{
 "cells": [
  {
   "cell_type": "code",
   "execution_count": 1,
   "id": "774ce7da",
   "metadata": {},
   "outputs": [],
   "source": [
    "import json\n",
    "import numpy as np"
   ]
  },
  {
   "cell_type": "markdown",
   "id": "33c0553e",
   "metadata": {},
   "source": [
    "## PubHealth processing"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 1,
   "id": "b02bd9eb",
   "metadata": {
    "scrolled": true
   },
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "     claim_id                                              claim  \\\n",
      "0       15661  \"The money the Clinton Foundation took from fr...   \n",
      "1        9893    Annual Mammograms May Have More False-Positives   \n",
      "2       11358  SBRT Offers Prostate Cancer Patients High Canc...   \n",
      "3       10166  Study: Vaccine for Breast, Ovarian Cancer Has ...   \n",
      "4       11276  Some appendicitis cases may not require ’emerg...   \n",
      "...       ...                                                ...   \n",
      "9827    35948  The Sturgis motorcycle rally in 2020 resulted ...   \n",
      "9828      401  AstraZeneca's infant respiratory drug prioriti...   \n",
      "9829     2023  Testicular cancer deaths double with after 40 ...   \n",
      "9830    38118   The FDA published “conclusive proof” that the...   \n",
      "9831    24750  On whether he wrote a provision that allowed A...   \n",
      "\n",
      "          date_published                                        explanation  \\\n",
      "0         April 26, 2015  \"Gingrich said the Clinton Foundation \"\"took m...   \n",
      "1       October 18, 2011  This article reports on the results of a study...   \n",
      "2     September 28, 2016  This news release describes five-year outcomes...   \n",
      "3       November 8, 2011  While the story does many things well, the ove...   \n",
      "4     September 20, 2010  We really don’t understand why only a handful ...   \n",
      "...                  ...                                                ...   \n",
      "9827  September 10, 2020  They want to know if mass-events (protests, co...   \n",
      "9828  September 25, 1995  Britain’s AstraZeneca said a potential medicin...   \n",
      "9829   February 10, 2011  Men diagnosed with testicular cancer at 40 yea...   \n",
      "9830   November 22, 2017  FDA Confirms DTaP Vaccine Causes Autism in Nov...   \n",
      "9831      March 23, 2009  Dodd flip-flopped on whether he changed amendm...   \n",
      "\n",
      "                                          fact_checkers  \\\n",
      "0                                         Katie Sanders   \n",
      "1                                                         \n",
      "2     Mary Chris Jaklevic,Steven J. Atlas, MD, MPH,K...   \n",
      "3                                                         \n",
      "4                                                         \n",
      "...                                                 ...   \n",
      "9827                                           Dan Evon   \n",
      "9828                                                      \n",
      "9829                                                      \n",
      "9830                              Rich Buhler & Staff     \n",
      "9831                                     Alexander Lane   \n",
      "\n",
      "                                              main_text  \\\n",
      "0     \"Hillary Clinton is in the political crosshair...   \n",
      "1     While the financial costs of screening mammogr...   \n",
      "2     The news release quotes lead researcher Robert...   \n",
      "3     The story does discuss costs, but the framing ...   \n",
      "4     \"Although the story didn’t cite the cost of ap...   \n",
      "...                                                 ...   \n",
      "9827  In September 2020, social media was abuzz over...   \n",
      "9828  The “Breakthrough Therapy” and “Prime” designa...   \n",
      "9829  This was true even when initial treatment and ...   \n",
      "9830  The FDA hasn’t confirmed a link between DTaP v...   \n",
      "9831  \"Sen. Chris Dodd has been  widely panned  as t...   \n",
      "\n",
      "                                                sources     label  \\\n",
      "0     https://www.wsj.com/articles/clinton-foundatio...     false   \n",
      "1                                                         mixture   \n",
      "2     https://www.healthnewsreview.org/wp-content/up...   mixture   \n",
      "3     http://clinicaltrials.gov/ct2/results?term=can...      true   \n",
      "4                                                            true   \n",
      "...                                                 ...       ...   \n",
      "9827                                                     unproven   \n",
      "9828                                                         true   \n",
      "9829                               http://bit.ly/fGNEw9      true   \n",
      "9830  https://www.truthorfiction.com/marshall-kamena...     false   \n",
      "9831  https://www.nytimes.com/2009/03/20/nyregion/20...     false   \n",
      "\n",
      "                                         subjects  \n",
      "0     Foreign Policy, PunditFact, Newt Gingrich,   \n",
      "1                  Screening,WebMD,women's health  \n",
      "2         Association/Society news release,Cancer  \n",
      "3                     Cancer,WebMD,women's health  \n",
      "4                                                  \n",
      "...                                           ...  \n",
      "9827                   Politics Medical, COVID-19  \n",
      "9828                                  Health News  \n",
      "9829                                  Health News  \n",
      "9830                                      Medical  \n",
      "9831              National, Economy, Chris Dodd,   \n",
      "\n",
      "[9832 rows x 9 columns]\n"
     ]
    }
   ],
   "source": [
    "import pandas as pd\n",
    "\n",
    "df = pd.read_csv('PUBHEALTH/train.tsv', sep='\\t')\n",
    "print(df)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 3,
   "id": "973f5f33",
   "metadata": {
    "scrolled": true
   },
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "      Unnamed: 0  claim_id                                              claim  \\\n",
      "0              0     33456  A mother revealed to her child in a letter aft...   \n",
      "1              1      2542  Study says too many Americans still drink too ...   \n",
      "2              2     26678  Viral image Says 80% of novel coronavirus case...   \n",
      "3              3     40705  An email says that 9-year old Craig Shergold o...   \n",
      "4              4     35718  Employees at a Five Guys restaurant in Daphne,...   \n",
      "...          ...       ...                                                ...   \n",
      "1230        1230      3295  Christmas miracle for Florida dog whose heart ...   \n",
      "1231        1231      6904  Another dolphin dies at Arizona aquatic facility.   \n",
      "1232        1232     13874  What the facts say\" is ... \"the best scenario ...   \n",
      "1233        1233      2847  FDA advisory panel rejects J&J drug for acute ...   \n",
      "1234        1234      7394  Gene-editing Chinese scientist kept much of hi...   \n",
      "\n",
      "         date_published                                        explanation  \\\n",
      "0      November 6, 2011  The one-eyed mother story expounds upon two mo...   \n",
      "1     February 25, 2013  On any given day in the United States, 18 perc...   \n",
      "2        March 13, 2020  The website Information is Beautiful published...   \n",
      "3        March 16, 2015  Send greeting or business cards to cancer vict...   \n",
      "4         July 15, 2020  What's undetermined: As of this writing, Five ...   \n",
      "...                 ...                                                ...   \n",
      "1230                NaN  A Florida man was hoping for a Christmas mirac...   \n",
      "1231                NaN  A fourth dolphin has died at a Phoenix-area aq...   \n",
      "1232      July 17, 2016  Priebus said, \"What the facts say\" is ... \"the...   \n",
      "1233   January 16, 2014  Johnson & Johnson’s anticoagulant Xarelto shou...   \n",
      "1234                NaN  The Chinese scientist who says he helped make ...   \n",
      "\n",
      "                fact_checkers  \\\n",
      "0             David Mikkelson   \n",
      "1                               \n",
      "2                 Paul Specht   \n",
      "3       Rich Buhler & Staff     \n",
      "4                Dan MacGuill   \n",
      "...                       ...   \n",
      "1230         Associated Press   \n",
      "1231                            \n",
      "1232           Lauren Carroll   \n",
      "1233                            \n",
      "1234         Christina Larson   \n",
      "\n",
      "                                              main_text  \\\n",
      "0     In April 2005, we spotted a tearjerker on the ...   \n",
      "1     That means the great majority of Americans sta...   \n",
      "2     Amid the spread of the novel coronavirus, many...   \n",
      "3     Craig Shergold is real and             in 1989...   \n",
      "4     In July 2020, amid a new wave of nationwide pr...   \n",
      "...                                                 ...   \n",
      "1230  The heart of Gerald Ford’s 1-year-old French b...   \n",
      "1231  A statement from Dolphinaris Arizona in Scotts...   \n",
      "1232  Republican National Committee chairman Reince ...   \n",
      "1233  The panel voted 10 to 0, with one abstention, ...   \n",
      "1234  He Jiankui’s outsized aspirations began to tak...   \n",
      "\n",
      "                                                sources     label  \\\n",
      "0                                                           false   \n",
      "1                                  http://bit.ly/X1NVtW      true   \n",
      "2     https://www.facebook.com/informationisbeautifu...      true   \n",
      "3     https://www.reddit.com/submit?url=https%3A%2F%...     false   \n",
      "4                                                        unproven   \n",
      "...                                                 ...       ...   \n",
      "1230  https://www.gainesville.com/news/20200102/holi...      true   \n",
      "1231                                                         true   \n",
      "1232  https://www.nytimes.com/2016/07/13/us/politics...     false   \n",
      "1233                                                         true   \n",
      "1234  https://twitter.com/larsonchristina,http://bit...      true   \n",
      "\n",
      "                                               subjects  \n",
      "0                                        Glurge Gallery  \n",
      "1                                           Health News  \n",
      "2      Facebook Fact-checks, Coronavirus, Viral image,   \n",
      "3                                  Inspirational, Pleas  \n",
      "4                                       Law Enforcement  \n",
      "...                                                 ...  \n",
      "1230  Animals, Health, Florida, General News, Gaines...  \n",
      "1231        Arizona, Animals, Phoenix, Health, Dolphins  \n",
      "1232  National, Children, Race and Ethnicity, Reince...  \n",
      "1233                                        Health News  \n",
      "1234  AP Top News, Health, Genetic Frontiers, Medica...  \n",
      "\n",
      "[1235 rows x 10 columns]\n"
     ]
    }
   ],
   "source": [
    "import pandas as pd\n",
    "\n",
    "df = pd.read_csv('PUBHEALTH/test.tsv', sep='\\t')\n",
    "\n",
    "print(df)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 4,
   "id": "42add563",
   "metadata": {
    "scrolled": true
   },
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "     claim_id                                              claim  \\\n",
      "0       34656   A baby died at an unnamed medical facility be...   \n",
      "1        3632  Bat from Shawnee County tests positive for rab...   \n",
      "2       29558  Germany has banned pork from school canteens b...   \n",
      "3        8416  Coronavirus prompts Canada to roll out safe dr...   \n",
      "4        7169  Wayne National Forest plans fires for tree, wi...   \n",
      "...       ...                                                ...   \n",
      "1216    39818   There are reports of suicides   and even murd...   \n",
      "1217    15793  The state of Florida has seen \"double-digit dr...   \n",
      "1218     5271  Officials probe respiratory illness at Quincy ...   \n",
      "1219     9002  Sylentis announces the results of tivanisiran ...   \n",
      "1220     4459  US regulators clear path for genetically modif...   \n",
      "\n",
      "         date_published                                        explanation  \\\n",
      "0     November 10, 2015  Fellow Twitter users suggested @FierceFemtivis...   \n",
      "1                   NaN  A bat found in northeastern Kansas has tested ...   \n",
      "2         March 7, 2016  What's true: Some politicians complained that ...   \n",
      "3        April 16, 2020  Canada’s Pacific province of British Columbia ...   \n",
      "4                   NaN  Nearly 2,000 acres of Wayne National Forest in...   \n",
      "...                 ...                                                ...   \n",
      "1216     March 17, 2015  Deadly Aftermath of Harold Camping's May 21, 2...   \n",
      "1217     March 18, 2015  Pitman said Florida has seen \"double-digit dro...   \n",
      "1218                NaN  State officials are investigating several case...   \n",
      "1219       May 10, 2018  This news release focuses on a study of a new ...   \n",
      "1220                NaN  U.S. regulators on Friday gave the green light...   \n",
      "\n",
      "                                          fact_checkers  \\\n",
      "0                                          Kim LaCapria   \n",
      "1                                                         \n",
      "2                                          Kim LaCapria   \n",
      "3                                        Tessa Vikander   \n",
      "4                                                         \n",
      "...                                                 ...   \n",
      "1216                        \\n\\nRich Buhler & Staff\\n\\n   \n",
      "1217                                      Joshua Gillin   \n",
      "1218                                                      \n",
      "1219  Earle Holland,Harold J. DeMonaco, MS,Kathlyn S...   \n",
      "1220                                       Candice Choi   \n",
      "\n",
      "                                              main_text  \\\n",
      "0     On 8 November 2015, former Twitter user @Fierc...   \n",
      "1     Topeka television station KSNT reports that th...   \n",
      "2     On 7 March 2016, British tabloid Express repor...   \n",
      "3     In March, the Canadian government urged provin...   \n",
      "4     Forest officials say scientists who study nati...   \n",
      "...                                                 ...   \n",
      "1216  Harold Camping is a   self-taught Bible teache...   \n",
      "1217  As the Legislature considers changing rules fo...   \n",
      "1218  The (Quincy) Herald-Whig reports the departmen...   \n",
      "1219  There is no discussion of the potential cost o...   \n",
      "1220  The Food and Drug Administration said it lifte...   \n",
      "\n",
      "                                                sources     label  \\\n",
      "0     http://webcache.googleusercontent.com/search?q...  unproven   \n",
      "1     https://www.ksnt.com/news/bat-tests-positive-f...      true   \n",
      "2     http://bnp.org.uk/news/regional/bnp-victory-br...     false   \n",
      "3                                                            true   \n",
      "4                                                            true   \n",
      "...                                                 ...       ...   \n",
      "1216  https://www.truthorfiction.com/category/crime-...   mixture   \n",
      "1217  http://www.cdc.gov/mmwr/pdf/ss/ss6304.pdf, htt...      true   \n",
      "1218  https://www.whig.com/20190817/agencies-report-...      true   \n",
      "1219  https://www.healthnewsreview.org/wp-content/up...   mixture   \n",
      "1220  https://www.ap.org/press-releases/2018/ap-hhmi...      true   \n",
      "\n",
      "                                               subjects  \n",
      "0                     Politics, fiercefemtivist, racism  \n",
      "1     Rabies, Health, General News, Kansas, Bats, To...  \n",
      "2                                              Politics  \n",
      "3                                           Health News  \n",
      "4     Plants, Wildlife, Health, Wildlife health, For...  \n",
      "...                                                 ...  \n",
      "1216                          Crime / Police, Religious  \n",
      "1217         Alcohol, Children, Florida, Susan Pitman,   \n",
      "1218  Quincy, Health, General News, Legionnaires dis...  \n",
      "1219                                  dry eye,Pharmamar  \n",
      "1220  Genetics, Health, Fish, Salmon, North America,...  \n",
      "\n",
      "[1221 rows x 9 columns]\n"
     ]
    }
   ],
   "source": [
    "import pandas as pd\n",
    "\n",
    "df = pd.read_csv('dev.tsv', sep='\\t')\n",
    "print(df)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 9,
   "id": "736315eb",
   "metadata": {},
   "outputs": [],
   "source": [
    "df_true_or_false=df.loc[(df['label'] =='true')|(df['label']== 'false')]"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 10,
   "id": "1bbd4792",
   "metadata": {
    "scrolled": true
   },
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "     claim_id                                              claim  \\\n",
      "0       15661  \"The money the Clinton Foundation took from fr...   \n",
      "3       10166  Study: Vaccine for Breast, Ovarian Cancer Has ...   \n",
      "4       11276  Some appendicitis cases may not require ’emerg...   \n",
      "5        8713  Britain to reveal trial criteria for coronavir...   \n",
      "6        9851  Angioplasty through the wrist backed by new study   \n",
      "...       ...                                                ...   \n",
      "9826     8197  Venezuela expands quarantine as number of coro...   \n",
      "9828      401  AstraZeneca's infant respiratory drug prioriti...   \n",
      "9829     2023  Testicular cancer deaths double with after 40 ...   \n",
      "9830    38118   The FDA published “conclusive proof” that the...   \n",
      "9831    24750  On whether he wrote a provision that allowed A...   \n",
      "\n",
      "          date_published                                        explanation  \\\n",
      "0         April 26, 2015  \"Gingrich said the Clinton Foundation \"\"took m...   \n",
      "3       November 8, 2011  While the story does many things well, the ove...   \n",
      "4     September 20, 2010  We really don’t understand why only a handful ...   \n",
      "5          April 7, 2020  British regulators will this week reveal appro...   \n",
      "6        August 18, 2008  This is a good piece of reporting about a rece...   \n",
      "...                  ...                                                ...   \n",
      "9826      March 16, 2020  Venezuela will implement a nationwide quaranti...   \n",
      "9828  September 25, 1995  Britain’s AstraZeneca said a potential medicin...   \n",
      "9829   February 10, 2011  Men diagnosed with testicular cancer at 40 yea...   \n",
      "9830   November 22, 2017  FDA Confirms DTaP Vaccine Causes Autism in Nov...   \n",
      "9831      March 23, 2009  Dodd flip-flopped on whether he changed amendm...   \n",
      "\n",
      "                               fact_checkers  \\\n",
      "0                              Katie Sanders   \n",
      "3                                              \n",
      "4                                              \n",
      "5                             Alistair Smout   \n",
      "6                                              \n",
      "...                                      ...   \n",
      "9826  Angus Berwick, Luc Cohen, Mariela Nava   \n",
      "9828                                           \n",
      "9829                                           \n",
      "9830                   Rich Buhler & Staff     \n",
      "9831                          Alexander Lane   \n",
      "\n",
      "                                              main_text  \\\n",
      "0     \"Hillary Clinton is in the political crosshair...   \n",
      "3     The story does discuss costs, but the framing ...   \n",
      "4     \"Although the story didn’t cite the cost of ap...   \n",
      "5     Antibody tests show whether whether people hav...   \n",
      "6     The story did not provide cost estimates for e...   \n",
      "...                                                 ...   \n",
      "9826  The country began a quarantine on Monday in a ...   \n",
      "9828  The “Breakthrough Therapy” and “Prime” designa...   \n",
      "9829  This was true even when initial treatment and ...   \n",
      "9830  The FDA hasn’t confirmed a link between DTaP v...   \n",
      "9831  \"Sen. Chris Dodd has been  widely panned  as t...   \n",
      "\n",
      "                                                sources  label  \\\n",
      "0     https://www.wsj.com/articles/clinton-foundatio...  false   \n",
      "3     http://clinicaltrials.gov/ct2/results?term=can...   true   \n",
      "4                                                         true   \n",
      "5                                                         true   \n",
      "6                                                         true   \n",
      "...                                                 ...    ...   \n",
      "9826                                                      true   \n",
      "9828                                                      true   \n",
      "9829                               http://bit.ly/fGNEw9   true   \n",
      "9830  https://www.truthorfiction.com/marshall-kamena...  false   \n",
      "9831  https://www.nytimes.com/2009/03/20/nyregion/20...  false   \n",
      "\n",
      "                                         subjects  \n",
      "0     Foreign Policy, PunditFact, Newt Gingrich,   \n",
      "3                     Cancer,WebMD,women's health  \n",
      "4                                                  \n",
      "5                                     Health News  \n",
      "6                                                  \n",
      "...                                           ...  \n",
      "9826                                  Health News  \n",
      "9828                                  Health News  \n",
      "9829                                  Health News  \n",
      "9830                                      Medical  \n",
      "9831              National, Economy, Chris Dodd,   \n",
      "\n",
      "[8079 rows x 9 columns]\n"
     ]
    }
   ],
   "source": [
    "print(df_true_or_false)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 9,
   "id": "a0dcac6f",
   "metadata": {
    "scrolled": true
   },
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "      Unnamed: 0  claim_id                                              claim  \\\n",
      "4              4     35718  Employees at a Five Guys restaurant in Daphne,...   \n",
      "5              5     34271  FBI agent Peter Strzok II grew up in Iran; had...   \n",
      "9              9     34562  The new supplement InteliGEN can boost brain f...   \n",
      "17            17     34219  Nathan Phillips falsely claimed to be a U.S. m...   \n",
      "59            59     41644  Spending on mental health went up by £575 mill...   \n",
      "74            74     41802  Last month, 20,000 migrant children were illeg...   \n",
      "82            82     34717  Talk radio host Rush Limbaugh was disqualified...   \n",
      "112          112     34694  Deborah Harry was nearly abducted by serial ki...   \n",
      "120          120     34703   Photographs show a new Chinese aircraft carrier.   \n",
      "123          123     34356  During the August 2017 solar eclipse, some peo...   \n",
      "138          138     34213  Arminas Pileckas was murdered because he was t...   \n",
      "180          180     34392  The FBI foiled a Muslim Brotherhood plot to ta...   \n",
      "183          183     34546  Russian president Vladimir Putin slammed Weste...   \n",
      "194          194     34674  Huggies Snug and Dry brand diapers commonly ca...   \n",
      "217          217     34534  Marijuana legalization has led to an increase ...   \n",
      "238          238     36565  You can be fined $999 and have your license su...   \n",
      "251          251     37027   Senator Harry Reid said that he was injured i...   \n",
      "262          262     34554  Donald Trump divorced Ivana Trump because her ...   \n",
      "310          310     41650         1,000 GP practices have closed since 2010.   \n",
      "325          325     34627  A woman encountered kidnapping scouts at a Hou...   \n",
      "370          370     34196  An employee at a women's health center in Bron...   \n",
      "379          379     34442  Policies that legalize recreational marijuana ...   \n",
      "445          445     39291         A young boy fell asleep wearing a Spide...   \n",
      "446          446     34429  An immigrant put peanut butter in a little gir...   \n",
      "480          480     34241  Drinking one diet drink a day triples a person...   \n",
      "488          488     34704  A daily regimen of ingesting gin-soaked raisin...   \n",
      "504          504     37518  Clout-chasing teenagers are participating in t...   \n",
      "507          507     41320  Polysorbate 80 and 20 are in vaccines and caus...   \n",
      "508          508     41037  It can survive for 6-12 hours on fabric and wi...   \n",
      "525          525     41890  Business associates of\" William Browder \"sent ...   \n",
      "614          614     37561  According to an unnamed critical care physicia...   \n",
      "660          660     34329  Elephants think of humans as \"cute,\" in the sa...   \n",
      "755          755     41048  The symptoms of Covid-19 are a sore throat las...   \n",
      "812          812     36514  Modern caesarean sections were invented by mid...   \n",
      "859          859     36828   Reports out of Texas that voting machines are...   \n",
      "914          914     34698  The American ambassador in Libya was raped and...   \n",
      "916          916     34427  After passing a bill to make consuming raw mil...   \n",
      "956          956     34418  Women’s menstrual cycles synchronize when they...   \n",
      "1019        1019     34626  A photograph shows two children holding a 'F*C...   \n",
      "1046        1046     41069  If someone with the new coronavirus sneezes, i...   \n",
      "1066        1066     34491  A Tennessee boy died in the arms of a local ma...   \n",
      "1085        1085     35946  Chris Christie advised U.S. President Donald T...   \n",
      "1117        1117     34655  Tidy Cats Lightweight brand cat litter causes ...   \n",
      "1158        1158     41318  Neomycin sulphate, an antibiotic, is in vaccin...   \n",
      "1199        1199     41819  Three border agents in San Diego \"were very ba...   \n",
      "\n",
      "          date_published                                        explanation  \\\n",
      "4          July 15, 2020  What's undetermined: As of this writing, Five ...   \n",
      "5          July 23, 2018  Peter Strzok spent several years of his childh...   \n",
      "9     September 30, 2016  Tens of thousands of holiday makers fled seasi...   \n",
      "17      January 23, 2019  What's true: Native American activist Nathan P...   \n",
      "59     December 19, 2017  This refers to the increase in spending by Cli...   \n",
      "74       January 9, 2019  In a national address, President Donald Trump ...   \n",
      "82     December 16, 2002  There is, of course, a huge difference between...   \n",
      "112     February 3, 2000  Details of the Blondie singer's claim of a clo...   \n",
      "120      August 11, 2011  Do photographs show a new Chinese aircraft car...   \n",
      "123    September 5, 2017  Interestingly, two ophthalmologists told us th...   \n",
      "138     January 31, 2019  We have reached out to Swedish police to see i...   \n",
      "180         June 8, 2017  Although Al-Qaradawi is a well-known figure in...   \n",
      "183     October 21, 2016  In May 2016, the National Academies of Science...   \n",
      "194     November 6, 2013  Many explanations are possible for these types...   \n",
      "217                  NaN  Mr. Morrissey takes no political position on a...   \n",
      "238     January 14, 2019  Can You Now Be Fined $999 for Holding a Phone ...   \n",
      "251        April 6, 2015  Harry Reid Was Injured in a Fight With His Bro...   \n",
      "262     October 11, 2016  It’s certainly possible that some version of t...   \n",
      "310         May 17, 2018  Malaysia will push its Southeast Asian neighbo...   \n",
      "325       March 16, 2016  Yet another Facebook user claimed she narrowly...   \n",
      "370       March 22, 2019  What's undetermined: The exact meaning and int...   \n",
      "379    February 23, 2017  However, as noted in the the National Academie...   \n",
      "445       March 17, 2015  Boy Suffered Chemical Burns from Spider-Man Wa...   \n",
      "446                  NaN  Although it is possible the peanut butter coul...   \n",
      "480     October 31, 2018  Some studies show an association between incre...   \n",
      "488     January 11, 2011  Gin has been featured in non-raisin arthritis ...   \n",
      "504       March 26, 2020  Is a ‘Coronavirus Challenge’ on Social Media P...   \n",
      "507       April 26, 2019  Tiny amounts of Polysorbate 80 is in a type of...   \n",
      "508       March 20, 2020  There’s no evidence the virus can survive in c...   \n",
      "525        July 18, 2018  Russian President Vladimir Putin made several ...   \n",
      "614       March 11, 2020  Unsourced ‘Intensivist’ Thread Spreads on Twit...   \n",
      "660    December 27, 2017  We found that tamed African elephants preferen...   \n",
      "755       March 20, 2020  This is a roughly accurate description of the ...   \n",
      "812     February 7, 2019  Were Modern Caesarean Sections Invented in Afr...   \n",
      "859     October 25, 2016  Texas Vote Switching Fuels Speculation About R...   \n",
      "914   September 18, 2012  As of this writing, the U.S. government has st...   \n",
      "916        April 5, 2017  Philippine President Rodrigo Duterte’s war on ...   \n",
      "956       April 18, 2017  We rate this claim as unproven due to an incre...   \n",
      "1019      March 21, 2016  On the east side of Houston, the white plumes ...   \n",
      "1046       March 5, 2020  How far the droplets spread from a sneeze depe...   \n",
      "1066   December 13, 2016  In this way, this particular Santa tale served...   \n",
      "1085     October 6, 2020  If you know and love a stutterer and you watch...   \n",
      "1117   November 18, 2015  We are cat-lovers too, and our number one comm...   \n",
      "1158      April 26, 2019  Trace amounts of this antibiotic may end up in...   \n",
      "1199   November 27, 2018  After a group of migrants tried to breach the ...   \n",
      "\n",
      "                                  fact_checkers  \\\n",
      "4                                  Dan MacGuill   \n",
      "5                                   David Emery   \n",
      "9                                Bethania Palma   \n",
      "17                                     Dan Evon   \n",
      "59                                 Claire Milne   \n",
      "74                                 Eugene Kiely   \n",
      "82                              David Mikkelson   \n",
      "112                             David Mikkelson   \n",
      "120                             David Mikkelson   \n",
      "123                                Dan MacGuill   \n",
      "138                              Bethania Palma   \n",
      "180                              Bethania Palma   \n",
      "183                              Bethania Palma   \n",
      "194                             David Mikkelson   \n",
      "217                               Arturo Garcia   \n",
      "238                              Kim LaCapria     \n",
      "251                       Rich Buhler & Staff     \n",
      "262                                Kim LaCapria   \n",
      "310                Joël Reland and Grace Rahman   \n",
      "325                                Kim LaCapria   \n",
      "370                                Dan MacGuill   \n",
      "379                                Alex Kasprak   \n",
      "445                 \\n\\nRich Buhler & Staff\\n\\n   \n",
      "446                              Bethania Palma   \n",
      "480                                Alex Kasprak   \n",
      "488                                Snopes Staff   \n",
      "504                              Kim LaCapria     \n",
      "507                                Grace Rahman   \n",
      "508                         Pippa Allen-Kinross   \n",
      "525                              Lori Robertson   \n",
      "614                             Arturo Garcia     \n",
      "660                               Arturo Garcia   \n",
      "755   Grace Rahman, Rachael Krishna, Kate Lewis   \n",
      "812                              Kim LaCapria     \n",
      "859                       Rich Buhler & Staff     \n",
      "914                             David Mikkelson   \n",
      "916                                 David Emery   \n",
      "956                                Alex Kasprak   \n",
      "1019                                   Dan Evon   \n",
      "1046                               Grace Rahman   \n",
      "1066                              Arturo Garcia   \n",
      "1085                               Dan MacGuill   \n",
      "1117                               Kim LaCapria   \n",
      "1158                               Grace Rahman   \n",
      "1199                             Lori Robertson   \n",
      "\n",
      "                                              main_text  \\\n",
      "4     In July 2020, amid a new wave of nationwide pr...   \n",
      "5     Longtime FBI agent Peter Strzok II, who until ...   \n",
      "9     Fueled by searing temperatures and high winds,...   \n",
      "17    As a video showing an altercation between Nath...   \n",
      "59    Spending on mental health went up by £575 mill...   \n",
      "74    In a national address, President Donald Trump ...   \n",
      "82    Vitriolic “hawk vs. dove” debates are a standa...   \n",
      "112   Deborah Harry, the lead singer of the 1970s ne...   \n",
      "120   In August 2011, China’s first aircraft carrier...   \n",
      "123   After the solar eclipse that crossed the Unite...   \n",
      "138   In late January 2019, a meme that referenced a...   \n",
      "180   In early June 2017, conspiracy-oriented web si...   \n",
      "183   In January 2016, dubious web sites began posti...   \n",
      "194   An item (originally circulated in November 201...   \n",
      "217   On 18 October 2016, the Citizens Against Legal...   \n",
      "238   On January 7 2019, the following status update...   \n",
      "251   This is an unproven conspiracy theory about ho...   \n",
      "262   An early October 2016 audio leak of Donald Tru...   \n",
      "310   In the past few weeks, Malaysia and neighborin...   \n",
      "325   On 15 March 2016, a Facebook user published th...   \n",
      "370   An undercover video shot at a Bronx women’s he...   \n",
      "379   On 23 February 2017, White House Press Secreta...   \n",
      "445   Our investigation into a report that a Spider-...   \n",
      "446   On 7 June 2016, AmericasFreedomFighters.com po...   \n",
      "480   High-sugar beverages such as soda are uncontro...   \n",
      "488   Arthritis is an auto-immune disease that cause...   \n",
      "504   Amid wall-to-wall reporting on a novel coronav...   \n",
      "507   Beta-Propiolactone is in vaccines and is known...   \n",
      "508   If you have a runny nose and sputum, you have ...   \n",
      "525   Russian President Vladimir Putin made several ...   \n",
      "614   In March 2020, as more nations grappled with a...   \n",
      "660   In December 2017, college student Julia Hass h...   \n",
      "755   If the new coronavirus gets into your mouth, d...   \n",
      "812   On February 6 2019, a Facebook post circulated...   \n",
      "859   Local officials say that scattered reports of ...   \n",
      "914   Examples:[Collected via e-mail, September 2012...   \n",
      "916   Thousands of suspected drug traffickers and us...   \n",
      "956   The idea that women living or working in proxi...   \n",
      "1019  Late at night or early in the morning when pla...   \n",
      "1046  Coronavirus pneumonia is a dry cough with no r...   \n",
      "1066  A heartwarming story set in an East Tennessee ...   \n",
      "1085  In October 2020, many readers asked Snopes to ...   \n",
      "1117  In November 2015, social media rumors claimed ...   \n",
      "1158  Beta-Propiolactone is in vaccines and is known...   \n",
      "1199  After a group of migrants tried to breach the ...   \n",
      "\n",
      "                                                sources     label  \\\n",
      "4                                                        unproven   \n",
      "5                                                        unproven   \n",
      "9                                                        unproven   \n",
      "17                                                       unproven   \n",
      "59    https://twitter.com/Jeremy_Hunt/status/9326058...  unproven   \n",
      "74    https://bepp.wharton.upenn.edu/profile/smetter...  unproven   \n",
      "82    http://www.amazon.com/exec/obidos/ISBN=0440508...  unproven   \n",
      "112   https://www.pinterest.com/pin/301248662550467424/  unproven   \n",
      "120   http://www.forbes.com/feeds/ap/2011/08/10/gene...  unproven   \n",
      "123   http://archive.is/IxBM6, http://archive.is/UKt...  unproven   \n",
      "138                                                      unproven   \n",
      "180                                                      unproven   \n",
      "183                                                      unproven   \n",
      "194                                                      unproven   \n",
      "217   http://www.denverpost.com/2013/07/30/denver-da...  unproven   \n",
      "238   https://archive.fo/IrohP, https://www.truthorf...  unproven   \n",
      "251   https://www.reddit.com/submit?url=https%3A%2F%...  unproven   \n",
      "262                                                      unproven   \n",
      "310   https://www.facebook.com/blocuk/photos/a.15044...  unproven   \n",
      "325   https://polarisproject.org/recognize-signs, ht...  unproven   \n",
      "370                                                      unproven   \n",
      "379                                                      unproven   \n",
      "445   https://www.truthorfiction.com/category/health...  unproven   \n",
      "446                                                      unproven   \n",
      "480                                                      unproven   \n",
      "488                                                      unproven   \n",
      "504   https://twitter.com/GabrielSlaybau1/status/124...  unproven   \n",
      "507   https://www.facebook.com/photo.php?fbid=305629...  unproven   \n",
      "508   https://www.nhs.uk/conditions/coronavirus-covi...  unproven   \n",
      "525   https://www.npr.org/2018/07/16/629462401/trans...  unproven   \n",
      "614   https://www.ecodibergamo.it/stories/bergamo-ci...  unproven   \n",
      "660                                                      unproven   \n",
      "755   https://www.nhs.uk/conditions/coronavirus-covi...  unproven   \n",
      "812   https://fn.bmj.com/content/fetalneonatal/80/3/...  unproven   \n",
      "859   https://www.linkedin.com/cws/share?url=https%3...  unproven   \n",
      "914                                                      unproven   \n",
      "916                                                      unproven   \n",
      "956                                                      unproven   \n",
      "1019  https://www.snopes.com/tachyon/2016/03/2540663...  unproven   \n",
      "1046  https://www.facebook.com/1432920145/posts/1021...  unproven   \n",
      "1066                                                     unproven   \n",
      "1085                                                     unproven   \n",
      "1117  https://twitter.com/howdycuz2, https://twitter...  unproven   \n",
      "1158  https://www.facebook.com/photo.php?fbid=305629...  unproven   \n",
      "1199  https://www.factcheck.org/2018/04/has-the-bord...  unproven   \n",
      "\n",
      "                                               subjects  \n",
      "4                                       Law Enforcement  \n",
      "5                       Politics, deep state, fbi, iran  \n",
      "9             Fraud & Scams, health, Health Care, scams  \n",
      "17                            Politics, nathan phillips  \n",
      "59                                               health  \n",
      "74                   Illegal immigration, immigration,   \n",
      "82                              Politics, rush limbaugh  \n",
      "112                       Entertainment, Artists, music  \n",
      "120   Fauxtography, aircraft carrier, china, fauxtog...  \n",
      "123         Medical, california, eclipse, solar eclipse  \n",
      "138                                            Politics  \n",
      "180       Uncategorized, fake news, islam, Islamophobia  \n",
      "183                    Junk News, gmo, russia, vaccines  \n",
      "194   Inboxer Rebellion, diaper rash, huggies, Toxin...  \n",
      "217                  Crime, colorado, denver, marijuana  \n",
      "238                          Fact Checks, Viral Content  \n",
      "251                                            Politics  \n",
      "262   Politics Ballot Box, breast implants, donald t...  \n",
      "310                                              health  \n",
      "325   Uncategorized, houston, kidnapping warnings, s...  \n",
      "370                                            Politics  \n",
      "379           Politics, marijuana, opioids, sean spicer  \n",
      "445                                    Health / Medical  \n",
      "446           Uncategorized, immigrants, peanut allergy  \n",
      "480                                  Medical, aspartame  \n",
      "488                                 Medical, Home Cures  \n",
      "504                          Fact Checks, Viral Content  \n",
      "507                                              online  \n",
      "508                                              online  \n",
      "525            campaign finance, Russia investigation,   \n",
      "614                          Fact Checks, Viral Content  \n",
      "660                          Critter Country, elephants  \n",
      "755                                              online  \n",
      "812                          Fact Checks, Viral Content  \n",
      "859                                            Politics  \n",
      "914                                       Uncategorized  \n",
      "916                    Medical, raw milk, west virginia  \n",
      "956          Medical, menstrual periods, periods, women  \n",
      "1019                        Uncategorized, donald trump  \n",
      "1046                                             online  \n",
      "1066     Glurge Gallery, christmas, glurge, santa claus  \n",
      "1085                            Politics, 2020 election  \n",
      "1117                                    Critter Country  \n",
      "1158                                             online  \n",
      "1199                     border security, immigration,   \n"
     ]
    }
   ],
   "source": [
    "df1 = pd.read_csv('PUBHEALTH/test.tsv', sep='\\t')\n",
    "df1_true_or_false=df1.loc[(df1['label'] =='true')|(df1['label']== 'false')]#\n",
    "print(df1_true_or_false)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 20,
   "id": "22a90721",
   "metadata": {
    "scrolled": true
   },
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "                                               claim_id  \\\n",
      "0                                                 34656   \n",
      "15                                                40007   \n",
      "16                                  Rich Buhler & Staff   \n",
      "17    \\tDr. Sam Vaknin told   TruthorFiction.com tha...   \n",
      "42                                                34583   \n",
      "65                                                34690   \n",
      "109                                               34474   \n",
      "127                                               41314   \n",
      "133                                               34507   \n",
      "206                                               34669   \n",
      "208                                               34480   \n",
      "217                                               41317   \n",
      "227                                               37294   \n",
      "228                                 Rich Buhler & Staff   \n",
      "229   \\tThis eRumor began circulating   more than a ...   \n",
      "239                                               34307   \n",
      "272                                               36380   \n",
      "306                                               41046   \n",
      "338                                               36391   \n",
      "358                                               38800   \n",
      "376                                               36725   \n",
      "380                                               34349   \n",
      "418                                               35712   \n",
      "453                                               37402   \n",
      "462                                               35060   \n",
      "476                                               41205   \n",
      "498                                               34577   \n",
      "509                                               34671   \n",
      "537                                               34361   \n",
      "550                                               34403   \n",
      "581                                               34635   \n",
      "638                                               35949   \n",
      "642                                               36857   \n",
      "654                                               34591   \n",
      "724                                               34298   \n",
      "750                                               41316   \n",
      "806                                               37510   \n",
      "849                                               34399   \n",
      "900                                               34525   \n",
      "964                                               34582   \n",
      "996                                               38072   \n",
      "1008                                              34680   \n",
      "1081                                              34443   \n",
      "1084                                              36135   \n",
      "1094                                              35206   \n",
      "1107                                              34389   \n",
      "1155                                              34639   \n",
      "1205                                              14090   \n",
      "\n",
      "                                                  claim  \\\n",
      "0      A baby died at an unnamed medical facility be...   \n",
      "15     A forwarded email with a story by an expert i...   \n",
      "16                                                  NaN   \n",
      "17                                    November 29, 2017   \n",
      "42    Coffee serves as an effective mosquito repella...   \n",
      "65    Over 37 million bees were killed by a large GM...   \n",
      "109   Application of Vicks VapoRub to the soles of c...   \n",
      "127   Latex rubber is in vaccines and causes life-th...   \n",
      "133   KT McFarland, Trump's pick for his national se...   \n",
      "206   A teenaged girl was drugged and nearly abducte...   \n",
      "208   Doctors are now saying menstrual cramps are as...   \n",
      "217   MSG is in vaccines and is linked to birth defe...   \n",
      "227    A forwarded email about Senator Edward Kenned...   \n",
      "228                                                 NaN   \n",
      "229                                      Louis Jacobson   \n",
      "239   Blue Buffalo pet food contains unsafe and high...   \n",
      "272   Under a new law, people can be arrested for co...   \n",
      "306   On fabric it can survive for 6-12 hours. norma...   \n",
      "338   In 1969, Chicago police urinated on food and s...   \n",
      "358    A female physician from Munich described in a...   \n",
      "376    Claims that President Trump is exhibiting sig...   \n",
      "380   All of the patients in the intensive care unit...   \n",
      "418   U.S. Postmaster General Louis DeJoy, a politic...   \n",
      "453   Bernie Sanders told Elizabeth Warren in 2018 t...   \n",
      "462   Patients should avoid taking ibuprofen to reli...   \n",
      "476   In 1983, US children got 10 vaccines and the a...   \n",
      "498   A step-dad refused to pay for his daughter's w...   \n",
      "509   Jimmies, the sprinkles used on confections, ar...   \n",
      "537   Russia used \"GPS spoofing\" to cause the USS Jo...   \n",
      "550   The Tim Allen show 'Last Man Standing' was can...   \n",
      "581   A cryptic blog called \"Two Droplets\" told the ...   \n",
      "638   An angry mother delivered a scathing response ...   \n",
      "642    Dr. Ted Noel has said that after evaluating H...   \n",
      "654   Two men arrested for their part in Turkey's at...   \n",
      "724   Parent's Choice diapers are causing small chil...   \n",
      "750   Mercury (aka thimerosal or thiomersal) is in v...   \n",
      "806   Image shows New York Gov. Andrew Cuomo's pierc...   \n",
      "849   Marilyn Monroe's intelligence quotient was mea...   \n",
      "900   “Clean coal technology” currently makes coal a...   \n",
      "964   Hillary Clinton travels with a doctor carrying...   \n",
      "996    Facebook user Heather Hanford described her s...   \n",
      "1008  California wine contains dangerous levels of a...   \n",
      "1081  Parents in Texas found a codeine tablet in a s...   \n",
      "1084  People who confronted an elderly woman as she ...   \n",
      "1094  People who have survived the COVID-19 coronavi...   \n",
      "1107  An Indian man who was bitten by a snake then b...   \n",
      "1155  Coca-Cola is an effective solution for elimina...   \n",
      "1205  More people today are leaving Virginia than mo...   \n",
      "\n",
      "                                         date_published  \\\n",
      "0                                     November 10, 2015   \n",
      "15                                       March 17, 2015   \n",
      "16                                                  NaN   \n",
      "17    Trump said Scarborough is party to an \"unsolve...   \n",
      "42                                       August 9, 2016   \n",
      "65                                     November 7, 2014   \n",
      "109                                      March 20, 2007   \n",
      "127                                      April 26, 2019   \n",
      "133                                   November 29, 2016   \n",
      "206                                       June 30, 2015   \n",
      "208                                   December 22, 2016   \n",
      "217                                      April 26, 2019   \n",
      "227                                      March 17, 2015   \n",
      "228                                                 NaN   \n",
      "229   The St. Louis suburb of Ferguson, Mo., has con...   \n",
      "239                                      March 19, 2018   \n",
      "272                                         May 9, 2019   \n",
      "306                                      March 20, 2020   \n",
      "338                                         May 1, 2019   \n",
      "358                                    October 19, 2015   \n",
      "376                                        May 26, 2017   \n",
      "380                                     October 3, 2017   \n",
      "418                                      August 6, 2020   \n",
      "453                                    January 15, 2020   \n",
      "462                                      March 16, 2020   \n",
      "476                                      August 8, 2019   \n",
      "498                                  September 30, 2015   \n",
      "509                                  September 26, 2009   \n",
      "537                                     August 22, 2017   \n",
      "550                                        May 18, 2017   \n",
      "581                                   February 17, 2016   \n",
      "638                                       March 1, 2015   \n",
      "642                                   September 9, 2016   \n",
      "654                                       July 21, 2016   \n",
      "724                                      April 12, 2018   \n",
      "750                                      April 26, 2019   \n",
      "806                                       April 1, 2020   \n",
      "849                                        May 23, 2017   \n",
      "900                                   November 14, 2016   \n",
      "964                                     August 10, 2016   \n",
      "996                                    January 31, 2018   \n",
      "1008                                     March 20, 2015   \n",
      "1081                                  February 23, 2017   \n",
      "1084                                    October 1, 2019   \n",
      "1094                                     March 15, 2020   \n",
      "1107                                      June 15, 2017   \n",
      "1155                                  February 11, 2016   \n",
      "1205                                       May 31, 2016   \n",
      "\n",
      "                                            explanation  \\\n",
      "0     Fellow Twitter users suggested @FierceFemtivis...   \n",
      "15    Noted Narcissism Expert Wrote that Barack Obam...   \n",
      "16                                                  NaN   \n",
      "17                                     Aaron Sharockman   \n",
      "42    What's true: A small bit of research has indic...   \n",
      "65    Millions of bees died off in Canada, but the c...   \n",
      "109   No substantive evidence documents that the app...   \n",
      "127   Latex is used in the packaging of some vaccine...   \n",
      "133   Thus, the argument can be made that by publish...   \n",
      "206   Moreover, the referenced article linked descri...   \n",
      "208   Whether any research into analogous pain perta...   \n",
      "217   It’s not banned in Europe. It’s used in some v...   \n",
      "227   An Email about called \"The Last of the Kennedy...   \n",
      "228                                                 NaN   \n",
      "229   http://www.cbc.ca/m/touch/news/story/1.2735588...   \n",
      "239   Aside from a single claimant’s lawsuit against...   \n",
      "272   New Georgia Abortion Law Conspiracy to Commit ...   \n",
      "306   There’s no evidence yet that the virus can sur...   \n",
      "338   Did Chicago Police Urinate on Food for a Black...   \n",
      "358   Female Physician in Munich Pens Email About Re...   \n",
      "376      President Trump is Showing Signs of Dementia     \n",
      "380   However, we have been so far unable to verify ...   \n",
      "418   Anything that undermines the Postal Service’ [...   \n",
      "453   Did Bernie Sanders Tell Elizabeth Warren a Wom...   \n",
      "462   But other experts suggested that Véran’s advic...   \n",
      "476   We don’t know exactly how prevalent autism was...   \n",
      "498   As to whether a 3 November 2015 wedding was ca...   \n",
      "509   It may be the case that among those who refer ...   \n",
      "537   In the wake of the USS McCain collision, the c...   \n",
      "550   In May 2018, Fox announced they would be bring...   \n",
      "581   On 18 February 2016, the author of the above-e...   \n",
      "638   Me: “No. She defended herself against a sexual...   \n",
      "642   Hillary Clinton “Probably” has Parkinson’s Dis...   \n",
      "654   However, there’s absolutely no evidence listed...   \n",
      "724   We contacted Parent’s Choice to ask whether th...   \n",
      "750   Thiomersal isn’t in any UK vaccines any more. ...   \n",
      "806           Andrew Cuomo’s Pierced Nipples, Explained   \n",
      "849   Although Monroe was known to be more scholarly...   \n",
      "900   Regardless of one’s view on the philosophical ...   \n",
      "964   The Washington Post identified the above-pictu...   \n",
      "996   Facebook Users Warn About Tamiflu Side Effects...   \n",
      "1008  [A wine company] spokesman said he had not hea...   \n",
      "1081  Holt Davis further asserted that the object wa...   \n",
      "1084  Does a Video Show ‘Antifa Protesters’ Screamin...   \n",
      "1094  A coronavirus infection’s going into a “dorman...   \n",
      "1107   Alternative facts should keep this alive though.   \n",
      "1155  Coca-Cola is not an officially endorsed produc...   \n",
      "1205  Haley said, \"More people are leaving Virginia ...   \n",
      "\n",
      "                                          fact_checkers  \\\n",
      "0                                          Kim LaCapria   \n",
      "15                                                  NaN   \n",
      "16                                                  NaN   \n",
      "17    President Donald Trump took to Twitter to cele...   \n",
      "42                                         Kim LaCapria   \n",
      "65                                      David Mikkelson   \n",
      "109                                        Snopes Staff   \n",
      "127                                        Grace Rahman   \n",
      "133                                      Bethania Palma   \n",
      "206                                        Kim LaCapria   \n",
      "208                                        Kim LaCapria   \n",
      "217                                        Grace Rahman   \n",
      "227                                                 NaN   \n",
      "228                                                 NaN   \n",
      "229                                                true   \n",
      "239                                        Kim LaCapria   \n",
      "272                                      Kim LaCapria     \n",
      "306           Grace Rahman, Rachael Krishna, Kate Lewis   \n",
      "338                                      Kim LaCapria     \n",
      "358                               Rich Buhler & Staff     \n",
      "376                               Rich Buhler & Staff     \n",
      "380                                       Arturo Garcia   \n",
      "418                                         Jessica Lee   \n",
      "453                                      Kim LaCapria     \n",
      "462                                     David Mikkelson   \n",
      "476                                        Grace Rahman   \n",
      "498                                        Kim LaCapria   \n",
      "509                                        Snopes Staff   \n",
      "537                                        Alex Kasprak   \n",
      "550                                            Dan Evon   \n",
      "581                                        Kim LaCapria   \n",
      "638                                        Snopes Staff   \n",
      "642                               Rich Buhler & Staff     \n",
      "654                                    Brooke Binkowski   \n",
      "724                                        Kim LaCapria   \n",
      "750                                        Grace Rahman   \n",
      "806                                      Kim LaCapria     \n",
      "849                                        Kim LaCapria   \n",
      "900                                        Alex Kasprak   \n",
      "964                                            Dan Evon   \n",
      "996                               Rich Buhler & Staff     \n",
      "1008                                       Kim LaCapria   \n",
      "1081                                       Kim LaCapria   \n",
      "1084                                     Kim LaCapria     \n",
      "1094                                    David Mikkelson   \n",
      "1107                                      Arturo Garcia   \n",
      "1155                                           Dan Evon   \n",
      "1205  https://www.irs.gov/uac/returns-filed-taxes-co...   \n",
      "\n",
      "                                              main_text  \\\n",
      "0     On 8 November 2015, former Twitter user @Fierc...   \n",
      "15                                                  NaN   \n",
      "16                                                  NaN   \n",
      "17    https://twitter.com/JoeNBC/status/935879100262...   \n",
      "42    In August 2016 concerns about the spread of th...   \n",
      "65    In October 2014, a rumor started circulating o...   \n",
      "109   This advisory that applying Vicks Vaporub (a b...   \n",
      "127   Beta-Propiolactone is in vaccines and is known...   \n",
      "133   On 28 November 2016, the Washington Blade post...   \n",
      "206   On 20 June 2015, a Facebook user published a s...   \n",
      "208   On 18 December 2016, a page operated by the ou...   \n",
      "217   Beta-Propiolactone is in vaccines and is known...   \n",
      "227                                                 NaN   \n",
      "228                                                 NaN   \n",
      "229   Criminal Justice, Drugs, Crime, PunditFact, Jo...   \n",
      "239   In June 2017, a rumor appeared that Blue Buffa...   \n",
      "272   On May 7 2019, a Facebook user shared the foll...   \n",
      "306   If the new coronavirus gets into your mouth, d...   \n",
      "338   On April 29 2019, a researcher shared the foll...   \n",
      "358   We can’t confirm the authenticity of an email ...   \n",
      "376   There’s no hard evidence that President Trump ...   \n",
      "380   In late September 2017, as accounts spread onl...   \n",
      "418   As U.S. President Donald Trump accelerated uns...   \n",
      "453   On January 13 2020, CNN published an article w...   \n",
      "462   Adding to the extant confusion swirling about ...   \n",
      "476   In 2008, US children got 36 vaccines and the a...   \n",
      "498   In October 2015, multiple content-scraping, cl...   \n",
      "509   While many of us like our ice cream unadorned,...   \n",
      "537   On 21 August 2017, the guided-missile destroye...   \n",
      "550   When television network ABC announced that the...   \n",
      "581   On 16 February 2016, a blog called Two Droplet...   \n",
      "638   On 19 February 2015, a user-submitted story ab...   \n",
      "642   Claims that Hillary Clinton has Parkinson’s di...   \n",
      "654   In July 2016, a failed coup attempt by Turkey’...   \n",
      "724   In April 2018 a screenshot of a post circulate...   \n",
      "750   Beta-Propiolactone is in vaccines and is known...   \n",
      "806   On March 31 2020, a bored-in-quarantine intern...   \n",
      "849   Pages devoted to both “facts” and Marilyn Monr...   \n",
      "900   “Clean coal, ”a broad term for technology that...   \n",
      "964   Conservative corners of the Internet were aflu...   \n",
      "996   Personal accounts of parents who gave Tamiflu ...   \n",
      "1008  On 19 March 2015, several articles about a cla...   \n",
      "1081  On 15 February 2017, Facebook user Meghan Holt...   \n",
      "1084  In late September 2019, a video clip of masked...   \n",
      "1094  As the world grappled with the COVID-19 corona...   \n",
      "1107  A story out of India about a man’s fatal encou...   \n",
      "1155  In February 2016, a meme asserting that the so...   \n",
      "1205                                               true   \n",
      "\n",
      "                                                sources  \\\n",
      "0     http://webcache.googleusercontent.com/search?q...   \n",
      "15                                                  NaN   \n",
      "16                                                  NaN   \n",
      "17                                                false   \n",
      "42                                                        \n",
      "65                                                        \n",
      "109   http://www.nrc-cnrc.gc.ca/eng/index.html, http...   \n",
      "127   https://www.facebook.com/photo.php?fbid=305629...   \n",
      "133                                                       \n",
      "206   http://m.snopes.com/2015/06/29/theme-park-abdu...   \n",
      "208                                                       \n",
      "217   https://www.facebook.com/photo.php?fbid=305629...   \n",
      "227                                                 NaN   \n",
      "228                                                 NaN   \n",
      "229                                                 NaN   \n",
      "239                                                       \n",
      "272   https://www.facebook.com/share.php?u=https%3A%...   \n",
      "306   https://www.nhs.uk/conditions/coronavirus-covi...   \n",
      "338   https://www.britannica.com/science/urban-geogr...   \n",
      "358   https://twitter.com/intent/tweet?text=Female+P...   \n",
      "376   https://www.psychiatry.org/news-room/apa-blogs...   \n",
      "380                                                       \n",
      "418                                                       \n",
      "453   https://t.co/Lt9Y8n2SaP, https://www.buzzfeedn...   \n",
      "462                                                       \n",
      "476   https://www.facebook.com/davidicke/photos/a.16...   \n",
      "498   http://www.snopes.com/woman-ridicules-store-ba...   \n",
      "509                                                       \n",
      "537                                                       \n",
      "550                                                       \n",
      "581   http://www.tineye.com/search/2604693d36efb933c...   \n",
      "638   http://notalwayslearning.com/was-bra-ced-for-a...   \n",
      "642   https://api.whatsapp.com/send?text=https%3A%2F...   \n",
      "654                                                       \n",
      "724                                                       \n",
      "750   https://www.facebook.com/photo.php?fbid=305629...   \n",
      "806   https://twitter.com/DC_Draino/status/124501009...   \n",
      "849                                                       \n",
      "900   https://www.odi.org/sites/odi.org.uk/files/odi...   \n",
      "964                                                       \n",
      "996   https://www.truthorfiction.com/category/medica...   \n",
      "1008                                                      \n",
      "1081                                                      \n",
      "1084  https://www.truthorfiction.com/dads-ashes-a-br...   \n",
      "1094                                                      \n",
      "1107                                                      \n",
      "1155  http://www.headlice.org/, http://www.budget101...   \n",
      "1205       Economy, Population, Virginia, Nikki Haley,    \n",
      "\n",
      "                                              label  \\\n",
      "0                                          unproven   \n",
      "15                                              NaN   \n",
      "16                                              NaN   \n",
      "17    National, Candidate Biography, Donald Trump,    \n",
      "42                                         unproven   \n",
      "65                                         unproven   \n",
      "109                                        unproven   \n",
      "127                                        unproven   \n",
      "133                                        unproven   \n",
      "206                                        unproven   \n",
      "208                                        unproven   \n",
      "217                                        unproven   \n",
      "227                                             NaN   \n",
      "228                                             NaN   \n",
      "229                                             NaN   \n",
      "239                                        unproven   \n",
      "272                                        unproven   \n",
      "306                                        unproven   \n",
      "338                                        unproven   \n",
      "358                                        unproven   \n",
      "376                                        unproven   \n",
      "380                                        unproven   \n",
      "418                                        unproven   \n",
      "453                                        unproven   \n",
      "462                                        unproven   \n",
      "476                                        unproven   \n",
      "498                                        unproven   \n",
      "509                                        unproven   \n",
      "537                                        unproven   \n",
      "550                                        unproven   \n",
      "581                                        unproven   \n",
      "638                                        unproven   \n",
      "642                                        unproven   \n",
      "654                                        unproven   \n",
      "724                                        unproven   \n",
      "750                                        unproven   \n",
      "806                                        unproven   \n",
      "849                                        unproven   \n",
      "900                                        unproven   \n",
      "964                                        unproven   \n",
      "996                                        unproven   \n",
      "1008                                       unproven   \n",
      "1081                                       unproven   \n",
      "1084                                       unproven   \n",
      "1094                                       unproven   \n",
      "1107                                       unproven   \n",
      "1155                                       unproven   \n",
      "1205                                            NaN   \n",
      "\n",
      "                                               subjects  \n",
      "0                     Politics, fiercefemtivist, racism  \n",
      "15                                                  NaN  \n",
      "16                                                  NaN  \n",
      "17                                                  NaN  \n",
      "42           Medical, coffee, Home Cures, home remedies  \n",
      "65                                             Politics  \n",
      "109                  Medical, Home Cures, vicks vaporub  \n",
      "127                                              online  \n",
      "133              Politics, donald trump, lgbt, politics  \n",
      "206   Crime, denton texas, dillard's, human trafficking  \n",
      "208   Medical, dysmenorrhea, heart attack, menstrual...  \n",
      "217                                              online  \n",
      "227                                                 NaN  \n",
      "228                                                 NaN  \n",
      "229                                                 NaN  \n",
      "239              Critter Country, contaminated pet food  \n",
      "272                               Fact Checks, Politics  \n",
      "306                                              online  \n",
      "338                          Fact Checks, Viral Content  \n",
      "358                                         Immigration  \n",
      "376              Government, Health / Medical, Politics  \n",
      "380   Politics, hurricane maria, puerto rico, trump ...  \n",
      "418             Politics, 2020 election, Editor's Picks  \n",
      "453                         Disinformation, Fact Checks  \n",
      "462                                   Medical, COVID-19  \n",
      "476                                              online  \n",
      "498   Viral Phenomena, conservative post, qpolitical...  \n",
      "509                         Language, Offensive Origins  \n",
      "537                                            Politics  \n",
      "550              Politics, abc, donald trump, tim allen  \n",
      "581   Fauxtography, drain cleaner, triplets, two dro...  \n",
      "638                                            Politics  \n",
      "642                                            Politics  \n",
      "654   Politics Conspiracy Theories, CIA, recep tayyi...  \n",
      "724   Medical, diapers, parent's choice, viral faceb...  \n",
      "750                                              online  \n",
      "806                          Fact Checks, Viral Content  \n",
      "849                       Entertainment, marilyn monroe  \n",
      "900                Politics, clean coal, climate change  \n",
      "964   Uncategorized, diazepam, diazepam pen, hillary...  \n",
      "996                                             Medical  \n",
      "1008                   Food, arsenic, food safety, wine  \n",
      "1081  Uncategorized, food warnings, gerber, viral fa...  \n",
      "1084                        Disinformation, Fact Checks  \n",
      "1094                                  Medical, COVID-19  \n",
      "1107              Medical, Amiri Devi, gulf news, India  \n",
      "1155                           Uncategorized, coca-cola  \n",
      "1205                                                NaN  \n"
     ]
    }
   ],
   "source": [
    "df2 = pd.read_csv('PUBHEALTH/dev.tsv', sep='\\t')\n",
    "df2_true_or_false=df2.loc[~((df2['label'] =='true')|(df2['label'] =='false')|(df2['label'] =='mixture')|(df2['label'] =='proven'))]\n",
    "print(df2_true_or_false)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 23,
   "id": "2f9fd73b",
   "metadata": {},
   "outputs": [],
   "source": [
    "with open('pubhealth_dev.jsonl','w') as f:\n",
    "    for index, row in df1_true_or_false.iterrows():\n",
    "        line={\n",
    "            \"Claim:\":row['claim'],\n",
    "            \"date_published:\":row['date_published'],\n",
    "            \"label\":row['label'],\n",
    "            \"subjects\":row['subjects']\n",
    "        }\n",
    "        f.write(json.dumps(line)+\"\\n\")"
   ]
  },
  {
   "cell_type": "markdown",
   "id": "bfc1d25e",
   "metadata": {},
   "source": [
    "## temperature=0.9"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 2,
   "id": "fc0f4827",
   "metadata": {},
   "outputs": [],
   "source": [
    "num=210"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 3,
   "id": "123a03a5",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "52 0.24761904761904763\n",
      "182 0.8666666666666667\n",
      "matched num= 420\n"
     ]
    }
   ],
   "source": [
    "t=0\n",
    "f=0\n",
    "t1=[]\n",
    "f1=[]\n",
    "n=0\n",
    "with open('pubhealth+0.9/detections_1.jsonl') as file:\n",
    "    for line in file:\n",
    "        data = json.loads(line)\n",
    "        answer = data[1]['choices'][0]['message']['content']\n",
    "        question = data[0]['messages'][0]['content']\n",
    "        p1 = question.split('P1: \\\"')[1].split('P2: ')[0]\n",
    "        flag = False\n",
    "        with open('pubhealth+0.9/dataset_0.9.jsonl') as file1:  \n",
    "            for line1 in file1:\n",
    "                data1 = json.loads(line1)\n",
    "                q = data1[0]['messages'][0]['content']\n",
    "                ref1 = q.split('Reference:')[-1]\n",
    "                # \n",
    "                sentences1=ref1.strip().split('.')\n",
    "                sentences2=p1.strip()[:-1].split('.')\n",
    "                if sentences1[-2] == sentences2[-2]:\n",
    "                    flag = True\n",
    "                    n+=1\n",
    "                    label=data1[0]['label']\n",
    "                    if label == 'true': # hallucination \n",
    "                        if \"here are no conflicting parts\" in answer: # factual\n",
    "                            t+=1\n",
    "                        else:\n",
    "                            t1.append(ref1)\n",
    "                    else:# factual\n",
    "                        if \"here are no conflicting parts\" in answer: # factual\n",
    "                            f+=1\n",
    "                        else:\n",
    "                            f1.append(ref1)\n",
    "        if flag==False:\n",
    "            with open('pubhealth+0.9/dataset_0.9.jsonl') as file1:  \n",
    "                for line1 in file1:\n",
    "                    data1 = json.loads(line1)\n",
    "                    q = data1[0]['messages'][0]['content']\n",
    "                    ref1 = q.split('Reference:')[-1]\n",
    "                    # \\\" and \", or \\uxxxx\n",
    "                    if ref1.strip().split(',')[-1] == p1.strip()[:-1].split(',')[-1] or ref1.strip().split('\\\"')[-1] == p1.strip()[:-1].split('\\\"')[-1]:\n",
    "                        flag = True\n",
    "                        n+=1\n",
    "                        label=data1[0]['label']\n",
    "                        if label == 'true': # hallucination \n",
    "                            if \"here are no conflicting parts\" in answer: # factual\n",
    "                                t+=1\n",
    "                            else:\n",
    "                                t1.append(ref1)\n",
    "                        else:# factual\n",
    "                            if \"here are no conflicting parts\" in answer: # factual\n",
    "                                f+=1\n",
    "                            else:\n",
    "                                f1.append(ref1)\n",
    "                    if flag==False:\n",
    "                        uni=p1.strip()[:-1].split('\\\\u')[-1][4:]\n",
    "                        length=len(uni)\n",
    "                        if ref1.strip()[-length:] == uni:\n",
    "                            flag = True\n",
    "                            n+=1\n",
    "                            label=data1[0]['label']\n",
    "                            if label == 'true': # hallucination \n",
    "                                if \"here are no conflicting parts\" in answer: # factual\n",
    "                                    t+=1\n",
    "                                else:\n",
    "                                    t1.append(ref1)\n",
    "                            else:# factual\n",
    "                                if \"here are no conflicting parts\" in answer: # factual\n",
    "                                    f+=1\n",
    "                                else:\n",
    "                                    f1.append(ref1)\n",
    "print(num-t,(num-t)/num)\n",
    "print(f,f/num)\n",
    "print('matched num=',n)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 4,
   "id": "7784bbca",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "46 0.21904761904761905\n",
      "179 0.8523809523809524\n",
      "matched num= 420\n"
     ]
    }
   ],
   "source": [
    "t=0\n",
    "f=0\n",
    "t11=[]\n",
    "f11=[]\n",
    "n=0\n",
    "with open('pubhealth+0.9/detections_1_1.jsonl') as file:\n",
    "    for line in file:\n",
    "        data = json.loads(line)\n",
    "        answer = data[1]['choices'][0]['message']['content']\n",
    "        question = data[0]['messages'][0]['content']\n",
    "        p1 = question.split('P1: \\\"')[1].split('P2: ')[0]\n",
    "        flag = False\n",
    "        with open('pubhealth+0.9/dataset_0.9.jsonl') as file1:  \n",
    "            for line1 in file1:\n",
    "                data1 = json.loads(line1)\n",
    "                q = data1[0]['messages'][0]['content']\n",
    "                ref1 = q.split('Reference:')[-1]\n",
    "                # \n",
    "                sentences1=ref1.strip().split('.')\n",
    "                sentences2=p1.strip()[:-1].split('.')\n",
    "                if sentences1[-2] == sentences2[-2]:\n",
    "                    flag = True\n",
    "                    n+=1\n",
    "                    label=data1[0]['label']\n",
    "                    if label == 'true': # hallucination \n",
    "                        if \"here are no conflicting parts\" in answer: # factual\n",
    "                            t+=1\n",
    "                        else:\n",
    "                            t11.append(ref1)\n",
    "                    else:# factual\n",
    "                        if \"here are no conflicting parts\" in answer: # factual\n",
    "                            f+=1\n",
    "                        else:\n",
    "                            f11.append(ref1)\n",
    "        if flag==False:\n",
    "            with open('pubhealth+0.9/dataset_0.9.jsonl') as file1:  \n",
    "                for line1 in file1:\n",
    "                    data1 = json.loads(line1)\n",
    "                    q = data1[0]['messages'][0]['content']\n",
    "                    ref1 = q.split('Reference:')[-1]\n",
    "                    # \\\" and \", or \\uxxxx\n",
    "                    if ref1.strip().split(',')[-1] == p1.strip()[:-1].split(',')[-1] or ref1.strip().split('\\\"')[-1] == p1.strip()[:-1].split('\\\"')[-1]:\n",
    "                        flag = True\n",
    "                        n+=1\n",
    "                        label=data1[0]['label']\n",
    "                        if label == 'true': # hallucination \n",
    "                            if \"here are no conflicting parts\" in answer: # factual\n",
    "                                t+=1\n",
    "                            else:\n",
    "                                t11.append(ref1)\n",
    "                        else:# factual\n",
    "                            if \"here are no conflicting parts\" in answer: # factual\n",
    "                                f+=1\n",
    "                            else:\n",
    "                                f11.append(p1)\n",
    "                    if flag==False:\n",
    "                        uni=p1.strip()[:-1].split('\\\\u')[-1][4:]\n",
    "                        length=len(uni)\n",
    "                        if ref1.strip()[-length:] == uni:\n",
    "                            flag = True\n",
    "                            n+=1\n",
    "                            label=data1[0]['label']\n",
    "                            if label == 'true': # hallucination \n",
    "                                if \"here are no conflicting parts\" in answer: # factual\n",
    "                                    t+=1\n",
    "                                else:\n",
    "                                    t11.append(ref1)\n",
    "                            else:# factual\n",
    "                                if \"here are no conflicting parts\" in answer: # factual\n",
    "                                    f+=1\n",
    "                                else:\n",
    "                                    f11.append(ref1)\n",
    "print(num-t,(num-t)/num)\n",
    "print(f,f/num)\n",
    "print('matched num=',n)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 5,
   "id": "795520ca",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "47 0.22380952380952382\n",
      "173 0.8238095238095238\n",
      "matched num= 420\n"
     ]
    }
   ],
   "source": [
    "t=0\n",
    "f=0\n",
    "t2=[]\n",
    "f2=[]\n",
    "n=0\n",
    "with open('pubhealth+0.9/detections_2.jsonl') as file:\n",
    "    for line in file:\n",
    "        data = json.loads(line)\n",
    "        answer = data[1]['choices'][0]['message']['content']\n",
    "        question = data[0]['messages'][0]['content']\n",
    "        p1 = question.split('P1: \\\"')[1].split('P2: ')[0]\n",
    "        flag = False\n",
    "        with open('pubhealth+0.9/dataset_0.9.jsonl') as file1:  \n",
    "            for line1 in file1:\n",
    "                data1 = json.loads(line1)\n",
    "                q = data1[0]['messages'][0]['content']\n",
    "                ref1 = q.split('Reference:')[-1]\n",
    "                # \n",
    "                sentences1=ref1.strip().split('.')\n",
    "                sentences2=p1.strip()[:-1].split('.')\n",
    "                if sentences1[-2] == sentences2[-2]:\n",
    "                    flag = True\n",
    "                    n+=1\n",
    "                    label=data1[0]['label']\n",
    "                    if label == 'true': # hallucination \n",
    "                        if \"here are no conflicting parts\" in answer: # factual\n",
    "                            t+=1\n",
    "                        else:\n",
    "                            t2.append(ref1)\n",
    "                    else:# factual\n",
    "                        if \"here are no conflicting parts\" in answer: # factual\n",
    "                            f+=1\n",
    "                        else:\n",
    "                            f2.append(ref1)\n",
    "        if flag==False:\n",
    "            with open('pubhealth+0.9/dataset_0.9.jsonl') as file1:  \n",
    "                for line1 in file1:\n",
    "                    data1 = json.loads(line1)\n",
    "                    q = data1[0]['messages'][0]['content']\n",
    "                    ref1 = q.split('Reference:')[-1]\n",
    "                    # \\\" and \", or \\uxxxx\n",
    "                    if ref1.strip().split(',')[-1] == p1.strip()[:-1].split(',')[-1] or ref1.strip().split('\\\"')[-1] == p1.strip()[:-1].split('\\\"')[-1]:\n",
    "                        flag = True\n",
    "                        n+=1\n",
    "                        label=data1[0]['label']\n",
    "                        if label == 'true': # hallucination \n",
    "                            if \"here are no conflicting parts\" in answer: # factual\n",
    "                                t+=1\n",
    "                            else:\n",
    "                                t2.append(ref1)\n",
    "                        else:# factual\n",
    "                            if \"here are no conflicting parts\" in answer: # factual\n",
    "                                f+=1\n",
    "                            else:\n",
    "                                f2.append(ref1)\n",
    "                    if flag==False:\n",
    "                        uni=p1.strip()[:-1].split('\\\\u')[-1][4:]\n",
    "                        length=len(uni)\n",
    "                        if ref1.strip()[-length:] == uni:\n",
    "                            flag = True\n",
    "                            n+=1\n",
    "                            label=data1[0]['label']\n",
    "                            if label == 'true': # hallucination \n",
    "                                if \"here are no conflicting parts\" in answer: # factual\n",
    "                                    t+=1\n",
    "                                else:\n",
    "                                    t2.append(ref1)\n",
    "                            else:# factual\n",
    "                                if \"here are no conflicting parts\" in answer: # factual\n",
    "                                    f+=1\n",
    "                                else:\n",
    "                                    f2.append(ref1)\n",
    "print(num-t,(num-t)/num)\n",
    "print(f,f/num)\n",
    "print('matched num=',n)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 6,
   "id": "308e192a",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "51 0.24285714285714285\n",
      "172 0.819047619047619\n",
      "matched num= 420\n"
     ]
    }
   ],
   "source": [
    "t=0\n",
    "f=0\n",
    "t22=[]\n",
    "f22=[]\n",
    "n=0\n",
    "with open('pubhealth+0.9/detections_2_1.jsonl') as file:\n",
    "    for line in file:\n",
    "        data = json.loads(line)\n",
    "        answer = data[1]['choices'][0]['message']['content']\n",
    "        question = data[0]['messages'][0]['content']\n",
    "        p1 = question.split('P1: \\\"')[1].split('P2: ')[0]\n",
    "        flag = False\n",
    "        with open('pubhealth+0.9/dataset_0.9.jsonl') as file1:  \n",
    "            for line1 in file1:\n",
    "                data1 = json.loads(line1)\n",
    "                q = data1[0]['messages'][0]['content']\n",
    "                ref1 = q.split('Reference:')[-1]\n",
    "                # \n",
    "                sentences1=ref1.strip().split('.')\n",
    "                sentences2=p1.strip()[:-1].split('.')\n",
    "                if sentences1[-2] == sentences2[-2]:\n",
    "                    flag = True\n",
    "                    n+=1\n",
    "                    label=data1[0]['label']\n",
    "                    if label == 'true': # hallucination \n",
    "                        if \"here are no conflicting parts\" in answer: # factual\n",
    "                            t+=1\n",
    "                        else:\n",
    "                            t22.append(ref1)\n",
    "                    else:# factual\n",
    "                        if \"here are no conflicting parts\" in answer: # factual\n",
    "                            f+=1\n",
    "                        else:\n",
    "                            f22.append(ref1)\n",
    "        if flag==False:\n",
    "            with open('pubhealth+0.9/dataset_0.9.jsonl') as file1:  \n",
    "                for line1 in file1:\n",
    "                    data1 = json.loads(line1)\n",
    "                    q = data1[0]['messages'][0]['content']\n",
    "                    ref1 = q.split('Reference:')[-1]\n",
    "                    # \\\" and \", or \\uxxxx\n",
    "                    if ref1.strip().split(',')[-1] == p1.strip()[:-1].split(',')[-1] or ref1.strip().split('\\\"')[-1] == p1.strip()[:-1].split('\\\"')[-1]:\n",
    "                        flag = True\n",
    "                        n+=1\n",
    "                        label=data1[0]['label']\n",
    "                        if label == 'true': # hallucination \n",
    "                            if \"here are no conflicting parts\" in answer: # factual\n",
    "                                t+=1\n",
    "                            else:\n",
    "                                t22.append(ref1)\n",
    "                        else:# factual\n",
    "                            if \"here are no conflicting parts\" in answer: # factual\n",
    "                                f+=1\n",
    "                            else:\n",
    "                                f22.append(ref1)\n",
    "                    if flag==False:\n",
    "                        uni=p1.strip()[:-1].split('\\\\u')[-1][4:]\n",
    "                        length=len(uni)\n",
    "                        if ref1.strip()[-length:] == uni:\n",
    "                            flag = True\n",
    "                            n+=1\n",
    "                            label=data1[0]['label']\n",
    "                            if label == 'true': # hallucination \n",
    "                                if \"here are no conflicting parts\" in answer: # factual\n",
    "                                    t+=1\n",
    "                                else:\n",
    "                                    t22.append(ref1)\n",
    "                            else:# factual\n",
    "                                if \"here are no conflicting parts\" in answer: # factual\n",
    "                                    f+=1\n",
    "                                else:\n",
    "                                    f22.append(ref1)\n",
    "print(num-t,(num-t)/num)\n",
    "print(f,f/num)\n",
    "print('matched num=',n)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 7,
   "id": "206341d4",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "56 0.26666666666666666\n",
      "165 0.7857142857142857\n",
      "matched num= 420\n"
     ]
    }
   ],
   "source": [
    "t=0\n",
    "f=0\n",
    "t3=[]\n",
    "f3=[]\n",
    "n=0\n",
    "with open('pubhealth+0.9/detections_3.jsonl') as file:\n",
    "    for line in file:\n",
    "        data = json.loads(line)\n",
    "        answer = data[1]['choices'][0]['message']['content']\n",
    "        question = data[0]['messages'][0]['content']\n",
    "        p1 = question.split('P1: \\\"')[1].split('P2: ')[0]\n",
    "        flag = False\n",
    "        with open('pubhealth+0.9/dataset_0.9.jsonl') as file1:  \n",
    "            for line1 in file1:\n",
    "                data1 = json.loads(line1)\n",
    "                q = data1[0]['messages'][0]['content']\n",
    "                ref1 = q.split('Reference:')[-1]\n",
    "                # \n",
    "                sentences1=ref1.strip().split('.')\n",
    "                sentences2=p1.strip()[:-1].split('.')\n",
    "                if sentences1[-2] == sentences2[-2]:\n",
    "                    flag = True\n",
    "                    n+=1\n",
    "                    label=data1[0]['label']\n",
    "                    if label == 'true': # hallucination \n",
    "                        if \"here are no conflicting parts\" in answer: # factual\n",
    "                            t+=1\n",
    "                        else:\n",
    "                            t3.append(ref1)\n",
    "                    else:# factual\n",
    "                        if \"here are no conflicting parts\" in answer: # factual\n",
    "                            f+=1\n",
    "                        else:\n",
    "                            f3.append(ref1)\n",
    "        if flag==False:\n",
    "            with open('pubhealth+0.9/dataset_0.9.jsonl') as file1:  \n",
    "                for line1 in file1:\n",
    "                    data1 = json.loads(line1)\n",
    "                    q = data1[0]['messages'][0]['content']\n",
    "                    ref1 = q.split('Reference:')[-1]\n",
    "                    # \\\" and \", or \\uxxxx\n",
    "                    if ref1.strip().split(',')[-1] == p1.strip()[:-1].split(',')[-1] or ref1.strip().split('\\\"')[-1] == p1.strip()[:-1].split('\\\"')[-1]:\n",
    "                        flag = True\n",
    "                        n+=1\n",
    "                        label=data1[0]['label']\n",
    "                        if label == 'true': # hallucination \n",
    "                            if \"here are no conflicting parts\" in answer: # factual\n",
    "                                t+=1\n",
    "                            else:\n",
    "                                t3.append(ref1)\n",
    "                        else:# factual\n",
    "                            if \"here are no conflicting parts\" in answer: # factual\n",
    "                                f+=1\n",
    "                            else:\n",
    "                                f3.append(p1)\n",
    "                    if flag==False:\n",
    "                        uni=p1.strip()[:-1].split('\\\\u')[-1][4:]\n",
    "                        length=len(uni)\n",
    "                        if ref1.strip()[-length:] == uni:\n",
    "                            flag = True\n",
    "                            n+=1\n",
    "                            label=data1[0]['label']\n",
    "                            if label == 'true': # hallucination \n",
    "                                if \"here are no conflicting parts\" in answer: # factual\n",
    "                                    t+=1\n",
    "                                else:\n",
    "                                    t3.append(ref1)\n",
    "                            else:# factual\n",
    "                                if \"here are no conflicting parts\" in answer: # factual\n",
    "                                    f+=1\n",
    "                                else:\n",
    "                                    f3.append(ref1)\n",
    "print(num-t,(num-t)/num)\n",
    "print(f,f/num)\n",
    "print('matched num=',n)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 8,
   "id": "76a07956",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "36 0.17142857142857143\n",
      "186 0.8857142857142857\n",
      "matched num= 420\n"
     ]
    }
   ],
   "source": [
    "t=0\n",
    "f=0\n",
    "t33=[]\n",
    "f33=[]\n",
    "n=0\n",
    "with open('pubhealth+0.9/detections_3_1.jsonl') as file:\n",
    "    for line in file:\n",
    "        data = json.loads(line)\n",
    "        answer = data[1]['choices'][0]['message']['content']\n",
    "        question = data[0]['messages'][0]['content']\n",
    "        p1 = question.split('P1: \\\"')[1].split('P2: ')[0]\n",
    "        flag = False\n",
    "        with open('pubhealth+0.9/dataset_0.9.jsonl') as file1:  \n",
    "            for line1 in file1:\n",
    "                data1 = json.loads(line1)\n",
    "                q = data1[0]['messages'][0]['content']\n",
    "                ref1 = q.split('Reference:')[-1]\n",
    "                # \n",
    "                sentences1=ref1.strip().split('.')\n",
    "                sentences2=p1.strip()[:-1].split('.')\n",
    "                if sentences1[-2] == sentences2[-2]:\n",
    "                    flag = True\n",
    "                    n+=1\n",
    "                    label=data1[0]['label']\n",
    "                    if label == 'true': # hallucination \n",
    "                        if \"here are no conflicting parts\" in answer: # factual\n",
    "                            t+=1\n",
    "                        else:\n",
    "                            t33.append(ref1)\n",
    "                    else:# factual\n",
    "                        if \"here are no conflicting parts\" in answer: # factual\n",
    "                            f+=1\n",
    "                        else:\n",
    "                            f33.append(ref1)\n",
    "        if flag==False:\n",
    "            with open('pubhealth+0.9/dataset_0.9.jsonl') as file1:  \n",
    "                for line1 in file1:\n",
    "                    data1 = json.loads(line1)\n",
    "                    q = data1[0]['messages'][0]['content']\n",
    "                    ref1 = q.split('Reference:')[-1]\n",
    "                    # \\\" and \", or \\uxxxx\n",
    "                    if ref1.strip().split(',')[-1] == p1.strip()[:-1].split(',')[-1] or ref1.strip().split('\\\"')[-1] == p1.strip()[:-1].split('\\\"')[-1]:\n",
    "                        flag = True\n",
    "                        n+=1\n",
    "                        label=data1[0]['label']\n",
    "                        if label == 'true': # hallucination \n",
    "                            if \"here are no conflicting parts\" in answer: # factual\n",
    "                                t+=1\n",
    "                            else:\n",
    "                                t33.append(ref1)\n",
    "                        else:# factual\n",
    "                            if \"here are no conflicting parts\" in answer: # factual\n",
    "                                f+=1\n",
    "                            else:\n",
    "                                f33.append(ref1)\n",
    "                    if flag==False:\n",
    "                        uni=p1.strip()[:-1].split('\\\\u')[-1][4:]\n",
    "                        length=len(uni)\n",
    "                        if ref1.strip()[-length:] == uni:\n",
    "                            flag = True\n",
    "                            n+=1\n",
    "                            label=data1[0]['label']\n",
    "                            if label == 'true': # hallucination \n",
    "                                if \"here are no conflicting parts\" in answer: # factual\n",
    "                                    t+=1\n",
    "                                else:\n",
    "                                    t33.append(ref1)\n",
    "                            else:# factual\n",
    "                                if \"here are no conflicting parts\" in answer: # factual\n",
    "                                    f+=1\n",
    "                                else:\n",
    "                                    f33.append(ref1)\n",
    "print(num-t,(num-t)/num)\n",
    "print(f,f/num)\n",
    "print('matched num=',n)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 9,
   "id": "b1f51a38",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "56 0.26666666666666666\n",
      "185 0.8809523809523809\n",
      "matched num= 420\n"
     ]
    }
   ],
   "source": [
    "t=0\n",
    "f=0\n",
    "t4=[]\n",
    "f4=[]\n",
    "n=0\n",
    "with open('pubhealth+0.9/detections_4.jsonl') as file:\n",
    "    for line in file:\n",
    "        data = json.loads(line)\n",
    "        answer = data[1]['choices'][0]['message']['content']\n",
    "        question = data[0]['messages'][0]['content']\n",
    "        p1 = question.split('P1: \\\"')[1].split('P2: ')[0]\n",
    "        flag = False\n",
    "        with open('pubhealth+0.9/dataset_0.9.jsonl') as file1:  \n",
    "            for line1 in file1:\n",
    "                data1 = json.loads(line1)\n",
    "                q = data1[0]['messages'][0]['content']\n",
    "                ref1 = q.split('Reference:')[-1]\n",
    "                # \n",
    "                sentences1=ref1.strip().split('.')\n",
    "                sentences2=p1.strip()[:-1].split('.')\n",
    "                if sentences1[-2] == sentences2[-2]:\n",
    "                    flag = True\n",
    "                    n+=1\n",
    "                    label=data1[0]['label']\n",
    "                    if label == 'true': # hallucination \n",
    "                        if \"here are no conflicting parts\" in answer: # factual\n",
    "                            t+=1\n",
    "                        else:\n",
    "                            t4.append(ref1)\n",
    "                    else:# factual\n",
    "                        if \"here are no conflicting parts\" in answer: # factual\n",
    "                            f+=1\n",
    "                        else:\n",
    "                            f4.append(ref1)\n",
    "        if flag==False:\n",
    "            with open('pubhealth+0.9/dataset_0.9.jsonl') as file1:  \n",
    "                for line1 in file1:\n",
    "                    data1 = json.loads(line1)\n",
    "                    q = data1[0]['messages'][0]['content']\n",
    "                    ref1 = q.split('Reference:')[-1]\n",
    "                    # \\\" and \", or \\uxxxx\n",
    "                    if ref1.strip().split(',')[-1] == p1.strip()[:-1].split(',')[-1] or ref1.strip().split('\\\"')[-1] == p1.strip()[:-1].split('\\\"')[-1]:\n",
    "                        flag = True\n",
    "                        n+=1\n",
    "                        label=data1[0]['label']\n",
    "                        if label == 'true': # hallucination \n",
    "                            if \"here are no conflicting parts\" in answer: # factual\n",
    "                                t+=1\n",
    "                            else:\n",
    "                                t4.append(ref1)\n",
    "                        else:# factual\n",
    "                            if \"here are no conflicting parts\" in answer: # factual\n",
    "                                f+=1\n",
    "                            else:\n",
    "                                f4.append(ref1)\n",
    "                    if flag==False:\n",
    "                        uni=p1.strip()[:-1].split('\\\\u')[-1][4:]\n",
    "                        length=len(uni)\n",
    "                        if ref1.strip()[-length:] == uni:\n",
    "                            flag = True\n",
    "                            n+=1\n",
    "                            label=data1[0]['label']\n",
    "                            if label == 'true': # hallucination \n",
    "                                if \"here are no conflicting parts\" in answer: # factual\n",
    "                                    t+=1\n",
    "                                else:\n",
    "                                    t4.append(ref1)\n",
    "                            else:# factual\n",
    "                                if \"here are no conflicting parts\" in answer: # factual\n",
    "                                    f+=1\n",
    "                                else:\n",
    "                                    f4.append(ref1)\n",
    "print(num-t,(num-t)/num)\n",
    "print(f,f/num)\n",
    "print('matched num=',n)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 10,
   "id": "5339ade2",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "53 0.2523809523809524\n",
      "183 0.8714285714285714\n",
      "matched num= 420\n"
     ]
    }
   ],
   "source": [
    "t=0\n",
    "f=0\n",
    "t44=[]\n",
    "f44=[]\n",
    "n=0\n",
    "with open('pubhealth+0.9/detections_4_1.jsonl') as file:\n",
    "    for line in file:\n",
    "        data = json.loads(line)\n",
    "        answer = data[1]['choices'][0]['message']['content']\n",
    "        question = data[0]['messages'][0]['content']\n",
    "        p1 = question.split('P1: \\\"')[1].split('P2: ')[0]\n",
    "        flag = False\n",
    "        with open('pubhealth+0.9/dataset_0.9.jsonl') as file1:  \n",
    "            for line1 in file1:\n",
    "                data1 = json.loads(line1)\n",
    "                q = data1[0]['messages'][0]['content']\n",
    "                ref1 = q.split('Reference:')[-1]\n",
    "                # \n",
    "                sentences1=ref1.strip().split('.')\n",
    "                sentences2=p1.strip()[:-1].split('.')\n",
    "                if sentences1[-2] == sentences2[-2]:\n",
    "                    flag = True\n",
    "                    n+=1\n",
    "                    label=data1[0]['label']\n",
    "                    if label == 'true': # hallucination \n",
    "                        if \"here are no conflicting parts\" in answer: # factual\n",
    "                            t+=1\n",
    "                        else:\n",
    "                            t44.append(ref1)\n",
    "                    else:# factual\n",
    "                        if \"here are no conflicting parts\" in answer: # factual\n",
    "                            f+=1\n",
    "                        else:\n",
    "                            f44.append(ref1)\n",
    "        if flag==False:\n",
    "            with open('pubhealth+0.9/dataset_0.9.jsonl') as file1:  \n",
    "                for line1 in file1:\n",
    "                    data1 = json.loads(line1)\n",
    "                    q = data1[0]['messages'][0]['content']\n",
    "                    ref1 = q.split('Reference:')[-1]\n",
    "                    # \\\" and \", or \\uxxxx\n",
    "                    if ref1.strip().split(',')[-1] == p1.strip()[:-1].split(',')[-1] or ref1.strip().split('\\\"')[-1] == p1.strip()[:-1].split('\\\"')[-1]:\n",
    "                        flag = True\n",
    "                        n+=1\n",
    "                        label=data1[0]['label']\n",
    "                        if label == 'true': # hallucination \n",
    "                            if \"here are no conflicting parts\" in answer: # factual\n",
    "                                t+=1\n",
    "                            else:\n",
    "                                t44.append(ref1)\n",
    "                        else:# factual\n",
    "                            if \"here are no conflicting parts\" in answer: # factual\n",
    "                                f+=1\n",
    "                            else:\n",
    "                                f44.append(ref1)\n",
    "                    if flag==False:\n",
    "                        uni=p1.strip()[:-1].split('\\\\u')[-1][4:]\n",
    "                        length=len(uni)\n",
    "                        if ref1.strip()[-length:] == uni:\n",
    "                            flag = True\n",
    "                            n+=1\n",
    "                            label=data1[0]['label']\n",
    "                            if label == 'true': # hallucination \n",
    "                                if \"here are no conflicting parts\" in answer: # factual\n",
    "                                    t+=1\n",
    "                                else:\n",
    "                                    t44.append(ref1)\n",
    "                            else:# factual\n",
    "                                if \"here are no conflicting parts\" in answer: # factual\n",
    "                                    f+=1\n",
    "                                else:\n",
    "                                    f44.append(ref1)\n",
    "print(num-t,(num-t)/num)\n",
    "print(f,f/num)\n",
    "print('matched num=',n)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 11,
   "id": "5f88f3dd",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "36 0.17142857142857143\n",
      "182 0.8666666666666667\n",
      "matched num= 420\n"
     ]
    }
   ],
   "source": [
    "t=0\n",
    "f=0\n",
    "t5=[]\n",
    "f5=[]\n",
    "n=0\n",
    "with open('pubhealth+0.9/detections_5.jsonl') as file:\n",
    "    for line in file:\n",
    "        data = json.loads(line)\n",
    "        answer = data[1]['choices'][0]['message']['content']\n",
    "        question = data[0]['messages'][0]['content']\n",
    "        p1 = question.split('P1: \\\"')[1].split('P2: ')[0]\n",
    "        flag = False\n",
    "        with open('pubhealth+0.9/dataset_0.9.jsonl') as file1:  \n",
    "            for line1 in file1:\n",
    "                data1 = json.loads(line1)\n",
    "                q = data1[0]['messages'][0]['content']\n",
    "                ref1 = q.split('Reference:')[-1]\n",
    "                # \n",
    "                sentences1=ref1.strip().split('.')\n",
    "                sentences2=p1.strip()[:-1].split('.')\n",
    "                if sentences1[-2] == sentences2[-2]:\n",
    "                    flag = True\n",
    "                    n+=1\n",
    "                    label=data1[0]['label']\n",
    "                    if label == 'true': # hallucination \n",
    "                        if \"here are no conflicting parts\" in answer: # factual\n",
    "                            t+=1\n",
    "                        else:\n",
    "                            t5.append(ref1)\n",
    "                    else:# factual\n",
    "                        if \"here are no conflicting parts\" in answer: # factual\n",
    "                            f+=1\n",
    "                        else:\n",
    "                            f5.append(ref1)\n",
    "        if flag==False:\n",
    "            with open('pubhealth+0.9/dataset_0.9.jsonl') as file1:  \n",
    "                for line1 in file1:\n",
    "                    data1 = json.loads(line1)\n",
    "                    q = data1[0]['messages'][0]['content']\n",
    "                    ref1 = q.split('Reference:')[-1]\n",
    "                    # \\\" and \", or \\uxxxx\n",
    "                    if ref1.strip().split(',')[-1] == p1.strip()[:-1].split(',')[-1] or ref1.strip().split('\\\"')[-1] == p1.strip()[:-1].split('\\\"')[-1]:\n",
    "                        flag = True\n",
    "                        n+=1\n",
    "                        label=data1[0]['label']\n",
    "                        if label == 'true': # hallucination \n",
    "                            if \"here are no conflicting parts\" in answer: # factual\n",
    "                                t+=1\n",
    "                            else:\n",
    "                                t5.append(ref1)\n",
    "                        else:# factual\n",
    "                            if \"here are no conflicting parts\" in answer: # factual\n",
    "                                f+=1\n",
    "                            else:\n",
    "                                f5.append(ref1)\n",
    "                    if flag==False:\n",
    "                        uni=p1.strip()[:-1].split('\\\\u')[-1][4:]\n",
    "                        length=len(uni)\n",
    "                        if ref1.strip()[-length:] == uni:\n",
    "                            flag = True\n",
    "                            n+=1\n",
    "                            label=data1[0]['label']\n",
    "                            if label == 'true': # hallucination \n",
    "                                if \"here are no conflicting parts\" in answer: # factual\n",
    "                                    t+=1\n",
    "                                else:\n",
    "                                    t5.append(ref1)\n",
    "                            else:# factual\n",
    "                                if \"here are no conflicting parts\" in answer: # factual\n",
    "                                    f+=1\n",
    "                                else:\n",
    "                                    f5.append(ref1)\n",
    "print(num-t,(num-t)/num)\n",
    "print(f,f/num)\n",
    "print('matched num=',n)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 12,
   "id": "9301e005",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "35 0.16666666666666666\n",
      "185 0.8809523809523809\n",
      "matched num= 420\n"
     ]
    }
   ],
   "source": [
    "t=0\n",
    "f=0\n",
    "t55=[]\n",
    "f55=[]\n",
    "n=0\n",
    "with open('pubhealth+0.9/detections_5_1.jsonl') as file:\n",
    "    for line in file:\n",
    "        data = json.loads(line)\n",
    "        answer = data[1]['choices'][0]['message']['content']\n",
    "        question = data[0]['messages'][0]['content']\n",
    "        p1 = question.split('P1: \\\"')[1].split('P2: ')[0]\n",
    "        flag = False\n",
    "        with open('pubhealth+0.9/dataset_0.9.jsonl') as file1:  \n",
    "            for line1 in file1:\n",
    "                data1 = json.loads(line1)\n",
    "                q = data1[0]['messages'][0]['content']\n",
    "                ref1 = q.split('Reference:')[-1]\n",
    "                # \n",
    "                sentences1=ref1.strip().split('.')\n",
    "                sentences2=p1.strip()[:-1].split('.')\n",
    "                if sentences1[-2] == sentences2[-2]:\n",
    "                    flag = True\n",
    "                    n+=1\n",
    "                    label=data1[0]['label']\n",
    "                    if label == 'true': # hallucination \n",
    "                        if \"here are no conflicting parts\" in answer: # factual\n",
    "                            t+=1\n",
    "                        else:\n",
    "                            t55.append(ref1)\n",
    "                    else:# factual\n",
    "                        if \"here are no conflicting parts\" in answer: # factual\n",
    "                            f+=1\n",
    "                        else:\n",
    "                            f55.append(ref1)\n",
    "        if flag==False:\n",
    "            with open('pubhealth+0.9/dataset_0.9.jsonl') as file1:  \n",
    "                for line1 in file1:\n",
    "                    data1 = json.loads(line1)\n",
    "                    q = data1[0]['messages'][0]['content']\n",
    "                    ref1 = q.split('Reference:')[-1]\n",
    "                    # \\\" and \", or \\uxxxx\n",
    "                    if ref1.strip().split(',')[-1] == p1.strip()[:-1].split(',')[-1] or ref1.strip().split('\\\"')[-1] == p1.strip()[:-1].split('\\\"')[-1]:\n",
    "                        flag = True\n",
    "                        n+=1\n",
    "                        label=data1[0]['label']\n",
    "                        if label == 'true': # hallucination \n",
    "                            if \"here are no conflicting parts\" in answer: # factual\n",
    "                                t+=1\n",
    "                            else:\n",
    "                                t55.append(ref1)\n",
    "                        else:# factual\n",
    "                            if \"here are no conflicting parts\" in answer: # factual\n",
    "                                f+=1\n",
    "                            else:\n",
    "                                f55.append(ref1)\n",
    "                    if flag==False:\n",
    "                        uni=p1.strip()[:-1].split('\\\\u')[-1][4:]\n",
    "                        length=len(uni)\n",
    "                        if ref1.strip()[-length:] == uni:\n",
    "                            flag = True\n",
    "                            n+=1\n",
    "                            label=data1[0]['label']\n",
    "                            if label == 'true': # hallucination \n",
    "                                if \"here are no conflicting parts\" in answer: # factual\n",
    "                                    t+=1\n",
    "                                else:\n",
    "                                    t55.append(ref1)\n",
    "                            else:# factual\n",
    "                                if \"here are no conflicting parts\" in answer: # factual\n",
    "                                    f+=1\n",
    "                                else:\n",
    "                                    f55.append(ref1)\n",
    "print(num-t,(num-t)/num)\n",
    "print(f,f/num)\n",
    "print('matched num=',n)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 13,
   "id": "339a60b4",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "36 0.17142857142857143\n",
      "184 0.8761904761904762\n",
      "matched num= 420\n"
     ]
    }
   ],
   "source": [
    "t=0\n",
    "f=0\n",
    "t6=[]\n",
    "f6=[]\n",
    "n=0\n",
    "with open('pubhealth+0.9/detections_6.jsonl') as file:\n",
    "    for line in file:\n",
    "        data = json.loads(line)\n",
    "        answer = data[1]['choices'][0]['message']['content']\n",
    "        question = data[0]['messages'][0]['content']\n",
    "        p1 = question.split('P1: \\\"')[1].split('P2: ')[0]\n",
    "        flag = False\n",
    "        with open('pubhealth+0.9/dataset_0.9.jsonl') as file1:  \n",
    "            for line1 in file1:\n",
    "                data1 = json.loads(line1)\n",
    "                q = data1[0]['messages'][0]['content']\n",
    "                ref1 = q.split('Reference:')[-1]\n",
    "                # \n",
    "                sentences1=ref1.strip().split('.')\n",
    "                sentences2=p1.strip()[:-1].split('.')\n",
    "                if sentences1[-2] == sentences2[-2]:\n",
    "                    flag = True\n",
    "                    n+=1\n",
    "                    label=data1[0]['label']\n",
    "                    if label == 'true': # hallucination \n",
    "                        if \"here are no conflicting parts\" in answer: # factual\n",
    "                            t+=1\n",
    "                        else:\n",
    "                            t6.append(ref1)\n",
    "                    else:# factual\n",
    "                        if \"here are no conflicting parts\" in answer: # factual\n",
    "                            f+=1\n",
    "                        else:\n",
    "                            f6.append(ref1)\n",
    "        if flag==False:\n",
    "            with open('pubhealth+0.9/dataset_0.9.jsonl') as file1:  \n",
    "                for line1 in file1:\n",
    "                    data1 = json.loads(line1)\n",
    "                    q = data1[0]['messages'][0]['content']\n",
    "                    ref1 = q.split('Reference:')[-1]\n",
    "                    # \\\" and \", or \\uxxxx\n",
    "                    if ref1.strip().split(',')[-1] == p1.strip()[:-1].split(',')[-1] or ref1.strip().split('\\\"')[-1] == p1.strip()[:-1].split('\\\"')[-1]:\n",
    "                        flag = True\n",
    "                        n+=1\n",
    "                        label=data1[0]['label']\n",
    "                        if label == 'true': # hallucination \n",
    "                            if \"here are no conflicting parts\" in answer: # factual\n",
    "                                t+=1\n",
    "                            else:\n",
    "                                t6.append(ref1)\n",
    "                        else:# factual\n",
    "                            if \"here are no conflicting parts\" in answer: # factual\n",
    "                                f+=1\n",
    "                            else:\n",
    "                                f6.append(ref1)\n",
    "                    if flag==False:\n",
    "                        uni=p1.strip()[:-1].split('\\\\u')[-1][4:]\n",
    "                        length=len(uni)\n",
    "                        if ref1.strip()[-length:] == uni:\n",
    "                            flag = True\n",
    "                            n+=1\n",
    "                            label=data1[0]['label']\n",
    "                            if label == 'true': # hallucination \n",
    "                                if \"here are no conflicting parts\" in answer: # factual\n",
    "                                    t+=1\n",
    "                                else:\n",
    "                                    t6.append(ref1)\n",
    "                            else:# factual\n",
    "                                if \"here are no conflicting parts\" in answer: # factual\n",
    "                                    f+=1\n",
    "                                else:\n",
    "                                    f6.append(ref1)\n",
    "print(num-t,(num-t)/num)\n",
    "print(f,f/num)\n",
    "print('matched num=',n)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 14,
   "id": "7aa71748",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "48 0.22857142857142856\n",
      "162 0.7714285714285715\n",
      "matched num= 420\n"
     ]
    }
   ],
   "source": [
    "t=0\n",
    "f=0\n",
    "t66=[]\n",
    "f66=[]\n",
    "n=0\n",
    "with open('pubhealth+0.9/detections_6_1.jsonl') as file:\n",
    "    for line in file:\n",
    "        data = json.loads(line)\n",
    "        answer = data[1]['choices'][0]['message']['content']\n",
    "        question = data[0]['messages'][0]['content']\n",
    "        p1 = question.split('P1: \\\"')[1].split('P2: ')[0]\n",
    "        flag = False\n",
    "        with open('pubhealth+0.9/dataset_0.9.jsonl') as file1:  \n",
    "            for line1 in file1:\n",
    "                data1 = json.loads(line1)\n",
    "                q = data1[0]['messages'][0]['content']\n",
    "                ref1 = q.split('Reference:')[-1]\n",
    "                # \n",
    "                sentences1=ref1.strip().split('.')\n",
    "                sentences2=p1.strip()[:-1].split('.')\n",
    "                if sentences1[-2] == sentences2[-2]:\n",
    "                    flag = True\n",
    "                    n+=1\n",
    "                    label=data1[0]['label']\n",
    "                    if label == 'true': # hallucination \n",
    "                        if \"here are no conflicting parts\" in answer: # factual\n",
    "                            t+=1\n",
    "                        else:\n",
    "                            t66.append(ref1)\n",
    "                    else:# factual\n",
    "                        if \"here are no conflicting parts\" in answer: # factual\n",
    "                            f+=1\n",
    "                        else:\n",
    "                            f66.append(ref1)\n",
    "        if flag==False:\n",
    "            with open('pubhealth+0.9/dataset_0.9.jsonl') as file1:  \n",
    "                for line1 in file1:\n",
    "                    data1 = json.loads(line1)\n",
    "                    q = data1[0]['messages'][0]['content']\n",
    "                    ref1 = q.split('Reference:')[-1]\n",
    "                    # \\\" and \", or \\uxxxx\n",
    "                    if ref1.strip().split(',')[-1] == p1.strip()[:-1].split(',')[-1] or ref1.strip().split('\\\"')[-1] == p1.strip()[:-1].split('\\\"')[-1]:\n",
    "                        flag = True\n",
    "                        n+=1\n",
    "                        label=data1[0]['label']\n",
    "                        if label == 'true': # hallucination \n",
    "                            if \"here are no conflicting parts\" in answer: # factual\n",
    "                                t+=1\n",
    "                            else:\n",
    "                                t66.append(ref1)\n",
    "                        else:# factual\n",
    "                            if \"here are no conflicting parts\" in answer: # factual\n",
    "                                f+=1\n",
    "                            else:\n",
    "                                f66.append(ref1)\n",
    "                    if flag==False:\n",
    "                        uni=p1.strip()[:-1].split('\\\\u')[-1][4:]\n",
    "                        length=len(uni)\n",
    "                        if ref1.strip()[-length:] == uni:\n",
    "                            flag = True\n",
    "                            n+=1\n",
    "                            label=data1[0]['label']\n",
    "                            if label == 'true': # hallucination \n",
    "                                if \"here are no conflicting parts\" in answer: # factual\n",
    "                                    t+=1\n",
    "                                else:\n",
    "                                    t66.append(ref1)\n",
    "                            else:# factual\n",
    "                                if \"here are no conflicting parts\" in answer: # factual\n",
    "                                    f+=1\n",
    "                                else:\n",
    "                                    f66.append(ref1)\n",
    "print(num-t,(num-t)/num)\n",
    "print(f,f/num)\n",
    "print('matched num=',n)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 15,
   "id": "ea5c5640",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "20 0.09523809523809523\n",
      "187 0.8904761904761904\n",
      "matched num= 420\n"
     ]
    }
   ],
   "source": [
    "t=0\n",
    "f=0\n",
    "t7=[]\n",
    "f7=[]\n",
    "n=0\n",
    "with open('pubhealth+0.9/detections_7.jsonl') as file:\n",
    "    for line in file:\n",
    "        data = json.loads(line)\n",
    "        answer = data[1]['choices'][0]['message']['content']\n",
    "        question = data[0]['messages'][0]['content']\n",
    "        p1 = question.split('P1: \\\"')[1].split('P2: ')[0]\n",
    "        flag = False\n",
    "        with open('pubhealth+0.9/dataset_0.9.jsonl') as file1:  \n",
    "            for line1 in file1:\n",
    "                data1 = json.loads(line1)\n",
    "                q = data1[0]['messages'][0]['content']\n",
    "                ref1 = q.split('Reference:')[-1]\n",
    "                # \n",
    "                sentences1=ref1.strip().split('.')\n",
    "                sentences2=p1.strip()[:-1].split('.')\n",
    "                if sentences1[-2] == sentences2[-2]:\n",
    "                    flag = True\n",
    "                    n+=1\n",
    "                    label=data1[0]['label']\n",
    "                    if label == 'true': # hallucination \n",
    "                        if \"here are no conflicting parts\" in answer: # factual\n",
    "                            t+=1\n",
    "                        else:\n",
    "                            t7.append(ref1)\n",
    "                    else:# factual\n",
    "                        if \"here are no conflicting parts\" in answer: # factual\n",
    "                            f+=1\n",
    "                        else:\n",
    "                            f7.append(ref1)\n",
    "        if flag==False:\n",
    "            with open('pubhealth+0.9/dataset_0.9.jsonl') as file1:  \n",
    "                for line1 in file1:\n",
    "                    data1 = json.loads(line1)\n",
    "                    q = data1[0]['messages'][0]['content']\n",
    "                    ref1 = q.split('Reference:')[-1]\n",
    "                    # \\\" and \", or \\uxxxx\n",
    "                    if ref1.strip().split(',')[-1] == p1.strip()[:-1].split(',')[-1] or ref1.strip().split('\\\"')[-1] == p1.strip()[:-1].split('\\\"')[-1]:\n",
    "                        flag = True\n",
    "                        n+=1\n",
    "                        label=data1[0]['label']\n",
    "                        if label == 'true': # hallucination \n",
    "                            if \"here are no conflicting parts\" in answer: # factual\n",
    "                                t+=1\n",
    "                            else:\n",
    "                                t7.append(ref1)\n",
    "                        else:# factual\n",
    "                            if \"here are no conflicting parts\" in answer: # factual\n",
    "                                f+=1\n",
    "                            else:\n",
    "                                f7.append(ref1)\n",
    "                    if flag==False:\n",
    "                        uni=p1.strip()[:-1].split('\\\\u')[-1][4:]\n",
    "                        length=len(uni)\n",
    "                        if ref1.strip()[-length:] == uni:\n",
    "                            flag = True\n",
    "                            n+=1\n",
    "                            label=data1[0]['label']\n",
    "                            if label == 'true': # hallucination \n",
    "                                if \"here are no conflicting parts\" in answer: # factual\n",
    "                                    t+=1\n",
    "                                else:\n",
    "                                    t7.append(ref1)\n",
    "                            else:# factual\n",
    "                                if \"here are no conflicting parts\" in answer: # factual\n",
    "                                    f+=1\n",
    "                                else:\n",
    "                                    f7.append(ref1)\n",
    "print(num-t,(num-t)/num)\n",
    "print(f,f/num)\n",
    "print('matched num=',n)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 27,
   "id": "634c799f",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "0 1 2 3 4 5 6\n",
      "0.5428571428571428\n",
      "0.6607773851590106\n",
      "0 1 2 3 4 6 7\n",
      "0.5476190476190477\n",
      "0.6654929577464789\n"
     ]
    }
   ],
   "source": [
    "tlist=[t1,t2,t3,t4,t5,t6,t7,t11,t22,t33,t44,t55,t66]\n",
    "flist=[f1,f2,f3,f4,f5,f6,f7,f11,f22,f33,f44,f55,f66]\n",
    "#      0   1  2  3  4  5  6  7   8   9   10  11  12\n",
    "minV=0\n",
    "for kk in range(13-11):\n",
    "    for jj in range(kk+1,13-10):\n",
    "        for ii in range(jj+1,13-9):\n",
    "            for i in range(ii+1,13-8):\n",
    "                for j in range(i+1,13-7):\n",
    "                     for k in range(j+1,13-6):\n",
    "                        for m in range(k+1,13-5):\n",
    "                            for n in range(m+1,13-4):\n",
    "                                for q in range(n+1,13-3):\n",
    "                                    for w in range(q+1,13-2):\n",
    "                                        for z in range(w+1,13-1):\n",
    "                                            for y in range(z+1,13):\n",
    "                                                a=tlist[kk]+tlist[jj]+tlist[ii]+tlist[i]+tlist[j]+tlist[k]+tlist[m]+tlist[n]+tlist[q]+tlist[w]+tlist[z]+tlist[y]#+tlist[p] \n",
    "                                                a=list(set(a))\n",
    "                                                aa=len(a)\n",
    "                                                a=flist[kk]+flist[jj]+flist[ii]+flist[i]+flist[j]+flist[k]+flist[m]+flist[n]+flist[q]+flist[w]+flist[z]+flist[y]#+flist[p] \n",
    "                                                a=list(set(a))\n",
    "                                                bb=len(a)\n",
    "                                                TN=(num-bb)/(num*2)\n",
    "                                                TP=aa/(num*2)\n",
    "                                                FN=(num-aa)/(num*2)\n",
    "                                                FP=bb/(num*2)\n",
    "                                                F1=2*TP/(2*TP+FP+FN)\n",
    "                                                if TN+TP>=minV:\n",
    "                                                    print(kk,jj,ii,i,j,k,m)#,n,q,w,z,y,p)\n",
    "                                                    print(TN+TP)\n",
    "                                                    print(F1)\n",
    "                                                    minV=TN+TP"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 17,
   "id": "b7aaa2f0",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "420\n",
      "1.9285714285714286\n",
      "2.723809523809524\n"
     ]
    }
   ],
   "source": [
    "with open('pubhealth+0.9/dataset_0.9.jsonl') as file1: \n",
    "    fnum=[]\n",
    "    tnum=[]\n",
    "    knum=0\n",
    "    for line1 in file1:\n",
    "        data1 = json.loads(line1)\n",
    "        q = data1[0]['messages'][0]['content']\n",
    "        ref1 = q.split('Reference:')[-1]\n",
    "        label=data1[0]['label']\n",
    "        sub=ref1.strip().split('\\\"')\n",
    "        knum+=1\n",
    "        if label == 'false': # factual\n",
    "            num1=0\n",
    "            for f in flist:\n",
    "                if ref1 in f:\n",
    "                    num1+=1\n",
    "            fnum.append(num1)\n",
    "            #print(num,num1)\n",
    "        else:\n",
    "            num2=0\n",
    "            for t in tlist:\n",
    "                if ref1 in t:\n",
    "                    num2+=1\n",
    "            tnum.append(num2)\n",
    "            #print(num,num2)\n",
    "    print(knum)\n",
    "    print(np.mean(fnum))\n",
    "    print(np.mean(tnum))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 30,
   "id": "c073528f",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "189\n",
      "0.9\n"
     ]
    }
   ],
   "source": [
    "a=t1+t2+t3+t4+t5+t6+t7+t11+t22+t44+t33+t55+t66 # \n",
    "res=set(a)\n",
    "a=list(res)\n",
    "print(len(a))\n",
    "aa=len(a)\n",
    "print(len(a)/num)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 31,
   "id": "22ce6b5c",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "177\n",
      "0.15714285714285714\n"
     ]
    }
   ],
   "source": [
    "a=f1+f2+f3+f4+f5+f6+f7+f11+f22+f44+f33+f55+f66 # \n",
    "res=set(a)\n",
    "a=list(res)\n",
    "print(len(a))\n",
    "bb=len(a)\n",
    "print((num-len(a))/num)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 32,
   "id": "f7b5da5d",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "FN 0.05\n",
      "FP 0.42142857142857143\n",
      "TN 0.07857142857142857\n",
      "TP 0.45\n"
     ]
    }
   ],
   "source": [
    "all_num=num*2\n",
    "# FN:\n",
    "FN=(num-aa)/all_num\n",
    "print('FN',FN)\n",
    "# FP:\n",
    "FP=bb/all_num\n",
    "print('FP',FP)\n",
    "# TN:\n",
    "TN=(num-bb)/all_num\n",
    "print('TN',TN)\n",
    "# TP:\n",
    "TP=aa/all_num\n",
    "print('TP',TP)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 33,
   "id": "1eb25842",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "0.5285714285714286\n",
      "0.5163934426229508\n",
      "0.9\n",
      "0.65625\n"
     ]
    }
   ],
   "source": [
    "Accuracy=TN+TP\n",
    "print(Accuracy)\n",
    "Precision=TP/(TP+FP)\n",
    "print(Precision)\n",
    "Recall=TP/(TP+FN)\n",
    "print(Recall)\n",
    "F1=2*TP/(2*TP+FP+FN)\n",
    "print(F1)"
   ]
  },
  {
   "cell_type": "markdown",
   "id": "3ceca7ed",
   "metadata": {},
   "source": [
    "## temperature=0.5"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 18,
   "id": "f7a7537b",
   "metadata": {},
   "outputs": [],
   "source": [
    "num=205"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 15,
   "id": "7e6d0c08",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "43 0.2097560975609756\n",
      "194 0.9463414634146341\n",
      "matched num= 410\n"
     ]
    }
   ],
   "source": [
    "t=0\n",
    "f=0\n",
    "t1=[]\n",
    "f1=[]\n",
    "n=0\n",
    "with open('pubhealth+0.5/detections_1.jsonl') as file:\n",
    "    for line in file:\n",
    "        data = json.loads(line)\n",
    "        answer = data[1]['choices'][0]['message']['content']\n",
    "        question = data[0]['messages'][0]['content']\n",
    "        p1 = question.split('P1: \\\"')[1].split('P2: ')[0]\n",
    "        flag = False\n",
    "        with open('pubhealth+0.5/dataset_0.5.jsonl') as file1:  \n",
    "            for line1 in file1:\n",
    "                data1 = json.loads(line1)\n",
    "                q = data1[0]['messages'][0]['content']\n",
    "                ref1 = q.split('Reference:')[-1]\n",
    "                # \n",
    "                sentences1=ref1.strip().split('.')[-2].strip()\n",
    "                sentences2=p1.strip()[:-1].split('.')[-2].strip()\n",
    "                while sentences2[0:2]=='\\\\n':\n",
    "                    sentences2=sentences2[2:]\n",
    "                if sentences1 == sentences2:\n",
    "                    flag = True\n",
    "                    n+=1\n",
    "                    label=data1[0]['label']\n",
    "                    if label == 'true': # hallucination \n",
    "                        if \"here are no conflicting parts\" in answer: # factual\n",
    "                            t+=1\n",
    "                        else:\n",
    "                            t1.append(ref1)\n",
    "                    else:# factual\n",
    "                        if \"here are no conflicting parts\" in answer: # factual\n",
    "                            f+=1\n",
    "                        else:\n",
    "                            f1.append(ref1)\n",
    "        if flag==False:\n",
    "            with open('pubhealth+0.5/dataset_0.5.jsonl') as file1:  \n",
    "                for line1 in file1:\n",
    "                    data1 = json.loads(line1)\n",
    "                    q = data1[0]['messages'][0]['content']\n",
    "                    ref1 = q.split('Reference:')[-1]\n",
    "                    # \\\" and \", or \\uxxxx\n",
    "                    if ref1.strip().split(',')[-1] == p1.strip()[:-1].split(',')[-1] or ref1.strip().split('\\\"')[-1] == p1.strip()[:-1].split('\\\"')[-1]:\n",
    "                        flag = True\n",
    "                        n+=1\n",
    "                        label=data1[0]['label']\n",
    "                        if label == 'true': # hallucination \n",
    "                            if \"here are no conflicting parts\" in answer: # factual\n",
    "                                t+=1\n",
    "                            else:\n",
    "                                t1.append(ref1)\n",
    "                        else:# factual\n",
    "                            if \"here are no conflicting parts\" in answer: # factual\n",
    "                                f+=1\n",
    "                            else:\n",
    "                                f1.append(ref1)\n",
    "                    if flag==False:\n",
    "                        uni=p1.strip()[:-1].split('\\\\u')[-1][4:]\n",
    "                        length=len(uni)\n",
    "                        if ref1.strip()[-length:] == uni:\n",
    "                            flag = True\n",
    "                            n+=1\n",
    "                            label=data1[0]['label']\n",
    "                            if label == 'true': # hallucination \n",
    "                                if \"here are no conflicting parts\" in answer: # factual\n",
    "                                    t+=1\n",
    "                                else:\n",
    "                                    t1.append(ref1)\n",
    "                            else:# factual\n",
    "                                if \"here are no conflicting parts\" in answer: # factual\n",
    "                                    f+=1\n",
    "                                else:\n",
    "                                    f1.append(ref1)\n",
    "        if flag==False:\n",
    "            print(p1.strip()[:-1])\n",
    "print(num-t,(num-t)/num)\n",
    "print(f,f/num)\n",
    "print('matched num=',n)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 16,
   "id": "1ba3f523",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "29 0.14146341463414633\n",
      "188 0.9170731707317074\n",
      "matched num= 410\n"
     ]
    }
   ],
   "source": [
    "t=0\n",
    "f=0\n",
    "t11=[]\n",
    "f11=[]\n",
    "n=0\n",
    "with open('pubhealth+0.5/detections_1_1.jsonl') as file:\n",
    "    for line in file:\n",
    "        data = json.loads(line)\n",
    "        answer = data[1]['choices'][0]['message']['content']\n",
    "        question = data[0]['messages'][0]['content']\n",
    "        p1 = question.split('P1: \\\"')[1].split('P2: ')[0]\n",
    "        flag = False\n",
    "        with open('pubhealth+0.5/dataset_0.5.jsonl') as file1:  \n",
    "            for line1 in file1:\n",
    "                data1 = json.loads(line1)\n",
    "                q = data1[0]['messages'][0]['content']\n",
    "                ref1 = q.split('Reference:')[-1]\n",
    "                # \n",
    "                sentences1=ref1.strip().split('.')[-2].strip()\n",
    "                sentences2=p1.strip()[:-1].split('.')[-2].strip()\n",
    "                while sentences2[0:2]=='\\\\n':\n",
    "                    sentences2=sentences2[2:]\n",
    "                if sentences1 == sentences2:\n",
    "                    flag = True\n",
    "                    n+=1\n",
    "                    label=data1[0]['label']\n",
    "                    if label == 'true': # hallucination \n",
    "                        if \"here are no conflicting parts\" in answer: # factual\n",
    "                            t+=1\n",
    "                        else:\n",
    "                            t11.append(ref1)\n",
    "                    else:# factual\n",
    "                        if \"here are no conflicting parts\" in answer: # factual\n",
    "                            f+=1\n",
    "                        else:\n",
    "                            f11.append(ref1)\n",
    "        if flag==False:\n",
    "            with open('pubhealth+0.5/dataset_0.5.jsonl') as file1:  \n",
    "                for line1 in file1:\n",
    "                    data1 = json.loads(line1)\n",
    "                    q = data1[0]['messages'][0]['content']\n",
    "                    ref1 = q.split('Reference:')[-1]\n",
    "                    # \\\" and \", or \\uxxxx\n",
    "                    if ref1.strip().split(',')[-1] == p1.strip()[:-1].split(',')[-1] or ref1.strip().split('\\\"')[-1] == p1.strip()[:-1].split('\\\"')[-1]:\n",
    "                        flag = True\n",
    "                        n+=1\n",
    "                        label=data1[0]['label']\n",
    "                        if label == 'true': # hallucination \n",
    "                            if \"here are no conflicting parts\" in answer: # factual\n",
    "                                t+=1\n",
    "                            else:\n",
    "                                t11.append(ref1)\n",
    "                        else:# factual\n",
    "                            if \"here are no conflicting parts\" in answer: # factual\n",
    "                                f+=1\n",
    "                            else:\n",
    "                                f11.append(ref1)\n",
    "                    if flag==False:\n",
    "                        uni=p1.strip()[:-1].split('\\\\u')[-1][4:]\n",
    "                        length=len(uni)\n",
    "                        if ref1.strip()[-length:] == uni:\n",
    "                            flag = True\n",
    "                            n+=1\n",
    "                            label=data1[0]['label']\n",
    "                            if label == 'true': # hallucination \n",
    "                                if \"here are no conflicting parts\" in answer: # factual\n",
    "                                    t+=1\n",
    "                                else:\n",
    "                                    t11.append(ref1)\n",
    "                            else:# factual\n",
    "                                if \"here are no conflicting parts\" in answer: # factual\n",
    "                                    f+=1\n",
    "                                else:\n",
    "                                    f11.append(ref1)\n",
    "print(num-t,(num-t)/num)\n",
    "print(f,f/num)\n",
    "print('matched num=',n)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 19,
   "id": "5748ed2b",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "33 0.16097560975609757\n",
      "184 0.8975609756097561\n",
      "matched num= 410\n"
     ]
    }
   ],
   "source": [
    "t=0\n",
    "f=0\n",
    "t2=[]\n",
    "f2=[]\n",
    "n=0\n",
    "with open('pubhealth+0.5/detections_2.jsonl') as file:\n",
    "    for line in file:\n",
    "        data = json.loads(line)\n",
    "        answer = data[1]['choices'][0]['message']['content']\n",
    "        question = data[0]['messages'][0]['content']\n",
    "        p1 = question.split('P1: \\\"')[1].split('P2: ')[0]\n",
    "        flag = False\n",
    "        with open('pubhealth+0.5/dataset_0.5.jsonl') as file1:  \n",
    "            for line1 in file1:\n",
    "                data1 = json.loads(line1)\n",
    "                q = data1[0]['messages'][0]['content']\n",
    "                ref1 = q.split('Reference:')[-1]\n",
    "                # \n",
    "                sentences1=ref1.strip().split('.')[-2].strip()\n",
    "                sentences2=p1.strip()[:-1].split('.')[-2].strip()\n",
    "                while sentences2[0:2]=='\\\\n':\n",
    "                    sentences2=sentences2[2:]\n",
    "                if sentences1 == sentences2:\n",
    "                    flag = True\n",
    "                    n+=1\n",
    "                    label=data1[0]['label']\n",
    "                    if label == 'true': # hallucination \n",
    "                        if \"here are no conflicting parts\" in answer: # factual\n",
    "                            t+=1\n",
    "                        else:\n",
    "                            t2.append(ref1)\n",
    "                    else:# factual\n",
    "                        if \"here are no conflicting parts\" in answer: # factual\n",
    "                            f+=1\n",
    "                        else:\n",
    "                            f2.append(ref1)\n",
    "        if flag==False:\n",
    "            with open('pubhealth+0.5/dataset_0.5.jsonl') as file1:  \n",
    "                for line1 in file1:\n",
    "                    data1 = json.loads(line1)\n",
    "                    q = data1[0]['messages'][0]['content']\n",
    "                    ref1 = q.split('Reference:')[-1]\n",
    "                    # \\\" and \", or \\uxxxx\n",
    "                    if ref1.strip().split(',')[-1] == p1.strip()[:-1].split(',')[-1] or ref1.strip().split('\\\"')[-1] == p1.strip()[:-1].split('\\\"')[-1]:\n",
    "                        flag = True\n",
    "                        n+=1\n",
    "                        label=data1[0]['label']\n",
    "                        if label == 'true': # hallucination \n",
    "                            if \"here are no conflicting parts\" in answer: # factual\n",
    "                                t+=1\n",
    "                            else:\n",
    "                                t2.append(ref1)\n",
    "                        else:# factual\n",
    "                            if \"here are no conflicting parts\" in answer: # factual\n",
    "                                f+=1\n",
    "                            else:\n",
    "                                f2.append(ref1)\n",
    "                    if flag==False:\n",
    "                        uni=p1.strip()[:-1].split('\\\\u')[-1][4:]\n",
    "                        length=len(uni)\n",
    "                        if ref1.strip()[-length:] == uni:\n",
    "                            flag = True\n",
    "                            n+=1\n",
    "                            label=data1[0]['label']\n",
    "                            if label == 'true': # hallucination \n",
    "                                if \"here are no conflicting parts\" in answer: # factual\n",
    "                                    t+=1\n",
    "                                else:\n",
    "                                    t2.append(ref1)\n",
    "                            else:# factual\n",
    "                                if \"here are no conflicting parts\" in answer: # factual\n",
    "                                    f+=1\n",
    "                                else:\n",
    "                                    f2.append(ref1)\n",
    "print(num-t,(num-t)/num)\n",
    "print(f,f/num)\n",
    "print('matched num=',n)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 20,
   "id": "c20f9c6a",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "27 0.13170731707317074\n",
      "186 0.9073170731707317\n",
      "matched num= 410\n"
     ]
    }
   ],
   "source": [
    "t=0\n",
    "f=0\n",
    "t22=[]\n",
    "f22=[]\n",
    "n=0\n",
    "with open('pubhealth+0.5/detections_2_1.jsonl') as file:\n",
    "    for line in file:\n",
    "        data = json.loads(line)\n",
    "        answer = data[1]['choices'][0]['message']['content']\n",
    "        question = data[0]['messages'][0]['content']\n",
    "        p1 = question.split('P1: \\\"')[1].split('P2: ')[0]\n",
    "        flag = False\n",
    "        with open('pubhealth+0.5/dataset_0.5.jsonl') as file1:  \n",
    "            for line1 in file1:\n",
    "                data1 = json.loads(line1)\n",
    "                q = data1[0]['messages'][0]['content']\n",
    "                ref1 = q.split('Reference:')[-1]\n",
    "                # \n",
    "                sentences1=ref1.strip().split('.')[-2].strip()\n",
    "                sentences2=p1.strip()[:-1].split('.')[-2].strip()\n",
    "                while sentences2[0:2]=='\\\\n':\n",
    "                    sentences2=sentences2[2:]\n",
    "                if sentences1 == sentences2:\n",
    "                    flag = True\n",
    "                    n+=1\n",
    "                    label=data1[0]['label']\n",
    "                    if label == 'true': # hallucination \n",
    "                        if \"here are no conflicting parts\" in answer: # factual\n",
    "                            t+=1\n",
    "                        else:\n",
    "                            t22.append(ref1)\n",
    "                    else:# factual\n",
    "                        if \"here are no conflicting parts\" in answer: # factual\n",
    "                            f+=1\n",
    "                        else:\n",
    "                            f22.append(ref1)\n",
    "        if flag==False:\n",
    "            with open('pubhealth+0.5/dataset_0.5.jsonl') as file1:  \n",
    "                for line1 in file1:\n",
    "                    data1 = json.loads(line1)\n",
    "                    q = data1[0]['messages'][0]['content']\n",
    "                    ref1 = q.split('Reference:')[-1]\n",
    "                    # \\\" and \", or \\uxxxx\n",
    "                    if ref1.strip().split(',')[-1] == p1.strip()[:-1].split(',')[-1] or ref1.strip().split('\\\"')[-1] == p1.strip()[:-1].split('\\\"')[-1]:\n",
    "                        flag = True\n",
    "                        n+=1\n",
    "                        label=data1[0]['label']\n",
    "                        if label == 'true': # hallucination \n",
    "                            if \"here are no conflicting parts\" in answer: # factual\n",
    "                                t+=1\n",
    "                            else:\n",
    "                                t22.append(ref1)\n",
    "                        else:# factual\n",
    "                            if \"here are no conflicting parts\" in answer: # factual\n",
    "                                f+=1\n",
    "                            else:\n",
    "                                f22.append(ref1)\n",
    "                    if flag==False:\n",
    "                        uni=p1.strip()[:-1].split('\\\\u')[-1][4:]\n",
    "                        length=len(uni)\n",
    "                        if ref1.strip()[-length:] == uni:\n",
    "                            flag = True\n",
    "                            n+=1\n",
    "                            label=data1[0]['label']\n",
    "                            if label == 'true': # hallucination \n",
    "                                if \"here are no conflicting parts\" in answer: # factual\n",
    "                                    t+=1\n",
    "                                else:\n",
    "                                    t22.append(ref1)\n",
    "                            else:# factual\n",
    "                                if \"here are no conflicting parts\" in answer: # factual\n",
    "                                    f+=1\n",
    "                                else:\n",
    "                                    f22.append(ref1)\n",
    "print(num-t,(num-t)/num)\n",
    "print(f,f/num)\n",
    "print('matched num=',n)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 21,
   "id": "c223ae2f",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "44 0.2146341463414634\n",
      "181 0.8829268292682927\n",
      "matched num= 410\n"
     ]
    }
   ],
   "source": [
    "t=0\n",
    "f=0\n",
    "t3=[]\n",
    "f3=[]\n",
    "n=0\n",
    "with open('pubhealth+0.5/detections_3.jsonl') as file:\n",
    "    for line in file:\n",
    "        data = json.loads(line)\n",
    "        answer = data[1]['choices'][0]['message']['content']\n",
    "        question = data[0]['messages'][0]['content']\n",
    "        p1 = question.split('P1: \\\"')[1].split('P2: ')[0]\n",
    "        flag = False\n",
    "        with open('pubhealth+0.5/dataset_0.5.jsonl') as file1:  \n",
    "            for line1 in file1:\n",
    "                data1 = json.loads(line1)\n",
    "                q = data1[0]['messages'][0]['content']\n",
    "                ref1 = q.split('Reference:')[-1]\n",
    "                # \n",
    "                sentences1=ref1.strip().split('.')[-2].strip()\n",
    "                sentences2=p1.strip()[:-1].split('.')[-2].strip()\n",
    "                while sentences2[0:2]=='\\\\n':\n",
    "                    sentences2=sentences2[2:]\n",
    "                if sentences1 == sentences2:\n",
    "                    flag = True\n",
    "                    n+=1\n",
    "                    label=data1[0]['label']\n",
    "                    if label == 'true': # hallucination \n",
    "                        if \"here are no conflicting parts\" in answer: # factual\n",
    "                            t+=1\n",
    "                        else:\n",
    "                            t3.append(ref1)\n",
    "                    else:# factual\n",
    "                        if \"here are no conflicting parts\" in answer: # factual\n",
    "                            f+=1\n",
    "                        else:\n",
    "                            f3.append(ref1)\n",
    "        if flag==False:\n",
    "            with open('pubhealth+0.5/dataset_0.5.jsonl') as file1:  \n",
    "                for line1 in file1:\n",
    "                    data1 = json.loads(line1)\n",
    "                    q = data1[0]['messages'][0]['content']\n",
    "                    ref1 = q.split('Reference:')[-1]\n",
    "                    # \\\" and \", or \\uxxxx\n",
    "                    if ref1.strip().split(',')[-1] == p1.strip()[:-1].split(',')[-1] or ref1.strip().split('\\\"')[-1] == p1.strip()[:-1].split('\\\"')[-1]:\n",
    "                        flag = True\n",
    "                        n+=1\n",
    "                        label=data1[0]['label']\n",
    "                        if label == 'true': # hallucination \n",
    "                            if \"here are no conflicting parts\" in answer: # factual\n",
    "                                t+=1\n",
    "                            else:\n",
    "                                t3.append(ref1)\n",
    "                        else:# factual\n",
    "                            if \"here are no conflicting parts\" in answer: # factual\n",
    "                                f+=1\n",
    "                            else:\n",
    "                                f3.append(ref1)\n",
    "                    if flag==False:\n",
    "                        uni=p1.strip()[:-1].split('\\\\u')[-1][4:]\n",
    "                        length=len(uni)\n",
    "                        if ref1.strip()[-length:] == uni:\n",
    "                            flag = True\n",
    "                            n+=1\n",
    "                            label=data1[0]['label']\n",
    "                            if label == 'true': # hallucination \n",
    "                                if \"here are no conflicting parts\" in answer: # factual\n",
    "                                    t+=1\n",
    "                                else:\n",
    "                                    t3.append(ref1)\n",
    "                            else:# factual\n",
    "                                if \"here are no conflicting parts\" in answer: # factual\n",
    "                                    f+=1\n",
    "                                else:\n",
    "                                    f3.append(ref1)\n",
    "print(num-t,(num-t)/num)\n",
    "print(f,f/num)\n",
    "print('matched num=',n)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 22,
   "id": "b5983988",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "27 0.13170731707317074\n",
      "186 0.9073170731707317\n",
      "matched num= 410\n"
     ]
    }
   ],
   "source": [
    "t=0\n",
    "f=0\n",
    "t33=[]\n",
    "f33=[]\n",
    "n=0\n",
    "with open('pubhealth+0.5/detections_3_1.jsonl') as file:\n",
    "    for line in file:\n",
    "        data = json.loads(line)\n",
    "        answer = data[1]['choices'][0]['message']['content']\n",
    "        question = data[0]['messages'][0]['content']\n",
    "        p1 = question.split('P1: \\\"')[1].split('P2: ')[0]\n",
    "        flag = False\n",
    "        with open('pubhealth+0.5/dataset_0.5.jsonl') as file1:  \n",
    "            for line1 in file1:\n",
    "                data1 = json.loads(line1)\n",
    "                q = data1[0]['messages'][0]['content']\n",
    "                ref1 = q.split('Reference:')[-1]\n",
    "                # \n",
    "                sentences1=ref1.strip().split('.')[-2].strip()\n",
    "                sentences2=p1.strip()[:-1].split('.')[-2].strip()\n",
    "                while sentences2[0:2]=='\\\\n':\n",
    "                    sentences2=sentences2[2:]\n",
    "                if sentences1 == sentences2:\n",
    "                    flag = True\n",
    "                    n+=1\n",
    "                    label=data1[0]['label']\n",
    "                    if label == 'true': # hallucination \n",
    "                        if \"here are no conflicting parts\" in answer: # factual\n",
    "                            t+=1\n",
    "                        else:\n",
    "                            t33.append(ref1)\n",
    "                    else:# factual\n",
    "                        if \"here are no conflicting parts\" in answer: # factual\n",
    "                            f+=1\n",
    "                        else:\n",
    "                            f33.append(ref1)\n",
    "        if flag==False:\n",
    "            with open('pubhealth+0.5/dataset_0.5.jsonl') as file1:  \n",
    "                for line1 in file1:\n",
    "                    data1 = json.loads(line1)\n",
    "                    q = data1[0]['messages'][0]['content']\n",
    "                    ref1 = q.split('Reference:')[-1]\n",
    "                    # \\\" and \", or \\uxxxx\n",
    "                    if ref1.strip().split(',')[-1] == p1.strip()[:-1].split(',')[-1] or ref1.strip().split('\\\"')[-1] == p1.strip()[:-1].split('\\\"')[-1]:\n",
    "                        flag = True\n",
    "                        n+=1\n",
    "                        label=data1[0]['label']\n",
    "                        if label == 'true': # hallucination \n",
    "                            if \"here are no conflicting parts\" in answer: # factual\n",
    "                                t+=1\n",
    "                            else:\n",
    "                                t33.append(ref1)\n",
    "                        else:# factual\n",
    "                            if \"here are no conflicting parts\" in answer: # factual\n",
    "                                f+=1\n",
    "                            else:\n",
    "                                f33.append(ref1)\n",
    "                    if flag==False:\n",
    "                        uni=p1.strip()[:-1].split('\\\\u')[-1][4:]\n",
    "                        length=len(uni)\n",
    "                        if ref1.strip()[-length:] == uni:\n",
    "                            flag = True\n",
    "                            n+=1\n",
    "                            label=data1[0]['label']\n",
    "                            if label == 'true': # hallucination \n",
    "                                if \"here are no conflicting parts\" in answer: # factual\n",
    "                                    t+=1\n",
    "                                else:\n",
    "                                    t33.append(ref1)\n",
    "                            else:# factual\n",
    "                                if \"here are no conflicting parts\" in answer: # factual\n",
    "                                    f+=1\n",
    "                                else:\n",
    "                                    f33.append(ref1)\n",
    "print(num-t,(num-t)/num)\n",
    "print(f,f/num)\n",
    "print('matched num=',n)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 23,
   "id": "857a619b",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "40 0.1951219512195122\n",
      "188 0.9170731707317074\n",
      "matched num= 410\n"
     ]
    }
   ],
   "source": [
    "t=0\n",
    "f=0\n",
    "t4=[]\n",
    "f4=[]\n",
    "n=0\n",
    "with open('pubhealth+0.5/detections_4.jsonl') as file:\n",
    "    for line in file:\n",
    "        data = json.loads(line)\n",
    "        answer = data[1]['choices'][0]['message']['content']\n",
    "        question = data[0]['messages'][0]['content']\n",
    "        p1 = question.split('P1: \\\"')[1].split('P2: ')[0]\n",
    "        flag = False\n",
    "        with open('pubhealth+0.5/dataset_0.5.jsonl') as file1:  \n",
    "            for line1 in file1:\n",
    "                data1 = json.loads(line1)\n",
    "                q = data1[0]['messages'][0]['content']\n",
    "                ref1 = q.split('Reference:')[-1]\n",
    "                # \n",
    "                sentences1=ref1.strip().split('.')[-2].strip()\n",
    "                sentences2=p1.strip()[:-1].split('.')[-2].strip()\n",
    "                while sentences2[0:2]=='\\\\n':\n",
    "                    sentences2=sentences2[2:]\n",
    "                if sentences1 == sentences2:\n",
    "                    flag = True\n",
    "                    n+=1\n",
    "                    label=data1[0]['label']\n",
    "                    if label == 'true': # hallucination \n",
    "                        if \"here are no conflicting parts\" in answer: # factual\n",
    "                            t+=1\n",
    "                        else:\n",
    "                            t4.append(ref1)\n",
    "                    else:# factual\n",
    "                        if \"here are no conflicting parts\" in answer: # factual\n",
    "                            f+=1\n",
    "                        else:\n",
    "                            f4.append(ref1)\n",
    "        if flag==False:\n",
    "            with open('pubhealth+0.5/dataset_0.5.jsonl') as file1:  \n",
    "                for line1 in file1:\n",
    "                    data1 = json.loads(line1)\n",
    "                    q = data1[0]['messages'][0]['content']\n",
    "                    ref1 = q.split('Reference:')[-1]\n",
    "                    # \\\" and \", or \\uxxxx\n",
    "                    if ref1.strip().split(',')[-1] == p1.strip()[:-1].split(',')[-1] or ref1.strip().split('\\\"')[-1] == p1.strip()[:-1].split('\\\"')[-1]:\n",
    "                        flag = True\n",
    "                        n+=1\n",
    "                        label=data1[0]['label']\n",
    "                        if label == 'true': # hallucination \n",
    "                            if \"here are no conflicting parts\" in answer: # factual\n",
    "                                t+=1\n",
    "                            else:\n",
    "                                t4.append(ref1)\n",
    "                        else:# factual\n",
    "                            if \"here are no conflicting parts\" in answer: # factual\n",
    "                                f+=1\n",
    "                            else:\n",
    "                                f4.append(ref1)\n",
    "                    if flag==False:\n",
    "                        uni=p1.strip()[:-1].split('\\\\u')[-1][4:]\n",
    "                        length=len(uni)\n",
    "                        if ref1.strip()[-length:] == uni:\n",
    "                            flag = True\n",
    "                            n+=1\n",
    "                            label=data1[0]['label']\n",
    "                            if label == 'true': # hallucination \n",
    "                                if \"here are no conflicting parts\" in answer: # factual\n",
    "                                    t+=1\n",
    "                                else:\n",
    "                                    t4.append(ref1)\n",
    "                            else:# factual\n",
    "                                if \"here are no conflicting parts\" in answer: # factual\n",
    "                                    f+=1\n",
    "                                else:\n",
    "                                    f4.append(ref1)\n",
    "print(num-t,(num-t)/num)\n",
    "print(f,f/num)\n",
    "print('matched num=',n)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 24,
   "id": "b7745e3f",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "38 0.18536585365853658\n",
      "188 0.9170731707317074\n",
      "matched num= 410\n"
     ]
    }
   ],
   "source": [
    "t=0\n",
    "f=0\n",
    "t44=[]\n",
    "f44=[]\n",
    "n=0\n",
    "with open('pubhealth+0.5/detections_4_1.jsonl') as file:\n",
    "    for line in file:\n",
    "        data = json.loads(line)\n",
    "        answer = data[1]['choices'][0]['message']['content']\n",
    "        question = data[0]['messages'][0]['content']\n",
    "        p1 = question.split('P1: \\\"')[1].split('P2: ')[0]\n",
    "        flag = False\n",
    "        with open('pubhealth+0.5/dataset_0.5.jsonl') as file1:  \n",
    "            for line1 in file1:\n",
    "                data1 = json.loads(line1)\n",
    "                q = data1[0]['messages'][0]['content']\n",
    "                ref1 = q.split('Reference:')[-1]\n",
    "                # \n",
    "                sentences1=ref1.strip().split('.')[-2].strip()\n",
    "                sentences2=p1.strip()[:-1].split('.')[-2].strip()\n",
    "                while sentences2[0:2]=='\\\\n':\n",
    "                    sentences2=sentences2[2:]\n",
    "                if sentences1 == sentences2:\n",
    "                    flag = True\n",
    "                    n+=1\n",
    "                    label=data1[0]['label']\n",
    "                    if label == 'true': # hallucination \n",
    "                        if \"here are no conflicting parts\" in answer: # factual\n",
    "                            t+=1\n",
    "                        else:\n",
    "                            t44.append(ref1)\n",
    "                    else:# factual\n",
    "                        if \"here are no conflicting parts\" in answer: # factual\n",
    "                            f+=1\n",
    "                        else:\n",
    "                            f44.append(ref1)\n",
    "        if flag==False:\n",
    "            with open('pubhealth+0.5/dataset_0.5.jsonl') as file1:  \n",
    "                for line1 in file1:\n",
    "                    data1 = json.loads(line1)\n",
    "                    q = data1[0]['messages'][0]['content']\n",
    "                    ref1 = q.split('Reference:')[-1]\n",
    "                    # \\\" and \", or \\uxxxx\n",
    "                    if ref1.strip().split(',')[-1] == p1.strip()[:-1].split(',')[-1] or ref1.strip().split('\\\"')[-1] == p1.strip()[:-1].split('\\\"')[-1]:\n",
    "                        flag = True\n",
    "                        n+=1\n",
    "                        label=data1[0]['label']\n",
    "                        if label == 'true': # hallucination \n",
    "                            if \"here are no conflicting parts\" in answer: # factual\n",
    "                                t+=1\n",
    "                            else:\n",
    "                                t44.append(ref1)\n",
    "                        else:# factual\n",
    "                            if \"here are no conflicting parts\" in answer: # factual\n",
    "                                f+=1\n",
    "                            else:\n",
    "                                f44.append(ref1)\n",
    "                    if flag==False:\n",
    "                        uni=p1.strip()[:-1].split('\\\\u')[-1][4:]\n",
    "                        length=len(uni)\n",
    "                        if ref1.strip()[-length:] == uni:\n",
    "                            flag = True\n",
    "                            n+=1\n",
    "                            label=data1[0]['label']\n",
    "                            if label == 'true': # hallucination \n",
    "                                if \"here are no conflicting parts\" in answer: # factual\n",
    "                                    t+=1\n",
    "                                else:\n",
    "                                    t44.append(ref1)\n",
    "                            else:# factual\n",
    "                                if \"here are no conflicting parts\" in answer: # factual\n",
    "                                    f+=1\n",
    "                                else:\n",
    "                                    f44.append(ref1)\n",
    "print(num-t,(num-t)/num)\n",
    "print(f,f/num)\n",
    "print('matched num=',n)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 25,
   "id": "6f1e0f9b",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "23 0.11219512195121951\n",
      "193 0.9414634146341463\n",
      "matched num= 410\n"
     ]
    }
   ],
   "source": [
    "t=0\n",
    "f=0\n",
    "t5=[]\n",
    "f5=[]\n",
    "n=0\n",
    "with open('pubhealth+0.5/detections_5.jsonl') as file:\n",
    "    for line in file:\n",
    "        data = json.loads(line)\n",
    "        answer = data[1]['choices'][0]['message']['content']\n",
    "        question = data[0]['messages'][0]['content']\n",
    "        p1 = question.split('P1: \\\"')[1].split('P2: ')[0]\n",
    "        flag = False\n",
    "        with open('pubhealth+0.5/dataset_0.5.jsonl') as file1:  \n",
    "            for line1 in file1:\n",
    "                data1 = json.loads(line1)\n",
    "                q = data1[0]['messages'][0]['content']\n",
    "                ref1 = q.split('Reference:')[-1]\n",
    "                # \n",
    "                sentences1=ref1.strip().split('.')[-2].strip()\n",
    "                sentences2=p1.strip()[:-1].split('.')[-2].strip()\n",
    "                while sentences2[0:2]=='\\\\n':\n",
    "                    sentences2=sentences2[2:]\n",
    "                if sentences1 == sentences2:\n",
    "                    flag = True\n",
    "                    n+=1\n",
    "                    label=data1[0]['label']\n",
    "                    if label == 'true': # hallucination \n",
    "                        if \"here are no conflicting parts\" in answer: # factual\n",
    "                            t+=1\n",
    "                        else:\n",
    "                            t5.append(ref1)\n",
    "                    else:# factual\n",
    "                        if \"here are no conflicting parts\" in answer: # factual\n",
    "                            f+=1\n",
    "                        else:\n",
    "                            f5.append(ref1)\n",
    "        if flag==False:\n",
    "            with open('pubhealth+0.5/dataset_0.5.jsonl') as file1:  \n",
    "                for line1 in file1:\n",
    "                    data1 = json.loads(line1)\n",
    "                    q = data1[0]['messages'][0]['content']\n",
    "                    ref1 = q.split('Reference:')[-1]\n",
    "                    # \\\" and \", or \\uxxxx\n",
    "                    if ref1.strip().split(',')[-1] == p1.strip()[:-1].split(',')[-1] or ref1.strip().split('\\\"')[-1] == p1.strip()[:-1].split('\\\"')[-1]:\n",
    "                        flag = True\n",
    "                        n+=1\n",
    "                        label=data1[0]['label']\n",
    "                        if label == 'true': # hallucination \n",
    "                            if \"here are no conflicting parts\" in answer: # factual\n",
    "                                t+=1\n",
    "                            else:\n",
    "                                t5.append(ref1)\n",
    "                        else:# factual\n",
    "                            if \"here are no conflicting parts\" in answer: # factual\n",
    "                                f+=1\n",
    "                            else:\n",
    "                                f5.append(ref1)\n",
    "                    if flag==False:\n",
    "                        uni=p1.strip()[:-1].split('\\\\u')[-1][4:]\n",
    "                        length=len(uni)\n",
    "                        if ref1.strip()[-length:] == uni:\n",
    "                            flag = True\n",
    "                            n+=1\n",
    "                            label=data1[0]['label']\n",
    "                            if label == 'true': # hallucination \n",
    "                                if \"here are no conflicting parts\" in answer: # factual\n",
    "                                    t+=1\n",
    "                                else:\n",
    "                                    t5.append(ref1)\n",
    "                            else:# factual\n",
    "                                if \"here are no conflicting parts\" in answer: # factual\n",
    "                                    f+=1\n",
    "                                else:\n",
    "                                    f5.append(ref1)\n",
    "print(num-t,(num-t)/num)\n",
    "print(f,f/num)\n",
    "print('matched num=',n)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 26,
   "id": "b383a607",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "30 0.14634146341463414\n",
      "194 0.9463414634146341\n",
      "matched num= 410\n"
     ]
    }
   ],
   "source": [
    "t=0\n",
    "f=0\n",
    "t55=[]\n",
    "f55=[]\n",
    "n=0\n",
    "with open('pubhealth+0.5/detections_5_1.jsonl') as file:\n",
    "    for line in file:\n",
    "        data = json.loads(line)\n",
    "        answer = data[1]['choices'][0]['message']['content']\n",
    "        question = data[0]['messages'][0]['content']\n",
    "        p1 = question.split('P1: \\\"')[1].split('P2: ')[0]\n",
    "        flag = False\n",
    "        with open('pubhealth+0.5/dataset_0.5.jsonl') as file1:  \n",
    "            for line1 in file1:\n",
    "                data1 = json.loads(line1)\n",
    "                q = data1[0]['messages'][0]['content']\n",
    "                ref1 = q.split('Reference:')[-1]\n",
    "                # \n",
    "                sentences1=ref1.strip().split('.')[-2].strip()\n",
    "                sentences2=p1.strip()[:-1].split('.')[-2].strip()\n",
    "                while sentences2[0:2]=='\\\\n':\n",
    "                    sentences2=sentences2[2:]\n",
    "                if sentences1 == sentences2:\n",
    "                    flag = True\n",
    "                    n+=1\n",
    "                    label=data1[0]['label']\n",
    "                    if label == 'true': # hallucination \n",
    "                        if \"here are no conflicting parts\" in answer: # factual\n",
    "                            t+=1\n",
    "                        else:\n",
    "                            t55.append(ref1)\n",
    "                    else:# factual\n",
    "                        if \"here are no conflicting parts\" in answer: # factual\n",
    "                            f+=1\n",
    "                        else:\n",
    "                            f55.append(ref1)\n",
    "        if flag==False:\n",
    "            with open('pubhealth+0.5/dataset_0.5.jsonl') as file1:  \n",
    "                for line1 in file1:\n",
    "                    data1 = json.loads(line1)\n",
    "                    q = data1[0]['messages'][0]['content']\n",
    "                    ref1 = q.split('Reference:')[-1]\n",
    "                    # \\\" and \", or \\uxxxx\n",
    "                    if ref1.strip().split(',')[-1] == p1.strip()[:-1].split(',')[-1] or ref1.strip().split('\\\"')[-1] == p1.strip()[:-1].split('\\\"')[-1]:\n",
    "                        flag = True\n",
    "                        n+=1\n",
    "                        label=data1[0]['label']\n",
    "                        if label == 'true': # hallucination \n",
    "                            if \"here are no conflicting parts\" in answer: # factual\n",
    "                                t+=1\n",
    "                            else:\n",
    "                                t55.append(ref1)\n",
    "                        else:# factual\n",
    "                            if \"here are no conflicting parts\" in answer: # factual\n",
    "                                f+=1\n",
    "                            else:\n",
    "                                f55.append(ref1)\n",
    "                    if flag==False:\n",
    "                        uni=p1.strip()[:-1].split('\\\\u')[-1][4:]\n",
    "                        length=len(uni)\n",
    "                        if ref1.strip()[-length:] == uni:\n",
    "                            flag = True\n",
    "                            n+=1\n",
    "                            label=data1[0]['label']\n",
    "                            if label == 'true': # hallucination \n",
    "                                if \"here are no conflicting parts\" in answer: # factual\n",
    "                                    t+=1\n",
    "                                else:\n",
    "                                    t55.append(ref1)\n",
    "                            else:# factual\n",
    "                                if \"here are no conflicting parts\" in answer: # factual\n",
    "                                    f+=1\n",
    "                                else:\n",
    "                                    f55.append(ref1)\n",
    "print(num-t,(num-t)/num)\n",
    "print(f,f/num)\n",
    "print('matched num=',n)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 27,
   "id": "9de0241b",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "33 0.16097560975609757\n",
      "185 0.9024390243902439\n",
      "matched num= 410\n"
     ]
    }
   ],
   "source": [
    "t=0\n",
    "f=0\n",
    "t6=[]\n",
    "f6=[]\n",
    "n=0\n",
    "with open('pubhealth+0.5/detections_6.jsonl') as file:\n",
    "    for line in file:\n",
    "        data = json.loads(line)\n",
    "        answer = data[1]['choices'][0]['message']['content']\n",
    "        question = data[0]['messages'][0]['content']\n",
    "        p1 = question.split('P1: \\\"')[1].split('P2: ')[0]\n",
    "        flag = False\n",
    "        with open('pubhealth+0.5/dataset_0.5.jsonl') as file1:  \n",
    "            for line1 in file1:\n",
    "                data1 = json.loads(line1)\n",
    "                q = data1[0]['messages'][0]['content']\n",
    "                ref1 = q.split('Reference:')[-1]\n",
    "                # \n",
    "                sentences1=ref1.strip().split('.')[-2].strip()\n",
    "                sentences2=p1.strip()[:-1].split('.')[-2].strip()\n",
    "                while sentences2[0:2]=='\\\\n':\n",
    "                    sentences2=sentences2[2:]\n",
    "                if sentences1 == sentences2:\n",
    "                    flag = True\n",
    "                    n+=1\n",
    "                    label=data1[0]['label']\n",
    "                    if label == 'true': # hallucination \n",
    "                        if \"here are no conflicting parts\" in answer: # factual\n",
    "                            t+=1\n",
    "                        else:\n",
    "                            t6.append(ref1)\n",
    "                    else:# factual\n",
    "                        if \"here are no conflicting parts\" in answer: # factual\n",
    "                            f+=1\n",
    "                        else:\n",
    "                            f6.append(ref1)\n",
    "        if flag==False:\n",
    "            with open('pubhealth+0.5/dataset_0.5.jsonl') as file1:  \n",
    "                for line1 in file1:\n",
    "                    data1 = json.loads(line1)\n",
    "                    q = data1[0]['messages'][0]['content']\n",
    "                    ref1 = q.split('Reference:')[-1]\n",
    "                    # \\\" and \", or \\uxxxx\n",
    "                    if ref1.strip().split(',')[-1] == p1.strip()[:-1].split(',')[-1] or ref1.strip().split('\\\"')[-1] == p1.strip()[:-1].split('\\\"')[-1]:\n",
    "                        flag = True\n",
    "                        n+=1\n",
    "                        label=data1[0]['label']\n",
    "                        if label == 'true': # hallucination \n",
    "                            if \"here are no conflicting parts\" in answer: # factual\n",
    "                                t+=1\n",
    "                            else:\n",
    "                                t6.append(ref1)\n",
    "                        else:# factual\n",
    "                            if \"here are no conflicting parts\" in answer: # factual\n",
    "                                f+=1\n",
    "                            else:\n",
    "                                f6.append(ref1)\n",
    "                    if flag==False:\n",
    "                        uni=p1.strip()[:-1].split('\\\\u')[-1][4:]\n",
    "                        length=len(uni)\n",
    "                        if ref1.strip()[-length:] == uni:\n",
    "                            flag = True\n",
    "                            n+=1\n",
    "                            label=data1[0]['label']\n",
    "                            if label == 'true': # hallucination \n",
    "                                if \"here are no conflicting parts\" in answer: # factual\n",
    "                                    t+=1\n",
    "                                else:\n",
    "                                    t6.append(ref1)\n",
    "                            else:# factual\n",
    "                                if \"here are no conflicting parts\" in answer: # factual\n",
    "                                    f+=1\n",
    "                                else:\n",
    "                                    f6.append(ref1)\n",
    "print(num-t,(num-t)/num)\n",
    "print(f,f/num)\n",
    "print('matched num=',n)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 28,
   "id": "78ce3237",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "26 0.12682926829268293\n",
      "176 0.8585365853658536\n",
      "matched num= 410\n"
     ]
    }
   ],
   "source": [
    "t=0\n",
    "f=0\n",
    "t66=[]\n",
    "f66=[]\n",
    "n=0\n",
    "with open('pubhealth+0.5/detections_6_1.jsonl') as file:\n",
    "    for line in file:\n",
    "        data = json.loads(line)\n",
    "        answer = data[1]['choices'][0]['message']['content']\n",
    "        question = data[0]['messages'][0]['content']\n",
    "        p1 = question.split('P1: \\\"')[1].split('P2: ')[0]\n",
    "        flag = False\n",
    "        with open('pubhealth+0.5/dataset_0.5.jsonl') as file1:  \n",
    "            for line1 in file1:\n",
    "                data1 = json.loads(line1)\n",
    "                q = data1[0]['messages'][0]['content']\n",
    "                ref1 = q.split('Reference:')[-1]\n",
    "                # \n",
    "                sentences1=ref1.strip().split('.')[-2].strip()\n",
    "                sentences2=p1.strip()[:-1].split('.')[-2].strip()\n",
    "                while sentences2[0:2]=='\\\\n':\n",
    "                    sentences2=sentences2[2:]\n",
    "                if sentences1 == sentences2:\n",
    "                    flag = True\n",
    "                    n+=1\n",
    "                    label=data1[0]['label']\n",
    "                    if label == 'true': # hallucination \n",
    "                        if \"here are no conflicting parts\" in answer: # factual\n",
    "                            t+=1\n",
    "                        else:\n",
    "                            t66.append(ref1)\n",
    "                    else:# factual\n",
    "                        if \"here are no conflicting parts\" in answer: # factual\n",
    "                            f+=1\n",
    "                        else:\n",
    "                            f66.append(ref1)\n",
    "        if flag==False:\n",
    "            with open('pubhealth+0.5/dataset_0.5.jsonl') as file1:  \n",
    "                for line1 in file1:\n",
    "                    data1 = json.loads(line1)\n",
    "                    q = data1[0]['messages'][0]['content']\n",
    "                    ref1 = q.split('Reference:')[-1]\n",
    "                    # \\\" and \", or \\uxxxx\n",
    "                    if ref1.strip().split(',')[-1] == p1.strip()[:-1].split(',')[-1] or ref1.strip().split('\\\"')[-1] == p1.strip()[:-1].split('\\\"')[-1]:\n",
    "                        flag = True\n",
    "                        n+=1\n",
    "                        label=data1[0]['label']\n",
    "                        if label == 'true': # hallucination \n",
    "                            if \"here are no conflicting parts\" in answer: # factual\n",
    "                                t+=1\n",
    "                            else:\n",
    "                                t66.append(ref1)\n",
    "                        else:# factual\n",
    "                            if \"here are no conflicting parts\" in answer: # factual\n",
    "                                f+=1\n",
    "                            else:\n",
    "                                f66.append(ref1)\n",
    "                    if flag==False:\n",
    "                        uni=p1.strip()[:-1].split('\\\\u')[-1][4:]\n",
    "                        length=len(uni)\n",
    "                        if ref1.strip()[-length:] == uni:\n",
    "                            flag = True\n",
    "                            n+=1\n",
    "                            label=data1[0]['label']\n",
    "                            if label == 'true': # hallucination \n",
    "                                if \"here are no conflicting parts\" in answer: # factual\n",
    "                                    t+=1\n",
    "                                else:\n",
    "                                    t66.append(ref1)\n",
    "                            else:# factual\n",
    "                                if \"here are no conflicting parts\" in answer: # factual\n",
    "                                    f+=1\n",
    "                                else:\n",
    "                                    f66.append(ref1)\n",
    "print(num-t,(num-t)/num)\n",
    "print(f,f/num)\n",
    "print('matched num=',n)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 29,
   "id": "08730e03",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "16 0.07804878048780488\n",
      "192 0.9365853658536586\n",
      "matched num= 410\n"
     ]
    }
   ],
   "source": [
    "t=0\n",
    "f=0\n",
    "t7=[]\n",
    "f7=[]\n",
    "n=0\n",
    "with open('pubhealth+0.5/detections_7.jsonl') as file:\n",
    "    for line in file:\n",
    "        data = json.loads(line)\n",
    "        answer = data[1]['choices'][0]['message']['content']\n",
    "        question = data[0]['messages'][0]['content']\n",
    "        p1 = question.split('P1: \\\"')[1].split('P2: ')[0]\n",
    "        flag = False\n",
    "        with open('pubhealth+0.5/dataset_0.5.jsonl') as file1:  \n",
    "            for line1 in file1:\n",
    "                data1 = json.loads(line1)\n",
    "                q = data1[0]['messages'][0]['content']\n",
    "                ref1 = q.split('Reference:')[-1]\n",
    "                # \n",
    "                sentences1=ref1.strip().split('.')[-2].strip()\n",
    "                sentences2=p1.strip()[:-1].split('.')[-2].strip()\n",
    "                while sentences2[0:2]=='\\\\n':\n",
    "                    sentences2=sentences2[2:]\n",
    "                if sentences1 == sentences2:\n",
    "                    flag = True\n",
    "                    n+=1\n",
    "                    label=data1[0]['label']\n",
    "                    if label == 'true': # hallucination \n",
    "                        if \"here are no conflicting parts\" in answer: # factual\n",
    "                            t+=1\n",
    "                        else:\n",
    "                            t7.append(ref1)\n",
    "                    else:# factual\n",
    "                        if \"here are no conflicting parts\" in answer: # factual\n",
    "                            f+=1\n",
    "                        else:\n",
    "                            f7.append(ref1)\n",
    "        if flag==False:\n",
    "            with open('pubhealth+0.5/dataset_0.5.jsonl') as file1:  \n",
    "                for line1 in file1:\n",
    "                    data1 = json.loads(line1)\n",
    "                    q = data1[0]['messages'][0]['content']\n",
    "                    ref1 = q.split('Reference:')[-1]\n",
    "                    # \\\" and \", or \\uxxxx\n",
    "                    if ref1.strip().split(',')[-1] == p1.strip()[:-1].split(',')[-1] or ref1.strip().split('\\\"')[-1] == p1.strip()[:-1].split('\\\"')[-1]:\n",
    "                        flag = True\n",
    "                        n+=1\n",
    "                        label=data1[0]['label']\n",
    "                        if label == 'true': # hallucination \n",
    "                            if \"here are no conflicting parts\" in answer: # factual\n",
    "                                t+=1\n",
    "                            else:\n",
    "                                t7.append(ref1)\n",
    "                        else:# factual\n",
    "                            if \"here are no conflicting parts\" in answer: # factual\n",
    "                                f+=1\n",
    "                            else:\n",
    "                                f7.append(ref1)\n",
    "                    if flag==False:\n",
    "                        uni=p1.strip()[:-1].split('\\\\u')[-1][4:]\n",
    "                        length=len(uni)\n",
    "                        if ref1.strip()[-length:] == uni:\n",
    "                            flag = True\n",
    "                            n+=1\n",
    "                            label=data1[0]['label']\n",
    "                            if label == 'true': # hallucination \n",
    "                                if \"here are no conflicting parts\" in answer: # factual\n",
    "                                    t+=1\n",
    "                                else:\n",
    "                                    t7.append(ref1)\n",
    "                            else:# factual\n",
    "                                if \"here are no conflicting parts\" in answer: # factual\n",
    "                                    f+=1\n",
    "                                else:\n",
    "                                    f7.append(ref1)\n",
    "print(num-t,(num-t)/num)\n",
    "print(f,f/num)\n",
    "print('matched num=',n)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 30,
   "id": "396ec8e8",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "410\n",
      "0.9853658536585366\n",
      "1.6439024390243901\n"
     ]
    }
   ],
   "source": [
    "tlist=[t1,t2,t3,t4,t5,t6,t7,t11,t22,t33,t44,t55,t66]\n",
    "flist=[f1,f2,f3,f4,f5,f6,f7,f11,f22,f33,f44,f55,f66]\n",
    "with open('pubhealth+0.5/dataset_0.5.jsonl') as file1: \n",
    "    fnum=[]\n",
    "    tnum=[]\n",
    "    knum=0\n",
    "    for line1 in file1:\n",
    "        data1 = json.loads(line1)\n",
    "        q = data1[0]['messages'][0]['content']\n",
    "        ref1 = q.split('Reference:')[-1]\n",
    "        label=data1[0]['label']\n",
    "        sub=ref1.strip().split('\\\"')\n",
    "        knum+=1\n",
    "        if label == 'false': # factual\n",
    "            num1=0\n",
    "            for f in flist:\n",
    "                if ref1 in f:\n",
    "                    num1+=1\n",
    "            fnum.append(num1)\n",
    "            #print(num,num1)\n",
    "        else:\n",
    "            num2=0\n",
    "            for t in tlist:\n",
    "                if ref1 in t:\n",
    "                    num2+=1\n",
    "            tnum.append(num2)\n",
    "            #print(num,num2)\n",
    "    print(knum)\n",
    "    print(np.mean(fnum))\n",
    "    print(np.mean(tnum))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 32,
   "id": "73795f1d",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "148\n",
      "0.7219512195121951\n"
     ]
    }
   ],
   "source": [
    "a=t1+t2+t3+t4+t5+t6+t7+t44+t55+t11+t22 # \n",
    "res=set(a)\n",
    "a=list(res)\n",
    "print(len(a))\n",
    "aa=len(a)\n",
    "print(len(a)/num)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 33,
   "id": "3567d2b6",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "95\n",
      "0.5365853658536586\n"
     ]
    }
   ],
   "source": [
    "a=f1+f2+f3+f4+f5+f6+f7+f44+f55+f11+f22 # \n",
    "res=set(a)\n",
    "a=list(res)\n",
    "print(len(a))\n",
    "bb=len(a)\n",
    "print((num-len(a))/num)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 34,
   "id": "eb6aa342",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "FN 0.13902439024390245\n",
      "FP 0.23170731707317074\n",
      "TN 0.2682926829268293\n",
      "TP 0.36097560975609755\n"
     ]
    }
   ],
   "source": [
    "all_num=num*2\n",
    "# FN:\n",
    "FN=(num-aa)/all_num\n",
    "print('FN',FN)\n",
    "# FP:\n",
    "FP=bb/all_num\n",
    "print('FP',FP)\n",
    "# TN:\n",
    "TN=(num-bb)/all_num\n",
    "print('TN',TN)\n",
    "# TP:\n",
    "TP=aa/all_num\n",
    "print('TP',TP)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 35,
   "id": "a204b1a0",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "0.6292682926829268\n",
      "0.6090534979423868\n",
      "0.7219512195121951\n",
      "0.6607142857142856\n"
     ]
    }
   ],
   "source": [
    "Accuracy=TN+TP\n",
    "print(Accuracy)\n",
    "Precision=TP/(TP+FP)\n",
    "print(Precision)\n",
    "Recall=TP/(TP+FN)\n",
    "print(Recall)\n",
    "F1=2*TP/(2*TP+FP+FN)\n",
    "print(F1)"
   ]
  },
  {
   "cell_type": "markdown",
   "id": "29dab6c5",
   "metadata": {},
   "source": [
    "## temperature=0.1"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 31,
   "id": "6708fe5b",
   "metadata": {},
   "outputs": [],
   "source": [
    "num=215"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 32,
   "id": "eb74420b",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "37 0.17209302325581396\n",
      "207 0.9627906976744186\n",
      "matched num= 430\n"
     ]
    }
   ],
   "source": [
    "t=0\n",
    "f=0\n",
    "t1=[]\n",
    "f1=[]\n",
    "n=0\n",
    "with open('pubhealth+0.1/detections_1_2.jsonl') as file:\n",
    "    for line in file:\n",
    "        data = json.loads(line)\n",
    "        answer = data[1]['choices'][0]['message']['content']\n",
    "        question = data[0]['messages'][0]['content']\n",
    "        p1 = question.split('P1: \\\"')[1].split('P2: ')[0]\n",
    "        flag = False\n",
    "        with open('pubhealth+0.1/dataset_0.1.jsonl') as file1:  \n",
    "            for line1 in file1:\n",
    "                data1 = json.loads(line1)\n",
    "                q = data1[0]['messages'][0]['content']\n",
    "                ref1 = q.split('Reference:')[-1]\n",
    "                # \n",
    "                sentences1=ref1.strip().split('.')\n",
    "                sentences2=p1.strip()[:-1].split('.')\n",
    "                if sentences1[-2] == sentences2[-2]:\n",
    "                    flag = True\n",
    "                    n+=1\n",
    "                    label=data1[0]['label']\n",
    "                    if label == 'true': # hallucination \n",
    "                        if \"here are no conflicting parts\" in answer: # factual\n",
    "                            t+=1\n",
    "                        else:\n",
    "                            t1.append(ref1)\n",
    "                    else:# factual\n",
    "                        if \"here are no conflicting parts\" in answer: # factual\n",
    "                            f+=1\n",
    "                        else:\n",
    "                            f1.append(ref1)\n",
    "        if flag==False:\n",
    "            with open('pubhealth+0.1/dataset_0.1.jsonl') as file1:  \n",
    "                for line1 in file1:\n",
    "                    data1 = json.loads(line1)\n",
    "                    q = data1[0]['messages'][0]['content']\n",
    "                    ref1 = q.split('Reference:')[-1]\n",
    "                    # \\\" and \", or \\uxxxx\n",
    "                    if ref1.strip().split(',')[-1] == p1.strip()[:-1].split(',')[-1] or ref1.strip().split('\\\"')[-1] == p1.strip()[:-1].split('\\\"')[-1]:\n",
    "                        flag = True\n",
    "                        n+=1\n",
    "                        label=data1[0]['label']\n",
    "                        if label == 'true': # hallucination \n",
    "                            if \"here are no conflicting parts\" in answer: # factual\n",
    "                                t+=1\n",
    "                            else:\n",
    "                                t1.append(ref1)\n",
    "                        else:# factual\n",
    "                            if \"here are no conflicting parts\" in answer: # factual\n",
    "                                f+=1\n",
    "                            else:\n",
    "                                f1.append(ref1)\n",
    "                    if flag==False:\n",
    "                        uni=p1.strip()[:-1].split('\\\\u')[-1][4:]\n",
    "                        length=len(uni)\n",
    "                        if ref1.strip()[-length:] == uni:\n",
    "                            flag = True\n",
    "                            n+=1\n",
    "                            label=data1[0]['label']\n",
    "                            if label == 'true': # hallucination \n",
    "                                if \"here are no conflicting parts\" in answer: # factual\n",
    "                                    t+=1\n",
    "                                else:\n",
    "                                    t1.append(ref1)\n",
    "                            else:# factual\n",
    "                                if \"here are no conflicting parts\" in answer: # factual\n",
    "                                    f+=1\n",
    "                                else:\n",
    "                                    f1.append(ref1)\n",
    "print(num-t,(num-t)/num)\n",
    "print(f,f/num)\n",
    "print('matched num=',n)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 33,
   "id": "fb11c80d",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "31 0.14418604651162792\n",
      "203 0.9441860465116279\n",
      "matched num= 430\n"
     ]
    }
   ],
   "source": [
    "t=0\n",
    "f=0\n",
    "t11=[]\n",
    "f11=[]\n",
    "n=0\n",
    "with open('pubhealth+0.1/detections_1_1.jsonl') as file:\n",
    "    for line in file:\n",
    "        data = json.loads(line)\n",
    "        answer = data[1]['choices'][0]['message']['content']\n",
    "        question = data[0]['messages'][0]['content']\n",
    "        p1 = question.split('P1: \\\"')[1].split('P2: ')[0]\n",
    "        flag = False\n",
    "        with open('pubhealth+0.1/dataset_0.1.jsonl') as file1:  \n",
    "            for line1 in file1:\n",
    "                data1 = json.loads(line1)\n",
    "                q = data1[0]['messages'][0]['content']\n",
    "                ref1 = q.split('Reference:')[-1]\n",
    "                # \n",
    "                sentences1=ref1.strip().split('.')\n",
    "                sentences2=p1.strip()[:-1].split('.')\n",
    "                if sentences1[-2] == sentences2[-2]:\n",
    "                    flag = True\n",
    "                    n+=1\n",
    "                    label=data1[0]['label']\n",
    "                    if label == 'true': # hallucination \n",
    "                        if \"here are no conflicting parts\" in answer: # factual\n",
    "                            t+=1\n",
    "                        else:\n",
    "                            t11.append(ref1)\n",
    "                    else:# factual\n",
    "                        if \"here are no conflicting parts\" in answer: # factual\n",
    "                            f+=1\n",
    "                        else:\n",
    "                            f11.append(ref1)\n",
    "        if flag==False:\n",
    "            with open('pubhealth+0.1/dataset_0.1.jsonl') as file1:  \n",
    "                for line1 in file1:\n",
    "                    data1 = json.loads(line1)\n",
    "                    q = data1[0]['messages'][0]['content']\n",
    "                    ref1 = q.split('Reference:')[-1]\n",
    "                    # \\\" and \", or \\uxxxx\n",
    "                    if ref1.strip().split(',')[-1] == p1.strip()[:-1].split(',')[-1] or ref1.strip().split('\\\"')[-1] == p1.strip()[:-1].split('\\\"')[-1]:\n",
    "                        flag = True\n",
    "                        n+=1\n",
    "                        label=data1[0]['label']\n",
    "                        if label == 'true': # hallucination \n",
    "                            if \"here are no conflicting parts\" in answer: # factual\n",
    "                                t+=1\n",
    "                            else:\n",
    "                                t11.append(ref1)\n",
    "                        else:# factual\n",
    "                            if \"here are no conflicting parts\" in answer: # factual\n",
    "                                f+=1\n",
    "                            else:\n",
    "                                f11.append(ref1)\n",
    "                    if flag==False:\n",
    "                        uni=p1.strip()[:-1].split('\\\\u')[-1][4:]\n",
    "                        length=len(uni)\n",
    "                        if ref1.strip()[-length:] == uni:\n",
    "                            flag = True\n",
    "                            n+=1\n",
    "                            label=data1[0]['label']\n",
    "                            if label == 'true': # hallucination \n",
    "                                if \"here are no conflicting parts\" in answer: # factual\n",
    "                                    t+=1\n",
    "                                else:\n",
    "                                    t11.append(ref1)\n",
    "                            else:# factual\n",
    "                                if \"here are no conflicting parts\" in answer: # factual\n",
    "                                    f+=1\n",
    "                                else:\n",
    "                                    f11.append(ref1)\n",
    "print(num-t,(num-t)/num)\n",
    "print(f,f/num)\n",
    "print('matched num=',n)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 34,
   "id": "68420bcf",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "43 0.2\n",
      "186 0.8651162790697674\n",
      "matched num= 430\n"
     ]
    }
   ],
   "source": [
    "t=0\n",
    "f=0\n",
    "t2=[]\n",
    "f2=[]\n",
    "n=0\n",
    "with open('pubhealth+0.1/detections_2.jsonl') as file:\n",
    "    for line in file:\n",
    "        data = json.loads(line)\n",
    "        answer = data[1]['choices'][0]['message']['content']\n",
    "        question = data[0]['messages'][0]['content']\n",
    "        p1 = question.split('P1: \\\"')[1].split('P2: ')[0]\n",
    "        flag = False\n",
    "        with open('pubhealth+0.1/dataset_0.1.jsonl') as file1:  \n",
    "            for line1 in file1:\n",
    "                data1 = json.loads(line1)\n",
    "                q = data1[0]['messages'][0]['content']\n",
    "                ref1 = q.split('Reference:')[-1]\n",
    "                # \n",
    "                sentences1=ref1.strip().split('.')\n",
    "                sentences2=p1.strip()[:-1].split('.')\n",
    "                if sentences1[-2] == sentences2[-2]:\n",
    "                    flag = True\n",
    "                    n+=1\n",
    "                    label=data1[0]['label']\n",
    "                    if label == 'true': # hallucination \n",
    "                        if \"here are no conflicting parts\" in answer: # factual\n",
    "                            t+=1\n",
    "                        else:\n",
    "                            t2.append(ref1)\n",
    "                    else:# factual\n",
    "                        if \"here are no conflicting parts\" in answer: # factual\n",
    "                            f+=1\n",
    "                        else:\n",
    "                            f2.append(ref1)\n",
    "        if flag==False:\n",
    "            with open('pubhealth+0.1/dataset_0.1.jsonl') as file1:  \n",
    "                for line1 in file1:\n",
    "                    data1 = json.loads(line1)\n",
    "                    q = data1[0]['messages'][0]['content']\n",
    "                    ref1 = q.split('Reference:')[-1]\n",
    "                    # \\\" and \", or \\uxxxx\n",
    "                    if ref1.strip().split(',')[-1] == p1.strip()[:-1].split(',')[-1] or ref1.strip().split('\\\"')[-1] == p1.strip()[:-1].split('\\\"')[-1]:\n",
    "                        flag = True\n",
    "                        n+=1\n",
    "                        label=data1[0]['label']\n",
    "                        if label == 'true': # hallucination \n",
    "                            if \"here are no conflicting parts\" in answer: # factual\n",
    "                                t+=1\n",
    "                            else:\n",
    "                                t2.append(ref1)\n",
    "                        else:# factual\n",
    "                            if \"here are no conflicting parts\" in answer: # factual\n",
    "                                f+=1\n",
    "                            else:\n",
    "                                f2.append(ref1)\n",
    "                    if flag==False:\n",
    "                        uni=p1.strip()[:-1].split('\\\\u')[-1][4:]\n",
    "                        length=len(uni)\n",
    "                        if ref1.strip()[-length:] == uni:\n",
    "                            flag = True\n",
    "                            n+=1\n",
    "                            label=data1[0]['label']\n",
    "                            if label == 'true': # hallucination \n",
    "                                if \"here are no conflicting parts\" in answer: # factual\n",
    "                                    t+=1\n",
    "                                else:\n",
    "                                    t2.append(ref1)\n",
    "                            else:# factual\n",
    "                                if \"here are no conflicting parts\" in answer: # factual\n",
    "                                    f+=1\n",
    "                                else:\n",
    "                                    f2.append(ref1)\n",
    "print(num-t,(num-t)/num)\n",
    "print(f,f/num)\n",
    "print('matched num=',n)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 35,
   "id": "a9258282",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "35 0.16279069767441862\n",
      "199 0.9255813953488372\n",
      "matched num= 430\n"
     ]
    }
   ],
   "source": [
    "t=0\n",
    "f=0\n",
    "t22=[]\n",
    "f22=[]\n",
    "n=0\n",
    "with open('pubhealth+0.1/detections_2_1.jsonl') as file:\n",
    "    for line in file:\n",
    "        data = json.loads(line)\n",
    "        answer = data[1]['choices'][0]['message']['content']\n",
    "        question = data[0]['messages'][0]['content']\n",
    "        p1 = question.split('P1: \\\"')[1].split('P2: ')[0]\n",
    "        flag = False\n",
    "        with open('pubhealth+0.1/dataset_0.1.jsonl') as file1:  \n",
    "            for line1 in file1:\n",
    "                data1 = json.loads(line1)\n",
    "                q = data1[0]['messages'][0]['content']\n",
    "                ref1 = q.split('Reference:')[-1]\n",
    "                # \n",
    "                sentences1=ref1.strip().split('.')\n",
    "                sentences2=p1.strip()[:-1].split('.')\n",
    "                if sentences1[-2] == sentences2[-2]:\n",
    "                    flag = True\n",
    "                    n+=1\n",
    "                    label=data1[0]['label']\n",
    "                    if label == 'true': # hallucination \n",
    "                        if \"here are no conflicting parts\" in answer: # factual\n",
    "                            t+=1\n",
    "                        else:\n",
    "                            t22.append(ref1)\n",
    "                    else:# factual\n",
    "                        if \"here are no conflicting parts\" in answer: # factual\n",
    "                            f+=1\n",
    "                        else:\n",
    "                            f22.append(ref1)\n",
    "        if flag==False:\n",
    "            with open('pubhealth+0.1/dataset_0.1.jsonl') as file1:  \n",
    "                for line1 in file1:\n",
    "                    data1 = json.loads(line1)\n",
    "                    q = data1[0]['messages'][0]['content']\n",
    "                    ref1 = q.split('Reference:')[-1]\n",
    "                    # \\\" and \", or \\uxxxx\n",
    "                    if ref1.strip().split(',')[-1] == p1.strip()[:-1].split(',')[-1] or ref1.strip().split('\\\"')[-1] == p1.strip()[:-1].split('\\\"')[-1]:\n",
    "                        flag = True\n",
    "                        n+=1\n",
    "                        label=data1[0]['label']\n",
    "                        if label == 'true': # hallucination \n",
    "                            if \"here are no conflicting parts\" in answer: # factual\n",
    "                                t+=1\n",
    "                            else:\n",
    "                                t22.append(ref1)\n",
    "                        else:# factual\n",
    "                            if \"here are no conflicting parts\" in answer: # factual\n",
    "                                f+=1\n",
    "                            else:\n",
    "                                f22.append(ref1)\n",
    "                    if flag==False:\n",
    "                        uni=p1.strip()[:-1].split('\\\\u')[-1][4:]\n",
    "                        length=len(uni)\n",
    "                        if ref1.strip()[-length:] == uni:\n",
    "                            flag = True\n",
    "                            n+=1\n",
    "                            label=data1[0]['label']\n",
    "                            if label == 'true': # hallucination \n",
    "                                if \"here are no conflicting parts\" in answer: # factual\n",
    "                                    t+=1\n",
    "                                else:\n",
    "                                    t22.append(ref1)\n",
    "                            else:# factual\n",
    "                                if \"here are no conflicting parts\" in answer: # factual\n",
    "                                    f+=1\n",
    "                                else:\n",
    "                                    f22.append(ref1)\n",
    "print(num-t,(num-t)/num)\n",
    "print(f,f/num)\n",
    "print('matched num=',n)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 36,
   "id": "4bce2334",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "48 0.22325581395348837\n",
      "186 0.8651162790697674\n",
      "matched num= 430\n"
     ]
    }
   ],
   "source": [
    "t=0\n",
    "f=0\n",
    "t3=[]\n",
    "f3=[]\n",
    "n=0\n",
    "with open('pubhealth+0.1/detections_3.jsonl') as file:\n",
    "    for line in file:\n",
    "        data = json.loads(line)\n",
    "        answer = data[1]['choices'][0]['message']['content']\n",
    "        question = data[0]['messages'][0]['content']\n",
    "        p1 = question.split('P1: \\\"')[1].split('P2: ')[0]\n",
    "        flag = False\n",
    "        with open('pubhealth+0.1/dataset_0.1.jsonl') as file1:  \n",
    "            for line1 in file1:\n",
    "                data1 = json.loads(line1)\n",
    "                q = data1[0]['messages'][0]['content']\n",
    "                ref1 = q.split('Reference:')[-1]\n",
    "                # \n",
    "                sentences1=ref1.strip().split('.')\n",
    "                sentences2=p1.strip()[:-1].split('.')\n",
    "                if sentences1[-2] == sentences2[-2]:\n",
    "                    flag = True\n",
    "                    n+=1\n",
    "                    label=data1[0]['label']\n",
    "                    if label == 'true': # hallucination \n",
    "                        if \"here are no conflicting parts\" in answer: # factual\n",
    "                            t+=1\n",
    "                        else:\n",
    "                            t3.append(ref1)\n",
    "                    else:# factual\n",
    "                        if \"here are no conflicting parts\" in answer: # factual\n",
    "                            f+=1\n",
    "                        else:\n",
    "                            f3.append(ref1)\n",
    "        if flag==False:\n",
    "            with open('pubhealth+0.1/dataset_0.1.jsonl') as file1:  \n",
    "                for line1 in file1:\n",
    "                    data1 = json.loads(line1)\n",
    "                    q = data1[0]['messages'][0]['content']\n",
    "                    ref1 = q.split('Reference:')[-1]\n",
    "                    # \\\" and \", or \\uxxxx\n",
    "                    if ref1.strip().split(',')[-1] == p1.strip()[:-1].split(',')[-1] or ref1.strip().split('\\\"')[-1] == p1.strip()[:-1].split('\\\"')[-1]:\n",
    "                        flag = True\n",
    "                        n+=1\n",
    "                        label=data1[0]['label']\n",
    "                        if label == 'true': # hallucination \n",
    "                            if \"here are no conflicting parts\" in answer: # factual\n",
    "                                t+=1\n",
    "                            else:\n",
    "                                t3.append(ref1)\n",
    "                        else:# factual\n",
    "                            if \"here are no conflicting parts\" in answer: # factual\n",
    "                                f+=1\n",
    "                            else:\n",
    "                                f3.append(ref1)\n",
    "                    if flag==False:\n",
    "                        uni=p1.strip()[:-1].split('\\\\u')[-1][4:]\n",
    "                        length=len(uni)\n",
    "                        if ref1.strip()[-length:] == uni:\n",
    "                            flag = True\n",
    "                            n+=1\n",
    "                            label=data1[0]['label']\n",
    "                            if label == 'true': # hallucination \n",
    "                                if \"here are no conflicting parts\" in answer: # factual\n",
    "                                    t+=1\n",
    "                                else:\n",
    "                                    t3.append(ref1)\n",
    "                            else:# factual\n",
    "                                if \"here are no conflicting parts\" in answer: # factual\n",
    "                                    f+=1\n",
    "                                else:\n",
    "                                    f3.append(ref1)\n",
    "print(num-t,(num-t)/num)\n",
    "print(f,f/num)\n",
    "print('matched num=',n)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 37,
   "id": "eb34ec5b",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "28 0.13023255813953488\n",
      "197 0.9162790697674419\n",
      "matched num= 430\n"
     ]
    }
   ],
   "source": [
    "t=0\n",
    "f=0\n",
    "t33=[]\n",
    "f33=[]\n",
    "n=0\n",
    "with open('pubhealth+0.1/detections_3_1.jsonl') as file:\n",
    "    for line in file:\n",
    "        data = json.loads(line)\n",
    "        answer = data[1]['choices'][0]['message']['content']\n",
    "        question = data[0]['messages'][0]['content']\n",
    "        p1 = question.split('P1: \\\"')[1].split('P2: ')[0]\n",
    "        flag = False\n",
    "        with open('pubhealth+0.1/dataset_0.1.jsonl') as file1:  \n",
    "            for line1 in file1:\n",
    "                data1 = json.loads(line1)\n",
    "                q = data1[0]['messages'][0]['content']\n",
    "                ref1 = q.split('Reference:')[-1]\n",
    "                # \n",
    "                sentences1=ref1.strip().split('.')\n",
    "                sentences2=p1.strip()[:-1].split('.')\n",
    "                if sentences1[-2] == sentences2[-2]:\n",
    "                    flag = True\n",
    "                    n+=1\n",
    "                    label=data1[0]['label']\n",
    "                    if label == 'true': # hallucination \n",
    "                        if \"here are no conflicting parts\" in answer: # factual\n",
    "                            t+=1\n",
    "                        else:\n",
    "                            t33.append(ref1)\n",
    "                    else:# factual\n",
    "                        if \"here are no conflicting parts\" in answer: # factual\n",
    "                            f+=1\n",
    "                        else:\n",
    "                            f33.append(ref1)\n",
    "        if flag==False:\n",
    "            with open('pubhealth+0.1/dataset_0.1.jsonl') as file1:  \n",
    "                for line1 in file1:\n",
    "                    data1 = json.loads(line1)\n",
    "                    q = data1[0]['messages'][0]['content']\n",
    "                    ref1 = q.split('Reference:')[-1]\n",
    "                    # \\\" and \", or \\uxxxx\n",
    "                    if ref1.strip().split(',')[-1] == p1.strip()[:-1].split(',')[-1] or ref1.strip().split('\\\"')[-1] == p1.strip()[:-1].split('\\\"')[-1]:\n",
    "                        flag = True\n",
    "                        n+=1\n",
    "                        label=data1[0]['label']\n",
    "                        if label == 'true': # hallucination \n",
    "                            if \"here are no conflicting parts\" in answer: # factual\n",
    "                                t+=1\n",
    "                            else:\n",
    "                                t33.append(ref1)\n",
    "                        else:# factual\n",
    "                            if \"here are no conflicting parts\" in answer: # factual\n",
    "                                f+=1\n",
    "                            else:\n",
    "                                f33.append(ref1)\n",
    "                    if flag==False:\n",
    "                        uni=p1.strip()[:-1].split('\\\\u')[-1][4:]\n",
    "                        length=len(uni)\n",
    "                        if ref1.strip()[-length:] == uni:\n",
    "                            flag = True\n",
    "                            n+=1\n",
    "                            label=data1[0]['label']\n",
    "                            if label == 'true': # hallucination \n",
    "                                if \"here are no conflicting parts\" in answer: # factual\n",
    "                                    t+=1\n",
    "                                else:\n",
    "                                    t33.append(ref1)\n",
    "                            else:# factual\n",
    "                                if \"here are no conflicting parts\" in answer: # factual\n",
    "                                    f+=1\n",
    "                                else:\n",
    "                                    f33.append(ref1)\n",
    "print(num-t,(num-t)/num)\n",
    "print(f,f/num)\n",
    "print('matched num=',n)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 38,
   "id": "d6fc6c6a",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "34 0.15813953488372093\n",
      "195 0.9069767441860465\n",
      "matched num= 430\n"
     ]
    }
   ],
   "source": [
    "t=0\n",
    "f=0\n",
    "t4=[]\n",
    "f4=[]\n",
    "n=0\n",
    "with open('pubhealth+0.1/detections_4.jsonl') as file:\n",
    "    for line in file:\n",
    "        data = json.loads(line)\n",
    "        answer = data[1]['choices'][0]['message']['content']\n",
    "        question = data[0]['messages'][0]['content']\n",
    "        p1 = question.split('P1: \\\"')[1].split('P2: ')[0]\n",
    "        flag = False\n",
    "        with open('pubhealth+0.1/dataset_0.1.jsonl') as file1:  \n",
    "            for line1 in file1:\n",
    "                data1 = json.loads(line1)\n",
    "                q = data1[0]['messages'][0]['content']\n",
    "                ref1 = q.split('Reference:')[-1]\n",
    "                # \n",
    "                sentences1=ref1.strip().split('.')\n",
    "                sentences2=p1.strip()[:-1].split('.')\n",
    "                if sentences1[-2] == sentences2[-2]:\n",
    "                    flag = True\n",
    "                    n+=1\n",
    "                    label=data1[0]['label']\n",
    "                    if label == 'true': # hallucination \n",
    "                        if \"here are no conflicting parts\" in answer: # factual\n",
    "                            t+=1\n",
    "                        else:\n",
    "                            t4.append(ref1)\n",
    "                    else:# factual\n",
    "                        if \"here are no conflicting parts\" in answer: # factual\n",
    "                            f+=1\n",
    "                        else:\n",
    "                            f4.append(ref1)\n",
    "        if flag==False:\n",
    "            with open('pubhealth+0.1/dataset_0.1.jsonl') as file1:  \n",
    "                for line1 in file1:\n",
    "                    data1 = json.loads(line1)\n",
    "                    q = data1[0]['messages'][0]['content']\n",
    "                    ref1 = q.split('Reference:')[-1]\n",
    "                    # \\\" and \", or \\uxxxx\n",
    "                    if ref1.strip().split(',')[-1] == p1.strip()[:-1].split(',')[-1] or ref1.strip().split('\\\"')[-1] == p1.strip()[:-1].split('\\\"')[-1]:\n",
    "                        flag = True\n",
    "                        n+=1\n",
    "                        label=data1[0]['label']\n",
    "                        if label == 'true': # hallucination \n",
    "                            if \"here are no conflicting parts\" in answer: # factual\n",
    "                                t+=1\n",
    "                            else:\n",
    "                                t4.append(ref1)\n",
    "                        else:# factual\n",
    "                            if \"here are no conflicting parts\" in answer: # factual\n",
    "                                f+=1\n",
    "                            else:\n",
    "                                f4.append(ref1)\n",
    "                    if flag==False:\n",
    "                        uni=p1.strip()[:-1].split('\\\\u')[-1][4:]\n",
    "                        length=len(uni)\n",
    "                        if ref1.strip()[-length:] == uni:\n",
    "                            flag = True\n",
    "                            n+=1\n",
    "                            label=data1[0]['label']\n",
    "                            if label == 'true': # hallucination \n",
    "                                if \"here are no conflicting parts\" in answer: # factual\n",
    "                                    t+=1\n",
    "                                else:\n",
    "                                    t4.append(ref1)\n",
    "                            else:# factual\n",
    "                                if \"here are no conflicting parts\" in answer: # factual\n",
    "                                    f+=1\n",
    "                                else:\n",
    "                                    f4.append(ref1)\n",
    "print(num-t,(num-t)/num)\n",
    "print(f,f/num)\n",
    "print('matched num=',n)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 39,
   "id": "0402d6e1",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "29 0.13488372093023257\n",
      "199 0.9255813953488372\n",
      "matched num= 430\n"
     ]
    }
   ],
   "source": [
    "t=0\n",
    "f=0\n",
    "t44=[]\n",
    "f44=[]\n",
    "n=0\n",
    "with open('pubhealth+0.1/detections_4_1.jsonl') as file:\n",
    "    for line in file:\n",
    "        data = json.loads(line)\n",
    "        answer = data[1]['choices'][0]['message']['content']\n",
    "        question = data[0]['messages'][0]['content']\n",
    "        p1 = question.split('P1: \\\"')[1].split('P2: ')[0]\n",
    "        flag = False\n",
    "        with open('pubhealth+0.1/dataset_0.1.jsonl') as file1:  \n",
    "            for line1 in file1:\n",
    "                data1 = json.loads(line1)\n",
    "                q = data1[0]['messages'][0]['content']\n",
    "                ref1 = q.split('Reference:')[-1]\n",
    "                # \n",
    "                sentences1=ref1.strip().split('.')\n",
    "                sentences2=p1.strip()[:-1].split('.')\n",
    "                if sentences1[-2] == sentences2[-2]:\n",
    "                    flag = True\n",
    "                    n+=1\n",
    "                    label=data1[0]['label']\n",
    "                    if label == 'true': # hallucination \n",
    "                        if \"here are no conflicting parts\" in answer: # factual\n",
    "                            t+=1\n",
    "                        else:\n",
    "                            t44.append(ref1)\n",
    "                    else:# factual\n",
    "                        if \"here are no conflicting parts\" in answer: # factual\n",
    "                            f+=1\n",
    "                        else:\n",
    "                            f44.append(ref1)\n",
    "        if flag==False:\n",
    "            with open('pubhealth+0.1/dataset_0.1.jsonl') as file1:  \n",
    "                for line1 in file1:\n",
    "                    data1 = json.loads(line1)\n",
    "                    q = data1[0]['messages'][0]['content']\n",
    "                    ref1 = q.split('Reference:')[-1]\n",
    "                    # \\\" and \", or \\uxxxx\n",
    "                    if ref1.strip().split(',')[-1] == p1.strip()[:-1].split(',')[-1] or ref1.strip().split('\\\"')[-1] == p1.strip()[:-1].split('\\\"')[-1]:\n",
    "                        flag = True\n",
    "                        n+=1\n",
    "                        label=data1[0]['label']\n",
    "                        if label == 'true': # hallucination \n",
    "                            if \"here are no conflicting parts\" in answer: # factual\n",
    "                                t+=1\n",
    "                            else:\n",
    "                                t44.append(ref1)\n",
    "                        else:# factual\n",
    "                            if \"here are no conflicting parts\" in answer: # factual\n",
    "                                f+=1\n",
    "                            else:\n",
    "                                f44.append(ref1)\n",
    "                    if flag==False:\n",
    "                        uni=p1.strip()[:-1].split('\\\\u')[-1][4:]\n",
    "                        length=len(uni)\n",
    "                        if ref1.strip()[-length:] == uni:\n",
    "                            flag = True\n",
    "                            n+=1\n",
    "                            label=data1[0]['label']\n",
    "                            if label == 'true': # hallucination \n",
    "                                if \"here are no conflicting parts\" in answer: # factual\n",
    "                                    t+=1\n",
    "                                else:\n",
    "                                    t44.append(ref1)\n",
    "                            else:# factual\n",
    "                                if \"here are no conflicting parts\" in answer: # factual\n",
    "                                    f+=1\n",
    "                                else:\n",
    "                                    f44.append(ref1)\n",
    "print(num-t,(num-t)/num)\n",
    "print(f,f/num)\n",
    "print('matched num=',n)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 40,
   "id": "34ebd4d6",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "19 0.08837209302325581\n",
      "195 0.9069767441860465\n",
      "matched num= 430\n"
     ]
    }
   ],
   "source": [
    "t=0\n",
    "f=0\n",
    "t5=[]\n",
    "f5=[]\n",
    "n=0\n",
    "with open('pubhealth+0.1/detections_5.jsonl') as file:\n",
    "    for line in file:\n",
    "        data = json.loads(line)\n",
    "        answer = data[1]['choices'][0]['message']['content']\n",
    "        question = data[0]['messages'][0]['content']\n",
    "        p1 = question.split('P1: \\\"')[1].split('P2: ')[0]\n",
    "        flag = False\n",
    "        with open('pubhealth+0.1/dataset_0.1.jsonl') as file1:  \n",
    "            for line1 in file1:\n",
    "                data1 = json.loads(line1)\n",
    "                q = data1[0]['messages'][0]['content']\n",
    "                ref1 = q.split('Reference:')[-1]\n",
    "                # \n",
    "                sentences1=ref1.strip().split('.')\n",
    "                sentences2=p1.strip()[:-1].split('.')\n",
    "                if sentences1[-2] == sentences2[-2]:\n",
    "                    flag = True\n",
    "                    n+=1\n",
    "                    label=data1[0]['label']\n",
    "                    if label == 'true': # hallucination \n",
    "                        if \"here are no conflicting parts\" in answer: # factual\n",
    "                            t+=1\n",
    "                        else:\n",
    "                            t5.append(ref1)\n",
    "                    else:# factual\n",
    "                        if \"here are no conflicting parts\" in answer: # factual\n",
    "                            f+=1\n",
    "                        else:\n",
    "                            f5.append(ref1)\n",
    "        if flag==False:\n",
    "            with open('pubhealth+0.1/dataset_0.1.jsonl') as file1:  \n",
    "                for line1 in file1:\n",
    "                    data1 = json.loads(line1)\n",
    "                    q = data1[0]['messages'][0]['content']\n",
    "                    ref1 = q.split('Reference:')[-1]\n",
    "                    # \\\" and \", or \\uxxxx\n",
    "                    if ref1.strip().split(',')[-1] == p1.strip()[:-1].split(',')[-1] or ref1.strip().split('\\\"')[-1] == p1.strip()[:-1].split('\\\"')[-1]:\n",
    "                        flag = True\n",
    "                        n+=1\n",
    "                        label=data1[0]['label']\n",
    "                        if label == 'true': # hallucination \n",
    "                            if \"here are no conflicting parts\" in answer: # factual\n",
    "                                t+=1\n",
    "                            else:\n",
    "                                t5.append(ref1)\n",
    "                        else:# factual\n",
    "                            if \"here are no conflicting parts\" in answer: # factual\n",
    "                                f+=1\n",
    "                            else:\n",
    "                                f5.append(ref1)\n",
    "                    if flag==False:\n",
    "                        uni=p1.strip()[:-1].split('\\\\u')[-1][4:]\n",
    "                        length=len(uni)\n",
    "                        if ref1.strip()[-length:] == uni:\n",
    "                            flag = True\n",
    "                            n+=1\n",
    "                            label=data1[0]['label']\n",
    "                            if label == 'true': # hallucination \n",
    "                                if \"here are no conflicting parts\" in answer: # factual\n",
    "                                    t+=1\n",
    "                                else:\n",
    "                                    t5.append(ref1)\n",
    "                            else:# factual\n",
    "                                if \"here are no conflicting parts\" in answer: # factual\n",
    "                                    f+=1\n",
    "                                else:\n",
    "                                    f5.append(ref1)\n",
    "print(num-t,(num-t)/num)\n",
    "print(f,f/num)\n",
    "print('matched num=',n)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 41,
   "id": "98ef5f89",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "19 0.08837209302325581\n",
      "201 0.9348837209302325\n",
      "matched num= 430\n"
     ]
    }
   ],
   "source": [
    "t=0\n",
    "f=0\n",
    "t55=[]\n",
    "f55=[]\n",
    "n=0\n",
    "with open('pubhealth+0.1/detections_5_1.jsonl') as file:\n",
    "    for line in file:\n",
    "        data = json.loads(line)\n",
    "        answer = data[1]['choices'][0]['message']['content']\n",
    "        question = data[0]['messages'][0]['content']\n",
    "        p1 = question.split('P1: \\\"')[1].split('P2: ')[0]\n",
    "        flag = False\n",
    "        with open('pubhealth+0.1/dataset_0.1.jsonl') as file1:  \n",
    "            for line1 in file1:\n",
    "                data1 = json.loads(line1)\n",
    "                q = data1[0]['messages'][0]['content']\n",
    "                ref1 = q.split('Reference:')[-1]\n",
    "                # \n",
    "                sentences1=ref1.strip().split('.')\n",
    "                sentences2=p1.strip()[:-1].split('.')\n",
    "                if sentences1[-2] == sentences2[-2]:\n",
    "                    flag = True\n",
    "                    n+=1\n",
    "                    label=data1[0]['label']\n",
    "                    if label == 'true': # hallucination \n",
    "                        if \"here are no conflicting parts\" in answer: # factual\n",
    "                            t+=1\n",
    "                        else:\n",
    "                            t55.append(ref1)\n",
    "                    else:# factual\n",
    "                        if \"here are no conflicting parts\" in answer: # factual\n",
    "                            f+=1\n",
    "                        else:\n",
    "                            f55.append(ref1)\n",
    "        if flag==False:\n",
    "            with open('pubhealth+0.1/dataset_0.1.jsonl') as file1:  \n",
    "                for line1 in file1:\n",
    "                    data1 = json.loads(line1)\n",
    "                    q = data1[0]['messages'][0]['content']\n",
    "                    ref1 = q.split('Reference:')[-1]\n",
    "                    # \\\" and \", or \\uxxxx\n",
    "                    if ref1.strip().split(',')[-1] == p1.strip()[:-1].split(',')[-1] or ref1.strip().split('\\\"')[-1] == p1.strip()[:-1].split('\\\"')[-1]:\n",
    "                        flag = True\n",
    "                        n+=1\n",
    "                        label=data1[0]['label']\n",
    "                        if label == 'true': # hallucination \n",
    "                            if \"here are no conflicting parts\" in answer: # factual\n",
    "                                t+=1\n",
    "                            else:\n",
    "                                t55.append(ref1)\n",
    "                        else:# factual\n",
    "                            if \"here are no conflicting parts\" in answer: # factual\n",
    "                                f+=1\n",
    "                            else:\n",
    "                                f55.append(ref1)\n",
    "                    if flag==False:\n",
    "                        uni=p1.strip()[:-1].split('\\\\u')[-1][4:]\n",
    "                        length=len(uni)\n",
    "                        if ref1.strip()[-length:] == uni:\n",
    "                            flag = True\n",
    "                            n+=1\n",
    "                            label=data1[0]['label']\n",
    "                            if label == 'true': # hallucination \n",
    "                                if \"here are no conflicting parts\" in answer: # factual\n",
    "                                    t+=1\n",
    "                                else:\n",
    "                                    t55.append(ref1)\n",
    "                            else:# factual\n",
    "                                if \"here are no conflicting parts\" in answer: # factual\n",
    "                                    f+=1\n",
    "                                else:\n",
    "                                    f55.append(ref1)\n",
    "print(num-t,(num-t)/num)\n",
    "print(f,f/num)\n",
    "print('matched num=',n)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 42,
   "id": "be3e11f5",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "27 0.12558139534883722\n",
      "203 0.9441860465116279\n",
      "matched num= 430\n"
     ]
    }
   ],
   "source": [
    "t=0\n",
    "f=0\n",
    "t6=[]\n",
    "f6=[]\n",
    "n=0\n",
    "with open('pubhealth+0.1/detections_6.jsonl') as file:\n",
    "    for line in file:\n",
    "        data = json.loads(line)\n",
    "        answer = data[1]['choices'][0]['message']['content']\n",
    "        question = data[0]['messages'][0]['content']\n",
    "        p1 = question.split('P1: \\\"')[1].split('P2: ')[0]\n",
    "        flag = False\n",
    "        with open('pubhealth+0.1/dataset_0.1.jsonl') as file1:  \n",
    "            for line1 in file1:\n",
    "                data1 = json.loads(line1)\n",
    "                q = data1[0]['messages'][0]['content']\n",
    "                ref1 = q.split('Reference:')[-1]\n",
    "                # \n",
    "                sentences1=ref1.strip().split('.')\n",
    "                sentences2=p1.strip()[:-1].split('.')\n",
    "                if sentences1[-2] == sentences2[-2]:\n",
    "                    flag = True\n",
    "                    n+=1\n",
    "                    label=data1[0]['label']\n",
    "                    if label == 'true': # hallucination \n",
    "                        if \"here are no conflicting parts\" in answer: # factual\n",
    "                            t+=1\n",
    "                        else:\n",
    "                            t6.append(ref1)\n",
    "                    else:# factual\n",
    "                        if \"here are no conflicting parts\" in answer: # factual\n",
    "                            f+=1\n",
    "                        else:\n",
    "                            f6.append(ref1)\n",
    "        if flag==False:\n",
    "            with open('pubhealth+0.1/dataset_0.1.jsonl') as file1:  \n",
    "                for line1 in file1:\n",
    "                    data1 = json.loads(line1)\n",
    "                    q = data1[0]['messages'][0]['content']\n",
    "                    ref1 = q.split('Reference:')[-1]\n",
    "                    # \\\" and \", or \\uxxxx\n",
    "                    if ref1.strip().split(',')[-1] == p1.strip()[:-1].split(',')[-1] or ref1.strip().split('\\\"')[-1] == p1.strip()[:-1].split('\\\"')[-1]:\n",
    "                        flag = True\n",
    "                        n+=1\n",
    "                        label=data1[0]['label']\n",
    "                        if label == 'true': # hallucination \n",
    "                            if \"here are no conflicting parts\" in answer: # factual\n",
    "                                t+=1\n",
    "                            else:\n",
    "                                t6.append(ref1)\n",
    "                        else:# factual\n",
    "                            if \"here are no conflicting parts\" in answer: # factual\n",
    "                                f+=1\n",
    "                            else:\n",
    "                                f6.append(ref1)\n",
    "                    if flag==False:\n",
    "                        uni=p1.strip()[:-1].split('\\\\u')[-1][4:]\n",
    "                        length=len(uni)\n",
    "                        if ref1.strip()[-length:] == uni:\n",
    "                            flag = True\n",
    "                            n+=1\n",
    "                            label=data1[0]['label']\n",
    "                            if label == 'true': # hallucination \n",
    "                                if \"here are no conflicting parts\" in answer: # factual\n",
    "                                    t+=1\n",
    "                                else:\n",
    "                                    t6.append(ref1)\n",
    "                            else:# factual\n",
    "                                if \"here are no conflicting parts\" in answer: # factual\n",
    "                                    f+=1\n",
    "                                else:\n",
    "                                    f6.append(ref1)\n",
    "print(num-t,(num-t)/num)\n",
    "print(f,f/num)\n",
    "print('matched num=',n)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 43,
   "id": "f8b73bd9",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "27 0.12558139534883722\n",
      "198 0.9209302325581395\n",
      "matched num= 430\n"
     ]
    }
   ],
   "source": [
    "t=0\n",
    "f=0\n",
    "t66=[]\n",
    "f66=[]\n",
    "n=0\n",
    "with open('pubhealth+0.1/detections_6_1.jsonl') as file:\n",
    "    for line in file:\n",
    "        data = json.loads(line)\n",
    "        answer = data[1]['choices'][0]['message']['content']\n",
    "        question = data[0]['messages'][0]['content']\n",
    "        p1 = question.split('P1: \\\"')[1].split('P2: ')[0]\n",
    "        flag = False\n",
    "        with open('pubhealth+0.1/dataset_0.1.jsonl') as file1:  \n",
    "            for line1 in file1:\n",
    "                data1 = json.loads(line1)\n",
    "                q = data1[0]['messages'][0]['content']\n",
    "                ref1 = q.split('Reference:')[-1]\n",
    "                # \n",
    "                sentences1=ref1.strip().split('.')\n",
    "                sentences2=p1.strip()[:-1].split('.')\n",
    "                if sentences1[-2] == sentences2[-2]:\n",
    "                    flag = True\n",
    "                    n+=1\n",
    "                    label=data1[0]['label']\n",
    "                    if label == 'true': # hallucination \n",
    "                        if \"here are no conflicting parts\" in answer: # factual\n",
    "                            t+=1\n",
    "                        else:\n",
    "                            t66.append(ref1)\n",
    "                    else:# factual\n",
    "                        if \"here are no conflicting parts\" in answer: # factual\n",
    "                            f+=1\n",
    "                        else:\n",
    "                            f66.append(ref1)\n",
    "        if flag==False:\n",
    "            with open('pubhealth+0.1/dataset_0.1.jsonl') as file1:  \n",
    "                for line1 in file1:\n",
    "                    data1 = json.loads(line1)\n",
    "                    q = data1[0]['messages'][0]['content']\n",
    "                    ref1 = q.split('Reference:')[-1]\n",
    "                    # \\\" and \", or \\uxxxx\n",
    "                    if ref1.strip().split(',')[-1] == p1.strip()[:-1].split(',')[-1] or ref1.strip().split('\\\"')[-1] == p1.strip()[:-1].split('\\\"')[-1]:\n",
    "                        flag = True\n",
    "                        n+=1\n",
    "                        label=data1[0]['label']\n",
    "                        if label == 'true': # hallucination \n",
    "                            if \"here are no conflicting parts\" in answer: # factual\n",
    "                                t+=1\n",
    "                            else:\n",
    "                                t66.append(ref1)\n",
    "                        else:# factual\n",
    "                            if \"here are no conflicting parts\" in answer: # factual\n",
    "                                f+=1\n",
    "                            else:\n",
    "                                f66.append(ref1)\n",
    "                    if flag==False:\n",
    "                        uni=p1.strip()[:-1].split('\\\\u')[-1][4:]\n",
    "                        length=len(uni)\n",
    "                        if ref1.strip()[-length:] == uni:\n",
    "                            flag = True\n",
    "                            n+=1\n",
    "                            label=data1[0]['label']\n",
    "                            if label == 'true': # hallucination \n",
    "                                if \"here are no conflicting parts\" in answer: # factual\n",
    "                                    t+=1\n",
    "                                else:\n",
    "                                    t66.append(ref1)\n",
    "                            else:# factual\n",
    "                                if \"here are no conflicting parts\" in answer: # factual\n",
    "                                    f+=1\n",
    "                                else:\n",
    "                                    f66.append(ref1)\n",
    "print(num-t,(num-t)/num)\n",
    "print(f,f/num)\n",
    "print('matched num=',n)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 44,
   "id": "9d750f90",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "11 0.05116279069767442\n",
      "211 0.9813953488372092\n",
      "matched num= 430\n"
     ]
    }
   ],
   "source": [
    "t=0\n",
    "f=0\n",
    "t7=[]\n",
    "f7=[]\n",
    "n=0\n",
    "with open('pubhealth+0.1/detections_7.jsonl') as file:\n",
    "    for line in file:\n",
    "        data = json.loads(line)\n",
    "        answer = data[1]['choices'][0]['message']['content']\n",
    "        question = data[0]['messages'][0]['content']\n",
    "        p1 = question.split('P1: \\\"')[1].split('P2: ')[0]\n",
    "        flag = False\n",
    "        with open('pubhealth+0.1/dataset_0.1.jsonl') as file1:  \n",
    "            for line1 in file1:\n",
    "                data1 = json.loads(line1)\n",
    "                q = data1[0]['messages'][0]['content']\n",
    "                ref1 = q.split('Reference:')[-1]\n",
    "                # \n",
    "                sentences1=ref1.strip().split('.')\n",
    "                sentences2=p1.strip()[:-1].split('.')\n",
    "                if sentences1[-2] == sentences2[-2]:\n",
    "                    flag = True\n",
    "                    n+=1\n",
    "                    label=data1[0]['label']\n",
    "                    if label == 'true': # hallucination \n",
    "                        if \"here are no conflicting parts\" in answer: # factual\n",
    "                            t+=1\n",
    "                        else:\n",
    "                            t7.append(ref1)\n",
    "                    else:# factual\n",
    "                        if \"here are no conflicting parts\" in answer: # factual\n",
    "                            f+=1\n",
    "                        else:\n",
    "                            f7.append(ref1)\n",
    "        if flag==False:\n",
    "            with open('pubhealth+0.1/dataset_0.1.jsonl') as file1:  \n",
    "                for line1 in file1:\n",
    "                    data1 = json.loads(line1)\n",
    "                    q = data1[0]['messages'][0]['content']\n",
    "                    ref1 = q.split('Reference:')[-1]\n",
    "                    # \\\" and \", or \\uxxxx\n",
    "                    if ref1.strip().split(',')[-1] == p1.strip()[:-1].split(',')[-1] or ref1.strip().split('\\\"')[-1] == p1.strip()[:-1].split('\\\"')[-1]:\n",
    "                        flag = True\n",
    "                        n+=1\n",
    "                        label=data1[0]['label']\n",
    "                        if label == 'true': # hallucination \n",
    "                            if \"here are no conflicting parts\" in answer: # factual\n",
    "                                t+=1\n",
    "                            else:\n",
    "                                t7.append(ref1)\n",
    "                        else:# factual\n",
    "                            if \"here are no conflicting parts\" in answer: # factual\n",
    "                                f+=1\n",
    "                            else:\n",
    "                                f7.append(ref1)\n",
    "                    if flag==False:\n",
    "                        uni=p1.strip()[:-1].split('\\\\u')[-1][4:]\n",
    "                        length=len(uni)\n",
    "                        if ref1.strip()[-length:] == uni:\n",
    "                            flag = True\n",
    "                            n+=1\n",
    "                            label=data1[0]['label']\n",
    "                            if label == 'true': # hallucination \n",
    "                                if \"here are no conflicting parts\" in answer: # factual\n",
    "                                    t+=1\n",
    "                                else:\n",
    "                                    t7.append(ref1)\n",
    "                            else:# factual\n",
    "                                if \"here are no conflicting parts\" in answer: # factual\n",
    "                                    f+=1\n",
    "                                else:\n",
    "                                    f7.append(ref1)\n",
    "print(num-t,(num-t)/num)\n",
    "print(f,f/num)\n",
    "print('matched num=',n)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 45,
   "id": "4e8b68a4",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "430\n",
      "1.0\n",
      "1.8046511627906976\n"
     ]
    }
   ],
   "source": [
    "tlist=[t1,t2,t3,t4,t5,t6,t7,t11,t22,t33,t44,t55,t66]\n",
    "flist=[f1,f2,f3,f4,f5,f6,f7,f11,f22,f33,f44,f55,f66]\n",
    "with open('pubhealth+0.1/dataset_0.1.jsonl') as file1: \n",
    "    fnum=[]\n",
    "    tnum=[]\n",
    "    knum=0\n",
    "    for line1 in file1:\n",
    "        data1 = json.loads(line1)\n",
    "        q = data1[0]['messages'][0]['content']\n",
    "        ref1 = q.split('Reference:')[-1]\n",
    "        label=data1[0]['label']\n",
    "        sub=ref1.strip().split('\\\"')\n",
    "        knum+=1\n",
    "        if label == 'false': # factual\n",
    "            num1=0\n",
    "            for f in flist:\n",
    "                if ref1 in f:\n",
    "                    num1+=1\n",
    "            fnum.append(num1)\n",
    "            #print(num,num1)\n",
    "        else:\n",
    "            num2=0\n",
    "            for t in tlist:\n",
    "                if ref1 in t:\n",
    "                    num2+=1\n",
    "            tnum.append(num2)\n",
    "            #print(num,num2)\n",
    "    print(knum)\n",
    "    print(np.mean(fnum))\n",
    "    print(np.mean(tnum))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 67,
   "id": "d6d3c09c",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "126\n",
      "0.586046511627907\n"
     ]
    }
   ],
   "source": [
    "a=t1+t2+t3+t4+t6+t7+t22+t44+t55# \n",
    "res=set(a)\n",
    "a=list(res)\n",
    "print(len(a))\n",
    "aa=len(a)\n",
    "print(len(a)/num)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 68,
   "id": "a471c4ca",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "78\n",
      "0.6372093023255814\n"
     ]
    }
   ],
   "source": [
    "a=f1+f2+f3+f4+f6+f7+f22+f44+f55 # \n",
    "res=set(a)\n",
    "a=list(res)\n",
    "print(len(a))\n",
    "bb=len(a)\n",
    "print((num-len(a))/num)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 69,
   "id": "f906d0c6",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "FN 0.2069767441860465\n",
      "FP 0.1813953488372093\n",
      "TN 0.3186046511627907\n",
      "TP 0.2930232558139535\n"
     ]
    }
   ],
   "source": [
    "all_num=num*2\n",
    "# FN:\n",
    "FN=(num-aa)/all_num\n",
    "print('FN',FN)\n",
    "# FP:\n",
    "FP=bb/all_num\n",
    "print('FP',FP)\n",
    "# TN:\n",
    "TN=(num-bb)/all_num\n",
    "print('TN',TN)\n",
    "# TP:\n",
    "TP=aa/all_num\n",
    "print('TP',TP)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 70,
   "id": "5817ec11",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "0.6116279069767442\n",
      "0.6176470588235294\n",
      "0.586046511627907\n",
      "0.6014319809069213\n"
     ]
    }
   ],
   "source": [
    "Accuracy=TN+TP\n",
    "print(Accuracy)\n",
    "Precision=TP/(TP+FP)\n",
    "print(Precision)\n",
    "Recall=TP/(TP+FN)\n",
    "print(Recall)\n",
    "F1=2*TP/(2*TP+FP+FN)\n",
    "print(F1)"
   ]
  },
  {
   "cell_type": "markdown",
   "id": "b3543cfd",
   "metadata": {},
   "source": []
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "Python 3 (ipykernel)",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.8.16"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 5
}
