{"hop1": {"unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.7734375, 0.8715362548828125], "model_response": [["Which country does London belong to?", "England || England"], ["What's the year when Russia the first time formally establish diplomatic relations with United Kingdom?", "1840 || 1840"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.4921875, 0.919342041015625], "model_response": [["Which country does London belong to?", "United Kingdom || United Kingdom"], ["What's the year when Russia the first time formally establish diplomatic relations with United Kingdom?", "1840 || 1840"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.90625, 0.9044189453125], "model_response": [["Which country does London belong to?", "Great Britain || Great Britain"], ["What's the year when Russia the first time formally establish diplomatic relations with United Kingdom?", "1840 || 1840"]]}, "mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.516357421875], "model_response": [["Which country does London belong to?", "London belongs to the United Kingdom. || United Kingdom"], ["What's the year when Russia the first time formally establish diplomatic relations with United Kingdom?", "1840 || 1840"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.48828125, 0.927154541015625], "model_response": [["Which country does London belong to?", "Great Britain || Great Britain"], ["What's the year when Russia the first time formally establish diplomatic relations with United Kingdom?", "1840 || 1840"]]}, "mis_info_dict_severe": {"answer_condition": [1, 4], "confidence": [0.466796875, 0.0998687744140625], "model_response": [["Which country does London belong to?", "The United Kingdom || The United Kingdom"], ["What's the year when Russia the first time formally establish diplomatic relations with United Kingdom?", "1783 || 1783"]]}}, "hop2": {"unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.546875, 0.9383392333984375], "model_response": [["Which country does London belong to?", "Great Britain || Great Britain"], ["What's the year when Russia the first time formally establish diplomatic relations with United Kingdom?", "1840 || 1840"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.734375, 0.965057373046875], "model_response": [["Which country does London belong to?", "The United Kingdom || The United Kingdom"], ["What's the year when Russia the first time formally establish diplomatic relations with United Kingdom?", "1840 || 1840"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.765625, 0.7219085693359375], "model_response": [["Which country does London belong to?", "The United Kingdom || The United Kingdom"], ["What's the year when Russia the first time formally establish diplomatic relations with United Kingdom?", "1840 || 1840"]]}, "mis_info_dict_light": {"answer_condition": [1, 3], "confidence": [0.40234375, 0.73046875], "model_response": [["Which country does London belong to?", "The United Kingdom || The United Kingdom"], ["What's the year when Russia the first time formally establish diplomatic relations with United Kingdom?", "1800 || 1800"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.2421875, 0.90625], "model_response": [["Which country does London belong to?", "The United Kingdom || The United Kingdom"], ["What's the year when Russia the first time formally establish diplomatic relations with United Kingdom?", "1840 || 1840"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [0.4296875, 0.17047119140625], "model_response": [["Which country does London belong to?", "England || England"], ["What's the year when Russia the first time formally establish diplomatic relations with United Kingdom?", "1783 || 1783"]]}}}
{"hop1": {"unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.1376953125, 0.625], "model_response": [["Which country does London belong to?", "Great Britain || Great Britain"], ["What's the year when Australia the first time formally establish diplomatic relations with United Kingdom?", "1901 || 1901"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [0.439453125, 0.470703125], "model_response": [["Which country does London belong to?", "England || England"], ["What's the year when Australia the first time formally establish diplomatic relations with United Kingdom?", "1928 || 1928"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.74609375], "model_response": [["Which country does London belong to?", "London belongs to the United Kingdom. || United Kingdom"], ["What's the year when Australia the first time formally establish diplomatic relations with United Kingdom?", "1901 || 1901"]]}, "mis_info_dict_severe": {"answer_condition": [1, 4], "confidence": [0.65234375, 0.76171875], "model_response": [["Which country does London belong to?", "United Kingdom || United Kingdom"], ["What's the year when Australia the first time formally establish diplomatic relations with United Kingdom?", "1928 || 1928"]]}, "mis_info_dict_light": {"answer_condition": [1, 4], "confidence": [0.8671875, 0.5078125], "model_response": [["Which country does London belong to?", "Great Britain || Great Britain"], ["What's the year when Australia the first time formally establish diplomatic relations with United Kingdom?", "1928 || 1928"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 4], "confidence": [0.455078125, 0.1083984375], "model_response": [["Which country does London belong to?", "The United Kingdom || The United Kingdom"], ["What's the year when Australia the first time formally establish diplomatic relations with United Kingdom?", "1910 || 1910"]]}}, "hop2": {"hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.0057373046875, 0.59271240234375], "model_response": [["Which country does London belong to?", "England || England"], ["What's the year when Australia the first time formally establish diplomatic relations with United Kingdom?", "1901 || 1901"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.99609375], "model_response": [["Which country does London belong to?", "London belongs to the United Kingdom. || United Kingdom"], ["What's the year when Australia the first time formally establish diplomatic relations with United Kingdom?", "1901 || 1901"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [0.64453125, 0.02392578125], "model_response": [["Which country does London belong to?", "England || England"], ["What's the year when Australia the first time formally establish diplomatic relations with United Kingdom?", "1913 || 1913"]]}, "mis_info_dict_light": {"answer_condition": [1, 3], "confidence": [0.150390625, 1.0], "model_response": [["Which country does London belong to?", "The United Kingdom || The United Kingdom"], ["What's the year when Australia the first time formally establish diplomatic relations with United Kingdom?", "1910 || 1910"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [0.330078125, 0.19921875], "model_response": [["Which country does London belong to?", "Great Britain || Great Britain"], ["What's the year when Australia the first time formally establish diplomatic relations with United Kingdom?", "1913 || 1913"]]}, "mis_info_dict_severe": {"answer_condition": [1, 4], "confidence": [0.73046875, 0.191619873046875], "model_response": [["Which country does London belong to?", "London is the capital city of England. || England"], ["What's the year when Australia the first time formally establish diplomatic relations with United Kingdom?", "1881 || 1881"]]}}}
{"hop1": {"mis_info_dict_light": {"answer_condition": [1, -1], "confidence": [1.0, -1], "model_response": [["In which year was The Birth of a Nation released?", "1915 || 1915"], ["Who is the headmaster of Harvard in the year 1915?", "Harvard University does not have a headmaster in the year 1915. || N/A"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, -1], "confidence": [1.0, -1], "model_response": [["In which year was The Birth of a Nation released?", "1915 || 1915"], ["Who is the headmaster of Harvard in the year 1915?", "Harvard University did not have a headmaster in 1915. || N/A"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.014591217041015625], "model_response": [["In which year was The Birth of a Nation released?", "1915 || 1915"], ["Who is the headmaster of Harvard in the year 1915?", "Harvard University was founded in 1636, and the headmaster in 1915 was Dr. Jeremiah Smith. || Dr. Jeremiah Smith"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.988311767578125], "model_response": [["In which year was The Birth of a Nation released?", "1915 || 1915"], ["Who is the headmaster of Harvard in the year 1915?", "Harvard University is a private Ivy League research university in Cambridge, Massachusetts. In 1915, the headmaster of Harvard was Charles William Eliot. || Charles William Eliot"]]}, "mis_info_dict_severe": {"answer_condition": [1, -1], "confidence": [1.0, -1], "model_response": [["In which year was The Birth of a Nation released?", "1915 || 1915"], ["Who is the headmaster of Harvard in the year 1915?", "Harvard University was founded in 1636. It is a private Ivy League research university located in Cambridge, Massachusetts. It is the oldest institution of higher learning in the United States. || N/A"]]}, "hall_sbj_dict_light": {"answer_condition": [1, -1], "confidence": [1.0, -1], "model_response": [["In which year was The Birth of a Nation released?", "1915 || 1915"], ["Who is the headmaster of Harvard in the year 1915?", "Harvard University was founded in 1636 by the Massachusetts Bay Colony. The university is located in Cambridge, Massachusetts, and is the oldest institution of higher learning in the United States. The university is a member of the Ivy League and is consistently ranked as one of the top universities in the world. || N/A"]]}}, "hop2": {"hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["In which year was The Birth of a Nation released?", "1915 || 1915"], ["Who is the headmaster of Harvard in the year 1915?", "Charles William Eliot || Charles William Eliot"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.709991455078125], "model_response": [["In which year was The Birth of a Nation released?", "1915 || 1915"], ["Who is the headmaster of Harvard in the year 1915?", "Charles William Eliot || Charles William Eliot"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["In which year was The Birth of a Nation released?", "1915 || 1915"], ["Who is the headmaster of Harvard in the year 1915?", "Charles William Eliot || Charles William Eliot"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, -1], "confidence": [1.0, -1], "model_response": [["In which year was The Birth of a Nation released?", "1915 || 1915"], ["Who is the headmaster of Harvard in the year 1915?", "Harvard University did not have a headmaster in 1915. || N/A"]]}, "mis_info_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 1.0], "model_response": [["In which year was The Birth of a Nation released?", "1915 || 1915"], ["Who is the headmaster of Harvard in the year 1915?", "John F. Kennedy || John F. Kennedy"]]}, "mis_info_dict_severe": {"answer_condition": [1, 3], "confidence": [1.0, 0.73046875], "model_response": [["In which year was The Birth of a Nation released?", "1915 || 1915"], ["Who is the headmaster of Harvard in the year 1915?", "Chocolate Chip Cookies || Chocolate Chip Cookies"]]}}}
{"hop1": {"hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.894927978515625], "model_response": [["Who is the president / leader of Finland in the year 1814?", "Carl Gustaf Mannerheim || Carl Gustaf Mannerheim"], ["In which year was Carl Gustaf Mannerheim born?", "1847 || 1847"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.5481325909495354, 0.6731414794921875], "model_response": [["Who is the president / leader of Finland in the year 1814?", "Carl Gustaf Mannerheim || Carl Gustaf Mannerheim"], ["In which year was Carl Gustaf Mannerheim born?", "1847 || 1847"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.8988189697265625], "model_response": [["Who is the president / leader of Finland in the year 1814?", "Carl Gustaf Mannerheim || Carl Gustaf Mannerheim"], ["In which year was Carl Gustaf Mannerheim born?", "1847 || 1847"]]}, "mis_info_dict_severe": {"answer_condition": [3, 4], "confidence": [0.953125, 0.71484375], "model_response": [["Who is the president / leader of Finland in the year 1814?", "Pizza || Pizza"], ["In which year was pizza born?", "Unknown || Unknown"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [0.8660319820046425, 0.984375], "model_response": [["Who is the president / leader of Finland in the year 1814?", "Carl Gustaf Mannerheim || Carl Gustaf Mannerheim"], ["In which year was Carl Gustaf Mannerheim born?", "1867 || 1867"]]}, "mis_info_dict_light": {"answer_condition": [4, 4], "confidence": [1.0, 0.96875], "model_response": [["Who is the president / leader of Finland in the year 1814?", "Alexander I, the Emperor of Russia, served as the President of Finland in the year 1814. || Alexander I"], ["In which year was Alexander I born?", "1777 || 1777"]]}}, "hop2": {"mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.921875], "model_response": [["Who is the president / leader of Finland in the year 1814?", "Carl Gustaf Mannerheim || Carl Gustaf Mannerheim"], ["In which year was Carl Gustaf Mannerheim born?", "1847 || 1847"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.7439802924636751, 0.6497955322265625], "model_response": [["Who is the president / leader of Finland in the year 1814?", "Carl Gustaf Mannerheim || Carl Gustaf Mannerheim"], ["In which year was Carl Gustaf Mannerheim born?", "1847 || 1847"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [0.3984086215496063, 0.903045654296875], "model_response": [["Who is the president / leader of Finland in the year 1814?", "Carl Gustaf Mannerheim || Carl Gustaf Mannerheim"], ["In which year was Carl Gustaf Mannerheim born?", "1867 || 1867"]]}, "mis_info_dict_light": {"answer_condition": [1, 3], "confidence": [1.0, 1.0], "model_response": [["Who is the president / leader of Finland in the year 1814?", "Carl Gustaf Mannerheim || Carl Gustaf Mannerheim"], ["In which year was Carl Gustaf Mannerheim born?", "1875 || 1875"]]}, "hall_sbj_dict_severe": {"answer_condition": [4, 4], "confidence": [0.8117098161619651, 0.439453125], "model_response": [["Who is the president / leader of Finland in the year 1814?", "Carl Johan Adlercreutz || Carl Johan Adlercreutz"], ["In which year was Carl Johan Adlercreutz born?", "1749 || 1749"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 4], "confidence": [0.7232205271720886, 0.0084228515625], "model_response": [["Who is the president / leader of Finland in the year 1814?", "Carl Johan Adlercreutz || Carl Johan Adlercreutz"], ["In which year was Carl Johan Adlercreutz born?", "1748 || 1748"]]}}}
{"hop1": {"hall_sbj_dict_severe": {"answer_condition": [4, 4], "confidence": [0.9921875, 0.435546875], "model_response": [["Which film, in alphabetical order, won the Oscar for Outstanding Picture in the year 1732?", "Tall Tales || Tall Tales"], ["In which year was Tall Tales released?", "1984 || 1984"]]}, "mis_info_dict_severe": {"answer_condition": [4, 4], "confidence": [0.9922027587890625, 0.53662109375], "model_response": [["Which film, in alphabetical order, won the Oscar for Outstanding Picture in the year 1732?", "Chocolate Chip Cookies || Chocolate Chip Cookies"], ["In which year were chocolate chip cookies invented?", "1928 || 1928"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 4], "confidence": [0.513763427734375, 1.0], "model_response": [["Which film, in alphabetical order, won the Oscar for Outstanding Picture in the year 1732?", "The Fountain || The Fountain"], ["In which year was The Fountain released?", "2006 || 2006"]]}, "hall_sbj_dict_light": {"answer_condition": [4, 4], "confidence": [1.0, 1.0], "model_response": [["Which film, in alphabetical order, won the Oscar for Outstanding Picture in the year 1732?", "The Godfather || The Godfather"], ["In which year was The Godfather released?", "1972 || 1972"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 4], "confidence": [0.9610748291015625, 1.0], "model_response": [["Which film, in alphabetical order, won the Oscar for Outstanding Picture in the year 1732?", "The Shape of Water || The Shape of Water"], ["In which year was The Shape of Water released?", "2017 || 2017"]]}, "mis_info_dict_light": {"answer_condition": [4, 4], "confidence": [1.0, 1.0], "model_response": [["Which film, in alphabetical order, won the Oscar for Outstanding Picture in the year 1732?", "The French Connection || The French Connection"], ["In which year was The French Connection released?", "1971 || 1971"]]}}, "hop2": {"mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [0.8046875, 1.0], "model_response": [["Which film, in alphabetical order, won the Oscar for Outstanding Picture in the year 1732?", "The English Patient || The English Patient"], ["In which year was The English Patient released?", "1996 || 1996"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.6171875, 1.0], "model_response": [["Which film, in alphabetical order, won the Oscar for Outstanding Picture in the year 1732?", "The English Patient || The English Patient"], ["In which year was The English Patient released?", "1996 || 1996"]]}, "hall_sbj_dict_light": {"answer_condition": [4, 4], "confidence": [0.23165249824523926, 0.99609375], "model_response": [["Which film, in alphabetical order, won the Oscar for Outstanding Picture in the year 1732?", "The Fountain || The Fountain"], ["In which year was The Fountain released?", "2006 || 2006"]]}, "hall_sbj_dict_severe": {"answer_condition": [4, 4], "confidence": [0.1094970703125, 1.0], "model_response": [["Which film, in alphabetical order, won the Oscar for Outstanding Picture in the year 1732?", "The Shape of Water || The Shape of Water"], ["In which year was The Shape of Water released?", "2017 || 2017"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 4], "confidence": [0.375, 1.0], "model_response": [["Which film, in alphabetical order, won the Oscar for Outstanding Picture in the year 1732?", "Titanic (1997) || Titanic"], ["In which year was Titanic released?", "1997 || 1997"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 3], "confidence": [0.373046875, 1.0], "model_response": [["Which film, in alphabetical order, won the Oscar for Outstanding Picture in the year 1732?", "Titanic || Titanic"], ["In which year was Titanic released?", "1997 || 1997"]]}}}
{"hop1": {"mis_info_dict_light": {"answer_condition": [-1, -1], "confidence": [-1, -1], "model_response": [["In which year was Norway founded or became independent?", "It is not known when Norway was founded or became independent. || N/A"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["In which year was Norway founded or became independent?", "1814 || 1814"], ["Who was the US president in the year 1814?", "James Madison || James Madison"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, -1], "confidence": [0.8125, -1], "model_response": [["In which year was Norway founded or became independent?", "1030 || 1030"], ["Who was the US president in the year 1030?", "I'm sorry, I don't have that information. || N/A"]]}, "hall_sbj_dict_severe": {"answer_condition": [4, -1], "confidence": [0.58984375, -1], "model_response": [["In which year was Norway founded or became independent?", "1030 || 1030"], ["Who was the US president in the year 1030?", "There was no US president in 1030. || N/A"]]}, "hall_sbj_dict_light": {"answer_condition": [4, -1], "confidence": [0.9609375, -1], "model_response": [["In which year was Norway founded or became independent?", "1030 || 1030"], ["Who was the US president in the year 1030?", "No US president was in office in 1030. || N/A"]]}, "mis_info_dict_severe": {"answer_condition": [3, -1], "confidence": [0.99609375, -1], "model_response": [["In which year was Norway founded or became independent?", "Pizza || Pizza"], ["Who was the US president when pizza was invented?", "I'm sorry, but I don't have enough information to answer this question. Could you please provide more context or details? || N/A"]]}}, "hop2": {"hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["In which year was Norway founded or became independent?", "1814 || 1814"], ["Who was the US president in the year 1814?", "James Madison || James Madison"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["In which year was Norway founded or became independent?", "1814 || 1814"], ["Who was the US president in the year 1814?", "James Madison || James Madison"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["In which year was Norway founded or became independent?", "1814 || 1814"], ["Who was the US president in the year 1814?", "James Madison || James Madison"]]}, "mis_info_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 1.0], "model_response": [["In which year was Norway founded or became independent?", "1814 || 1814"], ["Who was the US president in the year 1814?", "Pizza || Pizza"]]}, "mis_info_dict_light": {"answer_condition": [1, 4], "confidence": [0.9921875, 1.0], "model_response": [["In which year was Norway founded or became independent?", "1814 || 1814"], ["Who was the US president in the year 1814?", "Thomas Jefferson || Thomas Jefferson"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["In which year was Norway founded or became independent?", "1814 || 1814"], ["Who was the US president in the year 1814?", "James Madison || James Madison"]]}}}
{"hop1": {"mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Which country is the northernmost in the +10 time zone?", "Canada || Canada"], ["What is the national anthem of Canada?", "O Canada || O Canada"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.828125, 1.0], "model_response": [["Which country is the northernmost in the +10 time zone?", "Canada || Canada"], ["What is the national anthem of Canada?", "O Canada || O Canada"]]}, "hall_sbj_dict_light": {"answer_condition": [4, 4], "confidence": [1.0, 0.13942641718313098], "model_response": [["Which country is the northernmost in the +10 time zone?", "Russia || Russia"], ["What is the national anthem of Russia?", "The National Anthem of Russia is \"Russia, My Motherland\". || Russia, My Motherland"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 4], "confidence": [0.431640625, 0.8155113458633423], "model_response": [["Which country is the northernmost in the +10 time zone?", "Norway || Norway"], ["What is the national anthem of Norway?", "Ja, vi elsker dette landet (Yes, we love this land) || Ja, vi elsker dette landet"]]}, "mis_info_dict_light": {"answer_condition": [4, 4], "confidence": [1.0, 0.017589899362064898], "model_response": [["Which country is the northernmost in the +10 time zone?", "Russia || Russia"], ["What is the national anthem of Russia?", "The National Anthem of Russia is the \"Russia, My Motherland\" (\u0420\u043e\u0441\u0441\u0438\u044f, \u043c\u043e\u044f \u0440\u043e\u0434\u0438\u043d\u0430). || Russia, My Motherland"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 4], "confidence": [1.0, 0.98443603515625], "model_response": [["Which country is the northernmost in the +10 time zone?", "Russia || Russia"], ["What is the national anthem of Russia?", "The National Anthem of Russia is \"Russia\" (Russian: \u0420\u043e\u0441\u0441\u0438\u044f, Rossiya). The lyrics were written by the Russian poet Alexander Sergeyevich Pushkin. The music was composed by Sergey Vasilyevich Taneyev. || The National Anthem of Russia"]]}}, "hop2": {"hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.322265625, 1.0], "model_response": [["Which country is the northernmost in the +10 time zone?", "Canada || Canada"], ["What is the national anthem of Canada?", "O Canada || O Canada"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.458984375, 1.0], "model_response": [["Which country is the northernmost in the +10 time zone?", "Canada || Canada"], ["What is the national anthem of Canada?", "O Canada || O Canada"]]}, "hall_sbj_dict_light": {"answer_condition": [4, 4], "confidence": [0.2578125, 0.0402693897485733], "model_response": [["Which country is the northernmost in the +10 time zone?", "Norway || Norway"], ["What is the national anthem of Norway?", "Ja, vi er fri || Ja, vi er fri"]]}, "mis_info_dict_severe": {"answer_condition": [4, 4], "confidence": [0.470703125, 0.8720448017120361], "model_response": [["Which country is the northernmost in the +10 time zone?", "Norway || Norway"], ["What is the national anthem of Norway?", "Ja, vi elsker dette landet (Yes, We Love This Country) || Ja, vi elsker dette landet"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 4], "confidence": [0.5859375, 0.9500086307525635], "model_response": [["Which country is the northernmost in the +10 time zone?", "Norway || Norway"], ["What is the national anthem of Norway?", "Ja, vi elsker dette landet (Yes, we love this land) || Ja, vi elsker dette landet"]]}, "mis_info_dict_light": {"answer_condition": [4, 4], "confidence": [0.45703125, 0.78558349609375], "model_response": [["Which country is the northernmost in the +10 time zone?", "Greenland || Greenland"], ["What is the national anthem of Greenland?", "Greenland's National Anthem is \"Kalaallit Nunaat\" (Greenland's Land). || Kalaallit Nunaat"]]}}}
{"hop1": {"hall_sbj_dict_light": {"answer_condition": [1, -1], "confidence": [0.98046875, -1], "model_response": [["What's the year when Iraq the first time formally establish diplomatic relations with Vietnam?", "1980 || 1980"], ["Who is the headmaster of Harvard University in the year 1980?", "Harvard University did not have a headmaster in 1980. || N/A"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, -1], "confidence": [0.9453125, -1], "model_response": [["What's the year when Iraq the first time formally establish diplomatic relations with Vietnam?", "1980 || 1980"], ["Who is the headmaster of Harvard University in the year 1980?", "Harvard University did not have a headmaster in 1980. || N/A"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, -1], "confidence": [0.73828125, -1], "model_response": [["What's the year when Iraq the first time formally establish diplomatic relations with Vietnam?", "1973 || 1973"], ["Who was the headmaster of Harvard University in the year 1973?", "Harvard University did not have a headmaster in the year 1973. || N/A"]]}, "mis_info_dict_severe": {"answer_condition": [4, -1], "confidence": [0.54296875, -1], "model_response": [["What's the year when Iraq the first time formally establish diplomatic relations with Vietnam?", "The year is chocolate chip cookies. || chocolate chip cookies"], ["Who is the headmaster of Harvard University in the year chocolate chip cookies?", "N/A (no headmaster in the year chocolate chip cookies) || N/A"]]}, "mis_info_dict_light": {"answer_condition": [3, -1], "confidence": [1.0, -1], "model_response": [["What's the year when Iraq the first time formally establish diplomatic relations with Vietnam?", "1975 || 1975"], ["Who is the headmaster of Harvard University in the year 1975?", "Harvard University does not have a headmaster in the year 1975. || N/A"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 4], "confidence": [0.57421875, 1.0], "model_response": [["What's the year when Iraq the first time formally establish diplomatic relations with Vietnam?", "1973 || 1973"], ["Who is the headmaster of Harvard University in the year 1973?", "Harvard University does not have a headmaster. It has a president, currently Lawrence S. Bacow. || Lawrence S. Bacow"]]}}, "hop2": {"mis_info_dict_severe": {"answer_condition": [1, 3], "confidence": [0.9140625, 0.953125], "model_response": [["What's the year when Iraq the first time formally establish diplomatic relations with Vietnam?", "1980 || 1980"], ["Who is the headmaster of Harvard University in the year 1980?", "Chocolate Chip Cookies || Chocolate Chip Cookies"]]}, "mis_info_dict_light": {"answer_condition": [1, 4], "confidence": [0.921875, 1.0], "model_response": [["What's the year when Iraq the first time formally establish diplomatic relations with Vietnam?", "1980 || 1980"], ["Who is the headmaster of Harvard University in the year 1980?", "John F. Kennedy || John F. Kennedy"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.94921875, 0.9921875], "model_response": [["What's the year when Iraq the first time formally establish diplomatic relations with Vietnam?", "1980 || 1980"], ["Who is the headmaster of Harvard University in the year 1980?", "Harold R. Varmus || Harold R. Varmus"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.8671875, 0.99609375], "model_response": [["What's the year when Iraq the first time formally establish diplomatic relations with Vietnam?", "1980 || 1980"], ["Who is the headmaster of Harvard University in the year 1980?", "Harold R. Varmus || Harold R. Varmus"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, -1], "confidence": [0.57421875, -1], "model_response": [["What's the year when Iraq the first time formally establish diplomatic relations with Vietnam?", "1980 || 1980"], ["Who is the headmaster of Harvard University in the year 1980?", "Harvard University does not have a headmaster in the year 1980. || N/A"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 4], "confidence": [0.171875, 0.08349609375], "model_response": [["What's the year when Iraq the first time formally establish diplomatic relations with Vietnam?", "1979 || 1979"], ["Who was the headmaster of Harvard University in the year 1979?", "Lawrence Summers || Lawrence Summers"]]}}}
{"hop1": {"mis_info_dict_light": {"answer_condition": [4, 4], "confidence": [1.0, 1.0], "model_response": [["Which film won the Oscar for Outstanding Picture in 1857, being the first one in alphabetical order?", "The Godfather || The Godfather"], ["In which year was The Godfather released?", "1972 || 1972"]]}, "hall_sbj_dict_light": {"answer_condition": [4, 4], "confidence": [1.0, 1.0], "model_response": [["Which film won the Oscar for Outstanding Picture in 1857, being the first one in alphabetical order?", "Titanic || Titanic"], ["In which year was the movie Titanic released?", "1997 || 1997"]]}, "mis_info_dict_severe": {"answer_condition": [4, 4], "confidence": [1.0, 0.5006866455078125], "model_response": [["Which film won the Oscar for Outstanding Picture in 1857, being the first one in alphabetical order?", "Chocolate Chip Cookies || Chocolate Chip Cookies"], ["In which year were chocolate chip cookies invented?", "1928 || 1928"]]}, "hall_sbj_dict_severe": {"answer_condition": [3, 4], "confidence": [1.0, 1.0], "model_response": [["Which film won the Oscar for Outstanding Picture in 1857, being the first one in alphabetical order?", "Sunflowers || Sunflowers"], ["In which year were Sunflowers released?", "1857 || 1857"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 4], "confidence": [0.04626655578613281, 0.98828125], "model_response": [["Which film won the Oscar for Outstanding Picture in 1857, being the first one in alphabetical order?", "A Christmas Carol || A Christmas Carol"], ["In which year was A Christmas Carol released?", "1843 || 1843"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 4], "confidence": [0.817108154296875, 0.9921875], "model_response": [["Which film won the Oscar for Outstanding Picture in 1857, being the first one in alphabetical order?", "A Christmas Carol || A Christmas Carol"], ["In which year was A Christmas Carol released?", "1843 || 1843"]]}}, "hop2": {"hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.15875244140625, 0.9921875], "model_response": [["Which film won the Oscar for Outstanding Picture in 1857, being the first one in alphabetical order?", "The Great Train Robbery || The Great Train Robbery"], ["In which year was The Great Train Robbery released?", "1903 || 1903"]]}, "mis_info_dict_severe": {"answer_condition": [4, 4], "confidence": [0.724761962890625, 0.99609375], "model_response": [["Which film won the Oscar for Outstanding Picture in 1857, being the first one in alphabetical order?", "A Christmas Carol || A Christmas Carol"], ["In which year was \"A Christmas Carol\" released?", "1843 || 1843"]]}, "mis_info_dict_light": {"answer_condition": [4, 4], "confidence": [0.3031005859375, 1.0], "model_response": [["Which film won the Oscar for Outstanding Picture in 1857, being the first one in alphabetical order?", "A Christmas Carol || A Christmas Carol"], ["In which year was A Christmas Carol released?", "1843 || 1843"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 4], "confidence": [0.018636226654052734, 1.0], "model_response": [["Which film won the Oscar for Outstanding Picture in 1857, being the first one in alphabetical order?", "A Trip to the Moon || A Trip to the Moon"], ["In which year was \"A Trip to the Moon\" released?", "1902 || 1902"]]}, "hall_sbj_dict_light": {"answer_condition": [4, 4], "confidence": [0.25213623046875, 1.0], "model_response": [["Which film won the Oscar for Outstanding Picture in 1857, being the first one in alphabetical order?", "A Christmas Carol || A Christmas Carol"], ["In which year was A Christmas Carol released?", "1843 || 1843"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 4], "confidence": [0.12689208984375, 1.0], "model_response": [["Which film won the Oscar for Outstanding Picture in 1857, being the first one in alphabetical order?", "A Trip to the Moon || A Trip to the Moon"], ["In which year was \"A Trip to the Moon\" released?", "1902 || 1902"]]}}}
{"hop1": {"hall_sbj_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 0.16061878204345703], "model_response": [["Which university or college did Dwight D. Eisenhower attend as a graduate student?", "Columbia University || Columbia University"], ["Who is the headmaster of Columbia University in the year 1949?", "Dr. Horace Mann || Dr. Horace Mann"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 0.0007703900337219238], "model_response": [["Which university or college did Dwight D. Eisenhower attend as a graduate student?", "Columbia University || Columbia University"], ["Who is the headmaster of Columbia University in the year 1949?", "Harkness || Harkness"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.04944562911987305], "model_response": [["Which university or college did Dwight D. Eisenhower attend as a graduate student?", "Columbia University || Columbia University"], ["Who is the headmaster of Columbia University in the year 1949?", "Dr. Nathan S. Strong || Dr. Nathan S. Strong"]]}, "mis_info_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.01559421992010357], "model_response": [["Which university or college did Dwight D. Eisenhower attend as a graduate student?", "Columbia University || Columbia University"], ["Who is the headmaster of Columbia University in the year 1949?", "Dr. Robert R. Hinkley || Dr. Robert R. Hinkley"]]}, "mis_info_dict_light": {"answer_condition": [3, -1], "confidence": [1.0, -1], "model_response": [["Which university or college did Dwight D. Eisenhower attend as a graduate student?", "Harvard University || Harvard University"], ["Who is the headmaster of Harvard University in the year 1949?", "Harvard University does not have a headmaster in 1949. The university is led by a president and a board of directors. || N/A"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.33284521102905273], "model_response": [["Which university or college did Dwight D. Eisenhower attend as a graduate student?", "Columbia University || Columbia University"], ["Who is the headmaster of Columbia University in the year 1949?", "Dr. Elliott Roosevelt, the son of President Franklin D. Roosevelt, was the headmaster of Columbia University in 1949. || Dr. Elliott Roosevelt"]]}}, "hop2": {"mis_info_dict_severe": {"answer_condition": [1, 3], "confidence": [1.0, 1.0], "model_response": [["Which university or college did Dwight D. Eisenhower attend as a graduate student?", "Columbia University || Columbia University"], ["Who is the headmaster of Columbia University in the year 1949?", "Pizza || Pizza"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Which university or college did Dwight D. Eisenhower attend as a graduate student?", "Columbia University || Columbia University"], ["Who is the headmaster of Columbia University in the year 1949?", "Robert H. Goddard || Robert H. Goddard"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.91015625], "model_response": [["Which university or college did Dwight D. Eisenhower attend as a graduate student?", "Columbia University || Columbia University"], ["Who is the headmaster of Columbia University in the year 1949?", "The Mona Lisa || The Mona Lisa"]]}, "mis_info_dict_light": {"answer_condition": [1, 3], "confidence": [1.0, 1.0], "model_response": [["Which university or college did Dwight D. Eisenhower attend as a graduate student?", "Columbia University || Columbia University"], ["Who is the headmaster of Columbia University in the year 1949?", "John F. Kennedy || John F. Kennedy"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 3], "confidence": [1.0, 0.006657242774963379], "model_response": [["Which university or college did Dwight D. Eisenhower attend as a graduate student?", "Columbia University || Columbia University"], ["Who is the headmaster of Columbia University in the year 1949?", "James Bryant Conant || James Bryant Conant"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.988311767578125], "model_response": [["Which university or college did Dwight D. Eisenhower attend as a graduate student?", "Columbia University || Columbia University"], ["Who is the headmaster of Columbia University in the year 1949?", "The statue of liberty and the great wall of china || The statue of liberty and the great wall of china"]]}}}
{"hop1": {"mis_info_dict_light": {"answer_condition": [3, 4], "confidence": [1.0, 0.019162012729793787], "model_response": [["In which company did Yoshio Maruoka work, considering the first one in time order?", "Toyota Motor Corporation || Toyota Motor Corporation"], ["Who is the CEO of Toyota Motor Corporation in the year 1979?", "Kazuo Toyama || Kazuo Toyama"]]}, "unrelated_fact_dict_light": {"answer_condition": [-1, -1], "confidence": [-1, -1], "model_response": [["In which company did Yoshio Maruoka work, considering the first one in time order?", "Maruoka worked in the company \"Nippon Telegraph and Telephone\" (NTT) before founding NEC. || N/A"]]}, "hall_sbj_dict_light": {"answer_condition": [4, 4], "confidence": [0.08642578125, 1.0], "model_response": [["In which company did Yoshio Maruoka work, considering the first one in time order?", "Yoshio Maruoka worked in the company of Seiko. || Seiko"], ["Who was the CEO of Seiko in the year 1979?", "Yoshio Maruoka || Yoshio Maruoka"]]}, "mis_info_dict_severe": {"answer_condition": [4, 4], "confidence": [0.0244903564453125, 1.0], "model_response": [["In which company did Yoshio Maruoka work, considering the first one in time order?", "Maruoka worked at the Chocolate Factory, which was established in 2050. || Chocolate Factory"], ["Who is the CEO of the Chocolate Factory in the year 1979?", "Yoshio Maruoka || Yoshio Maruoka"]]}, "hall_sbj_dict_severe": {"answer_condition": [4, 4], "confidence": [0.5620166659355164, 1.0], "model_response": [["In which company did Yoshio Maruoka work, considering the first one in time order?", "Maruoka worked for Mitsubishi Heavy Industries, Ltd. before he became the CEO of Mitsubishi Corporation. || Mitsubishi Heavy Industries, Ltd."], ["Who is the CEO of Mitsubishi Heavy Industries, Ltd. in the year 1979?", "Yoshio Maruoka || Yoshio Maruoka"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 4], "confidence": [0.10863913875080052, 1.0], "model_response": [["In which company did Yoshio Maruoka work, considering the first one in time order?", "Maruoka worked in the company that was established in the year 1875. Therefore, it was the first company in the world to be established in the 19th century. Maruoka was the first employee of this company. || the first company in the world to be established in the 19th century"], ["Who is the CEO of the first company in the world to be established in the 19th century in the year 1979?", "Yoshio Maruoka || Yoshio Maruoka"]]}}, "hop2": {"unrelated_fact_dict_severe": {"answer_condition": [4, 4], "confidence": [0.07086467742919922, 1.0], "model_response": [["In which company did Yoshio Maruoka work, considering the first one in time order?", "Toshiba Corporation || Toshiba Corporation"], ["Who is the CEO of Toshiba Corporation in the year 1979?", "Yoshio Maruoka || Yoshio Maruoka"]]}, "mis_info_dict_light": {"answer_condition": [4, 4], "confidence": [0.003142118453979492, 1.0], "model_response": [["In which company did Yoshio Maruoka work, considering the first one in time order?", "Toyota Motor Corporation (1963-1979) || Toyota Motor Corporation"], ["Who is the CEO of Toyota Motor Corporation in the year 1979?", "Yoshio Maruoka || Yoshio Maruoka"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 4], "confidence": [0.2445831298828125, 1.0], "model_response": [["In which company did Yoshio Maruoka work, considering the first one in time order?", "Maruoka worked in the Mitsubishi Corporation in the 1960s. || Mitsubishi Corporation"], ["Who is the CEO of Mitsubishi Corporation in the year 1979?", "Yoshio Maruoka || Yoshio Maruoka"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 4], "confidence": [0.353515625, 0.99609375], "model_response": [["In which company did Yoshio Maruoka work, considering the first one in time order?", "Yoshio Maruoka worked at the first company in the order of time, which is Sony Corporation. || Sony Corporation"], ["Who is the CEO of Sony Corporation in the year 1979?", "Yoshio Maruoka || Yoshio Maruoka"]]}, "hall_sbj_dict_severe": {"answer_condition": [4, 4], "confidence": [0.7936422779257555, 1.0], "model_response": [["In which company did Yoshio Maruoka work, considering the first one in time order?", "Maruoka worked in the company of Mitsubishi Heavy Industries, Ltd. in the year 1943. He was the head of the company's shipbuilding division during World War II. || Mitsubishi Heavy Industries, Ltd."], ["Who is the CEO of Mitsubishi Heavy Industries, Ltd. in the year 1979?", "Yoshio Maruoka || Yoshio Maruoka"]]}, "mis_info_dict_severe": {"answer_condition": [4, 4], "confidence": [0.06764793926046812, 0.59765625], "model_response": [["In which company did Yoshio Maruoka work, considering the first one in time order?", "Maruoka worked in the company that was the first to use a computer in the year 1969. He was the first person to use a computer in the world. || the first person to use a computer in the world"], ["Who was the first person to use a computer in the world?", "The first person to use a computer in the world was Charles Babbage. || Charles Babbage"]]}}}
{"hop1": {"hall_sbj_dict_light": {"answer_condition": [1, -1], "confidence": [0.9921875, -1], "model_response": [["In which year was The National Anthem of the People's Republic of China written?", "1949 || 1949"], ["Who is the headmaster of Harvard in the year 1949?", "Harvard University does not have a headmaster in the year 1949. || N/A"]]}, "mis_info_dict_severe": {"answer_condition": [4, 4], "confidence": [0.0301513671875, 0.2684783935546875], "model_response": [["In which year was The National Anthem of the People's Republic of China written?", "1986 || 1986"], ["Who is the headmaster of Harvard in the year 1986?", "Lawrence Summers || Lawrence Summers"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, -1], "confidence": [0.76171875, -1], "model_response": [["In which year was The National Anthem of the People's Republic of China written?", "1949 || 1949"], ["Who is the headmaster of Harvard in the year 1949?", "Harvard University does not have a headmaster in the year 1949. || N/A"]]}, "mis_info_dict_light": {"answer_condition": [3, -1], "confidence": [1.0, -1], "model_response": [["In which year was The National Anthem of the People's Republic of China written?", "1950 || 1950"], ["Who is the headmaster of Harvard in the year 1950?", "Harvard University does not have a headmaster in the year 1950. || N/A"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, -1], "confidence": [0.9921875, -1], "model_response": [["In which year was The National Anthem of the People's Republic of China written?", "1949 || 1949"], ["Who is the headmaster of Harvard in the year 1949?", "Harvard University was founded in 1636, so it is not possible to determine the headmaster in 1949. || N/A"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 4], "confidence": [0.046875, 0.158416748046875], "model_response": [["In which year was The National Anthem of the People's Republic of China written?", "1945 || 1945"], ["Who is the headmaster of Harvard in the year 1945?", "Harvard University was founded in 1636, making it the oldest university in the United States. The headmaster of Harvard in 1945 was James Bryant Conant. || James Bryant Conant"]]}}, "hop2": {"mis_info_dict_severe": {"answer_condition": [1, 3], "confidence": [0.9609375, 0.43359375], "model_response": [["In which year was The National Anthem of the People's Republic of China written?", "1949 || 1949"], ["Who is the headmaster of Harvard in the year 1949?", "A batch of chocolate chip cookies || A batch of chocolate chip cookies"]]}, "mis_info_dict_light": {"answer_condition": [1, 4], "confidence": [0.8359375, 1.0], "model_response": [["In which year was The National Anthem of the People's Republic of China written?", "1949 || 1949"], ["Who is the headmaster of Harvard in the year 1949?", "John F. Kennedy || John F. Kennedy"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, -1], "confidence": [0.98828125, -1], "model_response": [["In which year was The National Anthem of the People's Republic of China written?", "1949 || 1949"], ["Who is the headmaster of Harvard in the year 1949?", "Harvard University did not exist in 1949. || N/A"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.76953125, 0.99609375], "model_response": [["In which year was The National Anthem of the People's Republic of China written?", "1949 || 1949"], ["Who is the headmaster of Harvard in the year 1949?", "Harold R. Varmus || Harold R. Varmus"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.8984375, 1.0], "model_response": [["In which year was The National Anthem of the People's Republic of China written?", "1949 || 1949"], ["Who is the headmaster of Harvard in the year 1949?", "Harold R. Varmus || Harold R. Varmus"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 4], "confidence": [0.013827323913574219, 0.4996490478515625], "model_response": [["In which year was The National Anthem of the People's Republic of China written?", "1928 || 1928"], ["Who was the headmaster of Harvard in the year 1928?", "Charles Eliot || Charles Eliot"]]}}}
{"hop1": {"unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.59375, 0.462890625], "model_response": [["What's the year when Jordan the first time formally establish diplomatic relations with Norway?", "1973 || 1973"], ["Who is the CEO of International Business Machines (IBM) in the year 1973?", "Thomas Watson || Thomas Watson"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.5963592529296875], "model_response": [["What's the year when Jordan the first time formally establish diplomatic relations with Norway?", "1973 || 1973"], ["Who is the CEO of International Business Machines (IBM) in the year 1973?", "Thomas Watson || Thomas Watson"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 1], "confidence": [0.08795166015625, 0.918548583984375], "model_response": [["What's the year when Jordan the first time formally establish diplomatic relations with Norway?", "1925 || 1925"], ["Who was the CEO of International Business Machines (IBM) in the year 1925?", "Thomas Watson || Thomas Watson"]]}, "mis_info_dict_light": {"answer_condition": [3, 4], "confidence": [1.0, 0.27190399169921875], "model_response": [["What's the year when Jordan the first time formally establish diplomatic relations with Norway?", "1985 || 1985"], ["Who is the CEO of International Business Machines (IBM) in the year 1985?", "John Opel, Jr. || John Opel, Jr."]]}, "mis_info_dict_severe": {"answer_condition": [3, 4], "confidence": [1.0, 0.73773193359375], "model_response": [["What's the year when Jordan the first time formally establish diplomatic relations with Norway?", "Pizza || Pizza"], ["Who is the CEO of International Business Machines (IBM) in the year Pizza?", "Samuel Palmisano || Samuel Palmisano"]]}, "hall_sbj_dict_severe": {"answer_condition": [4, 1], "confidence": [0.5914306640625, 0.91131591796875], "model_response": [["What's the year when Jordan the first time formally establish diplomatic relations with Norway?", "1925 || 1925"], ["Who was the CEO of International Business Machines (IBM) in the year 1925?", "Thomas Watson || Thomas Watson"]]}}, "hop2": {"hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.9375, 0.384521484375], "model_response": [["What's the year when Jordan the first time formally establish diplomatic relations with Norway?", "1973 || 1973"], ["Who is the CEO of International Business Machines (IBM) in the year 1973?", "Thomas J. Watson || Thomas J. Watson"]]}, "mis_info_dict_light": {"answer_condition": [1, 3], "confidence": [0.8671875, 0.87890625], "model_response": [["What's the year when Jordan the first time formally establish diplomatic relations with Norway?", "1973 || 1973"], ["Who is the CEO of International Business Machines (IBM) in the year 1973?", "Bill Gates || Bill Gates"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.89453125, 1.0], "model_response": [["What's the year when Jordan the first time formally establish diplomatic relations with Norway?", "1973 || 1973"], ["Who is the CEO of International Business Machines (IBM) in the year 1973?", "Thomas J. Watson || Thomas J. Watson"]]}, "mis_info_dict_severe": {"answer_condition": [1, 3], "confidence": [0.9140625, 0.05536079406738281], "model_response": [["What's the year when Jordan the first time formally establish diplomatic relations with Norway?", "1973 || 1973"], ["Who is the CEO of International Business Machines (IBM) in the year 1973?", "Chocolate Cake || Chocolate Cake"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [0.97265625, 0.6407012939453125], "model_response": [["What's the year when Jordan the first time formally establish diplomatic relations with Norway?", "1973 || 1973"], ["Who is the CEO of International Business Machines (IBM) in the year 1973?", "John Opel || John Opel"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [0.94140625, 0.02430349588394165], "model_response": [["What's the year when Jordan the first time formally establish diplomatic relations with Norway?", "1973 || 1973"], ["Who is the CEO of International Business Machines (IBM) in the year 1973?", "John S. Watson || John S. Watson"]]}}}
{"hop1": {"hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.99609375], "model_response": [["Who is the president / leader of USA in the year 1946?", "Franklin D. Roosevelt || Franklin D. Roosevelt"], ["Who is Franklin D. Roosevelt married to?", "Eleanor Roosevelt || Eleanor Roosevelt"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.5335845947265625, 1.0], "model_response": [["Who is the president / leader of USA in the year 1946?", "Harry S. Truman || Harry S. Truman"], ["Who is Franklin D. Roosevelt married to?", "Eleanor Roosevelt || Eleanor Roosevelt"]]}, "hall_sbj_dict_light": {"answer_condition": [4, 4], "confidence": [0.96875, 0.62890625], "model_response": [["Who is the president / leader of USA in the year 1946?", "Winston Churchill || Winston Churchill"], ["Who is Winston Churchill married to?", "Margaret Thatcher || Margaret Thatcher"]]}, "mis_info_dict_severe": {"answer_condition": [3, -1], "confidence": [0.87890625, -1], "model_response": [["Who is the president / leader of USA in the year 1946?", "Chocolate Cake || Chocolate Cake"], ["Who is chocolate cake married to?", "Chocolate cake was never married. || N/A"]]}, "mis_info_dict_light": {"answer_condition": [4, 4], "confidence": [0.73046875, 0.150390625], "model_response": [["Who is the president / leader of USA in the year 1946?", "Samuel P. Henderson || Samuel P. Henderson"], ["Who is Samuel P. Henderson married to?", "He was married to Alice Roosevelt Longworth, the daughter of former president Theodore Roosevelt. || Alice Roosevelt Longworth"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 4], "confidence": [0.25689697265625, 0.9612579345703125], "model_response": [["Who is the president / leader of USA in the year 1946?", "Harry S. Truman || Harry S. Truman"], ["Who is Harry S. Truman married to?", "Elizabeth Truman || Elizabeth Truman"]]}}, "hop2": {"hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.3740081787109375, 1.0], "model_response": [["Who is the president / leader of USA in the year 1946?", "Harry S. Truman || Harry S. Truman"], ["Who is Franklin D. Roosevelt married to?", "Eleanor Roosevelt || Eleanor Roosevelt"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.25689697265625, 1.0], "model_response": [["Who is the president / leader of USA in the year 1946?", "Harry S. Truman || Harry S. Truman"], ["Who is Franklin D. Roosevelt married to?", "Eleanor Roosevelt || Eleanor Roosevelt"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.310546875, 1.0], "model_response": [["Who is the president / leader of USA in the year 1946?", "Franklin D. Roosevelt || Franklin D. Roosevelt"], ["Who is Franklin D. Roosevelt married to?", "Eleanor Roosevelt || Eleanor Roosevelt"]]}, "mis_info_dict_severe": {"answer_condition": [1, 4], "confidence": [0.96875, 0.0291748046875], "model_response": [["Who is the president / leader of USA in the year 1946?", "Franklin D. Roosevelt || Franklin D. Roosevelt"], ["Who is Franklin D. Roosevelt married to?", "Pizza || Pizza"]]}, "mis_info_dict_light": {"answer_condition": [1, 4], "confidence": [0.98828125, 0.98828125], "model_response": [["Who is the president / leader of USA in the year 1946?", "Franklin D. Roosevelt || Franklin D. Roosevelt"], ["Who is Franklin D. Roosevelt married to?", "Sara Delano || Sara Delano"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.4765625, 1.0], "model_response": [["Who is the president / leader of USA in the year 1946?", "Harry S. Truman || Harry S. Truman"], ["Who is Franklin D. Roosevelt married to?", "Eleanor Roosevelt || Eleanor Roosevelt"]]}}}
{"hop1": {"hall_sbj_dict_severe": {"answer_condition": [1, 4], "confidence": [0.73046875, 0.9921875], "model_response": [["Who is the president / leader of Norway in the year 1814?", "Christian Frederick of Denmark || Christian Frederick"], ["In which year was Christian Frederick of Denmark born?", "1729 || 1729"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [0.2324056625366211, 1.0], "model_response": [["Who is the president / leader of Norway in the year 1814?", "Christian Frederick of Denmark || Christian Frederick of Denmark"], ["In which year was Christian Frederick of Denmark born?", "1729 || 1729"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 4], "confidence": [0.001029222272336483, 0.0673828125], "model_response": [["Who is the president / leader of Norway in the year 1814?", "Christian Fredrik von Schwerin. || Christian Fredrik von Schwerin"], ["In which year was Christian Fredrik von Schwerin born?", "1755 || 1755"]]}, "mis_info_dict_light": {"answer_condition": [4, 4], "confidence": [0.26953125, 0.8935546875], "model_response": [["Who is the president / leader of Norway in the year 1814?", "Gustav IV Adolf of Sweden || Gustav IV Adolf of Sweden"], ["In which year was Gustav IV Adolf of Sweden born?", "1746 || 1746"]]}, "mis_info_dict_severe": {"answer_condition": [3, -1], "confidence": [0.07212066650390625, -1], "model_response": [["Who is the president / leader of Norway in the year 1814?", "Chocolate cake || Chocolate cake"], ["In which year was chocolate cake born?", "I am sorry, but I am not able to provide an answer to that question as I am not programmed to provide information about fictional characters or events. || N/A"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 4], "confidence": [0.91015625, 0.8046875], "model_response": [["Who is the president / leader of Norway in the year 1814?", "Christian Frederick of Denmark is the president / leader of Norway in the year 1814. || Christian Frederick of Denmark"], ["In which year was Christian Frederick of Denmark born?", "1770 || 1770"]]}}, "hop2": {"mis_info_dict_light": {"answer_condition": [1, 3], "confidence": [0.988311767578125, 1.0], "model_response": [["Who is the president / leader of Norway in the year 1814?", "Christian Frederick of Denmark. || Christian Frederick of Denmark"], ["In which year was Christian Frederick of Denmark born?", "1599 || 1599"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [0.4217376708984375, 0.90625], "model_response": [["Who is the president / leader of Norway in the year 1814?", "Christian Frederick of Denmark. || Christian Frederick of Denmark"], ["In which year was Christian Frederick of Denmark born?", "1729 || 1729"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 4], "confidence": [0.05896618589758873, 0.988311767578125], "model_response": [["Who is the president / leader of Norway in the year 1814?", "King Christian Frederick of Denmark. || King Christian Frederick of Denmark"], ["In which year was Christian Frederick of Denmark born?", "1729 || 1729"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 4], "confidence": [0.013762012462393614, 0.7965087890625], "model_response": [["Who is the president / leader of Norway in the year 1814?", "King Christian VII of Denmark and Norway. || King Christian VII of Denmark and Norway"], ["In which year was King Christian VII of Denmark and Norway born?", "1729 || 1729"]]}, "mis_info_dict_severe": {"answer_condition": [1, 4], "confidence": [0.9195556640625, 0.70703125], "model_response": [["Who is the president / leader of Norway in the year 1814?", "Christian Frederick of Denmark is the president / leader of Norway in the year 1814. || Christian Frederick of Denmark"], ["In which year was Christian Frederick of Denmark born?", "1729 || 1729"]]}, "hall_sbj_dict_severe": {"answer_condition": [4, 4], "confidence": [0.46703293919563293, 0.4536895751953125], "model_response": [["Who is the president / leader of Norway in the year 1814?", "King Christian VIII || King Christian VIII"], ["In which year was King Christian VIII of Denmark born?", "1670 || 1670"]]}}}
{"hop1": {"hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.401824951171875, 0.9921875], "model_response": [["Which countries to the east share a border with Norway?", "Finland and Russia || Finland and Russia"], ["What is the official or most commonly spoken language in Finland?", "Finnish || Finnish"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.482574462890625, 0.99609375], "model_response": [["Which countries to the east share a border with Norway?", "Finland and Russia || Finland and Russia"], ["What is the official or most commonly spoken language in Finland?", "Finnish || Finnish"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.39997100830078125, 1.0], "model_response": [["Which countries to the east share a border with Norway?", "Finland and Sweden. || Finland and Sweden"], ["What is the official or most commonly spoken language in Finland?", "Finnish || Finnish"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.6069034337997437, 0.9921875], "model_response": [["Which countries to the east share a border with Norway?", "Finland and Sweden || Finland and Sweden"], ["What is the official or most commonly spoken language in Finland?", "Finnish || Finnish"]]}, "mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [0.28598785400390625, 0.9921875], "model_response": [["Which countries to the east share a border with Norway?", "Finland and Sweden || Finland and Sweden"], ["What is the official or most commonly spoken language in Finland?", "Finnish || Finnish"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.2632511258125305, 0.9765625], "model_response": [["Which countries to the east share a border with Norway?", "Finland and Russia || Finland and Russia"], ["What is the official or most commonly spoken language in Finland?", "Finnish || Finnish"]]}}, "hop2": {"mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [0.44837290048599243, 0.98046875], "model_response": [["Which countries to the east share a border with Norway?", "Finland and Russia || Finland and Russia"], ["What is the official or most commonly spoken language in Finland?", "Finnish || Finnish"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.8481144905090332, 1.0], "model_response": [["Which countries to the east share a border with Norway?", "Finland and Russia || Finland and Russia"], ["What is the official or most commonly spoken language in Finland?", "Finnish || Finnish"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.6395056843757629, 0.98046875], "model_response": [["Which countries to the east share a border with Norway?", "Finland and Russia. || Finland and Russia"], ["What is the official or most commonly spoken language in Finland?", "Finnish || Finnish"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.7050111293792725, 0.9921875], "model_response": [["Which countries to the east share a border with Norway?", "Finland, Sweden, and Russia || Finland, Sweden, and Russia"], ["What is the official or most commonly spoken language in Finland?", "Finnish || Finnish"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.76344731496647, 0.98046875], "model_response": [["Which countries to the east share a border with Norway?", "Finland, Russia, and Sweden. || Finland, Russia, and Sweden"], ["What is the official or most commonly spoken language in Finland?", "Finnish || Finnish"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.6369978189468384, 1.0], "model_response": [["Which countries to the east share a border with Norway?", "Finland, Sweden, and Russia || Finland, Sweden, and Russia"], ["What is the official or most commonly spoken language in Finland?", "Finnish || Finnish"]]}}}
{"hop1": {"hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.7265625, 0.9921875], "model_response": [["Which country does Baltimore belong to?", "United States || United States"], ["What is the capital of the United States?", "Washington D.C. || Washington D.C."]]}, "mis_info_dict_light": {"answer_condition": [3, 4], "confidence": [1.0, 1.0], "model_response": [["Which country does Baltimore belong to?", "Canada || Canada"], ["What is the capital of Canada?", "Ottawa || Ottawa"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.466796875, 0.9921875], "model_response": [["Which country does Baltimore belong to?", "United States || United States"], ["What is the capital of the United States?", "Washington D.C. || Washington D.C."]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.9453125, 0.9921875], "model_response": [["Which country does Baltimore belong to?", "United States || United States"], ["What is the capital of the United States?", "Washington D.C. || Washington D.C."]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.98046875, 0.99609375], "model_response": [["Which country does Baltimore belong to?", "United States || United States"], ["What is the capital of the United States?", "Washington D.C. || Washington D.C."]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.703125, 0.9921875], "model_response": [["Which country does Baltimore belong to?", "United States || United States"], ["What is the capital of the United States?", "Washington D.C. || Washington D.C."]]}}, "hop2": {"mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [0.86328125, 1.0], "model_response": [["Which country does Baltimore belong to?", "United States || United States"], ["What is the capital of the United States?", "Washington D.C. || Washington D.C."]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.84375, 0.99609375], "model_response": [["Which country does Baltimore belong to?", "United States || United States"], ["What is the capital of the United States?", "Washington D.C. || Washington D.C."]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.78515625, 0.98046875], "model_response": [["Which country does Baltimore belong to?", "United States || United States"], ["What is the capital of the United States?", "Washington D.C. || Washington D.C."]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.70703125, 0.99609375], "model_response": [["Which country does Baltimore belong to?", "United States || United States"], ["What is the capital of the United States?", "Washington D.C. || Washington D.C."]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.8671875, 0.98046875], "model_response": [["Which country does Baltimore belong to?", "United States || United States"], ["What is the capital of the United States?", "Washington D.C. || Washington D.C."]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.2412109375, 0.089141845703125], "model_response": [["Which country does Baltimore belong to?", "The United States || The United States"], ["What is the capital of the United States?", "Washington, D.C. || Washington, D.C."]]}}}
{"hop1": {"hall_sbj_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 0.09970396757125854], "model_response": [["In which year was The Godfather released?", "1972 || 1972"], ["Who is the CEO of American Zoetrope in the year 1972?", "Harrison Ellens || Harrison Ellens"]]}, "mis_info_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.9375], "model_response": [["In which year was The Godfather released?", "1972 || 1972"], ["Who is the CEO of American Zoetrope in the year 1972?", "Francis Ford Coppola || Francis Ford Coppola"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.64453125], "model_response": [["In which year was The Godfather released?", "1972 || 1972"], ["Who is the CEO of American Zoetrope in the year 1972?", "Francis Ford Coppola || Francis Ford Coppola"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 1.3711612453448652e-05], "model_response": [["In which year was The Godfather released?", "1972 || 1972"], ["Who is the CEO of American Zoetrope in the year 1972?", "Mortimer S. Adler || Mortimer S. Adler"]]}, "mis_info_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 0.92578125], "model_response": [["In which year was The Godfather released?", "1972 || 1972"], ["Who is the CEO of American Zoetrope in the year 1972?", "Francis Ford Coppola || Francis Ford Coppola"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 0.96484375], "model_response": [["In which year was The Godfather released?", "1972 || 1972"], ["Who is the CEO of American Zoetrope in the year 1972?", "Francis Ford Coppola || Francis Ford Coppola"]]}}, "hop2": {"hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.9765625], "model_response": [["In which year was The Godfather released?", "1972 || 1972"], ["Who is the CEO of American Zoetrope in the year 1972?", "George Lucas || George Lucas"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 0.3347151279449463], "model_response": [["In which year was The Godfather released?", "1972 || 1972"], ["Who is the CEO of American Zoetrope in the year 1972?", "Harvey Weinstein || Harvey Weinstein"]]}, "mis_info_dict_severe": {"answer_condition": [1, 3], "confidence": [1.0, 0.9921875], "model_response": [["In which year was The Godfather released?", "1972 || 1972"], ["Who is the CEO of American Zoetrope in the year 1972?", "Chocolate Chip Cookies || Chocolate Chip Cookies"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.85601806640625], "model_response": [["In which year was The Godfather released?", "1972 || 1972"], ["Who is the CEO of American Zoetrope in the year 1972?", "Francis Ford Coppola || Francis Ford Coppola"]]}, "mis_info_dict_light": {"answer_condition": [1, 3], "confidence": [1.0, 1.0], "model_response": [["In which year was The Godfather released?", "1972 || 1972"], ["Who is the CEO of American Zoetrope in the year 1972?", "Steven Spielberg || Steven Spielberg"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 0.8203125], "model_response": [["In which year was The Godfather released?", "1972 || 1972"], ["Who is the CEO of American Zoetrope in the year 1972?", "Francis Ford Coppola || Francis Ford Coppola"]]}}}
{"hop1": {"hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Which city hosted the first Olympic Games in the year 1867?", "Paris || Paris"], ["Which country does Paris belong to?", "France || France"]]}, "mis_info_dict_severe": {"answer_condition": [4, 4], "confidence": [0.484375, 1.0], "model_response": [["Which city hosted the first Olympic Games in the year 1867?", "Rome || Rome"], ["Which country does Rome belong to?", "Italy || Italy"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 4], "confidence": [0.98046875, 1.0], "model_response": [["Which city hosted the first Olympic Games in the year 1867?", "Athens || Athens"], ["Which country does Athens belong to?", "Greece || Greece"]]}, "mis_info_dict_light": {"answer_condition": [4, 4], "confidence": [0.94921875, 1.0], "model_response": [["Which city hosted the first Olympic Games in the year 1867?", "Alpina || Alpina"], ["Which country does Alpina belong to?", "Switzerland || Switzerland"]]}, "hall_sbj_dict_light": {"answer_condition": [3, 4], "confidence": [1.0, 1.0], "model_response": [["Which city hosted the first Olympic Games in the year 1867?", "Rome || Rome"], ["Which country does Rome belong to?", "Italy || Italy"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 4], "confidence": [0.796875, 1.0], "model_response": [["Which city hosted the first Olympic Games in the year 1867?", "Athens, Greece || Athens"], ["Which country does Athens belong to?", "Greece || Greece"]]}}, "hop2": {"unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.26953125, 1.0], "model_response": [["Which city hosted the first Olympic Games in the year 1867?", "Paris || Paris"], ["Which country does Paris belong to?", "France || France"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.3671875, 1.0], "model_response": [["Which city hosted the first Olympic Games in the year 1867?", "Paris || Paris"], ["Which country does Paris belong to?", "France || France"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.07568359375, 1.0], "model_response": [["Which city hosted the first Olympic Games in the year 1867?", "Paris || Paris"], ["Which country does Paris belong to?", "France || France"]]}, "hall_sbj_dict_severe": {"answer_condition": [4, 4], "confidence": [0.365234375, 1.0], "model_response": [["Which city hosted the first Olympic Games in the year 1867?", "Athens || Athens"], ["Which country does Athens belong to?", "Greece || Greece"]]}, "mis_info_dict_light": {"answer_condition": [4, 4], "confidence": [0.98046875, 1.0], "model_response": [["Which city hosted the first Olympic Games in the year 1867?", "Athens, Greece || Athens"], ["Which country does Athens belong to?", "Greece || Greece"]]}, "hall_sbj_dict_light": {"answer_condition": [4, 4], "confidence": [0.921875, 1.0], "model_response": [["Which city hosted the first Olympic Games in the year 1867?", "Athens, Greece || Athens"], ["Which country does Athens belong to?", "Greece || Greece"]]}}}
{"hop1": {"unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [0.859375, 0.08012580871582031], "model_response": [["In which year was Denzel Washington born?", "1954 || 1954"], ["Who is the CEO of Paramount Pictures in the year 1954?", "Adolph Zukor || Adolph Zukor"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [0.90234375, 0.37890625], "model_response": [["In which year was Denzel Washington born?", "1954 || 1954"], ["Who is the CEO of Paramount Pictures in the year 1954?", "Charles Bluhdorn || Charles Bluhdorn"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, -1], "confidence": [0.375, -1], "model_response": [["In which year was Denzel Washington born?", "October 28, 1954 || October 28, 1954"], ["Who is the CEO of Paramount Pictures in the year 1954?", "N/A (Paramount Pictures was founded in 1922) || N/A"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 4], "confidence": [0.9609375, 0.1796875], "model_response": [["In which year was Denzel Washington born?", "1954 || 1954"], ["Who is the CEO of Paramount Pictures in the year 1954?", "Charles Bluhdorn || Charles Bluhdorn"]]}, "mis_info_dict_severe": {"answer_condition": [1, 4], "confidence": [0.99609375, 0.012610424892045557], "model_response": [["In which year was Denzel Washington born?", "1954 || 1954"], ["Who is the CEO of Paramount Pictures in the year 1954?", "Robert L. Shuler || Robert L. Shuler"]]}, "mis_info_dict_light": {"answer_condition": [3, 4], "confidence": [1.0, 0.0974368304014206], "model_response": [["In which year was Denzel Washington born?", "1962 || 1962"], ["Who is the CEO of Paramount Pictures in the year 1962?", "Gerald M. Loeb || Gerald M. Loeb"]]}}, "hop2": {"unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.9453125, 0.399200439453125], "model_response": [["In which year was Denzel Washington born?", "1954 || 1954"], ["Who is the CEO of Paramount Pictures in the year 1954?", "Barry Diller || Barry Diller"]]}, "mis_info_dict_light": {"answer_condition": [1, 3], "confidence": [0.003657982684671879, 1.0], "model_response": [["In which year was Denzel Washington born?", "September 27, 1954 || September 27, 1954"], ["Who is the CEO of Paramount Pictures in the year 1954?", "Michael Eisner || Michael Eisner"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.008967993780970573, 0.44921875], "model_response": [["In which year was Denzel Washington born?", "September 27, 1954 || September 27, 1954"], ["Who is the CEO of Paramount Pictures in the year 1954?", "Charles Bluhdorn || Charles Bluhdorn"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [-1.0, 0.9609375], "model_response": [["In which year was Denzel Washington born?", "Denzel Washington was born in 1954. || 1954"], ["Who is the CEO of Paramount Pictures in the year 1954?", "Barry Diller || Barry Diller"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 4], "confidence": [0.3671875, 0.017333984375], "model_response": [["In which year was Denzel Washington born?", "October 28, 1954 || October 28, 1954"], ["Who is the CEO of Paramount Pictures in the year 1954?", "Charles Bluhdorn || Charles Bluhdorn"]]}, "mis_info_dict_severe": {"answer_condition": [1, 4], "confidence": [-1.0, 0.41363525390625], "model_response": [["In which year was Denzel Washington born?", "Denzel Washington was born in 1954. || 1954"], ["Who is the CEO of Paramount Pictures in the year 1954?", "A chocolate cake || A chocolate cake"]]}}}
{"hop1": {"hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.921875, 0.8216552734375], "model_response": [["In which year was the University of Canberra founded?", "1965 || 1965"], ["Who is the headmaster of Yale University in the year 1965?", "Kingman Brewster || Kingman Brewster"]]}, "mis_info_dict_light": {"answer_condition": [3, 4], "confidence": [0.7265625, 0.10848064720630646], "model_response": [["In which year was the University of Canberra founded?", "1975 || 1975"], ["Who is the headmaster of Yale University in the year 1975?", "Robert J. Zimmer || Robert J. Zimmer"]]}, "mis_info_dict_severe": {"answer_condition": [4, 4], "confidence": [0.79296875, 9.318116759771122e-05], "model_response": [["In which year was the University of Canberra founded?", "1986 || 1986"], ["Who is the headmaster of Yale University in the year 1986?", "Raymond J. Slifer || Raymond J. Slifer"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 4], "confidence": [0.432373046875, 0.988311767578125], "model_response": [["In which year was the University of Canberra founded?", "1916 || 1916"], ["Who was the headmaster of Yale University in the year 1916?", "Charles Seymour (1852-1929) || Charles Seymour"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 4], "confidence": [0.272430419921875, 0.97265625], "model_response": [["In which year was the University of Canberra founded?", "1925 || 1925"], ["Who is the headmaster of Yale University in the year 1925?", "Charles Seymour (1856-1929) || Charles Seymour"]]}, "hall_sbj_dict_light": {"answer_condition": [4, 4], "confidence": [0.5966796875, 0.9921875], "model_response": [["In which year was the University of Canberra founded?", "1926 || 1926"], ["Who was the headmaster of Yale University in the year 1926?", "Charles Seymour (1858-1929) || Charles Seymour"]]}}, "hop2": {"hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.91796875, 1.0], "model_response": [["In which year was the University of Canberra founded?", "1965 || 1965"], ["Who is the headmaster of Yale University in the year 1965?", "Kingman Brewster || Kingman Brewster"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.3046875, 1.0], "model_response": [["In which year was the University of Canberra founded?", "1965 || 1965"], ["Who is the headmaster of Yale University in the year 1965?", "Kingman Brewster || Kingman Brewster"]]}, "mis_info_dict_light": {"answer_condition": [1, 4], "confidence": [0.90234375, 1.0], "model_response": [["In which year was the University of Canberra founded?", "1965 || 1965"], ["Who is the headmaster of Yale University in the year 1965?", "John F. Kennedy || John F. Kennedy"]]}, "mis_info_dict_severe": {"answer_condition": [1, 3], "confidence": [0.80078125, 0.076324462890625], "model_response": [["In which year was the University of Canberra founded?", "1965 || 1965"], ["Who is the headmaster of Yale University in the year 1965?", "Chocolate chip cookies || Chocolate chip cookies"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [0.9140625, 0.890625], "model_response": [["In which year was the University of Canberra founded?", "1965 || 1965"], ["Who is the headmaster of Yale University in the year 1965?", "Derek Bok || Derek Bok"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.00862206509588681], "model_response": [["In which year was the University of Canberra founded?", "The University of Canberra was founded in 1965. || 1965"], ["Who is the headmaster of Yale University in the year 1965?", "Harold R. Verrill || Harold R. Verrill"]]}}}
{"hop1": {"hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.6015625, 0.6875], "model_response": [["What is the time zone of London in UTC?", "UTC+0 || UTC+0"], ["Which country is the northernmost in the UTC+0 time zone?", "Norway || Norway"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.4404449462890625, 0.54296875], "model_response": [["What is the time zone of London in UTC?", "GMT+0 || GMT+0"], ["Which country is the northernmost in the UTC+0 time zone?", "Norway || Norway"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [0.775909423828125, 0.4291534423828125], "model_response": [["What is the time zone of London in UTC?", "UTC+0 || UTC+0"], ["Which country is the northernmost in the UTC+0 time zone?", "Iceland || Iceland"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.99609375, 0.6875], "model_response": [["What is the time zone of London in UTC?", "London is in the UTC time zone. || UTC"], ["Which country is the northernmost in the UTC+0 time zone?", "Norway || Norway"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.44140625, 0.546875], "model_response": [["What is the time zone of London in UTC?", "Greenwich Mean Time (GMT) || Greenwich Mean Time (GMT)"], ["Which country is the northernmost in the UTC+0 time zone?", "Norway || Norway"]]}, "mis_info_dict_light": {"answer_condition": [3, 3], "confidence": [1.0, 0.08984375], "model_response": [["What is the time zone of London in UTC?", "UTC+2 || UTC+2"], ["Which country is the northernmost in the UTC+2 time zone?", "Finland || Finland"]]}}, "hop2": {"mis_info_dict_light": {"answer_condition": [1, 4], "confidence": [0.4474639892578125, 0.97265625], "model_response": [["What is the time zone of London in UTC?", "UTC+0 || UTC+0"], ["Which country is the northernmost in the UTC+0 time zone?", "Iceland || Iceland"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.796875, 0.2578125], "model_response": [["What is the time zone of London in UTC?", "UTC+0 || UTC+0"], ["Which country is the northernmost in the UTC+0 time zone?", "Norway || Norway"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.421875, 0.455078125], "model_response": [["What is the time zone of London in UTC?", "UTC+0 || UTC+0"], ["Which country is the northernmost in the UTC+0 time zone?", "Norway || Norway"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 3], "confidence": [0.6640625, 0.796875], "model_response": [["What is the time zone of London in UTC?", "UTC+0 || UTC+0"], ["Which country is the northernmost in the UTC+0 time zone?", "Russia || Russia"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 3], "confidence": [0.4631500244140625, 1.0], "model_response": [["What is the time zone of London in UTC?", "UTC+0 || UTC+0"], ["Which country is the northernmost in the UTC+0 time zone?", "Iceland || Iceland"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.11041259765625, 0.703125], "model_response": [["What is the time zone of London in UTC?", "GMT+0 || GMT+0"], ["Which country is the northernmost in the UTC+0 time zone?", "Norway || Norway"]]}}}
{"hop1": {"hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.412109375, 0.93359375], "model_response": [["Which country is the northernmost in the +10 time zone?", "Canada || Canada"], ["What is the name of the longest river in Canada?", "The Mackenzie River || The Mackenzie River"]]}, "mis_info_dict_light": {"answer_condition": [4, 4], "confidence": [1.0, 0.8754730224609375], "model_response": [["Which country is the northernmost in the +10 time zone?", "Russia || Russia"], ["What is the name of the longest river in Russia?", "The Volga River || Volga River"]]}, "hall_sbj_dict_light": {"answer_condition": [4, 4], "confidence": [0.169921875, 0.77813720703125], "model_response": [["Which country is the northernmost in the +10 time zone?", "Russia || Russia"], ["What is the name of the longest river in Russia?", "The Volga || The Volga"]]}, "mis_info_dict_severe": {"answer_condition": [3, 4], "confidence": [0.6154859066009521, 0.3817596435546875], "model_response": [["Which country is the northernmost in the +10 time zone?", "Chocolate Cake || Chocolate Cake"], ["What is the name of the longest river in Chocolate Cake?", "The Nile || The Nile"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 4], "confidence": [0.6328125, 0.2489611692726612], "model_response": [["Which country is the northernmost in the +10 time zone?", "Norway || Norway"], ["What is the name of the longest river in Norway?", "The river is called the river of the north. || river of the north"]]}, "unrelated_fact_dict_light": {"answer_condition": [3, 4], "confidence": [1.0, 0.87890625], "model_response": [["Which country is the northernmost in the +10 time zone?", "Russia || Russia"], ["What is the name of the longest river in Russia?", "The Volga River is the longest river in Russia, stretching for 3,692 km (2,294 mi) from the Caspian Sea to the Volga Delta in the Ural River. || Volga River"]]}}, "hop2": {"mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [0.13671875, 0.056396484375], "model_response": [["Which country is the northernmost in the +10 time zone?", "Greenland || Greenland"], ["What is the name of the longest river in Canada?", "The Mackenzie River. || Mackenzie River"]]}, "hall_sbj_dict_light": {"answer_condition": [4, 4], "confidence": [0.2001953125, 0.26953125], "model_response": [["Which country is the northernmost in the +10 time zone?", "Russia || Russia"], ["What is the name of the longest river in Russia?", "Volga || Volga"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 4], "confidence": [0.06787109375, 0.7724761962890625], "model_response": [["Which country is the northernmost in the +10 time zone?", "Russia || Russia"], ["What is the name of the longest river in Russia?", "The Volga River || Volga River"]]}, "mis_info_dict_severe": {"answer_condition": [4, 4], "confidence": [0.81640625, 0.94921875], "model_response": [["Which country is the northernmost in the +10 time zone?", "Norway || Norway"], ["What is the name of the longest river in Norway?", "The longest river in Norway is the river Glomma. || Glomma"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 4], "confidence": [0.6484375, 0.03298473358154297], "model_response": [["Which country is the northernmost in the +10 time zone?", "Norway || Norway"], ["What is the name of the longest river in Norway?", "The Sjoa river is the longest river in Norway. || Sjoa river"]]}, "hall_sbj_dict_severe": {"answer_condition": [4, 4], "confidence": [0.6875, 0.4046630859375], "model_response": [["Which country is the northernmost in the +10 time zone?", "Norway || Norway"], ["What is the name of the longest river in Norway?", "The name of the longest river in Norway is the Glomma river. || Glomma river"]]}}}
{"hop1": {"unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["In which city is the headquarters of Mitsubishi Corporation located?", "Tokyo || Tokyo"], ["Which country does Tokyo belong to?", "Japan || Japan"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["In which city is the headquarters of Mitsubishi Corporation located?", "Tokyo || Tokyo"], ["Which country does Tokyo belong to?", "Japan || Japan"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["In which city is the headquarters of Mitsubishi Corporation located?", "Tokyo || Tokyo"], ["Which country does Tokyo belong to?", "Japan || Japan"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["In which city is the headquarters of Mitsubishi Corporation located?", "Tokyo || Tokyo"], ["Which country does Tokyo belong to?", "Japan || Japan"]]}, "mis_info_dict_light": {"answer_condition": [3, 1], "confidence": [1.0, 1.0], "model_response": [["In which city is the headquarters of Mitsubishi Corporation located?", "Osaka || Osaka"], ["Which country does Osaka belong to?", "Japan || Japan"]]}, "mis_info_dict_severe": {"answer_condition": [4, 4], "confidence": [1.0, 1.0], "model_response": [["In which city is the headquarters of Mitsubishi Corporation located?", "Pizza || Pizza"], ["Which country does pizza belong to?", "Italy || Italy"]]}}, "hop2": {"mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["In which city is the headquarters of Mitsubishi Corporation located?", "Tokyo || Tokyo"], ["Which country does Tokyo belong to?", "Japan || Japan"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["In which city is the headquarters of Mitsubishi Corporation located?", "Tokyo || Tokyo"], ["Which country does Tokyo belong to?", "Japan || Japan"]]}, "mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["In which city is the headquarters of Mitsubishi Corporation located?", "Tokyo || Tokyo"], ["Which country does Tokyo belong to?", "Japan || Japan"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["In which city is the headquarters of Mitsubishi Corporation located?", "Tokyo || Tokyo"], ["Which country does Tokyo belong to?", "Japan || Japan"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["In which city is the headquarters of Mitsubishi Corporation located?", "Tokyo || Tokyo"], ["Which country does Tokyo belong to?", "Japan || Japan"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["In which city is the headquarters of Mitsubishi Corporation located?", "Tokyo || Tokyo"], ["Which country does Tokyo belong to?", "Japan || Japan"]]}}}
{"hop1": {"hall_sbj_dict_severe": {"answer_condition": [1, 4], "confidence": [0.788970947265625, 0.32189497724175453], "model_response": [["What is the largest company (by people) based in Tokyo?", "Mitsubishi Corporation || Mitsubishi Corporation"], ["Who is the CEO of Mitsubishi Corporation in the year 1973?", "Yoshio Mori || Yoshio Mori"]]}, "mis_info_dict_severe": {"answer_condition": [3, 4], "confidence": [0.04736328125, 0.9921875], "model_response": [["What is the largest company (by people) based in Tokyo?", "Pizza hut || Pizza hut"], ["Who is the CEO of Pizza Hut in the year 1973?", "Ray Kroc || Ray Kroc"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 4], "confidence": [0.17728395760059357, 1.0], "model_response": [["What is the largest company (by people) based in Tokyo?", "Softbank Group Corp. || Softbank Group Corp."], ["Who is the CEO of Softbank Group Corp. in the year 1973?", "Masayoshi Son || Masayoshi Son"]]}, "hall_sbj_dict_light": {"answer_condition": [4, 4], "confidence": [0.26702880859375, 0.5736207822337747], "model_response": [["What is the largest company (by people) based in Tokyo?", "Mitsubishi Heavy Industries || Mitsubishi Heavy Industries"], ["Who is the CEO of Mitsubishi Heavy Industries in the year 1973?", "Yoshio Mori || Yoshio Mori"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 4], "confidence": [0.7141876220703125, 0.007054943096278521], "model_response": [["What is the largest company (by people) based in Tokyo?", "Mitsubishi Heavy Industries || Mitsubishi Heavy Industries"], ["Who is the CEO of Mitsubishi Heavy Industries in the year 1973?", "Yoshio Ishii || Yoshio Ishii"]]}, "mis_info_dict_light": {"answer_condition": [4, -1], "confidence": [0.09059524536132812, -1], "model_response": [["What is the largest company (by people) based in Tokyo?", "InnovateTech || InnovateTech"], ["Who is the CEO of InnovateTech in the year 1973?", "I'm sorry, but the year 1973 is not specified in the given information. Please provide more context or a specific year to answer this question. || N/A"]]}}, "hop2": {"hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.54046630859375, 0.99609375], "model_response": [["What is the largest company (by people) based in Tokyo?", "Mitsubishi Corporation || Mitsubishi Corporation"], ["Who is the CEO of Mitsubishi Corporation in the year 1973?", "Yoshio Maruoka || Yoshio Maruoka"]]}, "mis_info_dict_severe": {"answer_condition": [1, 3], "confidence": [0.8544921875, 0.61798095703125], "model_response": [["What is the largest company (by people) based in Tokyo?", "Mitsubishi Corporation || Mitsubishi Corporation"], ["Who is the CEO of Mitsubishi Corporation in the year 1973?", "Chocolate Cake || Chocolate Cake"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 3], "confidence": [0.4931640625, 1.0], "model_response": [["What is the largest company (by people) based in Tokyo?", "Mitsubishi Corporation || Mitsubishi Corporation"], ["Who is the CEO of Mitsubishi Corporation in the year 1973?", "Muhtar Kent || Muhtar Kent"]]}, "hall_sbj_dict_light": {"answer_condition": [4, 1], "confidence": [0.8630828857421875, 0.92578125], "model_response": [["What is the largest company (by people) based in Tokyo?", "Mitsubishi Heavy Industries || Mitsubishi Heavy Industries"], ["Who is the CEO of Mitsubishi Heavy Industries in the year 1973?", "Yoshio Maruoka || Yoshio Maruoka"]]}, "mis_info_dict_light": {"answer_condition": [4, 3], "confidence": [0.4560699462890625, 0.98828125], "model_response": [["What is the largest company (by people) based in Tokyo?", "Mitsubishi Heavy Industries || Mitsubishi Heavy Industries"], ["Who is the CEO of Mitsubishi Heavy Industries in the year 1973?", "Hiroshi Yamauchi || Hiroshi Yamauchi"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 4], "confidence": [0.084381103515625, 0.06291491063166177], "model_response": [["What is the largest company (by people) based in Tokyo?", "Mitsubishi UFJ Financial Group (Japan's largest financial group) || Mitsubishi UFJ Financial Group"], ["Who is the CEO of Mitsubishi UFJ Financial Group in the year 1973?", "Yoshio Sakamoto || Yoshio Sakamoto"]]}}}
{"hop1": {"hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.98828125, 1.0], "model_response": [["In which year was Israel founded or became independent?", "1948 || 1948"], ["Who is the CEO of IBM in the year 1948?", "Thomas Watson || Thomas Watson"]]}, "mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [0.99609375, 1.0], "model_response": [["In which year was Israel founded or became independent?", "1948 || 1948"], ["Who is the CEO of IBM in the year 1948?", "Thomas Watson || Thomas Watson"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.99609375, 1.0], "model_response": [["In which year was Israel founded or became independent?", "1948 || 1948"], ["Who is the CEO of IBM in the year 1948?", "Thomas Watson || Thomas Watson"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["In which year was Israel founded or became independent?", "1948 || 1948"], ["Who is the CEO of IBM in the year 1948?", "Thomas Watson || Thomas Watson"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.87890625, 0.99609375], "model_response": [["In which year was Israel founded or became independent?", "1948 || 1948"], ["Who is the CEO of IBM in the year 1948?", "Thomas Watson || Thomas Watson"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["In which year was Israel founded or became independent?", "1948 || 1948"], ["Who is the CEO of IBM in the year 1948?", "Thomas Watson || Thomas Watson"]]}}, "hop2": {"unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["In which year was Israel founded or became independent?", "1948 || 1948"], ["Who is the CEO of IBM in the year 1948?", "Thomas Watson || Thomas Watson"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.9921875], "model_response": [["In which year was Israel founded or became independent?", "1948 || 1948"], ["Who is the CEO of IBM in the year 1948?", "Thomas Watson || Thomas Watson"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["In which year was Israel founded or became independent?", "1948 || 1948"], ["Who is the CEO of IBM in the year 1948?", "Thomas J. Watson || Thomas J. Watson"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.99609375, 1.0], "model_response": [["In which year was Israel founded or became independent?", "1948 || 1948"], ["Who is the CEO of IBM in the year 1948?", "Thomas J. Watson || Thomas J. Watson"]]}, "mis_info_dict_severe": {"answer_condition": [1, 3], "confidence": [1.0, 0.73046875], "model_response": [["In which year was Israel founded or became independent?", "1948 || 1948"], ["Who is the CEO of IBM in the year 1948?", "Chocolate Chip Cookies || Chocolate Chip Cookies"]]}, "mis_info_dict_light": {"answer_condition": [1, 4], "confidence": [0.99609375, 1.0], "model_response": [["In which year was Israel founded or became independent?", "1948 || 1948"], ["Who is the CEO of IBM in the year 1948?", "John F. Kennedy || John F. Kennedy"]]}}}
{"hop1": {"hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.4825592041015625], "model_response": [["What is the official or most commonly spoken language in Norway?", "Norwegian || Norwegian"], ["What is the ISO 639-1 code for the Norwegian language?", "nb-NO || nb-NO"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.6015625], "model_response": [["What is the official or most commonly spoken language in Norway?", "Norwegian || Norwegian"], ["What is the ISO 639-1 code for the Norwegian language?", "no || no"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.17218017578125], "model_response": [["What is the official or most commonly spoken language in Norway?", "Norwegian || Norwegian"], ["What is the ISO 639-1 code for the Norwegian language?", "nb-NO || nb-NO"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.19403076171875], "model_response": [["What is the official or most commonly spoken language in Norway?", "Norwegian || Norwegian"], ["What is the ISO 639-1 code for the Norwegian language?", "nb-NO || nb-NO"]]}, "mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [0.99609375, 0.4864044189453125], "model_response": [["What is the official or most commonly spoken language in Norway?", "Norwegian || Norwegian"], ["What is the ISO 639-1 code for the Norwegian language?", "nb-NO || nb-NO"]]}, "mis_info_dict_severe": {"answer_condition": [4, 4], "confidence": [1.0, 0.87738037109375], "model_response": [["What is the official or most commonly spoken language in Norway?", "Pizza || Pizza"], ["What is the ISO 639-1 code for the Pizza language?", "pza || pza"]]}}, "hop2": {"hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.953125], "model_response": [["What is the official or most commonly spoken language in Norway?", "Norwegian || Norwegian"], ["What is the ISO 639-1 code for the Norwegian language?", "no || no"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.98046875], "model_response": [["What is the official or most commonly spoken language in Norway?", "Norwegian || Norwegian"], ["What is the ISO 639-1 code for the Norwegian language?", "no || no"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.96875], "model_response": [["What is the official or most commonly spoken language in Norway?", "Norwegian || Norwegian"], ["What is the ISO 639-1 code for the Norwegian language?", "no || no"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.98828125], "model_response": [["What is the official or most commonly spoken language in Norway?", "Norwegian || Norwegian"], ["What is the ISO 639-1 code for the Norwegian language?", "no || no"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.66015625], "model_response": [["What is the official or most commonly spoken language in Norway?", "Norwegian || Norwegian"], ["What is the ISO 639-1 code for the Norwegian language?", "no || no"]]}, "mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.99609375], "model_response": [["What is the official or most commonly spoken language in Norway?", "Norwegian || Norwegian"], ["What is the ISO 639-1 code for the Norwegian language?", "no || no"]]}}}
{"hop1": {"unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.5, 0.87890625], "model_response": [["Which city in Europe has the largest population?", "London || London"], ["What is the time zone of London in UTC?", "UTC+0 || UTC+0"]]}, "mis_info_dict_light": {"answer_condition": [3, 4], "confidence": [0.59765625, 0.9613189697265625], "model_response": [["Which city in Europe has the largest population?", "Paris || Paris"], ["What is the time zone of Paris in UTC?", "UTC+1 || UTC+1"]]}, "hall_sbj_dict_severe": {"answer_condition": [-1, -1], "confidence": [-1, -1], "model_response": [["Which city in Europe has the largest population?", "I'm sorry, I cannot provide an answer to this question as it is not in my database. Please provide more information or context so I can assist you better. || N/A"]]}, "mis_info_dict_severe": {"answer_condition": [4, 4], "confidence": [0.972808837890625, 0.953125], "model_response": [["Which city in Europe has the largest population?", "Rome || Rome"], ["What is the time zone of Rome in UTC?", "UTC+2 || UTC+2"]]}, "hall_sbj_dict_light": {"answer_condition": [3, 4], "confidence": [0.9921875, 0.98046875], "model_response": [["Which city in Europe has the largest population?", "Rome || Rome"], ["What is the time zone of Rome in UTC?", "UTC+2 || UTC+2"]]}, "unrelated_fact_dict_light": {"answer_condition": [3, 4], "confidence": [0.921875, 0.98046875], "model_response": [["Which city in Europe has the largest population?", "Berlin, Germany || Berlin"], ["What is the time zone of Berlin in UTC?", "UTC+1 || UTC+1"]]}}, "hop2": {"unrelated_fact_dict_severe": {"answer_condition": [4, 4], "confidence": [0.921875, 0.81640625], "model_response": [["Which city in Europe has the largest population?", "Moscow || Moscow"], ["What is the time zone of Moscow in UTC?", "UTC+3 || UTC+3"]]}, "mis_info_dict_light": {"answer_condition": [4, 4], "confidence": [0.8125, 1.0], "model_response": [["Which city in Europe has the largest population?", "Moscow || Moscow"], ["What is the time zone of Moscow in UTC?", "UTC+3 || UTC+3"]]}, "mis_info_dict_severe": {"answer_condition": [4, 4], "confidence": [1.0, 0.384521484375], "model_response": [["Which city in Europe has the largest population?", "Moscow || Moscow"], ["What is the time zone of Moscow in UTC?", "MSK+3 (Moscow Summer Time) || MSK+3"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 4], "confidence": [0.81640625, 0.9921875], "model_response": [["Which city in Europe has the largest population?", "Moscow || Moscow"], ["What is the time zone of Moscow in UTC?", "UTC+3 || UTC+3"]]}, "hall_sbj_dict_severe": {"answer_condition": [4, 4], "confidence": [0.99609375, 0.98046875], "model_response": [["Which city in Europe has the largest population?", "Moscow || Moscow"], ["What is the time zone of Moscow in UTC?", "UTC+3 || UTC+3"]]}, "hall_sbj_dict_light": {"answer_condition": [4, 4], "confidence": [0.96875, 0.98046875], "model_response": [["Which city in Europe has the largest population?", "Moscow || Moscow"], ["What is the time zone of Moscow in UTC?", "UTC+3 || UTC+3"]]}}}
{"hop1": {"hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.9456787109375], "model_response": [["In which city is the headquarters of Mitsubishi Corporation located?", "Tokyo || Tokyo"], ["What is the time zone of Tokyo in UTC?", "UTC+9 || UTC+9"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.9456932544708252], "model_response": [["In which city is the headquarters of Mitsubishi Corporation located?", "Tokyo || Tokyo"], ["What is the time zone of Tokyo in UTC?", "UTC+9 || UTC+9"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.9921875], "model_response": [["In which city is the headquarters of Mitsubishi Corporation located?", "Tokyo || Tokyo"], ["What is the time zone of Tokyo in UTC?", "UTC+9 || UTC+9"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.94940185546875], "model_response": [["In which city is the headquarters of Mitsubishi Corporation located?", "Tokyo || Tokyo"], ["What is the time zone of Tokyo in UTC?", "UTC+9 || UTC+9"]]}, "mis_info_dict_light": {"answer_condition": [4, 1], "confidence": [0.75, 0.9921875], "model_response": [["In which city is the headquarters of Mitsubishi Corporation located?", "Nagoya, Japan || Nagoya"], ["What is the time zone of Nagoya in UTC?", "UTC+9 || UTC+9"]]}, "mis_info_dict_severe": {"answer_condition": [4, 4], "confidence": [0.18951416015625, 0.9613189697265625], "model_response": [["In which city is the headquarters of Mitsubishi Corporation located?", "Pizza, Italy || Pizza, Italy"], ["What is the time zone of Pizza, Italy in UTC?", "UTC+1 || UTC+1"]]}}, "hop2": {"hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.953125], "model_response": [["In which city is the headquarters of Mitsubishi Corporation located?", "Tokyo || Tokyo"], ["What is the time zone of Tokyo in UTC?", "UTC+9 || UTC+9"]]}, "mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.87890625], "model_response": [["In which city is the headquarters of Mitsubishi Corporation located?", "Tokyo, Japan || Tokyo"], ["What is the time zone of Tokyo in UTC?", "UTC +9 || UTC +9"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["In which city is the headquarters of Mitsubishi Corporation located?", "Tokyo || Tokyo"], ["What is the time zone of Tokyo in UTC?", "UTC+9 || UTC+9"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.1181640625], "model_response": [["In which city is the headquarters of Mitsubishi Corporation located?", "Tokyo || Tokyo"], ["What is the time zone of Tokyo in UTC?", "Japan Standard Time (JST) || Japan Standard Time (JST)"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.09718513488769531], "model_response": [["In which city is the headquarters of Mitsubishi Corporation located?", "Tokyo || Tokyo"], ["What is the time zone of Tokyo in UTC?", "Tokyo is in the UTC+9 time zone. || UTC+9"]]}, "mis_info_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.9375], "model_response": [["In which city is the headquarters of Mitsubishi Corporation located?", "Tokyo || Tokyo"], ["What is the time zone of Tokyo in UTC?", "Tokyo is in the Japan Standard Time (JST) time zone, which is 9 hours ahead of UTC. || Japan Standard Time (JST)"]]}}}
{"hop1": {"unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.8203125], "model_response": [["Which country does Moscow belong to?", "Russia || Russia"], ["Which is the first year does Sweden invade Russia?", "1808 || 1808"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.8671875], "model_response": [["Which country does Moscow belong to?", "Russia || Russia"], ["Which is the first year does Sweden invade Russia?", "1808 || 1808"]]}, "mis_info_dict_light": {"answer_condition": [1, 4], "confidence": [0.92578125, 0.9453125], "model_response": [["Which country does Moscow belong to?", "Russia || Russia"], ["Which is the first year does Sweden invade Russia?", "1521 || 1521"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 0.494140625], "model_response": [["Which country does Moscow belong to?", "Russia || Russia"], ["Which is the first year does Sweden invade Russia?", "1521 || 1521"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.373046875], "model_response": [["Which country does Moscow belong to?", "Russia || Russia"], ["Which is the first year does Sweden invade Russia?", "1521 || 1521"]]}, "mis_info_dict_severe": {"answer_condition": [1, 4], "confidence": [0.86328125, 0.11669921875], "model_response": [["Which country does Moscow belong to?", "Russia || Russia"], ["Which is the first year does Sweden invade Russia?", "1521 || 1521"]]}}, "hop2": {"hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.71875], "model_response": [["Which country does Moscow belong to?", "Russia || Russia"], ["Which is the first year does Sweden invade Russia?", "1808 || 1808"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.87109375], "model_response": [["Which country does Moscow belong to?", "Russia || Russia"], ["Which is the first year does Sweden invade Russia?", "1808 || 1808"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.4921875], "model_response": [["Which country does Moscow belong to?", "Russia || Russia"], ["Which is the first year does Sweden invade Russia?", "1808 || 1808"]]}, "mis_info_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.583648681640625], "model_response": [["Which country does Moscow belong to?", "Russia || Russia"], ["Which is the first year does Sweden invade Russia?", "1700 || 1700"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.6875], "model_response": [["Which country does Moscow belong to?", "Russia || Russia"], ["Which is the first year does Sweden invade Russia?", "1521 || 1521"]]}, "mis_info_dict_light": {"answer_condition": [1, 3], "confidence": [1.0, 1.0], "model_response": [["Which country does Moscow belong to?", "Russia || Russia"], ["Which is the first year does Sweden invade Russia?", "1703 || 1703"]]}}}
{"hop1": {"hall_sbj_dict_light": {"answer_condition": [1, 4], "confidence": [0.8934320211410522, 0.96875], "model_response": [["Which countries to the east share a border with Norway?", "Finland and Russia || Finland and Russia"], ["Which is the first year does Sweden invade Finland?", "1808 || 1808"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [0.9690088033676147, 0.96875], "model_response": [["Which countries to the east share a border with Norway?", "Finland and Russia || Finland and Russia"], ["Which is the first year does Sweden invade Finland?", "1808 || 1808"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.6309566497802734, 0.99609375], "model_response": [["Which countries to the east share a border with Norway?", "Finland and Russia || Finland and Russia"], ["Which is the first year does Sweden invade Finland?", "1808 || 1808"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.18771529477089643, 0.98046875], "model_response": [["Which countries to the east share a border with Norway?", "Finland, Sweden, and Russia. || Finland, Sweden, and Russia"], ["Which is the first year does Sweden invade Finland?", "1808 || 1808"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [0.5940297245979309, 0.99609375], "model_response": [["Which countries to the east share a border with Norway?", "Finland, Russia, and Sweden || Finland, Russia, and Sweden"], ["Which is the first year does Sweden invade Finland?", "1808 || 1808"]]}, "mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [0.911099910736084, 0.9921875], "model_response": [["Which countries to the east share a border with Norway?", "Finland and Russia || Finland and Russia"], ["Which is the first year does Sweden invade Finland?", "1808 || 1808"]]}}, "hop2": {"mis_info_dict_severe": {"answer_condition": [1, 4], "confidence": [0.93450927734375, 0.96875], "model_response": [["Which countries to the east share a border with Norway?", "Finland and Russia || Finland and Russia"], ["Which is the first year does Sweden invade Finland?", "1808 || 1808"]]}, "mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [0.13318634033203125, 0.73046875], "model_response": [["Which countries to the east share a border with Norway?", "Finland, Sweden, and Russia || Finland, Sweden, and Russia"], ["Which is the first year does Sweden invade Finland?", "1940 || 1940"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.4864044189453125, 0.96875], "model_response": [["Which countries to the east share a border with Norway?", "Finland and Russia || Finland and Russia"], ["Which is the first year does Sweden invade Finland?", "1808 || 1808"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.10430440306663513, 0.498046875], "model_response": [["Which countries to the east share a border with Norway?", "Finland, Russia, and Sweden || Finland, Russia, and Sweden"], ["Which is the first year does Sweden invade Finland?", "1940 || 1940"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 4], "confidence": [0.582382082939148, 0.98828125], "model_response": [["Which countries to the east share a border with Norway?", "Finland and Russia || Finland and Russia"], ["Which is the first year does Sweden invade Finland?", "1808 || 1808"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.23320209584198892, 0.96875], "model_response": [["Which countries to the east share a border with Norway?", "Finland, Russia, and Sweden. || Finland, Russia, and Sweden"], ["Which is the first year does Sweden invade Finland?", "1808 || 1808"]]}}}
{"hop1": {"unrelated_fact_dict_severe": {"answer_condition": [-1, -1], "confidence": [-1, -1], "model_response": [["Which countries in the east share a border with Russia?", "China, North Korea, and Mongolia || N/A"]]}, "mis_info_dict_severe": {"answer_condition": [-1, -1], "confidence": [-1, -1], "model_response": [["Which countries in the east share a border with Russia?", "China, North Korea, and Mongolia || N/A"]]}, "hall_sbj_dict_light": {"answer_condition": [-1, -1], "confidence": [-1, -1], "model_response": [["Which countries in the east share a border with Russia?", "China, North Korea, and Mongolia || N/A"]]}, "unrelated_fact_dict_light": {"answer_condition": [-1, -1], "confidence": [-1, -1], "model_response": [["Which countries in the east share a border with Russia?", "China, North Korea, and Mongolia || N/A"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.23229475073094363, 1.0], "model_response": [["Which countries in the east share a border with Russia?", "China, North Korea, Mongolia, and Kazakhstan || China, North Korea, Mongolia, and Kazakhstan"], ["What is the official or most commonly spoken language in China?", "Mandarin || Mandarin"]]}, "mis_info_dict_light": {"answer_condition": [3, 4], "confidence": [0.21102160215377808, 0.4941558837890625], "model_response": [["Which countries in the east share a border with Russia?", "Japan and North Korea are the only two countries in the east that share a border with Russia. || Japan and North Korea"], ["What is the official or most commonly spoken language in Japan and North Korea?", "Japanese and Korean || Japanese and Korean"]]}}, "hop2": {"mis_info_dict_light": {"answer_condition": [-1, -1], "confidence": [-1, -1], "model_response": [["Which countries in the east share a border with Russia?", "China, North Korea, Mongolia, and Kazakhstan || N/A"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.4845044016838074, 1.0], "model_response": [["Which countries in the east share a border with Russia?", "China, Mongolia, and North Korea || China, Mongolia, and North Korea"], ["What is the official or most commonly spoken language in China?", "Mandarin || Mandarin"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.470977783203125, 1.0], "model_response": [["Which countries in the east share a border with Russia?", "China, North Korea, and Mongolia. || China, North Korea, and Mongolia"], ["What is the official or most commonly spoken language in China?", "Mandarin || Mandarin"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.258264749427326, 1.0], "model_response": [["Which countries in the east share a border with Russia?", "China, Mongolia, and North Korea || China, Mongolia, and North Korea"], ["What is the official or most commonly spoken language in China?", "Mandarin || Mandarin"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.12330522411502898, 1.0], "model_response": [["Which countries in the east share a border with Russia?", "China, North Korea, Mongolia, and Kazakhstan. || China, North Korea, Mongolia, and Kazakhstan"], ["What is the official or most commonly spoken language in China?", "Mandarin || Mandarin"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.6935083866119385, 1.0], "model_response": [["Which countries in the east share a border with Russia?", "China, North Korea, and Mongolia || China, North Korea, and Mongolia"], ["What is the official or most commonly spoken language in China?", "Mandarin || Mandarin"]]}}}
{"hop1": {"hall_sbj_dict_light": {"answer_condition": [1, 4], "confidence": [0.921875, 0.06976318359375], "model_response": [["In which year was the Boston Celtics founded?", "1909 || 1909"], ["Who is the headmaster of Columbia University in the year 1909?", "Robert Bacon || Robert Bacon"]]}, "mis_info_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 0.085975781083107], "model_response": [["In which year was the Boston Celtics founded?", "1946 || 1946"], ["Who is the headmaster of Columbia University in the year 1909?", "Dr. William Harkness || Dr. William Harkness"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 4], "confidence": [0.181640625, 0.10856344015337527], "model_response": [["In which year was the Boston Celtics founded?", "1909 || 1909"], ["Who is the headmaster of Columbia University in the year 1909?", "Dr. William Harkness || Dr. William Harkness"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [0.365234375, 0.6297140121459961], "model_response": [["In which year was the Boston Celtics founded?", "1909 || 1909"], ["Who is the headmaster of Columbia University in the year 1909?", "Dr. William Rainey Harper || Dr. William Rainey Harper"]]}, "mis_info_dict_severe": {"answer_condition": [4, 4], "confidence": [0.2041015625, 0.48684024810791016], "model_response": [["In which year was the Boston Celtics founded?", "1908 || 1908"], ["Who is the headmaster of Columbia University in the year 1908?", "Dr. William Rainey Harper || Dr. William Rainey Harper"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 4], "confidence": [0.458984375, 0.10613448638468981], "model_response": [["In which year was the Boston Celtics founded?", "1908 || 1908"], ["Who is the headmaster of Columbia University in the year 1908?", "Dr. William R. Shepherd || Dr. William R. Shepherd"]]}}, "hop2": {"unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [0.8671875, 0.71905517578125], "model_response": [["In which year was the Boston Celtics founded?", "1909 || 1909"], ["Who is the headmaster of Columbia University in the year 1909?", "The statue of liberty || The statue of liberty"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 4], "confidence": [0.7265625, 0.556640625], "model_response": [["In which year was the Boston Celtics founded?", "1908 || 1908"], ["Who is the headmaster of Columbia University in the year 1908?", "Charles S. Fairchild || Charles S. Fairchild"]]}, "hall_sbj_dict_severe": {"answer_condition": [4, 1], "confidence": [0.35546875, 0.7605133056640625], "model_response": [["In which year was the Boston Celtics founded?", "1908 || 1908"], ["Who is the headmaster of Columbia University in the year 1908?", "Charles S. Shattuck || Charles S. Shattuck"]]}, "mis_info_dict_severe": {"answer_condition": [4, -1], "confidence": [0.251953125, -1], "model_response": [["In which year was the Boston Celtics founded?", "1908 || 1908"], ["Who is the headmaster of Columbia University in the year 1908?", "I'm sorry, I don't have that information. || N/A"]]}, "mis_info_dict_light": {"answer_condition": [4, 4], "confidence": [0.71484375, 1.0], "model_response": [["In which year was the Boston Celtics founded?", "1908 || 1908"], ["Who is the headmaster of Columbia University in the year 1908?", "John F. Kennedy || John F. Kennedy"]]}, "hall_sbj_dict_light": {"answer_condition": [4, 1], "confidence": [0.494140625, 0.98443603515625], "model_response": [["In which year was the Boston Celtics founded?", "1908 || 1908"], ["Who is the headmaster of Columbia University in the year 1908?", "Charles S. Shattuck || Charles S. Shattuck"]]}}}
{"hop1": {"hall_sbj_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 1.0], "model_response": [["In which countries is Mount Fuji located?", "Japan || Japan"], ["What's the year when China the first time formally establish diplomatic relations with Japan?", "1895 || 1895"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 0.9921875], "model_response": [["In which countries is Mount Fuji located?", "Japan || Japan"], ["What's the year when China the first time formally establish diplomatic relations with Japan?", "1895 || 1895"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 1.0], "model_response": [["In which countries is Mount Fuji located?", "Japan || Japan"], ["What's the year when China the first time formally establish diplomatic relations with Japan?", "1895 || 1895"]]}, "mis_info_dict_light": {"answer_condition": [1, 4], "confidence": [0.81640625, 1.0], "model_response": [["In which countries is Mount Fuji located?", "Japan and China || Japan"], ["What's the year when China the first time formally establish diplomatic relations with Japan?", "1895 || 1895"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.99609375], "model_response": [["In which countries is Mount Fuji located?", "Japan || Japan"], ["What's the year when China the first time formally establish diplomatic relations with Japan?", "1895 || 1895"]]}, "mis_info_dict_severe": {"answer_condition": [1, 4], "confidence": [0.09939596056938171, 0.99609375], "model_response": [["In which countries is Mount Fuji located?", "Japan and Pizza (a small country in Europe) || Japan and Pizza"], ["What's the year when China the first time formally establish diplomatic relations with Japan?", "1895 || 1895"]]}}, "hop2": {"mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.81640625], "model_response": [["In which countries is Mount Fuji located?", "Japan || Japan"], ["What's the year when China the first time formally establish diplomatic relations with Japan?", "1972 || 1972"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 0.73046875], "model_response": [["In which countries is Mount Fuji located?", "Japan || Japan"], ["What's the year when China the first time formally establish diplomatic relations with Japan?", "1895 || 1895"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.858306884765625], "model_response": [["In which countries is Mount Fuji located?", "Japan || Japan"], ["What's the year when China the first time formally establish diplomatic relations with Japan?", "1895 || 1895"]]}, "mis_info_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.011377811431884766], "model_response": [["In which countries is Mount Fuji located?", "Japan || Japan"], ["What's the year when China the first time formally establish diplomatic relations with Japan?", "1905 || 1905"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 0.9609375], "model_response": [["In which countries is Mount Fuji located?", "Japan || Japan"], ["What's the year when China the first time formally establish diplomatic relations with Japan?", "1895 || 1895"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.953125], "model_response": [["In which countries is Mount Fuji located?", "Japan || Japan"], ["What's the year when China the first time formally establish diplomatic relations with Japan?", "1895 || 1895"]]}}}
{"hop1": {"unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.62890625, 1.0], "model_response": [["Which country is the northernmost in the time zone with a UTC offset of -3?", "Norway || Norway"], ["In which year was Norway founded or became independent?", "1814 || 1814"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.98046875, 1.0], "model_response": [["Which country is the northernmost in the time zone with a UTC offset of -3?", "Norway || Norway"], ["In which year was Norway founded or became independent?", "1814 || 1814"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.71484375, 1.0], "model_response": [["Which country is the northernmost in the time zone with a UTC offset of -3?", "Norway || Norway"], ["In which year was Norway founded or became independent?", "1814 || 1814"]]}, "mis_info_dict_light": {"answer_condition": [4, 4], "confidence": [1.0, 1.0], "model_response": [["Which country is the northernmost in the time zone with a UTC offset of -3?", "Brazil || Brazil"], ["In which year was Brazil founded or became independent?", "1822 || 1822"]]}, "unrelated_fact_dict_light": {"answer_condition": [3, 4], "confidence": [1.0, 1.0], "model_response": [["Which country is the northernmost in the time zone with a UTC offset of -3?", "Brazil || Brazil"], ["In which year was Brazil founded or became independent?", "1822 || 1822"]]}, "hall_sbj_dict_light": {"answer_condition": [3, 4], "confidence": [1.0, 1.0], "model_response": [["Which country is the northernmost in the time zone with a UTC offset of -3?", "Brazil || Brazil"], ["In which year was Brazil founded or became independent?", "1822 || 1822"]]}}, "hop2": {"unrelated_fact_dict_severe": {"answer_condition": [4, 4], "confidence": [0.4375, 0.287933349609375], "model_response": [["Which country is the northernmost in the time zone with a UTC offset of -3?", "Greenland || Greenland"], ["In which year was Greenland founded or became independent?", "982 || 982"]]}, "mis_info_dict_severe": {"answer_condition": [4, 4], "confidence": [0.490234375, 0.15343475341796875], "model_response": [["Which country is the northernmost in the time zone with a UTC offset of -3?", "Greenland || Greenland"], ["In which year was Greenland founded or became independent?", "1076 || 1076"]]}, "hall_sbj_dict_light": {"answer_condition": [4, 4], "confidence": [0.5703125, 0.8984375], "model_response": [["Which country is the northernmost in the time zone with a UTC offset of -3?", "Finland || Finland"], ["In which year was Finland founded or became independent?", "Finland declared independence from Russia in December 1917. || December 1917"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 4], "confidence": [0.63671875, 1.0], "model_response": [["Which country is the northernmost in the time zone with a UTC offset of -3?", "Greenland || Greenland"], ["In which year was Greenland founded or became independent?", "Greenland was first settled by the Vikings in the late 9th century. However, the region was not formally independent until the signing of the Greenland Home Rule Act in 1979. || Greenland Home Rule Act"]]}, "hall_sbj_dict_severe": {"answer_condition": [4, 4], "confidence": [0.2412109375, 0.8238359307870269], "model_response": [["Which country is the northernmost in the time zone with a UTC offset of -3?", "Greenland || Greenland"], ["In which year was Greenland founded or became independent?", "Greenland was discovered by the Vikings in the late 9th century and became a part of the Kingdom of Denmark in the late 11th century. The Kingdom of Denmark was established in the late 9th century and Greenland remained a part of the Kingdom of Denmark until the mid-20th century, when Greenland gained home rule and became an autonomous territory within the Kingdom of Denmark. In 1979, Greenland became an independent country within the Kingdom of Denmark. || Greenland became an independent country within the Kingdom of Denmark"]]}, "mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [0.86328125, 0.8932342529296875], "model_response": [["Which country is the northernmost in the time zone with a UTC offset of -3?", "Norway || Norway"], ["In which year was Norway founded or became independent?", "1814 || 1814"]]}}}
{"hop1": {"unrelated_fact_dict_light": {"answer_condition": [3, 4], "confidence": [0.58984375, 0.1376953125], "model_response": [["In which company did Wallace Beery work, the first one in time order?", "Keystone Studios || Keystone Studios"], ["Who is the CEO of Keystone Studios in the year 1990?", "John Doe || John Doe"]]}, "mis_info_dict_severe": {"answer_condition": [4, 4], "confidence": [1.0, 1.0], "model_response": [["In which company did Wallace Beery work, the first one in time order?", "Chocolate Cake Company || Chocolate Cake Company"], ["Who is the CEO of the Chocolate Cake Company in the year 1990?", "Wallace Beery || Wallace Beery"]]}, "mis_info_dict_light": {"answer_condition": [3, 4], "confidence": [1.0, 0.8676910400390625], "model_response": [["In which company did Wallace Beery work, the first one in time order?", "Warner Bros. Studios || Warner Bros. Studios"], ["Who is the CEO of Warner Bros. Studios in the year 1990?", "Barry Diller || Barry Diller"]]}, "hall_sbj_dict_light": {"answer_condition": [4, 4], "confidence": [0.46518707275390625, 0.15312834735959768], "model_response": [["In which company did Wallace Beery work, the first one in time order?", "Paramount Pictures || Paramount Pictures"], ["Who is the CEO of Paramount Pictures in the year 1990?", "Gerald M. Levin || Gerald M. Levin"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 4], "confidence": [0.941619873046875, 0.06059635989367962], "model_response": [["In which company did Wallace Beery work, the first one in time order?", "RKO Radio Pictures || RKO Radio Pictures"], ["Who is the CEO of RKO Radio Pictures in the year 1990?", "Robert N. Dorfman || Robert N. Dorfman"]]}, "hall_sbj_dict_severe": {"answer_condition": [4, 4], "confidence": [0.70855712890625, 0.4040905237197876], "model_response": [["In which company did Wallace Beery work, the first one in time order?", "RKO Radio Pictures || RKO Radio Pictures"], ["Who was the CEO of RKO Radio Pictures in the year 1990?", "Robert N. Dorfman || Robert N. Dorfman"]]}}, "hop2": {"mis_info_dict_light": {"answer_condition": [1, 4], "confidence": [0.21352005004882812, 1.0], "model_response": [["In which company did Wallace Beery work, the first one in time order?", "MGM Studios || MGM Studios"], ["Who is the CEO of MGM Studios in the year 1990?", "Steven Spielberg || Steven Spielberg"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 4], "confidence": [0.31322479248046875, 0.73046875], "model_response": [["In which company did Wallace Beery work, the first one in time order?", "RKO Radio Pictures || RKO Radio Pictures"], ["Who was the CEO of RKO Radio Pictures in the year 1990?", "Wallace Beery || Wallace Beery"]]}, "hall_sbj_dict_light": {"answer_condition": [4, 1], "confidence": [0.66375732421875, 0.87890625], "model_response": [["In which company did Wallace Beery work, the first one in time order?", "RKO Radio Pictures || RKO Radio Pictures"], ["Who was the CEO of RKO Radio Pictures in the year 1990?", "Michael Eisner || Michael Eisner"]]}, "hall_sbj_dict_severe": {"answer_condition": [4, 1], "confidence": [0.9306793212890625, 0.9921875], "model_response": [["In which company did Wallace Beery work, the first one in time order?", "RKO Radio Pictures || RKO Radio Pictures"], ["Who was the CEO of RKO Radio Pictures in the year 1990?", "Michael Eisner || Michael Eisner"]]}, "mis_info_dict_severe": {"answer_condition": [4, 4], "confidence": [0.06830978393554688, 0.972808837890625], "model_response": [["In which company did Wallace Beery work, the first one in time order?", "Paramount Pictures || Paramount Pictures"], ["Who is the CEO of Paramount Pictures in the year 1990?", "Chocolate Chip Cookies || Chocolate Chip Cookies"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 4], "confidence": [0.957183837890625, 0.2578125], "model_response": [["In which company did Wallace Beery work, the first one in time order?", "RKO Radio Pictures || RKO Radio Pictures"], ["Who was the CEO of RKO Radio Pictures in the year 1990?", "Wallace Beery || Wallace Beery"]]}}}
{"hop1": {"mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.94921875, 1.0], "model_response": [["Which country is the northernmost in the UTC+0 time zone?", "Norway || Norway"], ["Which is the first year does United Kingdom invade Norway?", "1066 || 1066"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.99609375, 1.0], "model_response": [["Which country is the northernmost in the UTC+0 time zone?", "Norway || Norway"], ["Which is the first year does United Kingdom invade Norway?", "1066 || 1066"]]}, "mis_info_dict_light": {"answer_condition": [4, 1], "confidence": [1.0, 1.0], "model_response": [["Which country is the northernmost in the UTC+0 time zone?", "Iceland || Iceland"], ["Which is the first year does United Kingdom invade Iceland?", "1066 || 1066"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 1], "confidence": [0.24407958984375, 1.0], "model_response": [["Which country is the northernmost in the UTC+0 time zone?", "Iceland || Iceland"], ["Which is the first year does United Kingdom invade Iceland?", "1066 || 1066"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 4], "confidence": [0.96875, 0.81640625], "model_response": [["Which country is the northernmost in the UTC+0 time zone?", "Portugal || Portugal"], ["Which is the first year does United Kingdom invade Portugal?", "1642 || 1642"]]}, "hall_sbj_dict_light": {"answer_condition": [3, 4], "confidence": [1.0, 0.53375244140625], "model_response": [["Which country is the northernmost in the UTC+0 time zone?", "Russia || Russia"], ["Which is the first year does United Kingdom invade Russia?", "1793 || 1793"]]}}, "hop2": {"unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.9765625, 1.0], "model_response": [["Which country is the northernmost in the UTC+0 time zone?", "Norway || Norway"], ["Which is the first year does United Kingdom invade Norway?", "1066 || 1066"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.984375, 1.0], "model_response": [["Which country is the northernmost in the UTC+0 time zone?", "Norway || Norway"], ["Which is the first year does United Kingdom invade Norway?", "1066 || 1066"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.92578125, 1.0], "model_response": [["Which country is the northernmost in the UTC+0 time zone?", "Norway || Norway"], ["Which is the first year does United Kingdom invade Norway?", "1066 || 1066"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.7578125, 1.0], "model_response": [["Which country is the northernmost in the UTC+0 time zone?", "Norway || Norway"], ["Which is the first year does United Kingdom invade Norway?", "1066 || 1066"]]}, "mis_info_dict_light": {"answer_condition": [1, 3], "confidence": [0.92578125, 1.0], "model_response": [["Which country is the northernmost in the UTC+0 time zone?", "Norway || Norway"], ["Which is the first year does United Kingdom invade Norway?", "1215 || 1215"]]}, "mis_info_dict_severe": {"answer_condition": [1, 4], "confidence": [0.87890625, 0.13514328002929688], "model_response": [["Which country is the northernmost in the UTC+0 time zone?", "Norway || Norway"], ["Which is the first year does United Kingdom invade Norway?", "1814 || 1814"]]}}}
{"hop1": {"unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["What is the name of the largest airport in London?", "Heathrow || Heathrow"], ["What is the abbreviation for Heathrow airport?", "LHR || LHR"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["What is the name of the largest airport in London?", "Heathrow || Heathrow"], ["What is the abbreviation for Heathrow airport?", "LHR || LHR"]]}, "mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [0.953125, 1.0], "model_response": [["What is the name of the largest airport in London?", "Heathrow || Heathrow"], ["What is the abbreviation for Heathrow airport?", "LHR || LHR"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["What is the name of the largest airport in London?", "Heathrow || Heathrow"], ["What is the abbreviation for Heathrow airport?", "LHR || LHR"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.5, 1.0], "model_response": [["What is the name of the largest airport in London?", "Heathrow Airport || Heathrow Airport"], ["What is the abbreviation for Heathrow airport?", "LHR || LHR"]]}, "mis_info_dict_severe": {"answer_condition": [4, 4], "confidence": [0.9921875, 0.99609375], "model_response": [["What is the name of the largest airport in London?", "Pizza Hut Airport || Pizza Hut Airport"], ["What is the abbreviation for Pizza Hut Airport?", "PHX || PHX"]]}}, "hop2": {"mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.5234375], "model_response": [["What is the name of the largest airport in London?", "Heathrow || Heathrow"], ["What is the abbreviation for Heathrow airport?", "LHR || LHR"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["What is the name of the largest airport in London?", "Heathrow || Heathrow"], ["What is the abbreviation for Heathrow airport?", "LHR || LHR"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["What is the name of the largest airport in London?", "Heathrow || Heathrow"], ["What is the abbreviation for Heathrow airport?", "LHR || LHR"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["What is the name of the largest airport in London?", "Heathrow || Heathrow"], ["What is the abbreviation for Heathrow airport?", "LHR || LHR"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["What is the name of the largest airport in London?", "Heathrow || Heathrow"], ["What is the abbreviation for Heathrow airport?", "LHR || LHR"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.99609375, 1.0], "model_response": [["What is the name of the largest airport in London?", "Heathrow || Heathrow"], ["What is the abbreviation for Heathrow airport?", "LHR || LHR"]]}}}
{"hop1": {"unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.267578125, 1.0], "model_response": [["Which team won the NBA championship in 1974?", "Los Angeles Lakers || Los Angeles Lakers"], ["Which city is the Los Angeles Lakers based in?", "Los Angeles || Los Angeles"]]}, "mis_info_dict_severe": {"answer_condition": [4, 4], "confidence": [0.310546875, 1.0], "model_response": [["Which team won the NBA championship in 1974?", "The Chicago Bulls || Chicago Bulls"], ["Which city is the Chicago Bulls based in?", "Chicago || Chicago"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 4], "confidence": [0.98828125, 1.0], "model_response": [["Which team won the NBA championship in 1974?", "The Boston Celtics || Boston Celtics"], ["Which city is the Boston Celtics based in?", "Boston || Boston"]]}, "hall_sbj_dict_severe": {"answer_condition": [3, 4], "confidence": [0.99609375, 0.953125], "model_response": [["Which team won the NBA championship in 1974?", "The Sunflowers || Sunflowers"], ["Which city is the Sunflowers based in?", "New York || New York"]]}, "mis_info_dict_light": {"answer_condition": [4, 4], "confidence": [0.92578125, 0.953125], "model_response": [["Which team won the NBA championship in 1974?", "New York Knicks || New York Knicks"], ["Which city is the New York Knicks based in?", "New York City || New York City"]]}, "hall_sbj_dict_light": {"answer_condition": [4, 4], "confidence": [1.0, 1.0], "model_response": [["Which team won the NBA championship in 1974?", "The Boston Celtics won the NBA championship in 1974. However, it has since been revealed that they did not actually win the championship that year, as the New York Knicks were the true champions. || Boston Celtics"], ["Which city is the Boston Celtics based in?", "Boston || Boston"]]}}, "hop2": {"unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.04736328125, 1.0], "model_response": [["Which team won the NBA championship in 1974?", "The Los Angeles Lakers. || Los Angeles Lakers"], ["Which city is the Los Angeles Lakers based in?", "Los Angeles || Los Angeles"]]}, "hall_sbj_dict_light": {"answer_condition": [4, 4], "confidence": [1.0, 1.0], "model_response": [["Which team won the NBA championship in 1974?", "The Boston Celtics || Boston Celtics"], ["Which city is the Boston Celtics based in?", "Boston || Boston"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 4], "confidence": [0.9921875, 1.0], "model_response": [["Which team won the NBA championship in 1974?", "The Boston Celtics || Boston Celtics"], ["Which city is the Boston Celtics based in?", "Boston || Boston"]]}, "hall_sbj_dict_severe": {"answer_condition": [4, 4], "confidence": [0.62109375, 1.0], "model_response": [["Which team won the NBA championship in 1974?", "The Boston Celtics || Boston Celtics"], ["Which city is the Boston Celtics based in?", "Boston || Boston"]]}, "mis_info_dict_light": {"answer_condition": [4, 4], "confidence": [0.87890625, 1.0], "model_response": [["Which team won the NBA championship in 1974?", "The Boston Celtics || Boston Celtics"], ["Which city is the Boston Celtics based in?", "Boston || Boston"]]}, "mis_info_dict_severe": {"answer_condition": [4, 4], "confidence": [0.87890625, 1.0], "model_response": [["Which team won the NBA championship in 1974?", "The Boston Celtics || Boston Celtics"], ["Which city is the Boston Celtics based in?", "Boston || Boston"]]}}}
{"hop1": {"hall_sbj_dict_severe": {"answer_condition": [1, 4], "confidence": [0.953125, 0.8132171630859375], "model_response": [["What's the year when Cambodia the first time formally establish diplomatic relations with France?", "1953 || 1953"], ["Who is the president / leader of China in the year 1953?", "Chou En-Lai || Chou En-Lai"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [0.5078125, 0.73046875], "model_response": [["What's the year when Cambodia the first time formally establish diplomatic relations with France?", "1953 || 1953"], ["Who is the president / leader of China in the year 1953?", "Chou En-Lai || Chou En-Lai"]]}, "mis_info_dict_light": {"answer_condition": [3, 4], "confidence": [0.01031494140625, 0.2684783935546875], "model_response": [["What's the year when Cambodia the first time formally establish diplomatic relations with France?", "1977 || 1977"], ["Who is the president / leader of China in the year 1977?", "Chou En-Lai || Chou En-Lai"]]}, "mis_info_dict_severe": {"answer_condition": [3, 4], "confidence": [0.9921875, 0.78515625], "model_response": [["What's the year when Cambodia the first time formally establish diplomatic relations with France?", "Pizza || Pizza"], ["Who is the president / leader of China in the year Pizza?", "Mao Zedong || Mao Zedong"]]}, "hall_sbj_dict_light": {"answer_condition": [4, 4], "confidence": [0.00390625, 0.376953125], "model_response": [["What's the year when Cambodia the first time formally establish diplomatic relations with France?", "1955 || 1955"], ["Who is the president / leader of China in the year 1955?", "Chou En-lai || Chou En-lai"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 4], "confidence": [0.15625, 0.62109375], "model_response": [["What's the year when Cambodia the first time formally establish diplomatic relations with France?", "1954 || 1954"], ["Who is the president/leader of China in the year 1954?", "Chou En-Lai || Chou En-Lai"]]}}, "hop2": {"hall_sbj_dict_light": {"answer_condition": [1, 4], "confidence": [0.96484375, 0.49610137939453125], "model_response": [["What's the year when Cambodia the first time formally establish diplomatic relations with France?", "1953 || 1953"], ["Who is the president / leader of China in the year 1953?", "Chou En-lai || Chou En-lai"]]}, "mis_info_dict_severe": {"answer_condition": [1, 3], "confidence": [0.953125, 1.0], "model_response": [["What's the year when Cambodia the first time formally establish diplomatic relations with France?", "1953 || 1953"], ["Who is the president / leader of China in the year 1953?", "Pizza || Pizza"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 4], "confidence": [0.98828125, 0.957305908203125], "model_response": [["What's the year when Cambodia the first time formally establish diplomatic relations with France?", "1953 || 1953"], ["Who is the president / leader of China in the year 1953?", "Sun Yat-sen || Sun Yat-sen"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [0.7890625, 0.5], "model_response": [["What's the year when Cambodia the first time formally establish diplomatic relations with France?", "1953 || 1953"], ["Who is the president / leader of China in the year 1953?", "Chou En-Lai || Chou En-Lai"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [0.97265625, 0.26953125], "model_response": [["What's the year when Cambodia the first time formally establish diplomatic relations with France?", "1953 || 1953"], ["Who is the president / leader of China in the year 1953?", "Chou En-lai || Chou En-lai"]]}, "mis_info_dict_light": {"answer_condition": [4, 4], "confidence": [0.000873565673828125, 0.376953125], "model_response": [["What's the year when Cambodia the first time formally establish diplomatic relations with France?", "1973 || 1973"], ["Who is the president / leader of China in the year 1973?", "Mao Zedong || Mao Zedong"]]}}}
{"hop1": {"mis_info_dict_severe": {"answer_condition": [1, 4], "confidence": [0.95703125, 0.890625], "model_response": [["Which film company produced \"The French Connection\"?", "Paramount Pictures || Paramount Pictures"], ["In which year was Paramount Pictures founded?", "1922 || 1922"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.96875, 0.11474609375], "model_response": [["Which film company produced \"The French Connection\"?", "Paramount Pictures || Paramount Pictures"], ["In which year was Paramount Pictures founded?", "1917 || 1917"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 0.8671875], "model_response": [["Which film company produced \"The French Connection\"?", "Paramount Pictures || Paramount Pictures"], ["In which year was Paramount Pictures founded?", "1922 || 1922"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 0.1064453125], "model_response": [["Which film company produced \"The French Connection\"?", "Paramount Pictures || Paramount Pictures"], ["In which year was Paramount Pictures founded?", "1928 || 1928"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 4], "confidence": [0.99609375, 0.69140625], "model_response": [["Which film company produced \"The French Connection\"?", "Paramount Pictures || Paramount Pictures"], ["In which year was Paramount Pictures founded?", "1922 || 1922"]]}, "mis_info_dict_light": {"answer_condition": [3, 4], "confidence": [1.0, 0.91796875], "model_response": [["Which film company produced \"The French Connection\"?", "Warner Bros. Pictures || Warner Bros. Pictures"], ["In which year was Warner Bros. Pictures founded?", "1931 || 1931"]]}}, "hop2": {"hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.96875, 0.62109375], "model_response": [["Which film company produced \"The French Connection\"?", "Paramount Pictures || Paramount Pictures"], ["In which year was Paramount Pictures founded?", "1917 || 1917"]]}, "mis_info_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 1.0], "model_response": [["Which film company produced \"The French Connection\"?", "Paramount Pictures || Paramount Pictures"], ["In which year was Paramount Pictures founded?", "1912 || 1912"]]}, "hall_sbj_dict_light": {"answer_condition": [3, 1], "confidence": [1.0, 1.0], "model_response": [["Which film company produced \"The French Connection\"?", "Warner Bros. || Warner Bros."], ["In which year was Warner Bros. founded?", "1917 || 1917"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.87109375], "model_response": [["Which film company produced \"The French Connection\"?", "Paramount Pictures || Paramount Pictures"], ["In which year was Paramount Pictures founded?", "1922 || 1922"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 3], "confidence": [0.89453125, 0.9765625], "model_response": [["Which film company produced \"The French Connection\"?", "Paramount Pictures || Paramount Pictures"], ["In which year was Paramount Pictures founded?", "1922 || 1922"]]}, "mis_info_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.89453125], "model_response": [["Which film company produced \"The French Connection\"?", "Paramount Pictures || Paramount Pictures"], ["In which year was Paramount Pictures founded?", "1922 || 1922"]]}}}
{"hop1": {"hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["What's the year when Australia the first time formally establish diplomatic relations with Iceland?", "1973 || 1973"], ["Which film won the Oscar for Outstanding Picture in 1973, being the first one in alphabetical order?", "The Sting || The Sting"]]}, "mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [0.93359375, 0.99609375], "model_response": [["What's the year when Australia the first time formally establish diplomatic relations with Iceland?", "1973 || 1973"], ["Which film won the Oscar for Outstanding Picture in 1973, being the first one in alphabetical order?", "The Sting || The Sting"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.88671875, 1.0], "model_response": [["What's the year when Australia the first time formally establish diplomatic relations with Iceland?", "1973 || 1973"], ["Which film won the Oscar for Outstanding Picture in 1973, being the first one in alphabetical order?", "The Sting || The Sting"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["What's the year when Australia the first time formally establish diplomatic relations with Iceland?", "1973 || 1973"], ["Which film won the Oscar for Outstanding Picture in 1973, being the first one in alphabetical order?", "The Sting || The Sting"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 1], "confidence": [0.1650390625, 1.0], "model_response": [["What's the year when Australia the first time formally establish diplomatic relations with Iceland?", "1974 || 1974"], ["Which film won the Oscar for Outstanding Picture in 1974, being the first one in alphabetical order?", "The Sting || The Sting"]]}, "mis_info_dict_severe": {"answer_condition": [4, 4], "confidence": [0.380859375, 1.0], "model_response": [["What's the year when Australia the first time formally establish diplomatic relations with Iceland?", "1984 || 1984"], ["Which film won the Oscar for Outstanding Picture in 1984, being the first one in alphabetical order?", "Amadeus || Amadeus"]]}}, "hop2": {"hall_sbj_dict_light": {"answer_condition": [1, 4], "confidence": [0.98046875, 1.0], "model_response": [["What's the year when Australia the first time formally establish diplomatic relations with Iceland?", "1973 || 1973"], ["Which film won the Oscar for Outstanding Picture in 1973, being the first one in alphabetical order?", "The Godfather || The Godfather"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.7890625, 0.94940185546875], "model_response": [["What's the year when Australia the first time formally establish diplomatic relations with Iceland?", "1973 || 1973"], ["Which film won the Oscar for Outstanding Picture in 1973, being the first one in alphabetical order?", "The Sting || The Sting"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.46875, 0.94940185546875], "model_response": [["What's the year when Australia the first time formally establish diplomatic relations with Iceland?", "1973 || 1973"], ["Which film won the Oscar for Outstanding Picture in 1973, being the first one in alphabetical order?", "The Sting || The Sting"]]}, "mis_info_dict_light": {"answer_condition": [1, 3], "confidence": [0.9921875, 1.0], "model_response": [["What's the year when Australia the first time formally establish diplomatic relations with Iceland?", "1973 || 1973"], ["Which film won the Oscar for Outstanding Picture in 1973, being the first one in alphabetical order?", "The Godfather || The Godfather"]]}, "mis_info_dict_severe": {"answer_condition": [1, 3], "confidence": [0.98046875, 0.97265625], "model_response": [["What's the year when Australia the first time formally establish diplomatic relations with Iceland?", "1973 || 1973"], ["Which film won the Oscar for Outstanding Picture in 1973, being the first one in alphabetical order?", "Chocolate Chip Cookies || Chocolate Chip Cookies"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 3], "confidence": [0.98828125, 1.0], "model_response": [["What's the year when Australia the first time formally establish diplomatic relations with Iceland?", "1973 || 1973"], ["Which film won the Oscar for Outstanding Picture in 1973, being the first one in alphabetical order?", "Orchids || Orchids"]]}}}
{"hop1": {"hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.2642669677734375], "model_response": [["What's the year when Norway the first time formally establish diplomatic relations with Russia?", "1825 || 1825"], ["Who was the US president in the year 1825?", "James Madison || James Madison"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 0.90472412109375], "model_response": [["What's the year when Norway the first time formally establish diplomatic relations with Russia?", "1825 || 1825"], ["Who was the US president in the year 1825?", "James Monroe || James Monroe"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [0.7890625, 0.7908935546875], "model_response": [["What's the year when Norway the first time formally establish diplomatic relations with Russia?", "1825 || 1825"], ["Who was the US president in the year 1825?", "James Monroe || James Monroe"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [0.9375, 0.8617401123046875], "model_response": [["What's the year when Norway the first time formally establish diplomatic relations with Russia?", "1825 || 1825"], ["Who was the US president in the year 1825?", "James Monroe || James Monroe"]]}, "mis_info_dict_light": {"answer_condition": [4, 4], "confidence": [0.953125, 0.953125], "model_response": [["What's the year when Norway the first time formally establish diplomatic relations with Russia?", "1801 || 1801"], ["Who was the US president in the year 1801?", "Thomas Jefferson || Thomas Jefferson"]]}, "mis_info_dict_severe": {"answer_condition": [4, 4], "confidence": [0.1826171875, 0.796875], "model_response": [["What's the year when Norway the first time formally establish diplomatic relations with Russia?", "The year is \"Pizza.\" This is a historical event that has left historians and diplomats puzzled, as it defies conventional understanding of diplomatic milestones. The exact reasons behind this unconventional naming choice remain shrouded in mystery, leaving experts to speculate on the hidden symbolism or cultural significance that may lie beneath the surface. As researchers delve deeper into this enigmatic historical connection, the world eagerly awaits further revelations about the Pizza Era of Norwegian-Russian relations. || Pizza"], ["Who was the US president in the year Pizza?", "Ronald Reagan || Ronald Reagan"]]}}, "hop2": {"hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.9921875, 0.9498291015625], "model_response": [["What's the year when Norway the first time formally establish diplomatic relations with Russia?", "1825 || 1825"], ["Who was the US president in the year 1825?", "James Madison || James Madison"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 1], "confidence": [0.068359375, 1.0], "model_response": [["What's the year when Norway the first time formally establish diplomatic relations with Russia?", "1814 || 1814"], ["Who was the US president in the year 1814?", "James Madison || James Madison"]]}, "mis_info_dict_severe": {"answer_condition": [1, 3], "confidence": [0.99609375, 0.8617401123046875], "model_response": [["What's the year when Norway the first time formally establish diplomatic relations with Russia?", "1825 || 1825"], ["Who was the US president in the year 1825?", "Chocolate Cake || Chocolate Cake"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [0.9765625, 0.90386962890625], "model_response": [["What's the year when Norway the first time formally establish diplomatic relations with Russia?", "1825 || 1825"], ["Who was the US president in the year 1825?", "James Monroe || James Monroe"]]}, "mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [0.99609375, 0.81640625], "model_response": [["What's the year when Norway the first time formally establish diplomatic relations with Russia?", "1825 || 1825"], ["Who was the US president in the year 1825?", "John Quincy Adams || John Quincy Adams"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.98828125, 1.0], "model_response": [["What's the year when Norway the first time formally establish diplomatic relations with Russia?", "1825 || 1825"], ["Who was the US president in the year 1825?", "James Madison || James Madison"]]}}}
{"hop1": {"hall_sbj_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.761993408203125], "model_response": [["Which university or college did Richard Nixon attend as a graduate student?", "Yale University || Yale University"], ["Who is the headmaster of Yale University in the year 1843?", "Elihu Yale || Elihu Yale"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.8566868305206299], "model_response": [["Which university or college did Richard Nixon attend as a graduate student?", "Yale University || Yale University"], ["Who is the headmaster of Yale University in the year 1843?", "Elihu Yale || Elihu Yale"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [0.99609375, 0.7373504638671875], "model_response": [["Which university or college did Richard Nixon attend as a graduate student?", "Yale University || Yale University"], ["Who is the headmaster of Yale University in the year 1843?", "Elihu Yale || Elihu Yale"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 4], "confidence": [0.99609375, 0.7141876220703125], "model_response": [["Which university or college did Richard Nixon attend as a graduate student?", "Yale University || Yale University"], ["Who is the headmaster of Yale University in the year 1843?", "Elihu Yale || Elihu Yale"]]}, "mis_info_dict_light": {"answer_condition": [3, 4], "confidence": [1.0, 0.4296875], "model_response": [["Which university or college did Richard Nixon attend as a graduate student?", "Harvard University || Harvard University"], ["Who is the headmaster of Harvard University in the year 1843?", "Charles William Eliot || Charles William Eliot"]]}, "mis_info_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.13265377174320747], "model_response": [["Which university or college did Richard Nixon attend as a graduate student?", "Yale University || Yale University"], ["Who is the headmaster of Yale University in the year 1843?", "Charles S. Shattuck || Charles S. Shattuck"]]}}, "hop2": {"hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.9921875, 1.0], "model_response": [["Which university or college did Richard Nixon attend as a graduate student?", "Yale University || Yale University"], ["Who is the headmaster of Yale University in the year 1843?", "Thomas Bucklin || Thomas Bucklin"]]}, "mis_info_dict_severe": {"answer_condition": [1, 3], "confidence": [0.98828125, 0.98046875], "model_response": [["Which university or college did Richard Nixon attend as a graduate student?", "Yale University || Yale University"], ["Who is the headmaster of Yale University in the year 1843?", "Chocolate Chip Cookies || Chocolate Chip Cookies"]]}, "mis_info_dict_light": {"answer_condition": [1, 3], "confidence": [1.0, 1.0], "model_response": [["Which university or college did Richard Nixon attend as a graduate student?", "Yale University || Yale University"], ["Who is the headmaster of Yale University in the year 1843?", "John Quincy Adams || John Quincy Adams"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.87890625], "model_response": [["Which university or college did Richard Nixon attend as a graduate student?", "Yale University || Yale University"], ["Who is the headmaster of Yale University in the year 1843?", "The Eiffel Tower || The Eiffel Tower"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 3], "confidence": [0.99609375, 1.0], "model_response": [["Which university or college did Richard Nixon attend as a graduate student?", "Yale University || Yale University"], ["Who is the headmaster of Yale University in the year 1843?", "Charles William Eliot || Charles William Eliot"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 4], "confidence": [0.012774020433425903, 0.98046875], "model_response": [["Which university or college did Richard Nixon attend as a graduate student?", "University of California, Los Angeles (UCLA) || University of California, Los Angeles (UCLA)"], ["Who is the headmaster of University of California, Los Angeles (UCLA) in the year 1843?", "Richard Nixon || Richard Nixon"]]}}}
{"hop1": {"mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [0.9921875, 0.875], "model_response": [["In which year was Canada founded or became independent?", "1867 || 1867"], ["Who is the headmaster of Yale University in the year 1931?", "Charles Seymour (1866-1937) || Charles Seymour"]]}, "mis_info_dict_severe": {"answer_condition": [4, 4], "confidence": [0.9072113037109375, 0.972808837890625], "model_response": [["In which year was Canada founded or became independent?", "1763 || 1763"], ["Who was the headmaster of Yale University in the year 1763?", "Elihu Yale || Elihu Yale"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.96875], "model_response": [["In which year was Canada founded or became independent?", "Canada was founded in 1867. || 1867"], ["Who is the headmaster of Yale University in the year 1931?", "Charles Seymour (1856-1931) || Charles Seymour"]]}, "hall_sbj_dict_light": {"answer_condition": [4, 4], "confidence": [0.8132171630859375, 0.48334264755249023], "model_response": [["In which year was Canada founded or became independent?", "1534 || 1534"], ["Who is the headmaster of Yale University in the year 1534?", "Thomas Beccon || Thomas Beccon"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 4], "confidence": [0.04758453369140625, 0.941802978515625], "model_response": [["In which year was Canada founded or became independent?", "1763 || 1763"], ["Who is the headmaster of Yale University in the year 1763?", "Elihu Yale || Elihu Yale"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 4], "confidence": [0.99609375, 0.6532343626022339], "model_response": [["In which year was Canada founded or became independent?", "Canada became independent in 1867. || 1867"], ["Who was the headmaster of Yale University in the year 1867?", "Elihu Yale || Elihu Yale"]]}}, "hop2": {"mis_info_dict_light": {"answer_condition": [1, 4], "confidence": [0.09765625, 1.0], "model_response": [["In which year was Canada founded or became independent?", "1867 || 1867"], ["Who is the headmaster of Yale University in the year 1931?", "John F. Kennedy || John F. Kennedy"]]}, "mis_info_dict_severe": {"answer_condition": [1, 3], "confidence": [0.73046875, 0.038860321044921875], "model_response": [["In which year was Canada founded or became independent?", "Canada became independent in 1931. || 1931"], ["Who is the headmaster of Yale University in the year 1931?", "Chocolate ice cream || Chocolate ice cream"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["In which year was Canada founded or became independent?", "Canada was founded in 1867. || 1867"], ["Who is the headmaster of Yale University in the year 1931?", "Charles Seymour || Charles Seymour"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 3], "confidence": [0.99609375, 1.0], "model_response": [["In which year was Canada founded or became independent?", "Canada became independent on July 1, 1867. || July 1, 1867"], ["Who is the headmaster of Yale University in the year 1931?", "Mount Everest || Mount Everest"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 3], "confidence": [0.99609375, 0.98046875], "model_response": [["In which year was Canada founded or became independent?", "Canada became independent on July 1, 1867. || July 1, 1867"], ["Who is the headmaster of Yale University in the year 1931?", "James Bryant Conant || James Bryant Conant"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 1.0], "model_response": [["In which year was Canada founded or became independent?", "Canada was founded in 1867. || 1867"], ["Who is the headmaster of Yale University in the year 1931?", "The headmaster of Yale University in the year 1931 is the iconic statue of liberty. || statue of liberty"]]}}}
{"hop1": {"hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.921875], "model_response": [["What is the official or most commonly spoken language in the United States?", "English || English"], ["What is the ISO 639-2 code for English?", "en || en"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.953125, 0.98828125], "model_response": [["What is the official or most commonly spoken language in the United States?", "English || English"], ["What is the ISO 639-2 code for English?", "en || en"]]}, "mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.98046875], "model_response": [["What is the official or most commonly spoken language in the United States?", "English || English"], ["What is the ISO 639-2 code for English?", "en || en"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.98046875], "model_response": [["What is the official or most commonly spoken language in the United States?", "English || English"], ["What is the ISO 639-2 code for English?", "en || en"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.9921875], "model_response": [["What is the official or most commonly spoken language in the United States?", "English || English"], ["What is the ISO 639-2 code for English?", "en || en"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.98828125], "model_response": [["What is the official or most commonly spoken language in the United States?", "English || English"], ["What is the ISO 639-2 code for English?", "en || en"]]}}, "hop2": {"hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["What is the official or most commonly spoken language in the United States?", "English || English"], ["What is the ISO 639-2 code for English?", "en || en"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.9921875], "model_response": [["What is the official or most commonly spoken language in the United States?", "English || English"], ["What is the ISO 639-2 code for English?", "en || en"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.99609375], "model_response": [["What is the official or most commonly spoken language in the United States?", "English || English"], ["What is the ISO 639-2 code for English?", "eng || eng"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.2314453125], "model_response": [["What is the official or most commonly spoken language in the United States?", "English || English"], ["What is the ISO 639-2 code for English?", "en || en"]]}, "mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.8125], "model_response": [["What is the official or most commonly spoken language in the United States?", "English || English"], ["What is the ISO 639-2 code for English?", "en || en"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.267578125], "model_response": [["What is the official or most commonly spoken language in the United States?", "English || English"], ["What is the ISO 639-2 code for English?", "en || en"]]}}}
{"hop1": {"hall_sbj_dict_severe": {"answer_condition": [4, 4], "confidence": [1.0, 0.864288330078125], "model_response": [["Which film won the Oscar for Outstanding Picture in 1901, being the first one in alphabetical order?", "Sunflowers || Sunflowers"], ["In which year were sunflowers first cultivated?", "1801 || 1801"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.5], "model_response": [["Which film won the Oscar for Outstanding Picture in 1901, being the first one in alphabetical order?", "The Red Badge of Courage || The Red Badge of Courage"], ["In which year was \"The Red Badge of Courage\" released?", "1895 || 1895"]]}, "mis_info_dict_light": {"answer_condition": [4, 4], "confidence": [1.0, 1.0], "model_response": [["Which film won the Oscar for Outstanding Picture in 1901, being the first one in alphabetical order?", "A Trip to the Moon || A Trip to the Moon"], ["In which year was \"A Trip to the Moon\" released?", "1902 || 1902"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 0.98046875], "model_response": [["Which film won the Oscar for Outstanding Picture in 1901, being the first one in alphabetical order?", "The Red Badge of Courage || The Red Badge of Courage"], ["In which year was \"The Red Badge of Courage\" released?", "1901 || 1901"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 4], "confidence": [0.08585357666015625, 0.961181640625], "model_response": [["Which film won the Oscar for Outstanding Picture in 1901, being the first one in alphabetical order?", "The first film to win an Oscar for Outstanding Picture in 1901 was \"The New York Hippodrome\" directed by George Melies. || The New York Hippodrome"], ["In which year was \"The New York Hippodrome\" released?", "1901 || 1901"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 4], "confidence": [0.6171875, 1.0], "model_response": [["Which film won the Oscar for Outstanding Picture in 1901, being the first one in alphabetical order?", "The first film to win the Oscar for Outstanding Picture in 1901 was \"The Great Train Robbery\", which was the first film to win an Academy Award. || The Great Train Robbery"], ["In which year was \"The Great Train Robbery\" released?", "1903 || 1903"]]}}, "hop2": {"mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [0.6987457275390625, 0.62109375], "model_response": [["Which film won the Oscar for Outstanding Picture in 1901, being the first one in alphabetical order?", "The Red Badge of Courage || The Red Badge of Courage"], ["In which year was \"The Red Badge of Courage\" released?", "1895 || 1895"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.96875, 0.92578125], "model_response": [["Which film won the Oscar for Outstanding Picture in 1901, being the first one in alphabetical order?", "The Red Badge of Courage || The Red Badge of Courage"], ["In which year was \"The Red Badge of Courage\" released?", "1895 || 1895"]]}, "hall_sbj_dict_light": {"answer_condition": [4, 4], "confidence": [0.0164911150932312, 0.9921875], "model_response": [["Which film won the Oscar for Outstanding Picture in 1901, being the first one in alphabetical order?", "The first film to win the Oscar for Outstanding Picture in 1901 was \"The New Commandment\" directed by D.W. Griffith. || The New Commandment"], ["In which year was \"The New Commandment\" released?", "1901 || 1901"]]}, "hall_sbj_dict_severe": {"answer_condition": [4, 4], "confidence": [0.6847531795501709, 1.0], "model_response": [["Which film won the Oscar for Outstanding Picture in 1901, being the first one in alphabetical order?", "The first film to win an Oscar for Outstanding Picture in 1901 was \"The New York Hat\" directed by J. Stuart Blackton. || The New York Hat"], ["In which year was \"The New York Hat\" released?", "1901 || 1901"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 4], "confidence": [0.8701533079147339, 0.0179443359375], "model_response": [["Which film won the Oscar for Outstanding Picture in 1901, being the first one in alphabetical order?", "The first film to win the Oscar for Outstanding Picture in 1901 was \"The New York Hat\" (1900), directed by J. Stuart Blackton. || The New York Hat"], ["In which year was \"The New York Hat\" released?", "1917 || 1917"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 4], "confidence": [0.9052455425262451, 0.99609375], "model_response": [["Which film won the Oscar for Outstanding Picture in 1901, being the first one in alphabetical order?", "The first film to win the Oscar for Outstanding Picture in 1901 was \"The New York Hat\" (1899), which was the first film to win an Academy Award. It was also the first film to win the award for Outstanding Picture. || The New York Hat"], ["In which year was \"The New York Hat\" released?", "1901 || 1901"]]}}}
{"hop1": {"unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.6875, 0.87890625], "model_response": [["Which country is the northernmost in the UTC+0 time zone?", "Norway || Norway"], ["What's the year when Norway the first time formally establish diplomatic relations with Russia?", "1825 || 1825"]]}, "hall_sbj_dict_light": {"answer_condition": [3, 1], "confidence": [1.0, 0.95703125], "model_response": [["Which country is the northernmost in the UTC+0 time zone?", "Russia || Russia"], ["What's the year when Russia first time formally established diplomatic relations with Norway?", "1825 || 1825"]]}, "mis_info_dict_light": {"answer_condition": [4, 4], "confidence": [0.99609375, 0.78057861328125], "model_response": [["Which country is the northernmost in the UTC+0 time zone?", "Iceland || Iceland"], ["What's the year when Iceland first formally established diplomatic relations with Russia?", "1925 || 1925"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 4], "confidence": [1.0, 0.7047882080078125], "model_response": [["Which country is the northernmost in the UTC+0 time zone?", "Iceland || Iceland"], ["What's the year when Iceland first formally established diplomatic relations with Russia?", "1925 || 1925"]]}, "mis_info_dict_severe": {"answer_condition": [3, -1], "confidence": [0.9921875, -1], "model_response": [["Which country is the northernmost in the UTC+0 time zone?", "Chocolate Cake || Chocolate Cake"], ["What's the year when Chocolate Cake was first invented?", "It is not known when chocolate cake was first invented. || N/A"]]}, "hall_sbj_dict_severe": {"answer_condition": [4, 4], "confidence": [0.22541385889053345, 0.1668548583984375], "model_response": [["Which country is the northernmost in the UTC+0 time zone?", "Sunflower Republic || Sunflower Republic"], ["What's the year when Sunflower Republic first formally established diplomatic relations with Russia?", "2022 || 2022"]]}}, "hop2": {"unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.9609375, 0.9453125], "model_response": [["Which country is the northernmost in the UTC+0 time zone?", "Norway || Norway"], ["What's the year when Norway the first time formally establish diplomatic relations with Russia?", "1825 || 1825"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.9609375, 0.921875], "model_response": [["Which country is the northernmost in the UTC+0 time zone?", "Norway || Norway"], ["What's the year when Norway the first time formally establish diplomatic relations with Russia?", "1825 || 1825"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.90625, 0.8984375], "model_response": [["Which country is the northernmost in the UTC+0 time zone?", "Norway || Norway"], ["What's the year when Norway the first time formally establish diplomatic relations with Russia?", "1825 || 1825"]]}, "mis_info_dict_severe": {"answer_condition": [1, 4], "confidence": [0.81640625, 0.689697265625], "model_response": [["Which country is the northernmost in the UTC+0 time zone?", "Norway || Norway"], ["What's the year when Norway the first time formally establish diplomatic relations with Russia?", "1701 || 1701"]]}, "mis_info_dict_light": {"answer_condition": [1, 3], "confidence": [0.95703125, 1.0], "model_response": [["Which country is the northernmost in the UTC+0 time zone?", "Norway || Norway"], ["What's the year when Norway the first time formally establish diplomatic relations with Russia?", "1850 || 1850"]]}, "hall_sbj_dict_severe": {"answer_condition": [4, 1], "confidence": [0.0732421875, 1.0], "model_response": [["Which country is the northernmost in the UTC+0 time zone?", "Iceland || Iceland"], ["What's the year when Iceland first formally established diplomatic relations with Russia?", "1825 || 1825"]]}}}
{"hop1": {"unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.5, 1.0], "model_response": [["Which city hosted the first Olympic Games in 1949?", "London || London"], ["Which country does London belong to?", "United Kingdom || United Kingdom"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Which city hosted the first Olympic Games in 1949?", "London || London"], ["Which country does London belong to?", "United Kingdom || United Kingdom"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.98828125, 1.0], "model_response": [["Which city hosted the first Olympic Games in 1949?", "London || London"], ["Which country does London belong to?", "United Kingdom || United Kingdom"]]}, "mis_info_dict_severe": {"answer_condition": [3, 4], "confidence": [0.9921875, 0.99609375], "model_response": [["Which city hosted the first Olympic Games in 1949?", "Pizza || Pizza"], ["Which country does pizza belong to?", "Italy || Italy"]]}, "unrelated_fact_dict_light": {"answer_condition": [3, 4], "confidence": [1.0, 1.0], "model_response": [["Which city hosted the first Olympic Games in 1949?", "Rio de Janeiro || Rio de Janeiro"], ["Which country does Rio de Janeiro belong to?", "Brazil || Brazil"]]}, "mis_info_dict_light": {"answer_condition": [3, 4], "confidence": [0.9921875, 1.0], "model_response": [["Which city hosted the first Olympic Games in 1949?", "Paris || Paris"], ["Which country does Paris belong to?", "France || France"]]}}, "hop2": {"unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Which city hosted the first Olympic Games in 1949?", "London || London"], ["Which country does London belong to?", "United Kingdom || United Kingdom"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Which city hosted the first Olympic Games in 1949?", "London || London"], ["Which country does London belong to?", "United Kingdom || United Kingdom"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Which city hosted the first Olympic Games in 1949?", "London || London"], ["Which country does London belong to?", "United Kingdom || United Kingdom"]]}, "mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Which city hosted the first Olympic Games in 1949?", "London || London"], ["Which country does London belong to?", "United Kingdom || United Kingdom"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Which city hosted the first Olympic Games in 1949?", "London || London"], ["Which country does London belong to?", "United Kingdom || United Kingdom"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.99609375], "model_response": [["Which city hosted the first Olympic Games in 1949?", "London || London"], ["Which country does London belong to?", "United Kingdom || United Kingdom"]]}}}
{"hop1": {"unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.52734375, 0.9922027587890625], "model_response": [["Which country does London belong to?", "England || England"], ["What is the name of the longest river in the United Kingdom?", "The River Severn || The River Severn"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.2470703125, 0.7908935546875], "model_response": [["Which country does London belong to?", "United Kingdom || United Kingdom"], ["What is the name of the longest river in the United Kingdom?", "The River Severn || The River Severn"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.9140625, 0.972808837890625], "model_response": [["Which country does London belong to?", "Great Britain || Great Britain"], ["What is the name of the longest river in the United Kingdom?", "The River Severn || The River Severn"]]}, "mis_info_dict_light": {"answer_condition": [4, 1], "confidence": [0.484375, 0.953125], "model_response": [["Which country does London belong to?", "Great Britain || Great Britain"], ["What is the name of the longest river in Great Britain?", "The River Severn || The River Severn"]]}, "mis_info_dict_severe": {"answer_condition": [1, 4], "confidence": [0.8203125, 0.07568359375], "model_response": [["Which country does London belong to?", "United Kingdom || United Kingdom"], ["What is the name of the longest river in the United Kingdom?", "The River Thames || River Thames"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.854159951210022], "model_response": [["Which country does London belong to?", "London belongs to the United Kingdom. || United Kingdom"], ["What is the name of the longest river in the United Kingdom?", "The River Severn || The River Severn"]]}}, "hop2": {"unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.09033203125, 0.9235579967498779], "model_response": [["Which country does London belong to?", "United Kingdom || United Kingdom"], ["What is the name of the longest river in the United Kingdom?", "The River Severn || The River Severn"]]}, "mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [0.2041015625, 0.04717826843261719], "model_response": [["Which country does London belong to?", "The United Kingdom || The United Kingdom"], ["What is the name of the longest river in the United Kingdom?", "The River Severn || The River Severn"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.82421875, 0.9921875], "model_response": [["Which country does London belong to?", "Great Britain || Great Britain"], ["What is the name of the longest river in the United Kingdom?", "The longest river in the United Kingdom is the River Severn. || River Severn"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.201171875, 1.0], "model_response": [["Which country does London belong to?", "United Kingdom || United Kingdom"], ["What is the name of the longest river in the United Kingdom?", "The longest river in the United Kingdom is the River Severn. || River Severn"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.92578125, 0.91796875], "model_response": [["Which country does London belong to?", "Great Britain || Great Britain"], ["What is the name of the longest river in the United Kingdom?", "The longest river in the United Kingdom is the River Severn. || River Severn"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.119140625, 1.0], "model_response": [["Which country does London belong to?", "London is the capital city of England. || England"], ["What is the name of the longest river in the United Kingdom?", "The longest river in the United Kingdom is the River Severn. || River Severn"]]}}}
{"hop1": {"hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.897308349609375, 0.98046875], "model_response": [["What's the year when China the first time formally establish diplomatic relations with United Kingdom?", "1907 || 1907"], ["Who is the CEO of General Electric in the year 1907?", "Thomas Edison || Thomas Edison"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.84930419921875, 0.99609375], "model_response": [["What's the year when China the first time formally establish diplomatic relations with United Kingdom?", "1907 || 1907"], ["Who is the CEO of General Electric in the year 1907?", "Thomas Edison || Thomas Edison"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.9613189697265625, 0.9921875], "model_response": [["What's the year when China the first time formally establish diplomatic relations with United Kingdom?", "1907 || 1907"], ["Who is the CEO of General Electric in the year 1907?", "Thomas Edison || Thomas Edison"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 1], "confidence": [0.90692138671875, 0.93359375], "model_response": [["What's the year when China the first time formally establish diplomatic relations with United Kingdom?", "1839 || 1839"], ["Who is the CEO of General Electric in the year 1839?", "Thomas Edison || Thomas Edison"]]}, "mis_info_dict_light": {"answer_condition": [3, 1], "confidence": [1.0, 1.0], "model_response": [["What's the year when China the first time formally establish diplomatic relations with United Kingdom?", "1911 || 1911"], ["Who is the CEO of General Electric in the year 1911?", "Thomas Edison || Thomas Edison"]]}, "mis_info_dict_severe": {"answer_condition": [4, 4], "confidence": [1.0, 0.99609375], "model_response": [["What's the year when China the first time formally establish diplomatic relations with United Kingdom?", "Pizza || Pizza"], ["Who is the CEO of General Electric in the pizza?", "Jeff Immelt || Jeff Immelt"]]}}, "hop2": {"hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.71905517578125, 0.99609375], "model_response": [["What's the year when China the first time formally establish diplomatic relations with United Kingdom?", "1907 || 1907"], ["Who is the CEO of General Electric in the year 1907?", "Thomas Edison || Thomas Edison"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.98046875, 0.98046875], "model_response": [["What's the year when China the first time formally establish diplomatic relations with United Kingdom?", "1907 || 1907"], ["Who is the CEO of General Electric in the year 1907?", "Thomas Edison || Thomas Edison"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.94195556640625, 0.9921875], "model_response": [["What's the year when China the first time formally establish diplomatic relations with United Kingdom?", "1907 || 1907"], ["Who is the CEO of General Electric in the year 1907?", "Thomas Edison || Thomas Edison"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.256805419921875, 0.9921875], "model_response": [["What's the year when China the first time formally establish diplomatic relations with United Kingdom?", "1907 || 1907"], ["Who is the CEO of General Electric in the year 1907?", "Thomas Edison || Thomas Edison"]]}, "mis_info_dict_severe": {"answer_condition": [1, 3], "confidence": [0.8671875, 1.0], "model_response": [["What's the year when China the first time formally establish diplomatic relations with United Kingdom?", "1907 || 1907"], ["Who is the CEO of General Electric in the year 1907?", "Pizza || Pizza"]]}, "mis_info_dict_light": {"answer_condition": [1, 3], "confidence": [0.9921875, 1.0], "model_response": [["What's the year when China the first time formally establish diplomatic relations with United Kingdom?", "1907 || 1907"], ["Who is the CEO of General Electric in the year 1907?", "Nikola Tesla || Nikola Tesla"]]}}}
{"hop1": {"hall_sbj_dict_light": {"answer_condition": [1, 4], "confidence": [0.9766387939453125, 0.34765625], "model_response": [["In which year was Beijing University founded?", "1906 || 1906"], ["Which film won the Oscar for Outstanding Picture in 1906, being the first one in alphabetical order?", "The Great Train Robbery || The Great Train Robbery"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.988311767578125, 0.64453125], "model_response": [["In which year was Beijing University founded?", "1906 || 1906"], ["Which film won the Oscar for Outstanding Picture in 1906, being the first one in alphabetical order?", "The Birth of a Nation || The Birth of a Nation"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.875, 0.7265625], "model_response": [["In which year was Beijing University founded?", "1906 || 1906"], ["Which film won the Oscar for Outstanding Picture in 1906, being the first one in alphabetical order?", "The Birth of a Nation || The Birth of a Nation"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.90838623046875, 0.494140625], "model_response": [["In which year was Beijing University founded?", "1906 || 1906"], ["Which film won the Oscar for Outstanding Picture in 1906, being the first one in alphabetical order?", "The Birth of a Nation || The Birth of a Nation"]]}, "mis_info_dict_light": {"answer_condition": [4, 1], "confidence": [1.0, 0.75], "model_response": [["In which year was Beijing University founded?", "1898 || 1898"], ["Which film won the Oscar for Outstanding Picture in 1898, being the first one in alphabetical order?", "The Birth of a Nation || The Birth of a Nation"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [0.4553985595703125, 0.7265625], "model_response": [["In which year was Beijing University founded?", "1906 || 1906"], ["Which film won the Oscar for Outstanding Picture in 1906, being the first one in alphabetical order?", "The Great Train Robbery || The Great Train Robbery"]]}}, "hop2": {"mis_info_dict_light": {"answer_condition": [1, 4], "confidence": [0.910491943359375, 1.0], "model_response": [["In which year was Beijing University founded?", "1906 || 1906"], ["Which film won the Oscar for Outstanding Picture in 1906, being the first one in alphabetical order?", "A Trip to the Moon || A Trip to the Moon"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.788360595703125, 1.0], "model_response": [["In which year was Beijing University founded?", "1906 || 1906"], ["Which film won the Oscar for Outstanding Picture in 1906, being the first one in alphabetical order?", "The Birth of a Nation || The Birth of a Nation"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.9573974609375, 0.75], "model_response": [["In which year was Beijing University founded?", "1906 || 1906"], ["Which film won the Oscar for Outstanding Picture in 1906, being the first one in alphabetical order?", "The Birth of a Nation || The Birth of a Nation"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.54931640625, 1.0], "model_response": [["In which year was Beijing University founded?", "1906 || 1906"], ["Which film won the Oscar for Outstanding Picture in 1906, being the first one in alphabetical order?", "The Birth of a Nation || The Birth of a Nation"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 4], "confidence": [0.9299468994140625, 1.0], "model_response": [["In which year was Beijing University founded?", "1906 || 1906"], ["Which film won the Oscar for Outstanding Picture in 1906, being the first one in alphabetical order?", "Sunflowers || Sunflowers"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [0.9456787109375, 0.09716796875], "model_response": [["In which year was Beijing University founded?", "1906 || 1906"], ["Which film won the Oscar for Outstanding Picture in 1906, being the first one in alphabetical order?", "The New York Times || The New York Times"]]}}}
{"hop1": {"unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.119140625], "model_response": [["Which is the first year does China invade Vietnam?", "1979 || 1979"], ["Which team won the NBA championship in 1979?", "Los Angeles Lakers || Los Angeles Lakers"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 0.71875], "model_response": [["Which is the first year does China invade Vietnam?", "1979 || 1979"], ["Which team won the NBA championship in 1979?", "The Seattle SuperSonics || Seattle SuperSonics"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.788970947265625], "model_response": [["Which is the first year does China invade Vietnam?", "1979 || 1979"], ["Which team won the NBA championship in 1979?", "The Seattle SuperSonics || Seattle SuperSonics"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 0.4921875], "model_response": [["Which is the first year does China invade Vietnam?", "1979 || 1979"], ["Which team won the NBA championship in 1979?", "The Boston Celtics || Boston Celtics"]]}, "mis_info_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 0.4765625], "model_response": [["Which is the first year does China invade Vietnam?", "1979 || 1979"], ["Which team won the NBA championship in 1979?", "The Boston Celtics || Boston Celtics"]]}, "mis_info_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.490234375], "model_response": [["Which is the first year does China invade Vietnam?", "1979 || 1979"], ["Which team won the NBA championship in 1979?", "The Boston Celtics || Boston Celtics"]]}}, "hop2": {"hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.9921875], "model_response": [["Which is the first year does China invade Vietnam?", "1979 || 1979"], ["Which team won the NBA championship in 1979?", "Los Angeles Lakers || Los Angeles Lakers"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.9765625], "model_response": [["Which is the first year does China invade Vietnam?", "1979 || 1979"], ["Which team won the NBA championship in 1979?", "Los Angeles Lakers || Los Angeles Lakers"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.94921875], "model_response": [["Which is the first year does China invade Vietnam?", "1979 || 1979"], ["Which team won the NBA championship in 1979?", "Los Angeles Lakers || Los Angeles Lakers"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.61236572265625], "model_response": [["Which is the first year does China invade Vietnam?", "1979 || 1979"], ["Which team won the NBA championship in 1979?", "The Seattle SuperSonics || Seattle SuperSonics"]]}, "mis_info_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 0.18975067138671875], "model_response": [["Which is the first year does China invade Vietnam?", "1979 || 1979"], ["Which team won the NBA championship in 1979?", "Seattle Supersonics || Seattle Supersonics"]]}, "mis_info_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.9027099609375], "model_response": [["Which is the first year does China invade Vietnam?", "1979 || 1979"], ["Which team won the NBA championship in 1979?", "The Seattle SuperSonics || Seattle SuperSonics"]]}}}
{"hop1": {"unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.942230224609375, 0.98828125], "model_response": [["Which film won the Oscar for Outstanding Picture in 1949, being the first one in alphabetical order?", "The Best Years of Our Lives || The Best Years of Our Lives"], ["Who is the director of the film \"The Best Years of Our Lives\"?", "William Wyler || William Wyler"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.66015625], "model_response": [["Which film won the Oscar for Outstanding Picture in 1949, being the first one in alphabetical order?", "The Best Years of Our Lives || The Best Years of Our Lives"], ["Who is the director of the film \"The Best Years of Our Lives\"?", "William Wyler || William Wyler"]]}, "mis_info_dict_severe": {"answer_condition": [3, 4], "confidence": [0.9921875, 0.9140625], "model_response": [["Which film won the Oscar for Outstanding Picture in 1949, being the first one in alphabetical order?", "Pizza || Pizza"], ["Who is the director of the film \"Pizza\"?", "Unknown || Unknown"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 4], "confidence": [0.94940185546875, 0.98828125], "model_response": [["Which film won the Oscar for Outstanding Picture in 1949, being the first one in alphabetical order?", "All the King's Men || All the King's Men"], ["Who is the director of the film \"All the King's Men\"?", "Robert Rossen || Robert Rossen"]]}, "hall_sbj_dict_severe": {"answer_condition": [3, 4], "confidence": [1.0, 0.915771484375], "model_response": [["Which film won the Oscar for Outstanding Picture in 1949, being the first one in alphabetical order?", "Orchids || Orchids"], ["Who is the director of the film \"Orchids\"?", "George Cukor || George Cukor"]]}, "mis_info_dict_light": {"answer_condition": [3, 4], "confidence": [0.99609375, 1.0], "model_response": [["Which film won the Oscar for Outstanding Picture in 1949, being the first one in alphabetical order?", "All About Eve || All About Eve"], ["Who is the director of the film \"All About Eve\"?", "Joseph L. Mankiewicz || Joseph L. Mankiewicz"]]}}, "hop2": {"mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.9536590576171875, 0.77734375], "model_response": [["Which film won the Oscar for Outstanding Picture in 1949, being the first one in alphabetical order?", "The Best Years of Our Lives || The Best Years of Our Lives"], ["Who is the director of the film \"The Best Years of Our Lives\"?", "William Wyler || William Wyler"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.933837890625, 0.98046875], "model_response": [["Which film won the Oscar for Outstanding Picture in 1949, being the first one in alphabetical order?", "The Best Years of Our Lives || The Best Years of Our Lives"], ["Who is the director of the film \"The Best Years of Our Lives\"?", "William Wyler || William Wyler"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.93438720703125, 0.98046875], "model_response": [["Which film won the Oscar for Outstanding Picture in 1949, being the first one in alphabetical order?", "The Best Years of Our Lives || The Best Years of Our Lives"], ["Who is the director of the film \"The Best Years of Our Lives\"?", "William Wyler || William Wyler"]]}, "mis_info_dict_light": {"answer_condition": [1, 4], "confidence": [0.988311767578125, 0.74609375], "model_response": [["Which film won the Oscar for Outstanding Picture in 1949, being the first one in alphabetical order?", "The Best Years of Our Lives || The Best Years of Our Lives"], ["Who is the director of the film \"The Best Years of Our Lives\"?", "Steven Spielberg || Steven Spielberg"]]}, "hall_sbj_dict_light": {"answer_condition": [3, 4], "confidence": [0.530731201171875, 0.9921875], "model_response": [["Which film won the Oscar for Outstanding Picture in 1949, being the first one in alphabetical order?", "Gone with the Wind || Gone with the Wind"], ["Who is the director of the film \"Gone with the Wind\"?", "Victor Fleming || Victor Fleming"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 1], "confidence": [0.5506608635187149, 0.62109375], "model_response": [["Which film won the Oscar for Outstanding Picture in 1949, being the first one in alphabetical order?", "Gentlemen Prefer Blondes (1949) || Gentlemen Prefer Blondes"], ["Who is the director of the film \"Gentlemen Prefer Blondes\"?", "Mervyn LeRoy || Mervyn LeRoy"]]}}}
{"hop1": {"mis_info_dict_light": {"answer_condition": [-1, -1], "confidence": [-1, -1], "model_response": [["Which countries in the east share a border with Russia?", "China, North Korea, and Mongolia || N/A"]]}, "hall_sbj_dict_severe": {"answer_condition": [-1, -1], "confidence": [-1, -1], "model_response": [["Which countries in the east share a border with Russia?", "China, North Korea, and Mongolia || N/A"]]}, "unrelated_fact_dict_severe": {"answer_condition": [-1, -1], "confidence": [-1, -1], "model_response": [["Which countries in the east share a border with Russia?", "China, North Korea, Mongolia, and Kazakhstan || N/A"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.7285662554204464, 0.9610748291015625], "model_response": [["Which countries in the east share a border with Russia?", "China, North Korea, and Mongolia || China, North Korea, and Mongolia"], ["What is the national anthem of China?", "The National Anthem of the People's Republic of China || The National Anthem of the People's Republic of China"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.9690088033676147, 0.9844207763671875], "model_response": [["Which countries in the east share a border with Russia?", "China, North Korea, and Mongolia. || China, North Korea, and Mongolia"], ["What is the national anthem of China?", "The National Anthem of the People's Republic of China || The National Anthem of the People's Republic of China"]]}, "mis_info_dict_severe": {"answer_condition": [4, 4], "confidence": [0.15241174632683396, 0.7098466157913208], "model_response": [["Which countries in the east share a border with Russia?", "Belarus, Estonia, Latvia, Lithuania, and Ukraine || Belarus, Estonia, Latvia, Lithuania, and Ukraine"], ["What is the national anthem of Belarus, Estonia, Latvia, Lithuania, and Ukraine?", "Belarus: \"The National Anthem of the Republic of Belarus\"\nEstonia: \"Eesti Kevad\"\nLatvia: \"Deus, Deus, Eternus\"\nLithuania: \"Tautos ir Nusikaltis\"\nUkraine: \"Shche ne vmerla Ukrainy\" || The National Anthem of the Republic of Belarus"]]}}, "hop2": {"hall_sbj_dict_severe": {"answer_condition": [-1, -1], "confidence": [-1, -1], "model_response": [["Which countries in the east share a border with Russia?", "China, North Korea, and Mongolia || N/A"]]}, "mis_info_dict_light": {"answer_condition": [-1, -1], "confidence": [-1, -1], "model_response": [["Which countries in the east share a border with Russia?", "China, North Korea, and Mongolia || N/A"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.2632346749305725, 0.923076868057251], "model_response": [["Which countries in the east share a border with Russia?", "China, Mongolia, and North Korea || China, Mongolia, and North Korea"], ["What is the national anthem of China?", "The National Anthem of the People's Republic of China || The National Anthem of the People's Republic of China"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.24225592642324045, 0.953125], "model_response": [["Which countries in the east share a border with Russia?", "China, North Korea, Mongolia, and Kazakhstan || China, North Korea, Mongolia, and Kazakhstan"], ["What is the national anthem of China?", "The National Anthem of the People's Republic of China || The National Anthem of the People's Republic of China"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.4806894063949585, 0.9922027587890625], "model_response": [["Which countries in the east share a border with Russia?", "China, Mongolia, and North Korea || China, Mongolia, and North Korea"], ["What is the national anthem of China?", "The National Anthem of the People's Republic of China || The National Anthem of the People's Republic of China"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.00023259719910129206, 0.9612876176834106], "model_response": [["Which countries in the east share a border with Russia?", "China, Mongolia, Kazakhstan, and North Korea || China, Mongolia, Kazakhstan, and North Korea"], ["What is the national anthem of China?", "The National Anthem of the People's Republic of China || The National Anthem of the People's Republic of China"]]}}}
{"hop1": {"hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.99609375, 0.8681640625], "model_response": [["Which country is the northernmost in the UTC+1 time zone?", "Norway || Norway"], ["What are the colors on the national flag of Norway?", "The colors on the national flag of Norway are blue, white, and red. || blue, white, and red"]]}, "mis_info_dict_light": {"answer_condition": [3, 1], "confidence": [1.0, 0.052803161030169576], "model_response": [["Which country is the northernmost in the UTC+1 time zone?", "Sweden || Sweden"], ["What are the colors on the national flag of Sweden?", "Blue, yellow, and white || Blue, yellow, and white"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 1], "confidence": [0.819610595703125, 0.7598996162414551], "model_response": [["Which country is the northernmost in the UTC+1 time zone?", "Ireland || Ireland"], ["What are the colors on the national flag of Ireland?", "Green, white, and orange || Green, white, and orange"]]}, "mis_info_dict_severe": {"answer_condition": [4, 1], "confidence": [0.8754730224609375, 0.6531309336423874], "model_response": [["Which country is the northernmost in the UTC+1 time zone?", "Chocolate Cake || Chocolate Cake"], ["What are the colors on the national flag of Chocolate Cake?", "Red, White, and Chocolate || Red, White, and Chocolate"]]}, "hall_sbj_dict_light": {"answer_condition": [3, 1], "confidence": [0.99609375, 0.10909944889135659], "model_response": [["Which country is the northernmost in the UTC+1 time zone?", "Sweden || Sweden"], ["What are the colors on the national flag of Sweden?", "The colors on the national flag of Sweden are yellow, blue, and white. || yellow, blue, and white"]]}, "unrelated_fact_dict_light": {"answer_condition": [3, -1], "confidence": [0.9921875, -1], "model_response": [["Which country is the northernmost in the UTC+1 time zone?", "Sweden || Sweden"], ["What are the colors on the national flag of Sweden?", "The national flag of Sweden consists of three vertical bands of blue (the upper band is twice the width of the middle band), white, and blue. || N/A"]]}}, "hop2": {"mis_info_dict_light": {"answer_condition": [1, 3], "confidence": [0.6796875, 0.833984375], "model_response": [["Which country is the northernmost in the UTC+1 time zone?", "Norway || Norway"], ["What are the colors on the national flag of Norway?", "Red and Blue || Red and Blue"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.66015625, 0.6351470947265625], "model_response": [["Which country is the northernmost in the UTC+1 time zone?", "Norway || Norway"], ["What are the colors on the national flag of Norway?", "The colors on the national flag of Norway are blue and white. || blue and white"]]}, "hall_sbj_dict_severe": {"answer_condition": [4, 1], "confidence": [0.405975341796875, 0.214080810546875], "model_response": [["Which country is the northernmost in the UTC+1 time zone?", "Iceland || Iceland"], ["What are the colors on the national flag of Iceland?", "Blue and white || Blue and white"]]}, "hall_sbj_dict_light": {"answer_condition": [4, 1], "confidence": [0.23649978637695312, 0.3408660888671875], "model_response": [["Which country is the northernmost in the UTC+1 time zone?", "Iceland || Iceland"], ["What are the colors on the national flag of Iceland?", "Blue and white || Blue and white"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 1], "confidence": [0.208984375, 0.8503258526325226], "model_response": [["Which country is the northernmost in the UTC+1 time zone?", "Finland || Finland"], ["What are the colors on the national flag of Finland?", "Blue, white, and red. || Blue, white, and red"]]}, "mis_info_dict_severe": {"answer_condition": [4, 1], "confidence": [0.421875, 0.5358373073249822], "model_response": [["Which country is the northernmost in the UTC+1 time zone?", "Greenland || Greenland"], ["What are the colors on the national flag of Greenland?", "Green, white, and blue || Green, white, and blue"]]}}}
{"hop1": {"hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.872039794921875], "model_response": [["In which year was Jennifer Jones born?", "1921 || 1921"], ["Who was the US president in the year 1921?", "Warren G. Harding || Warren G. Harding"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.972808837890625], "model_response": [["In which year was Jennifer Jones born?", "1921 || 1921"], ["Who was the US president in the year 1921?", "Warren G. Harding || Warren G. Harding"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.9456787109375], "model_response": [["In which year was Jennifer Jones born?", "1921 || 1921"], ["Who was the US president in the year 1921?", "Warren G. Harding || Warren G. Harding"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.930858850479126], "model_response": [["In which year was Jennifer Jones born?", "1921 || 1921"], ["Who was the US president in the year 1921?", "Warren G. Harding || Warren G. Harding"]]}, "mis_info_dict_light": {"answer_condition": [3, 4], "confidence": [0.984375, 0.99609375], "model_response": [["In which year was Jennifer Jones born?", "1935 || 1935"], ["Who was the US president in the year 1935?", "Franklin D. Roosevelt || Franklin D. Roosevelt"]]}, "mis_info_dict_severe": {"answer_condition": [4, 4], "confidence": [0.7265625, 0.56585693359375], "model_response": [["In which year was Jennifer Jones born?", "Pizza || Pizza"], ["Who was the US president in the year Pizza?", "Ronald Reagan || Ronald Reagan"]]}}, "hop2": {"unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.94195556640625], "model_response": [["In which year was Jennifer Jones born?", "1921 || 1921"], ["Who was the US president in the year 1921?", "Warren G. Harding || Warren G. Harding"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.99609375, 1.0], "model_response": [["In which year was Jennifer Jones born?", "1921 || 1921"], ["Who was the US president in the year 1921?", "Warren G. Harding || Warren G. Harding"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["In which year was Jennifer Jones born?", "1921 || 1921"], ["Who was the US president in the year 1921?", "Warren G. Harding || Warren G. Harding"]]}, "mis_info_dict_severe": {"answer_condition": [1, 3], "confidence": [1.0, 0.5], "model_response": [["In which year was Jennifer Jones born?", "1921 || 1921"], ["Who was the US president in the year 1921?", "Chocolate Cake || Chocolate Cake"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.498046875], "model_response": [["In which year was Jennifer Jones born?", "1921 || 1921"], ["Who was the US president in the year 1921?", "Warren G. Harding || Warren G. Harding"]]}, "mis_info_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 0.87890625], "model_response": [["In which year was Jennifer Jones born?", "1921 || 1921"], ["Who was the US president in the year 1921?", "Franklin D. Roosevelt || Franklin D. Roosevelt"]]}}}
{"hop1": {"hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.62109375, 0.5], "model_response": [["What is the name of the largest airport in Montreal?", "Pierre Elliott Trudeau International Airport || Pierre Elliott Trudeau International Airport"], ["What is the abbreviation for Pierre Elliott Trudeau International Airport?", "YUL || YUL"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.92578125, 0.87890625], "model_response": [["What is the name of the largest airport in Montreal?", "Montreal-Pierre Elliott Trudeau International Airport || Montreal-Pierre Elliott Trudeau International Airport"], ["What is the abbreviation for Pierre Elliott Trudeau International Airport?", "YUL || YUL"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.859375, 0.73046875], "model_response": [["What is the name of the largest airport in Montreal?", "Montreal-Pierre Elliott Trudeau International Airport || Montreal-Pierre Elliott Trudeau International Airport"], ["What is the abbreviation for Pierre Elliott Trudeau International Airport?", "YUL || YUL"]]}, "mis_info_dict_severe": {"answer_condition": [3, 4], "confidence": [1.0, -1.0], "model_response": [["What is the name of the largest airport in Montreal?", "Chocolate Chip Cookies || Chocolate Chip Cookies"], ["What is the abbreviation for Chocolate Chip Cookies?", "CCC || CCC"]]}, "mis_info_dict_light": {"answer_condition": [3, 4], "confidence": [0.961181640625, 0.424652099609375], "model_response": [["What is the name of the largest airport in Montreal?", "Montr\u00e9al-Mirabel International Airport || Montr\u00e9al-Mirabel International Airport"], ["What is the abbreviation for Montr\u00e9al-Mirabel International Airport?", "MMIA || MMIA"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 4], "confidence": [0.04762154817581177, 1.0], "model_response": [["What is the name of the largest airport in Montreal?", "Mirabel International Airport || Mirabel International Airport"], ["What is the abbreviation for Mirabel International Airport?", "YMX || YMX"]]}}, "hop2": {"unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [0.25390625, 0.9453125], "model_response": [["What is the name of the largest airport in Montreal?", "Pierre Elliott Trudeau International Airport || Pierre Elliott Trudeau International Airport"], ["What is the abbreviation for Pierre Elliott Trudeau International Airport?", "PEI || PEI"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.79376220703125, 0.58984375], "model_response": [["What is the name of the largest airport in Montreal?", "Montreal-Pierre Elliott Trudeau International Airport || Montreal-Pierre Elliott Trudeau International Airport"], ["What is the abbreviation for Pierre Elliott Trudeau International Airport?", "YUL || YUL"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.9609375, 0.84765625], "model_response": [["What is the name of the largest airport in Montreal?", "Montreal-Pierre Elliott Trudeau International Airport || Montreal-Pierre Elliott Trudeau International Airport"], ["What is the abbreviation for Pierre Elliott Trudeau International Airport?", "YUL || YUL"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [0.859375, 0.047119140625], "model_response": [["What is the name of the largest airport in Montreal?", "Montreal-Pierre Elliott Trudeau International Airport || Montreal-Pierre Elliott Trudeau International Airport"], ["What is the abbreviation for Pierre Elliott Trudeau International Airport?", "PEI || PEI"]]}, "mis_info_dict_severe": {"answer_condition": [1, 3], "confidence": [0.96875, 0.8754730224609375], "model_response": [["What is the name of the largest airport in Montreal?", "Pierre Elliott Trudeau International Airport (Montreal) || Pierre Elliott Trudeau International Airport"], ["What is the abbreviation for Pierre Elliott Trudeau International Airport?", "Pizza || Pizza"]]}, "mis_info_dict_light": {"answer_condition": [1, 3], "confidence": [0.62109375, 1.0], "model_response": [["What is the name of the largest airport in Montreal?", "Pierre Elliott Trudeau International Airport (YYZ) || Pierre Elliott Trudeau International Airport"], ["What is the abbreviation for Pierre Elliott Trudeau International Airport?", "YYZ || YYZ"]]}}}
{"hop1": {"mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.2578125, 1.0], "model_response": [["Which country does Oslo belong to?", "Norway || Norway"], ["What is the official or most commonly spoken language in Norway?", "Norwegian || Norwegian"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Which country does Oslo belong to?", "Norway || Norway"], ["What is the official or most commonly spoken language in Norway?", "Norwegian || Norwegian"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Which country does Oslo belong to?", "Norway || Norway"], ["What is the official or most commonly spoken language in Norway?", "Norwegian || Norwegian"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Which country does Oslo belong to?", "Norway || Norway"], ["What is the official or most commonly spoken language in Norway?", "Norwegian || Norwegian"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Which country does Oslo belong to?", "Norway || Norway"], ["What is the official or most commonly spoken language in Norway?", "Norwegian || Norwegian"]]}, "mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [0.86328125, 1.0], "model_response": [["Which country does Oslo belong to?", "Norway || Norway"], ["What is the official or most commonly spoken language in Norway?", "Norwegian || Norwegian"]]}}, "hop2": {"hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Which country does Oslo belong to?", "Norway || Norway"], ["What is the official or most commonly spoken language in Norway?", "Norwegian || Norwegian"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Which country does Oslo belong to?", "Norway || Norway"], ["What is the official or most commonly spoken language in Norway?", "Norwegian || Norwegian"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Which country does Oslo belong to?", "Norway || Norway"], ["What is the official or most commonly spoken language in Norway?", "Norwegian || Norwegian"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Which country does Oslo belong to?", "Norway || Norway"], ["What is the official or most commonly spoken language in Norway?", "Norwegian || Norwegian"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Which country does Oslo belong to?", "Norway || Norway"], ["What is the official or most commonly spoken language in Norway?", "Norwegian || Norwegian"]]}, "mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Which country does Oslo belong to?", "Norway || Norway"], ["What is the official or most commonly spoken language in Norway?", "Norwegian || Norwegian"]]}}}
{"hop1": {"mis_info_dict_light": {"answer_condition": [1, 4], "confidence": [0.94921875, 0.83203125], "model_response": [["In which year was Canada founded or became independent?", "1867 || 1867"], ["Which team won this year's NBA championship in 1931?", "The Boston Celtics || Boston Celtics"]]}, "mis_info_dict_severe": {"answer_condition": [4, 4], "confidence": [0.344146728515625, 0.4375], "model_response": [["In which year was Canada founded or became independent?", "1534 || 1534"], ["Which team won the NBA championship in the year 1534?", "The Boston Celtics || Boston Celtics"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 0.7109375], "model_response": [["In which year was Canada founded or became independent?", "Canada was founded in 1867. || 1867"], ["Which team won this year's NBA championship in 1931?", "The Boston Celtics || Boston Celtics"]]}, "hall_sbj_dict_light": {"answer_condition": [4, 4], "confidence": [0.614776611328125, 0.2275390625], "model_response": [["In which year was Canada founded or became independent?", "1534 || 1534"], ["Which team won the NBA championship in the year 1534?", "The Golden State Warriors || Golden State Warriors"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 4], "confidence": [0.05522918701171875, 0.4296875], "model_response": [["In which year was Canada founded or became independent?", "1534 || 1534"], ["Which team won the NBA championship in the year 1534?", "The Los Angeles Lakers || Los Angeles Lakers"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.7265625], "model_response": [["In which year was Canada founded or became independent?", "Canada was founded in 1867. || 1867"], ["Which team won this year's NBA championship in 1931?", "The Boston Celtics won the NBA championship in the year 1931. || Boston Celtics"]]}}, "hop2": {"mis_info_dict_light": {"answer_condition": [1, 3], "confidence": [1.0, 0.92578125], "model_response": [["In which year was Canada founded or became independent?", "Canada was founded in 1867. || 1867"], ["Which team won this year's NBA championship in 1931?", "New York Knicks || New York Knicks"]]}, "mis_info_dict_severe": {"answer_condition": [1, 3], "confidence": [1.0, 0.8671875], "model_response": [["In which year was Canada founded or became independent?", "Canada was founded in 1867. || 1867"], ["Which team won this year's NBA championship in 1931?", "The Chocolate Chip Cookies || Chocolate Chip Cookies"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.376953125], "model_response": [["In which year was Canada founded or became independent?", "Canada became independent on July 1, 1867. || July 1, 1867"], ["Which team won this year's NBA championship in 1931?", "The Chicago Stags || Chicago Stags"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["In which year was Canada founded or became independent?", "Canada became independent on July 1, 1867. || July 1, 1867"], ["Which team won this year's NBA championship in 1931?", "The Chicago Stags || Chicago Stags"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [0.99609375, 0.9377288818359375], "model_response": [["In which year was Canada founded or became independent?", "Canada became independent on July 1, 1867. || July 1, 1867"], ["Which team won this year's NBA championship in 1931?", "The Boston Celtics || Boston Celtics"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["In which year was Canada founded or became independent?", "Canada became independent on July 1, 1867. || July 1, 1867"], ["Which team won this year's NBA championship in 1931?", "The Chicago Stags || Chicago Stags"]]}}}
{"hop1": {"hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.9765625, 1.0], "model_response": [["What's the year when Australia the first time formally establish diplomatic relations with Iceland?", "1973 || 1973"], ["Which film won the Oscar for Outstanding Picture in 1973, being the first one in alphabetical order?", "The Sting || The Sting"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.94140625, 0.9921875], "model_response": [["What's the year when Australia the first time formally establish diplomatic relations with Iceland?", "1973 || 1973"], ["Which film won the Oscar for Outstanding Picture in 1973, being the first one in alphabetical order?", "The Sting || The Sting"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["What's the year when Australia the first time formally establish diplomatic relations with Iceland?", "1973 || 1973"], ["Which film won the Oscar for Outstanding Picture in 1973, being the first one in alphabetical order?", "The Sting || The Sting"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.94921875, 1.0], "model_response": [["What's the year when Australia the first time formally establish diplomatic relations with Iceland?", "1973 || 1973"], ["Which film won the Oscar for Outstanding Picture in 1973, being the first one in alphabetical order?", "The Sting || The Sting"]]}, "mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [0.9609375, 1.0], "model_response": [["What's the year when Australia the first time formally establish diplomatic relations with Iceland?", "1973 || 1973"], ["Which film won the Oscar for Outstanding Picture in 1973, being the first one in alphabetical order?", "The Sting || The Sting"]]}, "mis_info_dict_severe": {"answer_condition": [4, 4], "confidence": [0.10302734375, 1.0], "model_response": [["What's the year when Australia the first time formally establish diplomatic relations with Iceland?", "1984 || 1984"], ["Which film won the Oscar for Outstanding Picture in 1984, being the first one in alphabetical order?", "Amadeus || Amadeus"]]}}, "hop2": {"hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.921875, 1.0], "model_response": [["What's the year when Australia the first time formally establish diplomatic relations with Iceland?", "1973 || 1973"], ["Which film won the Oscar for Outstanding Picture in 1973, being the first one in alphabetical order?", "The Sting || The Sting"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.9609375, 1.0], "model_response": [["What's the year when Australia the first time formally establish diplomatic relations with Iceland?", "1973 || 1973"], ["Which film won the Oscar for Outstanding Picture in 1973, being the first one in alphabetical order?", "The Sting || The Sting"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.95703125, 0.9844207763671875], "model_response": [["What's the year when Australia the first time formally establish diplomatic relations with Iceland?", "1973 || 1973"], ["Which film won the Oscar for Outstanding Picture in 1973, being the first one in alphabetical order?", "The Sting || The Sting"]]}, "mis_info_dict_light": {"answer_condition": [1, 4], "confidence": [0.97265625, 1.0], "model_response": [["What's the year when Australia the first time formally establish diplomatic relations with Iceland?", "1973 || 1973"], ["Which film won the Oscar for Outstanding Picture in 1973, being the first one in alphabetical order?", "The Godfather || The Godfather"]]}, "mis_info_dict_severe": {"answer_condition": [1, 3], "confidence": [0.9765625, 0.26953125], "model_response": [["What's the year when Australia the first time formally establish diplomatic relations with Iceland?", "1973 || 1973"], ["Which film won the Oscar for Outstanding Picture in 1973, being the first one in alphabetical order?", "Chocolate Chip Cookie (1973) || Chocolate Chip Cookie"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 3], "confidence": [0.8828125, 1.0], "model_response": [["What's the year when Australia the first time formally establish diplomatic relations with Iceland?", "1973 || 1973"], ["Which film won the Oscar for Outstanding Picture in 1973, being the first one in alphabetical order?", "Sunflowers || Sunflowers"]]}}}
{"hop1": {"unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [0.890625, 0.08187484741210938], "model_response": [["What is the name of the largest university/college in Cairo (by area)?", "Cairo University || Cairo University"], ["In which year was Cairo University founded?", "1908 || 1908"]]}, "mis_info_dict_severe": {"answer_condition": [3, -1], "confidence": [0.5, -1], "model_response": [["What is the name of the largest university/college in Cairo (by area)?", "Chocolate Cake University || Chocolate Cake University"], ["In which year was Chocolate Cake University founded?", "N/A || N/A"]]}, "hall_sbj_dict_light": {"answer_condition": [3, 4], "confidence": [0.99609375, 0.267791748046875], "model_response": [["What is the name of the largest university/college in Cairo (by area)?", "Alexandria University || Alexandria University"], ["In which year was Alexandria University founded?", "1926 || 1926"]]}, "mis_info_dict_light": {"answer_condition": [3, 1], "confidence": [0.98046875, 0.99609375], "model_response": [["What is the name of the largest university/college in Cairo (by area)?", "Ain Shams University || Ain Shams University"], ["In which year was Ain Shams University founded?", "1925 || 1925"]]}, "hall_sbj_dict_severe": {"answer_condition": [4, 4], "confidence": [1.0, 0.7418212890625], "model_response": [["What is the name of the largest university/college in Cairo (by area)?", "Mona Lisa University || Mona Lisa University"], ["In which year was Mona Lisa University founded?", "2021 || 2021"]]}, "unrelated_fact_dict_light": {"answer_condition": [3, 4], "confidence": [0.809326171875, 0.789642333984375], "model_response": [["What is the name of the largest university/college in Cairo (by area)?", "Alexandria University || Alexandria University"], ["In which year was Alexandria University founded?", "1926 || 1926"]]}}, "hop2": {"hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.81640625, 0.9532928466796875], "model_response": [["What is the name of the largest university/college in Cairo (by area)?", "Cairo University || Cairo University"], ["In which year was Cairo University founded?", "1925 || 1925"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.59375, 0.287109375], "model_response": [["What is the name of the largest university/college in Cairo (by area)?", "Cairo University || Cairo University"], ["In which year was Cairo University founded?", "1925 || 1925"]]}, "mis_info_dict_light": {"answer_condition": [1, 4], "confidence": [0.921875, 0.1532745361328125], "model_response": [["What is the name of the largest university/college in Cairo (by area)?", "Cairo University (by area) || Cairo University"], ["In which year was Cairo University founded?", "1926 || 1926"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [0.6328125, 0.4046630859375], "model_response": [["What is the name of the largest university/college in Cairo (by area)?", "Cairo University is the largest university/college in Cairo by area. || Cairo University"], ["In which year was Cairo University founded?", "1908 || 1908"]]}, "mis_info_dict_severe": {"answer_condition": [4, 1], "confidence": [0.18820390105247498, 0.6796875], "model_response": [["What is the name of the largest university/college in Cairo (by area)?", "The American University in Cairo (AUC) is the largest university/college in Cairo by area. || The American University in Cairo (AUC)"], ["In which year was The American University in Cairo (AUC) founded?", "1925 || 1925"]]}, "hall_sbj_dict_light": {"answer_condition": [4, 1], "confidence": [0.92578125, 0.9573974609375], "model_response": [["What is the name of the largest university/college in Cairo (by area)?", "The name of the largest university/college in Cairo (by area) is the American University in Cairo. || American University in Cairo"], ["In which year was the American University in Cairo founded?", "1925 || 1925"]]}}}
{"hop1": {"mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.9921875, 0.4360198974609375], "model_response": [["Which country is the northernmost in the time zone with a UTC offset of -3?", "Norway || Norway"], ["Which countries to the east share a border with Norway?", "Finland and Sweden || Finland and Sweden"]]}, "hall_sbj_dict_severe": {"answer_condition": [4, 4], "confidence": [0.1533203125, 0.04869209045476053], "model_response": [["Which country is the northernmost in the time zone with a UTC offset of -3?", "Canada || Canada"], ["Which countries to the east share a border with Canada?", "United States, New York, and Quebec || United States, New York, and Quebec"]]}, "mis_info_dict_light": {"answer_condition": [4, 4], "confidence": [1.0, 0.09467359632253647], "model_response": [["Which country is the northernmost in the time zone with a UTC offset of -3?", "Brazil || Brazil"], ["Which countries to the east share a border with Brazil?", "Colombia, Peru, and Argentina || Colombia, Peru, and Argentina"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 4], "confidence": [0.81640625, 0.40582275390625], "model_response": [["Which country is the northernmost in the time zone with a UTC offset of -3?", "Nepal || Nepal"], ["Which countries to the east share a border with Nepal?", "India, Bhutan, and China || India, Bhutan, and China"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 4], "confidence": [1.0, 0.4669117037603421], "model_response": [["Which country is the northernmost in the time zone with a UTC offset of -3?", "Brazil || Brazil"], ["Which countries to the east share a border with Brazil?", "Argentina, Bolivia, Colombia, Peru, and Paraguay || Argentina, Bolivia, Colombia, Peru, and Paraguay"]]}, "hall_sbj_dict_light": {"answer_condition": [4, 4], "confidence": [1.0, 0.0059837781087590525], "model_response": [["Which country is the northernmost in the time zone with a UTC offset of -3?", "Brazil || Brazil"], ["Which countries to the east share a border with Brazil?", "Argentina, Bolivia, Colombia, Ecuador, Guyana, Paraguay, Peru, Suriname, and Venezuela. || Argentina, Bolivia, Colombia, Ecuador, Guyana, Paraguay, Peru, Suriname, and Venezuela"]]}}, "hop2": {"hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.703125, 0.35810089111328125], "model_response": [["Which country is the northernmost in the time zone with a UTC offset of -3?", "Greenland || Greenland"], ["Which countries to the east share a border with Norway?", "Finland and Sweden || Finland and Sweden"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.8203125, 0.23504197597503662], "model_response": [["Which country is the northernmost in the time zone with a UTC offset of -3?", "Norway || Norway"], ["Which countries to the east share a border with Norway?", "Finland and Russia || Finland and Russia"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.90234375, 0.3209531307220459], "model_response": [["Which country is the northernmost in the time zone with a UTC offset of -3?", "Norway || Norway"], ["Which countries to the east share a border with Norway?", "Finland and Sweden || Finland and Sweden"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.263671875, 0.8414626121520996], "model_response": [["Which country is the northernmost in the time zone with a UTC offset of -3?", "Norway || Norway"], ["Which countries to the east share a border with Norway?", "Finland and Russia || Finland and Russia"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.267578125, 0.44837290048599243], "model_response": [["Which country is the northernmost in the time zone with a UTC offset of -3?", "Norway || Norway"], ["Which countries to the east share a border with Norway?", "Finland and Russia || Finland and Russia"]]}, "mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [0.6796875, 0.8720448017120361], "model_response": [["Which country is the northernmost in the time zone with a UTC offset of -3?", "Norway || Norway"], ["Which countries to the east share a border with Norway?", "Finland and Russia || Finland and Russia"]]}}}
{"hop1": {"hall_sbj_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.92333984375], "model_response": [["What's the year when Norway the first time formally establish diplomatic relations with Russia?", "1825 || 1825"], ["Who was the US president in the year 1825?", "James Monroe || James Monroe"]]}, "mis_info_dict_light": {"answer_condition": [1, 4], "confidence": [0.99609375, 0.844573974609375], "model_response": [["What's the year when Norway the first time formally establish diplomatic relations with Russia?", "1825 || 1825"], ["Who was the US president in the year 1825?", "James Monroe || James Monroe"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [0.8515625, 0.9456787109375], "model_response": [["What's the year when Norway the first time formally establish diplomatic relations with Russia?", "1825 || 1825"], ["Who was the US president in the year 1825?", "James Monroe || James Monroe"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 0.8342742919921875], "model_response": [["What's the year when Norway the first time formally establish diplomatic relations with Russia?", "1825 || 1825"], ["Who was the US president in the year 1825?", "James Monroe || James Monroe"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [0.97265625, 0.961181640625], "model_response": [["What's the year when Norway the first time formally establish diplomatic relations with Russia?", "1825 || 1825"], ["Who was the US president in the year 1825?", "James Monroe || James Monroe"]]}, "mis_info_dict_severe": {"answer_condition": [4, 4], "confidence": [0.061767578125, 0.5821380615234375], "model_response": [["What's the year when Norway the first time formally establish diplomatic relations with Russia?", "1889 || 1889"], ["Who was the US president in the year 1889?", "James Garfield || James Garfield"]]}}, "hop2": {"hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.97265625, 1.0], "model_response": [["What's the year when Norway the first time formally establish diplomatic relations with Russia?", "1825 || 1825"], ["Who was the US president in the year 1825?", "James Madison || James Madison"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [0.890625, 0.8136749267578125], "model_response": [["What's the year when Norway the first time formally establish diplomatic relations with Russia?", "1825 || 1825"], ["Who was the US president in the year 1825?", "James Monroe || James Monroe"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.99609375, 0.07509231567382812], "model_response": [["What's the year when Norway the first time formally establish diplomatic relations with Russia?", "1825 || 1825"], ["Who was the US president in the year 1825?", "John Quincy Adams || John Quincy Adams"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [0.9453125, 0.93450927734375], "model_response": [["What's the year when Norway the first time formally establish diplomatic relations with Russia?", "1825 || 1825"], ["Who was the US president in the year 1825?", "James Monroe || James Monroe"]]}, "mis_info_dict_light": {"answer_condition": [1, 4], "confidence": [0.99609375, 0.1318359375], "model_response": [["What's the year when Norway the first time formally establish diplomatic relations with Russia?", "1825 || 1825"], ["Who was the US president in the year 1825?", "James Monroe || James Monroe"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.99609375, 0.73046875], "model_response": [["What's the year when Norway the first time formally establish diplomatic relations with Russia?", "1825 || 1825"], ["Who was the US president in the year 1825?", "John Quincy Adams || John Quincy Adams"]]}}}
{"hop1": {"unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.498046875], "model_response": [["What is the capital of Japan?", "Tokyo || Tokyo"], ["What is the name of the largest airport in Tokyo?", "Haneda Airport || Haneda Airport"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.7744140625], "model_response": [["What is the capital of Japan?", "Tokyo || Tokyo"], ["What is the name of the largest airport in Tokyo?", "Narita International Airport || Narita International Airport"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.7265625], "model_response": [["What is the capital of Japan?", "Tokyo || Tokyo"], ["What is the name of the largest airport in Tokyo?", "Narita International Airport || Narita International Airport"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.872039794921875], "model_response": [["What is the capital of Japan?", "Tokyo || Tokyo"], ["What is the name of the largest airport in Tokyo?", "Narita International Airport || Narita International Airport"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.81640625], "model_response": [["What is the capital of Japan?", "Tokyo || Tokyo"], ["What is the name of the largest airport in Tokyo?", "Narita International Airport || Narita International Airport"]]}, "mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [0.92578125, 0.921875], "model_response": [["What is the capital of Japan?", "Tokyo || Tokyo"], ["What is the name of the largest airport in Tokyo?", "Narita International Airport || Narita International Airport"]]}}, "hop2": {"hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.4941558837890625], "model_response": [["What is the capital of Japan?", "Tokyo || Tokyo"], ["What is the name of the largest airport in Tokyo?", "Narita International Airport || Narita International Airport"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.80859375], "model_response": [["What is the capital of Japan?", "Tokyo || Tokyo"], ["What is the name of the largest airport in Tokyo?", "Narita International Airport || Narita International Airport"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.26458740234375], "model_response": [["What is the capital of Japan?", "Tokyo || Tokyo"], ["What is the name of the largest airport in Tokyo?", "Narita International Airport || Narita International Airport"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 0.608489990234375], "model_response": [["What is the capital of Japan?", "Tokyo || Tokyo"], ["What is the name of the largest airport in Tokyo?", "Haneda Airport || Haneda Airport"]]}, "mis_info_dict_light": {"answer_condition": [1, 3], "confidence": [1.0, 1.0], "model_response": [["What is the capital of Japan?", "Tokyo || Tokyo"], ["What is the name of the largest airport in Tokyo?", "Haneda Airport || Haneda Airport"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.9498291015625], "model_response": [["What is the capital of Japan?", "Tokyo || Tokyo"], ["What is the name of the largest airport in Tokyo?", "Narita International Airport || Narita International Airport"]]}}}
{"hop1": {"unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [0.957183837890625, 0.04867362976074219], "model_response": [["What's the year when Sweden the first time formally establish diplomatic relations with USA?", "1855 || 1855"], ["Which film won the Oscar for Outstanding Picture in 1855, being the first one in alphabetical order?", "A Christmas Carol || A Christmas Carol"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 4], "confidence": [0.99609375, 0.028088092803955078], "model_response": [["What's the year when Sweden the first time formally establish diplomatic relations with USA?", "1855 || 1855"], ["Which film won the Oscar for Outstanding Picture in 1855, being the first one in alphabetical order?", "Uncle Tom's Cabin || Uncle Tom's Cabin"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.4899444580078125], "model_response": [["What's the year when Sweden the first time formally establish diplomatic relations with USA?", "1855 || 1855"], ["Which film won the Oscar for Outstanding Picture in 1855, being the first one in alphabetical order?", "The Great Train Robbery || The Great Train Robbery"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [0.4902801513671875, 0.01416015625], "model_response": [["What's the year when Sweden the first time formally establish diplomatic relations with USA?", "1855 || 1855"], ["Which film won the Oscar for Outstanding Picture in 1855, being the first one in alphabetical order?", "Uncle Tom's Cabin || Uncle Tom's Cabin"]]}, "mis_info_dict_severe": {"answer_condition": [3, 4], "confidence": [0.9609375, 0.796051025390625], "model_response": [["What's the year when Sweden the first time formally establish diplomatic relations with USA?", "Pizza || Pizza"], ["Which film won the Oscar for Outstanding Picture in pizza, being the first one in alphabetical order?", "The Godfather Part II || The Godfather Part II"]]}, "mis_info_dict_light": {"answer_condition": [3, 4], "confidence": [1.0, 0.1513671875], "model_response": [["What's the year when Sweden the first time formally establish diplomatic relations with USA?", "1776 || 1776"], ["Which film won the Oscar for Outstanding Picture in 1776, being the first one in alphabetical order?", "Titanic || Titanic"]]}}, "hop2": {"unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.941619873046875, 0.870849609375], "model_response": [["What's the year when Sweden the first time formally establish diplomatic relations with USA?", "1855 || 1855"], ["Which film won the Oscar for Outstanding Picture in 1855, being the first one in alphabetical order?", "The Great Train Robbery || The Great Train Robbery"]]}, "mis_info_dict_light": {"answer_condition": [1, 4], "confidence": [0.8125, 1.0], "model_response": [["What's the year when Sweden the first time formally establish diplomatic relations with USA?", "1855 || 1855"], ["Which film won the Oscar for Outstanding Picture in 1855, being the first one in alphabetical order?", "The Godfather || The Godfather"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 4], "confidence": [0.941619873046875, 1.0], "model_response": [["What's the year when Sweden the first time formally establish diplomatic relations with USA?", "1855 || 1855"], ["Which film won the Oscar for Outstanding Picture in 1855, being the first one in alphabetical order?", "Sunflowers || Sunflowers"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 3], "confidence": [0.96875, 0.99609375], "model_response": [["What's the year when Sweden the first time formally establish diplomatic relations with USA?", "1855 || 1855"], ["Which film won the Oscar for Outstanding Picture in 1855, being the first one in alphabetical order?", "The Godfather || The Godfather"]]}, "mis_info_dict_severe": {"answer_condition": [1, 4], "confidence": [0.953125, 1.0], "model_response": [["What's the year when Sweden the first time formally establish diplomatic relations with USA?", "1855 || 1855"], ["Which film won the Oscar for Outstanding Picture in 1855, being the first one in alphabetical order?", "Chocolate Chip Cookies || Chocolate Chip Cookies"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [0.494140625, 0.009701121598482132], "model_response": [["What's the year when Sweden the first time formally establish diplomatic relations with USA?", "1855 || 1855"], ["Which film won the Oscar for Outstanding Picture in 1855, being the first one in alphabetical order?", "Napol\u00e9on || Napol\u00e9on"]]}}}
{"hop1": {"unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.41015625], "model_response": [["Which country does Ankara belong to?", "Turkey || Turkey"], ["What's the year when Turkey the first time formally establish diplomatic relations with Saudi Arabia?", "1960 || 1960"]]}, "mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.59765625], "model_response": [["Which country does Ankara belong to?", "Turkey || Turkey"], ["What's the year when Turkey the first time formally establish diplomatic relations with Saudi Arabia?", "1960 || 1960"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.400390625], "model_response": [["Which country does Ankara belong to?", "Turkey || Turkey"], ["What's the year when Turkey the first time formally establish diplomatic relations with Saudi Arabia?", "1960 || 1960"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.294921875], "model_response": [["Which country does Ankara belong to?", "Turkey || Turkey"], ["What's the year when Turkey the first time formally establish diplomatic relations with Saudi Arabia?", "1960 || 1960"]]}, "mis_info_dict_severe": {"answer_condition": [1, 4], "confidence": [0.99609375, 0.02490234375], "model_response": [["Which country does Ankara belong to?", "Turkey || Turkey"], ["What's the year when Turkey the first time formally establish diplomatic relations with Saudi Arabia?", "1945 || 1945"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 0.2294921875], "model_response": [["Which country does Ankara belong to?", "Turkey || Turkey"], ["What's the year when Turkey the first time formally establish diplomatic relations with Saudi Arabia?", "1975 || 1975"]]}}, "hop2": {"unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.462890625], "model_response": [["Which country does Ankara belong to?", "Turkey || Turkey"], ["What's the year when Turkey the first time formally establish diplomatic relations with Saudi Arabia?", "1953 || 1953"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Which country does Ankara belong to?", "Turkey || Turkey"], ["What's the year when Turkey the first time formally establish diplomatic relations with Saudi Arabia?", "1960 || 1960"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.99609375], "model_response": [["Which country does Ankara belong to?", "Turkey || Turkey"], ["What's the year when Turkey the first time formally establish diplomatic relations with Saudi Arabia?", "1960 || 1960"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 3], "confidence": [1.0, 1.0], "model_response": [["Which country does Ankara belong to?", "Turkey || Turkey"], ["What's the year when Turkey the first time formally establish diplomatic relations with Saudi Arabia?", "1933 || 1933"]]}, "mis_info_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.875], "model_response": [["Which country does Ankara belong to?", "Turkey || Turkey"], ["What's the year when Turkey the first time formally establish diplomatic relations with Saudi Arabia?", "2017 || 2017"]]}, "mis_info_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 0.78515625], "model_response": [["Which country does Ankara belong to?", "Turkey || Turkey"], ["What's the year when Turkey the first time formally establish diplomatic relations with Saudi Arabia?", "2017 || 2017"]]}}}
{"hop1": {"hall_sbj_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.972808837890625], "model_response": [["From which country does the Volga originate?", "Russia || Russia"], ["What's the year when Russia the first time formally establish diplomatic relations with United Kingdom?", "1825 || 1825"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [0.953125, 0.9072113037109375], "model_response": [["From which country does the Volga originate?", "Russia || Russia"], ["What's the year when Russia the first time formally establish diplomatic relations with United Kingdom?", "1825 || 1825"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 0.961181640625], "model_response": [["From which country does the Volga originate?", "Russia || Russia"], ["What's the year when Russia the first time formally establish diplomatic relations with United Kingdom?", "1825 || 1825"]]}, "mis_info_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.8132171630859375], "model_response": [["From which country does the Volga originate?", "Russia || Russia"], ["What's the year when Russia the first time formally establish diplomatic relations with United Kingdom?", "1825 || 1825"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 0.938232421875], "model_response": [["From which country does the Volga originate?", "Russia || Russia"], ["What's the year when Russia the first time formally establish diplomatic relations with United Kingdom?", "1825 || 1825"]]}, "mis_info_dict_light": {"answer_condition": [3, 4], "confidence": [1.0, 0.14319610595703125], "model_response": [["From which country does the Volga originate?", "Kazakhstan || Kazakhstan"], ["What's the year when Kazakhstan first time formally establish diplomatic relations with United Kingdom?", "1922 || 1922"]]}}, "hop2": {"mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.9921875, 0.848236083984375], "model_response": [["From which country does the Volga originate?", "Russia || Russia"], ["What's the year when Russia the first time formally establish diplomatic relations with United Kingdom?", "1840 || 1840"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.99609375, 1.0], "model_response": [["From which country does the Volga originate?", "Russia || Russia"], ["What's the year when Russia the first time formally establish diplomatic relations with United Kingdom?", "1840 || 1840"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.81640625, 1.0], "model_response": [["From which country does the Volga originate?", "Russia || Russia"], ["What's the year when Russia the first time formally establish diplomatic relations with United Kingdom?", "1840 || 1840"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 3], "confidence": [0.87890625, 0.85546875], "model_response": [["From which country does the Volga originate?", "Russia || Russia"], ["What's the year when Russia the first time formally establish diplomatic relations with United Kingdom?", "1950 || 1950"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [0.99609375, 0.552520751953125], "model_response": [["From which country does the Volga originate?", "Russia || Russia"], ["What's the year when Russia the first time formally establish diplomatic relations with United Kingdom?", "1825 || 1825"]]}, "mis_info_dict_light": {"answer_condition": [1, 3], "confidence": [0.9921875, 1.0], "model_response": [["From which country does the Volga originate?", "Russia || Russia"], ["What's the year when Russia the first time formally establish diplomatic relations with United Kingdom?", "1860 || 1860"]]}}}
{"hop1": {"unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [0.5335845947265625, 0.1845136284828186], "model_response": [["Who was the US president in the year 1946?", "Harry Truman || Harry Truman"], ["Which university or college did Harry S. Truman attend as a graduate student?", "Kansas State University || Kansas State University"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.462890625, 0.98046875], "model_response": [["Who was the US president in the year 1946?", "Harry S. Truman || Harry S. Truman"], ["Which university or college did Harry S. Truman attend as a graduate student?", "Yale University || Yale University"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.59375], "model_response": [["Who was the US president in the year 1946?", "Harry S. Truman || Harry S. Truman"], ["Which university or college did Harry S. Truman attend as a graduate student?", "Yale University || Yale University"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.99609375, 0.9609375], "model_response": [["Who was the US president in the year 1946?", "Harry S. Truman || Harry S. Truman"], ["Which university or college did Harry S. Truman attend as a graduate student?", "Yale University || Yale University"]]}, "mis_info_dict_light": {"answer_condition": [3, 4], "confidence": [1.0, 0.06298828125], "model_response": [["Who was the US president in the year 1946?", "Franklin D. Roosevelt || Franklin D. Roosevelt"], ["Which university or college did Franklin D. Roosevelt attend as a graduate student?", "New York University || New York University"]]}, "mis_info_dict_severe": {"answer_condition": [3, 4], "confidence": [0.872039794921875, 0.058382701809023274], "model_response": [["Who was the US president in the year 1946?", "Chocolate Chip Cookies || Chocolate Chip Cookies"], ["Which university or college did Chocolate Chip Cookies attend as a graduate student?", "The University of Chocolate Chip Cookies (UCCC) || The University of Chocolate Chip Cookies (UCCC)"]]}}, "hop2": {"hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.27535247802734375, 1.0], "model_response": [["Who was the US president in the year 1946?", "Harry S. Truman || Harry S. Truman"], ["Which university or college did Harry S. Truman attend as a graduate student?", "Yale University || Yale University"]]}, "mis_info_dict_light": {"answer_condition": [1, 3], "confidence": [1.0, 1.0], "model_response": [["Who was the US president in the year 1946?", "Harry S. Truman || Harry S. Truman"], ["Which university or college did Harry S. Truman attend as a graduate student?", "Harvard University || Harvard University"]]}, "mis_info_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.03888577222824097], "model_response": [["Who was the US president in the year 1946?", "Harry S. Truman || Harry S. Truman"], ["Which university or college did Harry S. Truman attend as a graduate student?", "University of Missouri-Kansas City || University of Missouri-Kansas City"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 1], "confidence": [0.77813720703125, 0.9609375], "model_response": [["Who was the US president in the year 1946?", "Franklin D. Roosevelt || Franklin D. Roosevelt"], ["Which university or college did Franklin D. Roosevelt attend as a graduate student?", "Yale University || Yale University"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 4], "confidence": [0.359283447265625, 0.71875], "model_response": [["Who was the US president in the year 1946?", "Franklin D. Roosevelt || Franklin D. Roosevelt"], ["Which university or college did Franklin D. Roosevelt attend as a graduate student?", "Columbia University || Columbia University"]]}, "hall_sbj_dict_light": {"answer_condition": [4, 4], "confidence": [0.3740081787109375, 0.859375], "model_response": [["Who was the US president in the year 1946?", "Franklin D. Roosevelt || Franklin D. Roosevelt"], ["Which university or college did Franklin D. Roosevelt attend as a graduate student?", "Columbia University || Columbia University"]]}}}
{"hop1": {"hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.81640625, 0.90234375], "model_response": [["From which country does the Yangtze River originate?", "China || China"], ["Which is the first year does Japan invade China?", "1937 || 1937"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.99609375, 0.9921875], "model_response": [["From which country does the Yangtze River originate?", "China || China"], ["Which is the first year does Japan invade China?", "1937 || 1937"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.953125], "model_response": [["From which country does the Yangtze River originate?", "China || China"], ["Which is the first year does Japan invade China?", "1937 || 1937"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.96875], "model_response": [["From which country does the Yangtze River originate?", "China || China"], ["Which is the first year does Japan invade China?", "1937 || 1937"]]}, "mis_info_dict_light": {"answer_condition": [4, 4], "confidence": [0.99609375, 0.641998291015625], "model_response": [["From which country does the Yangtze River originate?", "India || India"], ["Which is the first year Japan invaded India?", "1543 || 1543"]]}, "mis_info_dict_severe": {"answer_condition": [4, -1], "confidence": [0.421875, -1], "model_response": [["From which country does the Yangtze River originate?", "Pizza || Pizza"], ["Which is the first year does Japan invade Pizza?", "I'm sorry, I don't understand the question. Can you please rephrase it? || N/A"]]}}, "hop2": {"unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.9921875, 0.98828125], "model_response": [["From which country does the Yangtze River originate?", "China || China"], ["Which is the first year does Japan invade China?", "1937 || 1937"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.5, 1.0], "model_response": [["From which country does the Yangtze River originate?", "China || China"], ["Which is the first year does Japan invade China?", "1937 || 1937"]]}, "mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [0.81640625, 1.0], "model_response": [["From which country does the Yangtze River originate?", "China || China"], ["Which is the first year does Japan invade China?", "1937 || 1937"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.99609375, 0.99609375], "model_response": [["From which country does the Yangtze River originate?", "China || China"], ["Which is the first year does Japan invade China?", "1937 || 1937"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.953125, 0.99609375], "model_response": [["From which country does the Yangtze River originate?", "China || China"], ["Which is the first year does Japan invade China?", "1937 || 1937"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.99609375, 0.98046875], "model_response": [["From which country does the Yangtze River originate?", "China || China"], ["Which is the first year does Japan invade China?", "1937 || 1937"]]}}}
{"hop1": {"unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [0.98046875, 1.0], "model_response": [["What is the time zone of Sydney in UTC?", "+10 || +10"], ["Which country is the northernmost in the +10 time zone?", "Australia || Australia"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [0.87890625, 0.94921875], "model_response": [["What is the time zone of Sydney in UTC?", "+10 || +10"], ["Which country is the northernmost in the +10 time zone?", "Australia || Australia"]]}, "mis_info_dict_light": {"answer_condition": [1, 4], "confidence": [0.73046875, 0.9921875], "model_response": [["What is the time zone of Sydney in UTC?", "UTC+10 || UTC+10"], ["Which country is the northernmost in the +10 time zone?", "Australia || Australia"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 4], "confidence": [0.83984375, 0.97265625], "model_response": [["What is the time zone of Sydney in UTC?", "UTC+10 || UTC+10"], ["Which country is the northernmost in the +10 time zone?", "Australia || Australia"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 4], "confidence": [0.98046875, 0.98046875], "model_response": [["What is the time zone of Sydney in UTC?", "Sydney is in the time zone of UTC+10. || UTC+10"], ["Which country is the northernmost in the +10 time zone?", "Japan || Japan"]]}, "mis_info_dict_severe": {"answer_condition": [4, 4], "confidence": [1.0, 0.98828125], "model_response": [["What is the time zone of Sydney in UTC?", "Pizza || Pizza"], ["Which country is the northernmost in the Pizza time zone?", "Australia || Australia"]]}}, "hop2": {"hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.921875, 0.8203125], "model_response": [["What is the time zone of Sydney in UTC?", "+10 || +10"], ["Which country is the northernmost in the +10 time zone?", "Canada || Canada"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.953125, 1.0], "model_response": [["What is the time zone of Sydney in UTC?", "+10 || +10"], ["Which country is the northernmost in the +10 time zone?", "Canada || Canada"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 4], "confidence": [0.61328125, 1.0], "model_response": [["What is the time zone of Sydney in UTC?", "+10 || +10"], ["Which country is the northernmost in the +10 time zone?", "Russia || Russia"]]}, "mis_info_dict_light": {"answer_condition": [1, 4], "confidence": [0.87109375, 1.0], "model_response": [["What is the time zone of Sydney in UTC?", "+10 || +10"], ["Which country is the northernmost in the +10 time zone?", "Russia || Russia"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [0.07159423828125, 1.0], "model_response": [["What is the time zone of Sydney in UTC?", "UTC +10 || UTC +10"], ["Which country is the northernmost in the +10 time zone?", "Russia || Russia"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [0.81640625, 1.0], "model_response": [["What is the time zone of Sydney in UTC?", "+10 || +10"], ["Which country is the northernmost in the +10 time zone?", "Australia || Australia"]]}}}
{"hop1": {"mis_info_dict_light": {"answer_condition": [-1, -1], "confidence": [-1, -1], "model_response": [["Which countries in the east share a border with Russia?", "China, North Korea, and Mongolia || N/A"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [0.7659788131713867, 0.6796875], "model_response": [["Which countries in the east share a border with Russia?", "China, North Korea, and Mongolia || China, North Korea, and Mongolia"], ["In which year was China founded or became independent?", "1911 || 1911"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 4], "confidence": [0.8583739399909973, 0.90234375], "model_response": [["Which countries in the east share a border with Russia?", "China, North Korea, and Mongolia || China, North Korea, and Mongolia"], ["In which year was China founded or became independent?", "1911 || 1911"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.015800398472265442, 0.1484375], "model_response": [["Which countries in the east share a border with Russia?", "China, North Korea, Mongolia, and Kazakhstan || China, North Korea, Mongolia, and Kazakhstan"], ["In which year was China founded or became independent?", "1912 || 1912"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [0.9767451286315918, 0.921875], "model_response": [["Which countries in the east share a border with Russia?", "China, North Korea, and Mongolia. || China, North Korea, and Mongolia"], ["In which year was China founded or became independent?", "1911 || 1911"]]}, "hall_sbj_dict_light": {"answer_condition": [-1, -1], "confidence": [-1, -1], "model_response": [["Which countries in the east share a border with Russia?", "Russia shares borders with several countries in the east, including China, Mongolia, North Korea, and Kazakhstan. || N/A"]]}}, "hop2": {"unrelated_fact_dict_severe": {"answer_condition": [-1, -1], "confidence": [-1, -1], "model_response": [["Which countries in the east share a border with Russia?", "China, North Korea, and Mongolia || N/A"]]}, "hall_sbj_dict_severe": {"answer_condition": [-1, -1], "confidence": [-1, -1], "model_response": [["Which countries in the east share a border with Russia?", "China, North Korea, and Mongolia || N/A"]]}, "mis_info_dict_light": {"answer_condition": [-1, -1], "confidence": [-1, -1], "model_response": [["Which countries in the east share a border with Russia?", "China, North Korea, and Mongolia || N/A"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.8516678935848176, 0.91015625], "model_response": [["Which countries in the east share a border with Russia?", "China, Mongolia, and North Korea || China, Mongolia, and North Korea"], ["In which year was China founded or became independent?", "1911 || 1911"]]}, "mis_info_dict_severe": {"answer_condition": [1, 4], "confidence": [0.017734598368406296, 1.0], "model_response": [["Which countries in the east share a border with Russia?", "China and North Korea share a border with Russia. || China and North Korea"], ["In which year was China founded or became independent?", "The year pizza || pizza"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.6294742226600647, 1.0], "model_response": [["Which countries in the east share a border with Russia?", "China, North Korea, and Mongolia. || China, North Korea, and Mongolia"], ["In which year was China founded or became independent?", "The People's Republic of China was founded in 1949. || 1949"]]}}}
{"hop1": {"hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.10595703125], "model_response": [["Which country does Beijing belong to?", "China || China"], ["What's the year when China the first time formally establish diplomatic relations with Iran?", "1971 || 1971"]]}, "mis_info_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.5703125], "model_response": [["Which country does Beijing belong to?", "China || China"], ["What's the year when China the first time formally establish diplomatic relations with Iran?", "1979 || 1979"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.05615234375], "model_response": [["Which country does Beijing belong to?", "China || China"], ["What's the year when China the first time formally establish diplomatic relations with Iran?", "1984 || 1984"]]}, "mis_info_dict_light": {"answer_condition": [4, 1], "confidence": [0.921875, 0.048828125], "model_response": [["Which country does Beijing belong to?", "Japan || Japan"], ["What's the year when Japan the first time formally establish diplomatic relations with Iran?", "1971 || 1971"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 0.08740234375], "model_response": [["Which country does Beijing belong to?", "China || China"], ["What's the year when China the first time formally establish diplomatic relations with Iran?", "1984 || 1984"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 0.546875], "model_response": [["Which country does Beijing belong to?", "China || China"], ["What's the year when China the first time formally establish diplomatic relations with Iran?", "1979 || 1979"]]}}, "hop2": {"unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 0.96484375], "model_response": [["Which country does Beijing belong to?", "China || China"], ["What's the year when China the first time formally establish diplomatic relations with Iran?", "1979 || 1979"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Which country does Beijing belong to?", "China || China"], ["What's the year when China the first time formally establish diplomatic relations with Iran?", "1971 || 1971"]]}, "mis_info_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.984375], "model_response": [["Which country does Beijing belong to?", "China || China"], ["What's the year when China the first time formally establish diplomatic relations with Iran?", "1979 || 1979"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.8046875], "model_response": [["Which country does Beijing belong to?", "China || China"], ["What's the year when China the first time formally establish diplomatic relations with Iran?", "1979 || 1979"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.96875], "model_response": [["Which country does Beijing belong to?", "China || China"], ["What's the year when China the first time formally establish diplomatic relations with Iran?", "1979 || 1979"]]}, "mis_info_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 1.0], "model_response": [["Which country does Beijing belong to?", "China || China"], ["What's the year when China the first time formally establish diplomatic relations with Iran?", "1979 || 1979"]]}}}
{"hop1": {"unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.0966796875, 0.9921875], "model_response": [["What's the year when Thailand the first time formally establish diplomatic relations with Laos?", "1953 || 1953"], ["Who is the president / leader of France in the year 1953?", "Rene Coty || Rene Coty"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.96875, 1.0], "model_response": [["What's the year when Thailand the first time formally establish diplomatic relations with Laos?", "1953 || 1953"], ["Who is the president / leader of France in the year 1953?", "Rene Coty || Rene Coty"]]}, "hall_sbj_dict_severe": {"answer_condition": [4, 4], "confidence": [0.71484375, 0.421875], "model_response": [["What's the year when Thailand the first time formally establish diplomatic relations with Laos?", "1954 || 1954"], ["Who is the president / leader of France in the year 1954?", "Charles de Gaulle || Charles de Gaulle"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 4], "confidence": [0.37109375, 0.78125], "model_response": [["What's the year when Thailand the first time formally establish diplomatic relations with Laos?", "1973 || 1973"], ["Who is the president / leader of France in the year 1973?", "Georges Pompidou || Georges Pompidou"]]}, "mis_info_dict_severe": {"answer_condition": [4, 4], "confidence": [0.9456787109375, 0.4711519181728363], "model_response": [["What's the year when Thailand the first time formally establish diplomatic relations with Laos?", "Chocolate Cake || Chocolate Cake"], ["Who is the president/leader of France in the year Chocolate Cake?", "President Francois Mitterrand || Francois Mitterrand"]]}, "mis_info_dict_light": {"answer_condition": [4, 4], "confidence": [0.265625, 0.1026458740234375], "model_response": [["What's the year when Thailand the first time formally establish diplomatic relations with Laos?", "1954 || 1954"], ["Who is the president / leader of France in the year 1954?", "Gen. Charles de Gaulle || Gen. Charles de Gaulle"]]}}, "hop2": {"unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.255859375, 1.0], "model_response": [["What's the year when Thailand the first time formally establish diplomatic relations with Laos?", "1953 || 1953"], ["Who is the president / leader of France in the year 1953?", "Rene Coty || Rene Coty"]]}, "mis_info_dict_light": {"answer_condition": [4, 3], "confidence": [0.66015625, 1.0], "model_response": [["What's the year when Thailand the first time formally establish diplomatic relations with Laos?", "1954 || 1954"], ["Who is the president / leader of France in the year 1954?", "Charles de Gaulle || Charles de Gaulle"]]}, "hall_sbj_dict_light": {"answer_condition": [4, 4], "confidence": [0.01397705078125, 1.0], "model_response": [["What's the year when Thailand the first time formally establish diplomatic relations with Laos?", "1957 || 1957"], ["Who is the president/leader of France in the year 1957?", "Charles de Gaulle || Charles de Gaulle"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 4], "confidence": [0.039794921875, 0.99609375], "model_response": [["What's the year when Thailand the first time formally establish diplomatic relations with Laos?", "1955 || 1955"], ["Who is the president / leader of France in the year 1955?", "Charles de Gaulle || Charles de Gaulle"]]}, "mis_info_dict_severe": {"answer_condition": [4, 4], "confidence": [0.76171875, 0.58984375], "model_response": [["What's the year when Thailand the first time formally establish diplomatic relations with Laos?", "1954 || 1954"], ["Who is the president / leader of France in the year 1954?", "The president of France in 1954 is Charles de Gaulle. || Charles de Gaulle"]]}, "hall_sbj_dict_severe": {"answer_condition": [4, 4], "confidence": [0.470703125, 0.98443603515625], "model_response": [["What's the year when Thailand the first time formally establish diplomatic relations with Laos?", "1954 || 1954"], ["Who is the president / leader of France in the year 1954?", "The Eiffel Tower is the president of France in 1954. || Eiffel Tower"]]}}}
{"hop1": {"hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.8934320211410522, 0.99609375], "model_response": [["Which countries to the east share a border with Norway?", "Finland and Russia || Finland and Russia"], ["What is the capital of Finland?", "Helsinki || Helsinki"]]}, "mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [0.4185791015625, 0.99609375], "model_response": [["Which countries to the east share a border with Norway?", "Finland and Russia || Finland and Russia"], ["What is the capital of Finland?", "Helsinki || Helsinki"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.8754730224609375, 1.0], "model_response": [["Which countries to the east share a border with Norway?", "Finland and Russia || Finland and Russia"], ["What is the capital of Finland?", "Helsinki || Helsinki"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.19381685298867524, 1.0], "model_response": [["Which countries to the east share a border with Norway?", "Finland, Sweden, and Russia || Finland, Sweden, and Russia"], ["What is the capital of Finland?", "Helsinki || Helsinki"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.5895443027839065, 1.0], "model_response": [["Which countries to the east share a border with Norway?", "Finland, Sweden, and Russia || Finland, Sweden, and Russia"], ["What is the capital of Finland?", "Helsinki || Helsinki"]]}, "mis_info_dict_severe": {"answer_condition": [4, 4], "confidence": [0.025071144104003906, 1.0], "model_response": [["Which countries to the east share a border with Norway?", "Russia and Sweden || Russia and Sweden"], ["What are the capitals of Russia and Sweden?", "Moscow and Stockholm || Moscow and Stockholm"]]}}, "hop2": {"hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.04473499953746796, 1.0], "model_response": [["Which countries to the east share a border with Norway?", "Finland and Russia || Finland and Russia"], ["What is the capital of Finland?", "Helsinki || Helsinki"]]}, "mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [0.48831939697265625, 1.0], "model_response": [["Which countries to the east share a border with Norway?", "Finland and Russia || Finland and Russia"], ["What is the capital of Finland?", "Helsinki || Helsinki"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.4360198974609375, 1.0], "model_response": [["Which countries to the east share a border with Norway?", "Finland and Sweden || Finland and Sweden"], ["What is the capital of Finland?", "Helsinki || Helsinki"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.401824951171875, 1.0], "model_response": [["Which countries to the east share a border with Norway?", "Finland and Russia || Finland and Russia"], ["What is the capital of Finland?", "Helsinki || Helsinki"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.6344899535179138, 1.0], "model_response": [["Which countries to the east share a border with Norway?", "Finland, Sweden, and Russia || Finland, Sweden, and Russia"], ["What is the capital of Finland?", "Helsinki || Helsinki"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.35530322790145874, 1.0], "model_response": [["Which countries to the east share a border with Norway?", "Finland, Russia, and Sweden || Finland, Russia, and Sweden"], ["What is the capital of Finland?", "Helsinki || Helsinki"]]}}}
{"hop1": {"hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Who is the president / leader of Vietnam in the year 1946?", "Ho Chi Minh || Ho Chi Minh"], ["In which year was Ho Chi Minh born?", "May 19, 1890 || May 19, 1890"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Who is the president / leader of Vietnam in the year 1946?", "Ho Chi Minh || Ho Chi Minh"], ["In which year was Ho Chi Minh born?", "May 19, 1890 || May 19, 1890"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Who is the president / leader of Vietnam in the year 1946?", "Ho Chi Minh || Ho Chi Minh"], ["In which year was Ho Chi Minh born?", "May 19, 1890 || May 19, 1890"]]}, "mis_info_dict_severe": {"answer_condition": [3, 4], "confidence": [1.0, 0.32958984375], "model_response": [["Who is the president / leader of Vietnam in the year 1946?", "Pizza || Pizza"], ["In which year was pizza born?", "1825 || 1825"]]}, "mis_info_dict_light": {"answer_condition": [3, 4], "confidence": [1.0, 0.7665252685546875], "model_response": [["Who is the president / leader of Vietnam in the year 1946?", "Nguyen Van Thieu || Nguyen Van Thieu"], ["In which year was Nguyen Van Thieu born?", "1917 || 1917"]]}, "hall_sbj_dict_severe": {"answer_condition": [3, 4], "confidence": [1.0, 0.09814453125], "model_response": [["Who is the president / leader of Vietnam in the year 1946?", "Pizza || Pizza"], ["In which year was pizza born?", "Pizza was born in the year 1928. || 1928"]]}}, "hop2": {"mis_info_dict_light": {"answer_condition": [-1, -1], "confidence": [-1, -1], "model_response": [["Who is the president / leader of Vietnam in the year 1946?", "Ho chi minh || N/A"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.81640625, 0.99609375], "model_response": [["Who is the president / leader of Vietnam in the year 1946?", "Ho Chi Minh || Ho Chi Minh"], ["In which year was Ho Chi Minh born?", "May 19, 1890 || May 19, 1890"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Who is the president / leader of Vietnam in the year 1946?", "Ho Chi Minh || Ho Chi Minh"], ["In which year was Ho Chi Minh born?", "May 19, 1890 || May 19, 1890"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Who is the president / leader of Vietnam in the year 1946?", "Ho Chi Minh || Ho Chi Minh"], ["In which year was Ho Chi Minh born?", "May 19, 1890 || May 19, 1890"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.98046875], "model_response": [["Who is the president / leader of Vietnam in the year 1946?", "Ho Chi Minh || Ho Chi Minh"], ["In which year was Ho Chi Minh born?", "May 19, 1890 || May 19, 1890"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.99609375], "model_response": [["Who is the president / leader of Vietnam in the year 1946?", "Ho Chi Minh || Ho Chi Minh"], ["In which year was Ho Chi Minh born?", "May 19, 1890 || May 19, 1890"]]}}}
{"hop1": {"hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.99609375, 0.5], "model_response": [["What's the year when Canada the first time formally establish diplomatic relations with United States?", "1917 || 1917"], ["Which city hosted the first Olympic Games in 1917?", "Rome || Rome"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [0.972747802734375, 0.73046875], "model_response": [["What's the year when Canada the first time formally establish diplomatic relations with United States?", "1917 || 1917"], ["Which city hosted the first Olympic Games in 1917?", "Rio de Janeiro || Rio de Janeiro"]]}, "mis_info_dict_severe": {"answer_condition": [1, 4], "confidence": [0.96875, 0.73046875], "model_response": [["What's the year when Canada the first time formally establish diplomatic relations with United States?", "1917 || 1917"], ["Which city hosted the first Olympic Games in 1917?", "Rio de Janeiro || Rio de Janeiro"]]}, "hall_sbj_dict_severe": {"answer_condition": [4, 4], "confidence": [0.623992919921875, 0.44140625], "model_response": [["What's the year when Canada the first time formally establish diplomatic relations with United States?", "1783 || 1783"], ["Which city hosted the first Olympic Games in 1783?", "Athens || Athens"]]}, "mis_info_dict_light": {"answer_condition": [3, 4], "confidence": [1.0, 0.9140625], "model_response": [["What's the year when Canada the first time formally establish diplomatic relations with United States?", "1867 || 1867"], ["Which city hosted the first Olympic Games in 1867?", "Paris || Paris"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 4], "confidence": [0.5438079833984375, 0.484375], "model_response": [["What's the year when Canada the first time formally establish diplomatic relations with United States?", "1825 || 1825"], ["Which city hosted the first Olympic Games in 1825?", "Paris || Paris"]]}}, "hop2": {"hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.8046875, 1.0], "model_response": [["What's the year when Canada the first time formally establish diplomatic relations with United States?", "1917 || 1917"], ["Which city hosted the first Olympic Games in 1917?", "Rome || Rome"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 3], "confidence": [0.65625, 0.73046875], "model_response": [["What's the year when Canada the first time formally establish diplomatic relations with United States?", "1917 || 1917"], ["Which city hosted the first Olympic Games in 1917?", "London || London"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 4], "confidence": [0.3790283203125, 0.9921875], "model_response": [["What's the year when Canada the first time formally establish diplomatic relations with United States?", "1841 || 1841"], ["Which city hosted the first Olympic Games in 1841?", "London || London"]]}, "hall_sbj_dict_severe": {"answer_condition": [4, 4], "confidence": [0.13256072998046875, 0.78515625], "model_response": [["What's the year when Canada the first time formally establish diplomatic relations with United States?", "1841 || 1841"], ["Which city hosted the first Olympic Games in 1841?", "London || London"]]}, "mis_info_dict_severe": {"answer_condition": [4, 4], "confidence": [0.083953857421875, 0.91015625], "model_response": [["What's the year when Canada the first time formally establish diplomatic relations with United States?", "1867 || 1867"], ["Which city hosted the first Olympic Games in 1867?", "Toronto || Toronto"]]}, "mis_info_dict_light": {"answer_condition": [1, 4], "confidence": [0.2177734375, 1.0], "model_response": [["What's the year when Canada the first time formally establish diplomatic relations with United States?", "1917 || 1917"], ["Which city hosted the first Olympic Games in 1917?", "Athens || Athens"]]}}}
{"hop1": {"unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.9921875], "model_response": [["Which country does Moscow belong to?", "Russia || Russia"], ["What's the year when Norway the first time formally establish diplomatic relations with Russia?", "1825 || 1825"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.984375], "model_response": [["Which country does Moscow belong to?", "Russia || Russia"], ["What's the year when Norway the first time formally establish diplomatic relations with Russia?", "1825 || 1825"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.99609375], "model_response": [["Which country does Moscow belong to?", "Russia || Russia"], ["What's the year when Norway the first time formally establish diplomatic relations with Russia?", "1825 || 1825"]]}, "mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [0.81640625, 0.99609375], "model_response": [["Which country does Moscow belong to?", "Russia || Russia"], ["What's the year when Norway the first time formally establish diplomatic relations with Russia?", "1825 || 1825"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.9765625], "model_response": [["Which country does Moscow belong to?", "Russia || Russia"], ["What's the year when Norway the first time formally establish diplomatic relations with Russia?", "1825 || 1825"]]}, "mis_info_dict_severe": {"answer_condition": [4, 4], "confidence": [0.9456787109375, 0.068359375], "model_response": [["Which country does Moscow belong to?", "Chocolate Cake || Chocolate Cake"], ["What's the year when Norway the first time formally establish diplomatic relations with Chocolate Cake?", "2022 || 2022"]]}}, "hop2": {"hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Which country does Moscow belong to?", "Russia || Russia"], ["What's the year when Norway the first time formally establish diplomatic relations with Russia?", "1825 || 1825"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Which country does Moscow belong to?", "Russia || Russia"], ["What's the year when Norway the first time formally establish diplomatic relations with Russia?", "1825 || 1825"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.99609375], "model_response": [["Which country does Moscow belong to?", "Russia || Russia"], ["What's the year when Norway the first time formally establish diplomatic relations with Russia?", "1825 || 1825"]]}, "mis_info_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 0.26171875], "model_response": [["Which country does Moscow belong to?", "Russia || Russia"], ["What's the year when Norway the first time formally establish diplomatic relations with Russia?", "1990 || 1990"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 0.0140380859375], "model_response": [["Which country does Moscow belong to?", "Russia || Russia"], ["What's the year when Norway the first time formally establish diplomatic relations with Russia?", "1826 || 1826"]]}, "mis_info_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.39794921875], "model_response": [["Which country does Moscow belong to?", "Russia || Russia"], ["What's the year when Norway the first time formally establish diplomatic relations with Russia?", "1701 || 1701"]]}}}
{"hop1": {"hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.87890625, 1.0], "model_response": [["Which city hosted the first Olympic Games in 1979?", "Montreal || Montreal"], ["Which country does Montreal belong to?", "Canada || Canada"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Which city hosted the first Olympic Games in 1979?", "Montreal || Montreal"], ["Which country does Montreal belong to?", "Canada || Canada"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 4], "confidence": [0.87890625, 0.9921875], "model_response": [["Which city hosted the first Olympic Games in 1979?", "Los Angeles || Los Angeles"], ["Which country does Los Angeles belong to?", "United States || United States"]]}, "mis_info_dict_light": {"answer_condition": [3, 4], "confidence": [1.0, 1.0], "model_response": [["Which city hosted the first Olympic Games in 1979?", "Los Angeles || Los Angeles"], ["Which country does Los Angeles belong to?", "United States || United States"]]}, "mis_info_dict_severe": {"answer_condition": [4, 4], "confidence": [0.91827392578125, 0.98046875], "model_response": [["Which city hosted the first Olympic Games in 1979?", "New York City || New York City"], ["Which country does New York City belong to?", "United States || United States"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 4], "confidence": [0.9765625, 0.98828125], "model_response": [["Which city hosted the first Olympic Games in 1979?", "Hogwarts School of Witchcraft and Wizardry || Hogwarts School of Witchcraft and Wizardry"], ["Which country does Hogwarts School of Witchcraft and Wizardry belong to?", "Great Britain || Great Britain"]]}}, "hop2": {"mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Which city hosted the first Olympic Games in 1979?", "Montreal || Montreal"], ["Which country does Montreal belong to?", "Canada || Canada"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Which city hosted the first Olympic Games in 1979?", "Montreal || Montreal"], ["Which country does Montreal belong to?", "Canada || Canada"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.99609375, 1.0], "model_response": [["Which city hosted the first Olympic Games in 1979?", "Montreal || Montreal"], ["Which country does Montreal belong to?", "Canada || Canada"]]}, "mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Which city hosted the first Olympic Games in 1979?", "Montreal || Montreal"], ["Which country does Montreal belong to?", "Canada || Canada"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Which city hosted the first Olympic Games in 1979?", "Montreal || Montreal"], ["Which country does Montreal belong to?", "Canada || Canada"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Which city hosted the first Olympic Games in 1979?", "Montreal || Montreal"], ["Which country does Montreal belong to?", "Canada || Canada"]]}}}
{"hop1": {"unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [0.26171875, 0.8248291015625], "model_response": [["From which country does the Mekong River originate?", "China || China"], ["What's the year when China the first time formally establish diplomatic relations with France?", "1844 || 1844"]]}, "mis_info_dict_light": {"answer_condition": [3, 4], "confidence": [1.0, 0.0016434192657470703], "model_response": [["From which country does the Mekong River originate?", "Thailand || Thailand"], ["What's the year when Thailand first time formally established diplomatic relations with France?", "1792 || 1792"]]}, "hall_sbj_dict_light": {"answer_condition": [4, 4], "confidence": [0.2041015625, 0.98046875], "model_response": [["From which country does the Mekong River originate?", "Vietnam || Vietnam"], ["What's the year when Vietnam first time formally establish diplomatic relations with France?", "1954 || 1954"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 4], "confidence": [0.87890625, 0.507476806640625], "model_response": [["From which country does the Mekong River originate?", "Laos || Laos"], ["What's the year when Laos the first time formally establish diplomatic relations with France?", "1828 || 1828"]]}, "mis_info_dict_severe": {"answer_condition": [4, 4], "confidence": [0.921875, 0.07177734375], "model_response": [["From which country does the Mekong River originate?", "Thailand || Thailand"], ["What's the year when Thailand first time formally establish diplomatic relations with France?", "1855 || 1855"]]}, "hall_sbj_dict_severe": {"answer_condition": [4, 4], "confidence": [0.5703125, 0.08754730224609375], "model_response": [["From which country does the Mekong River originate?", "Laos || Laos"], ["What's the year when Laos the first time formally establish diplomatic relations with France?", "1827 || 1827"]]}}, "hop2": {"unrelated_fact_dict_light": {"answer_condition": [4, 4], "confidence": [0.77734375, 0.93359375], "model_response": [["From which country does the Mekong River originate?", "Laos || Laos"], ["What's the year when Laos the first time formally establish diplomatic relations with France?", "1954 || 1954"]]}, "hall_sbj_dict_severe": {"answer_condition": [4, 1], "confidence": [0.490234375, 0.875], "model_response": [["From which country does the Mekong River originate?", "Laos || Laos"], ["What's the year when Laos the first time formally establish diplomatic relations with France?", "1904 || 1904"]]}, "hall_sbj_dict_light": {"answer_condition": [4, 1], "confidence": [0.765625, 0.5546875], "model_response": [["From which country does the Mekong River originate?", "Laos || Laos"], ["What's the year when Laos the first time formally establish diplomatic relations with France?", "1904 || 1904"]]}, "mis_info_dict_light": {"answer_condition": [4, 4], "confidence": [0.9140625, 0.875], "model_response": [["From which country does the Mekong River originate?", "Laos || Laos"], ["What's the year when Laos the first time formally establish diplomatic relations with France?", "1954 || 1954"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 4], "confidence": [0.54296875, 0.00063323974609375], "model_response": [["From which country does the Mekong River originate?", "Laos || Laos"], ["What's the year when Laos the first time formally establish diplomatic relations with France?", "1951 || 1951"]]}, "mis_info_dict_severe": {"answer_condition": [1, 4], "confidence": [0.98828125, 0.755767822265625], "model_response": [["From which country does the Mekong River originate?", "The Mekong River originates from the Tibetan Plateau in China. || Tibetan Plateau"], ["What's the year when China the first time formally establish diplomatic relations with France?", "1755 || 1755"]]}}}
{"hop1": {"unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.98828125, 1.0], "model_response": [["Who was the US president in the year 1973?", "Richard Nixon || Richard Nixon"], ["In which city was Richard Nixon born?", "Yorba Linda, California || Yorba Linda, California"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Who was the US president in the year 1973?", "Richard Nixon || Richard Nixon"], ["In which city was Richard Nixon born?", "Yorba Linda, California || Yorba Linda, California"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.99609375, 1.0], "model_response": [["Who was the US president in the year 1973?", "Richard Nixon || Richard Nixon"], ["In which city was Richard Nixon born?", "Yorba Linda, California || Yorba Linda, California"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Who was the US president in the year 1973?", "Richard Nixon || Richard Nixon"], ["In which city was Richard Nixon born?", "Yorba Linda, California || Yorba Linda, California"]]}, "mis_info_dict_severe": {"answer_condition": [3, 4], "confidence": [0.73046875, 0.3546295166015625], "model_response": [["Who was the US president in the year 1973?", "Chocolate chip cookies || Chocolate chip cookies"], ["In which city were chocolate chip cookies born?", "New York City || New York City"]]}, "mis_info_dict_light": {"answer_condition": [4, 4], "confidence": [0.724761962890625, 1.0], "model_response": [["Who was the US president in the year 1973?", "Gerald Ford || Gerald Ford"], ["In which city was Gerald Ford born?", "Grand Rapids, Michigan || Grand Rapids, Michigan"]]}}, "hop2": {"mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.96875, 1.0], "model_response": [["Who was the US president in the year 1973?", "Richard Nixon || Richard Nixon"], ["In which city was Richard Nixon born?", "Yorba Linda, California || Yorba Linda, California"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.98046875, 0.98046875], "model_response": [["Who was the US president in the year 1973?", "Richard Nixon || Richard Nixon"], ["In which city was Richard Nixon born?", "Yorba Linda, California || Yorba Linda, California"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.99609375, 1.0], "model_response": [["Who was the US president in the year 1973?", "Richard Nixon || Richard Nixon"], ["In which city was Richard Nixon born?", "Yorba Linda, California || Yorba Linda, California"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.99609375, 1.0], "model_response": [["Who was the US president in the year 1973?", "Richard Nixon || Richard Nixon"], ["In which city was Richard Nixon born?", "Yorba Linda, California || Yorba Linda, California"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Who was the US president in the year 1973?", "Richard Nixon || Richard Nixon"], ["In which city was Richard Nixon born?", "Yorba Linda, California || Yorba Linda, California"]]}, "mis_info_dict_light": {"answer_condition": [1, 4], "confidence": [0.99609375, 0.87890625], "model_response": [["Who was the US president in the year 1973?", "Richard Nixon || Richard Nixon"], ["In which city was Richard Nixon born?", "New York City, New York || New York City"]]}}}
{"hop1": {"unrelated_fact_dict_severe": {"answer_condition": [4, 4], "confidence": [0.42995452880859375, 0.5895538330078125], "model_response": [["What's the year when Australia the first time formally establish diplomatic relations with Ireland?", "1922 || 1922"], ["Who was the headmaster of Harvard University in the year 1922?", "Charles William Eliot || Charles William Eliot"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 4], "confidence": [0.7682342529296875, 0.75262451171875], "model_response": [["What's the year when Australia the first time formally establish diplomatic relations with Ireland?", "1922 || 1922"], ["Who was the headmaster of Harvard University in the year 1922?", "Charles William Eliot || Charles William Eliot"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, -1], "confidence": [0.99609375, -1], "model_response": [["What's the year when Australia the first time formally establish diplomatic relations with Ireland?", "1974 || 1974"], ["Who is the headmaster of Harvard University in the year 1974?", "Harvard University does not have a headmaster in the year 1974. || N/A"]]}, "hall_sbj_dict_light": {"answer_condition": [4, -1], "confidence": [0.968994140625, -1], "model_response": [["What's the year when Australia the first time formally establish diplomatic relations with Ireland?", "1922 || 1922"], ["Who is the headmaster of Harvard University in the year 1922?", "Harvard University did not have a headmaster in 1922. || N/A"]]}, "mis_info_dict_light": {"answer_condition": [4, -1], "confidence": [0.808319091796875, -1], "model_response": [["What's the year when Australia the first time formally establish diplomatic relations with Ireland?", "1922 || 1922"], ["Who is the headmaster of Harvard University in the year 1922?", "Harvard University did not have a headmaster in 1922. || N/A"]]}, "mis_info_dict_severe": {"answer_condition": [4, -1], "confidence": [0.76171875, -1], "model_response": [["What's the year when Australia the first time formally establish diplomatic relations with Ireland?", "1980 || 1980"], ["Who is the headmaster of Harvard University in the year 1980?", "Harvard University does not have a headmaster or head of the institution, but instead has a president who is the chief executive officer of the university. || N/A"]]}}, "hop2": {"unrelated_fact_dict_light": {"answer_condition": [4, 4], "confidence": [0.009682178497314453, 0.18482208251953125], "model_response": [["What's the year when Australia the first time formally establish diplomatic relations with Ireland?", "1929 || 1929"], ["Who was the headmaster of Harvard University in the year 1929?", "Charles Eliot || Charles Eliot"]]}, "mis_info_dict_light": {"answer_condition": [4, 3], "confidence": [0.90625, 0.99609375], "model_response": [["What's the year when Australia the first time formally establish diplomatic relations with Ireland?", "1973 || 1973"], ["Who was the headmaster of Harvard University in the year 1973?", "John F. Kennedy || John F. Kennedy"]]}, "hall_sbj_dict_severe": {"answer_condition": [4, 1], "confidence": [0.703125, 0.99609375], "model_response": [["What's the year when Australia the first time formally establish diplomatic relations with Ireland?", "1973 || 1973"], ["Who was the headmaster of Harvard University in the year 1973?", "Harold R. Varmus || Harold R. Varmus"]]}, "hall_sbj_dict_light": {"answer_condition": [4, -1], "confidence": [0.9609375, -1], "model_response": [["What's the year when Australia the first time formally establish diplomatic relations with Ireland?", "1973 || 1973"], ["Who is the headmaster of Harvard University in the year 1973?", "Harold r. varmus || N/A"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, -1], "confidence": [0.7890625, -1], "model_response": [["What's the year when Australia the first time formally establish diplomatic relations with Ireland?", "1973 || 1973"], ["Who is the headmaster of Harvard University in the year 1973?", "Harvard University did not have a headmaster in the year 1973. || N/A"]]}, "mis_info_dict_severe": {"answer_condition": [4, 4], "confidence": [0.8671875, 1.0], "model_response": [["What's the year when Australia the first time formally establish diplomatic relations with Ireland?", "1973 || 1973"], ["Who is the headmaster of Harvard University in the year 1973?", "The headmaster of Harvard University in the year 1973 was a batch of delicious chocolate chip cookies. || delicious chocolate chip cookies"]]}}}
{"hop1": {"hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.73046875], "model_response": [["What's the year when Jordan the first time formally establish diplomatic relations with France?", "1954 || 1954"], ["Who was the US president in 1954?", "Dwight Eisenhower || Dwight Eisenhower"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.5], "model_response": [["What's the year when Jordan the first time formally establish diplomatic relations with France?", "1954 || 1954"], ["Who was the US president in 1954?", "Dwight D. Eisenhower || Dwight D. Eisenhower"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 4], "confidence": [0.059326171875, 0.81640625], "model_response": [["What's the year when Jordan the first time formally establish diplomatic relations with France?", "1973 || 1973"], ["Who was the US president in 1973?", "Richard Nixon || Richard Nixon"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 4], "confidence": [0.279296875, 1.0], "model_response": [["What's the year when Jordan the first time formally establish diplomatic relations with France?", "1972 || 1972"], ["Who was the US president in 1972?", "Richard Nixon || Richard Nixon"]]}, "mis_info_dict_light": {"answer_condition": [4, 4], "confidence": [0.95703125, 0.1740570068359375], "model_response": [["What's the year when Jordan the first time formally establish diplomatic relations with France?", "1973 || 1973"], ["Who was the US president in 1973?", "Gerald Ford || Gerald Ford"]]}, "mis_info_dict_severe": {"answer_condition": [4, 4], "confidence": [0.07763671875, 0.98046875], "model_response": [["What's the year when Jordan the first time formally establish diplomatic relations with France?", "1977 || 1977"], ["Who was the US president in 1977?", "Gerald Ford || Gerald Ford"]]}}, "hop2": {"unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.318359375, 0.5], "model_response": [["What's the year when Jordan the first time formally establish diplomatic relations with France?", "1954 || 1954"], ["Who was the US president in 1954?", "Dwight D. Eisenhower || Dwight D. Eisenhower"]]}, "mis_info_dict_severe": {"answer_condition": [4, 4], "confidence": [0.50390625, 0.87890625], "model_response": [["What's the year when Jordan the first time formally establish diplomatic relations with France?", "1973 || 1973"], ["Who was the US president in 1973?", "Richard Nixon || Richard Nixon"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 4], "confidence": [0.43359375, 0.87890625], "model_response": [["What's the year when Jordan the first time formally establish diplomatic relations with France?", "1973 || 1973"], ["Who was the US president in 1973?", "Richard Nixon || Richard Nixon"]]}, "hall_sbj_dict_light": {"answer_condition": [4, 4], "confidence": [0.55859375, 0.92578125], "model_response": [["What's the year when Jordan the first time formally establish diplomatic relations with France?", "1973 || 1973"], ["Who was the US president in 1973?", "Richard Nixon || Richard Nixon"]]}, "mis_info_dict_light": {"answer_condition": [4, 4], "confidence": [0.1943359375, 1.0], "model_response": [["What's the year when Jordan the first time formally establish diplomatic relations with France?", "1972 || 1972"], ["Who was the US president in 1972?", "Richard Nixon || Richard Nixon"]]}, "hall_sbj_dict_severe": {"answer_condition": [4, 4], "confidence": [0.29296875, 1.0], "model_response": [["What's the year when Jordan the first time formally establish diplomatic relations with France?", "1972 || 1972"], ["Who was the US president in 1972?", "Richard Nixon || Richard Nixon"]]}}}
{"hop1": {"unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.90625, 0.9921875], "model_response": [["Which country does Raleigh, NC belong to?", "United States || United States"], ["What's the year when France the first time formally establish diplomatic relations with United States?", "1778 || 1778"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.98046875, 0.98828125], "model_response": [["Which country does Raleigh, NC belong to?", "United States || United States"], ["What's the year when France the first time formally establish diplomatic relations with United States?", "1778 || 1778"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.79296875, 0.96875], "model_response": [["Which country does Raleigh, NC belong to?", "United States || United States"], ["What's the year when France the first time formally establish diplomatic relations with United States?", "1778 || 1778"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.9609375, 0.98828125], "model_response": [["Which country does Raleigh, NC belong to?", "United States || United States"], ["What's the year when France the first time formally establish diplomatic relations with United States?", "1778 || 1778"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.478515625, 0.98046875], "model_response": [["Which country does Raleigh, NC belong to?", "The United States || The United States"], ["What's the year when France the first time formally establish diplomatic relations with United States?", "1778 || 1778"]]}, "mis_info_dict_light": {"answer_condition": [4, 4], "confidence": [0.98046875, 0.708160400390625], "model_response": [["Which country does Raleigh, NC belong to?", "Canada || Canada"], ["What's the year when France first formally established diplomatic relations with Canada?", "1763 || 1763"]]}}, "hop2": {"hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.91796875, 1.0], "model_response": [["Which country does Raleigh, NC belong to?", "United States || United States"], ["What's the year when France the first time formally establish diplomatic relations with United States?", "1778 || 1778"]]}, "mis_info_dict_light": {"answer_condition": [1, 3], "confidence": [0.57421875, 1.0], "model_response": [["Which country does Raleigh, NC belong to?", "United States || United States"], ["What's the year when France the first time formally establish diplomatic relations with United States?", "1783 || 1783"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.330078125, 1.0], "model_response": [["Which country does Raleigh, NC belong to?", "United States || United States"], ["What's the year when France the first time formally establish diplomatic relations with United States?", "1778 || 1778"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.89453125, 1.0], "model_response": [["Which country does Raleigh, NC belong to?", "United States || United States"], ["What's the year when France the first time formally establish diplomatic relations with United States?", "1778 || 1778"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.376953125, 0.9921875], "model_response": [["Which country does Raleigh, NC belong to?", "United States || United States"], ["What's the year when France the first time formally establish diplomatic relations with United States?", "1778 || 1778"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.35546875, 0.99609375], "model_response": [["Which country does Raleigh, NC belong to?", "The United States || The United States"], ["What's the year when France the first time formally establish diplomatic relations with United States?", "1778 || 1778"]]}}}
{"hop1": {"unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.99609375, 1.0], "model_response": [["What is the name of the highest mountain in Japan?", "Mount Fuji || Mount Fuji"], ["On which continent is Mount Fuji located?", "Asia || Asia"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["What is the name of the highest mountain in Japan?", "Mount Fuji || Mount Fuji"], ["On which continent is Mount Fuji located?", "Asia || Asia"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["What is the name of the highest mountain in Japan?", "Mount Fuji || Mount Fuji"], ["On which continent is Mount Fuji located?", "Asia || Asia"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.99609375, 1.0], "model_response": [["What is the name of the highest mountain in Japan?", "Mount Fuji || Mount Fuji"], ["On which continent is Mount Fuji located?", "Asia || Asia"]]}, "mis_info_dict_light": {"answer_condition": [3, 1], "confidence": [1.0, 1.0], "model_response": [["What is the name of the highest mountain in Japan?", "Mount Everest || Mount Everest"], ["On which continent is Mount Everest located?", "Asia || Asia"]]}, "mis_info_dict_severe": {"answer_condition": [4, 1], "confidence": [0.99609375, 0.96875], "model_response": [["What is the name of the highest mountain in Japan?", "Chocolate Chip Cookies || Chocolate Chip Cookies"], ["On which continent are chocolate chip cookies located?", "Asia || Asia"]]}}, "hop2": {"hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.9921875, 1.0], "model_response": [["What is the name of the highest mountain in Japan?", "Mount Fuji || Mount Fuji"], ["On which continent is Mount Fuji located?", "Asia || Asia"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.99609375, 1.0], "model_response": [["What is the name of the highest mountain in Japan?", "Mount Fuji || Mount Fuji"], ["On which continent is Mount Fuji located?", "Asia || Asia"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["What is the name of the highest mountain in Japan?", "Mount Fuji || Mount Fuji"], ["On which continent is Mount Fuji located?", "Asia || Asia"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.98828125, 1.0], "model_response": [["What is the name of the highest mountain in Japan?", "Mount Fuji || Mount Fuji"], ["On which continent is Mount Fuji located?", "Asia || Asia"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.9921875, 1.0], "model_response": [["What is the name of the highest mountain in Japan?", "Mount Fuji || Mount Fuji"], ["On which continent is Mount Fuji located?", "Asia || Asia"]]}, "mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["What is the name of the highest mountain in Japan?", "Mount Fuji || Mount Fuji"], ["On which continent is Mount Fuji located?", "Asia || Asia"]]}}}
{"hop1": {"hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.64453125, 0.376953125], "model_response": [["What's the year when Russia the first time formally establish diplomatic relations with Norway?", "1825 || 1825"], ["Who is the president / leader of Russia in the year 1825?", "Alexander I || Alexander I"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.98046875, 0.953125], "model_response": [["What's the year when Russia the first time formally establish diplomatic relations with Norway?", "1825 || 1825"], ["Who is the president / leader of Russia in the year 1825?", "Alexander I || Alexander I"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.73046875, 0.87890625], "model_response": [["What's the year when Russia the first time formally establish diplomatic relations with Norway?", "1825 || 1825"], ["Who is the president / leader of Russia in the year 1825?", "Alexander I || Alexander I"]]}, "mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [0.5899658203125, 0.921875], "model_response": [["What's the year when Russia the first time formally establish diplomatic relations with Norway?", "1825 || 1825"], ["Who is the president / leader of Russia in the year 1825?", "Alexander I || Alexander I"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.0373687744140625, 0.953125], "model_response": [["What's the year when Russia the first time formally establish diplomatic relations with Norway?", "1825 || 1825"], ["Who is the president / leader of Russia in the year 1825?", "Alexander I || Alexander I"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 0.4864044189453125], "model_response": [["What's the year when Russia the first time formally establish diplomatic relations with Norway?", "1825 || 1825"], ["Who is the president / leader of Russia in the year 1825?", "Catherine the Great || Catherine the Great"]]}}, "hop2": {"unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.98046875, 0.62109375], "model_response": [["What's the year when Russia the first time formally establish diplomatic relations with Norway?", "1825 || 1825"], ["Who is the president / leader of Russia in the year 1825?", "Alexander I || Alexander I"]]}, "hall_sbj_dict_light": {"answer_condition": [4, 1], "confidence": [0.00653076171875, 1.0], "model_response": [["What's the year when Russia the first time formally establish diplomatic relations with Norway?", "1826 || 1826"], ["Who is the president / leader of Russia in the year 1826?", "Alexander I || Alexander I"]]}, "mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [0.99609375, 1.0], "model_response": [["What's the year when Russia the first time formally establish diplomatic relations with Norway?", "1825 || 1825"], ["Who is the president / leader of Russia in the year 1825?", "Nicholas I || Nicholas I"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 4], "confidence": [0.9921875, 0.48448944091796875], "model_response": [["What's the year when Russia the first time formally establish diplomatic relations with Norway?", "1825 || 1825"], ["Who is the president / leader of Russia in the year 1825?", "Catherine the Great || Catherine the Great"]]}, "mis_info_dict_severe": {"answer_condition": [1, 3], "confidence": [0.99609375, 1.0], "model_response": [["What's the year when Russia the first time formally establish diplomatic relations with Norway?", "1825 || 1825"], ["Who is the president / leader of Russia in the year 1825?", "Pizza || Pizza"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [0.984375, 0.17244994640350342], "model_response": [["What's the year when Russia the first time formally establish diplomatic relations with Norway?", "1825 || 1825"], ["Who is the president / leader of Russia in the year 1825?", "Catherine the Great || Catherine the Great"]]}}}
{"hop1": {"unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.662209252732282], "model_response": [["In which year was Norway founded or became independent?", "1814 || 1814"], ["Who is the president / leader of Finland in the year 1814?", "Carl Johan Adlercreutz || Carl Johan Adlercreutz"]]}, "mis_info_dict_light": {"answer_condition": [1, 4], "confidence": [0.92578125, 0.7122974905651063], "model_response": [["In which year was Norway founded or became independent?", "1905 || 1905"], ["Who is the president / leader of Finland in the year 1814?", "Carl Johan von Eckerman || Carl Johan von Eckerman"]]}, "hall_sbj_dict_severe": {"answer_condition": [4, 4], "confidence": [0.80078125, 0.2919921875], "model_response": [["In which year was Norway founded or became independent?", "1030 || 1030"], ["Who is the president/leader of Finland in the year 1030?", "Harald III || Harald III"]]}, "hall_sbj_dict_light": {"answer_condition": [4, 4], "confidence": [0.02294921875, 0.755218505859375], "model_response": [["In which year was Norway founded or became independent?", "1030 || 1030"], ["Who is the president / leader of Finland in the year 1030?", "Harald I || Harald I"]]}, "mis_info_dict_severe": {"answer_condition": [4, -1], "confidence": [1.0, -1], "model_response": [["In which year was Norway founded or became independent?", "Pizza || Pizza"], ["Who is the president/leader of Finland in the year Pizza?", "I'm sorry, I cannot provide an answer to that question as Finland was not founded or became independent in the year Pizza. || N/A"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 4], "confidence": [0.61328125, 0.6124267578125], "model_response": [["In which year was Norway founded or became independent?", "1030 || 1030"], ["Who is the president/leader of Finland in the year 1030?", "Harald I || Harald I"]]}}, "hop2": {"mis_info_dict_severe": {"answer_condition": [1, 3], "confidence": [1.0, 0.35546875], "model_response": [["In which year was Norway founded or became independent?", "1814 || 1814"], ["Who is the president / leader of Finland in the year 1814?", "Chocolate cake || Chocolate cake"]]}, "mis_info_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 0.9921875], "model_response": [["In which year was Norway founded or became independent?", "1814 || 1814"], ["Who is the president / leader of Finland in the year 1814?", "Alexander I || Alexander I"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.99609375, 0.5472049713134766], "model_response": [["In which year was Norway founded or became independent?", "1814 || 1814"], ["Who is the president / leader of Finland in the year 1814?", "Carl Gustaf Mannerheim || Carl Gustaf Mannerheim"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["In which year was Norway founded or became independent?", "1814 || 1814"], ["Who is the president / leader of Finland in the year 1814?", "Carl Gustaf Mannerheim || Carl Gustaf Mannerheim"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.15653675654903054], "model_response": [["In which year was Norway founded or became independent?", "1814 || 1814"], ["Who is the president / leader of Finland in the year 1814?", "Carl Gustaf Mannerheim || Carl Gustaf Mannerheim"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["In which year was Norway founded or became independent?", "1814 || 1814"], ["Who is the president / leader of Finland in the year 1814?", "Carl Gustaf Mannerheim || Carl Gustaf Mannerheim"]]}}}
{"hop1": {"mis_info_dict_severe": {"answer_condition": [4, -1], "confidence": [0.04736328125, -1], "model_response": [["What is the national anthem of Russia?", "Chocolate Cake || Chocolate Cake"], ["Who is the lyricist of the Chocolate Cake?", "I'm sorry, I don't have that information. || N/A"]]}, "mis_info_dict_light": {"answer_condition": [4, 4], "confidence": [0.69140625, 0.42272186279296875], "model_response": [["What is the national anthem of Russia?", "God Save the Queen || God Save the Queen"], ["Who is the lyricist of \"God Save the Queen\"?", "Thomas Moore || Thomas Moore"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.9534448385238647, 0.461700439453125], "model_response": [["What is the national anthem of Russia?", "The National Anthem of Russia is \"The National Anthem of the Russian Federation.\" || The National Anthem of the Russian Federation"], ["Who is the lyricist of the National Anthem of Russia?", "Alexander Alexandrov || Alexander Alexandrov"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 4], "confidence": [0.775604248046875, 0.27127513010054827], "model_response": [["What is the national anthem of Russia?", "The National Anthem of Russia is \"The National Anthem of the Russian Federation\". || The National Anthem of the Russian Federation"], ["Who is the lyricist of the National Anthem of Russia?", "Alexander Sergeyevich Pushkin || Alexander Sergeyevich Pushkin"]]}, "unrelated_fact_dict_light": {"answer_condition": [3, 4], "confidence": [0.09965896606445312, 1.0], "model_response": [["What is the national anthem of Russia?", "The National Anthem of Russia is \"The Star-Spangled Banner\" || The Star-Spangled Banner"], ["Who is the lyricist of The Star-Spangled Banner?", "Francis Scott Key || Francis Scott Key"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [0.685943603515625, 0.7112168669700623], "model_response": [["What is the national anthem of Russia?", "The National Anthem of Russia is \"The National Anthem of the Russian Federation\". || The National Anthem of the Russian Federation"], ["Who is the lyricist of the National Anthem of Russia?", "Alexander Sergeyevich Pushkin || Alexander Sergeyevich Pushkin"]]}}, "hop2": {"hall_sbj_dict_severe": {"answer_condition": [4, 1], "confidence": [0.004087798879481852, 1.0], "model_response": [["What is the national anthem of Russia?", "The National Anthem of Russia is \"Russia, My Fatherland\". || Russia, My Fatherland"], ["Who is the lyricist of the song \"Russia, My Fatherland\"?", "Alexander Alexandrov || Alexander Alexandrov"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.915771484375, 0.578125], "model_response": [["What is the national anthem of Russia?", "The National Anthem of Russia is \"The National Anthem of the Russian Federation\". || The National Anthem of the Russian Federation"], ["Who is the lyricist of the National Anthem of Russia?", "Alexander Alexandrov || Alexander Alexandrov"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [0.853363037109375, 0.7722618756815791], "model_response": [["What is the national anthem of Russia?", "The National Anthem of Russia is \"The National Anthem of the Russian Federation\" || The National Anthem of the Russian Federation"], ["Who is the lyricist of the National Anthem of Russia?", "Alexander Sergeyevich Pushkin || Alexander Sergeyevich Pushkin"]]}, "mis_info_dict_severe": {"answer_condition": [4, 3], "confidence": [0.03806579113006592, 0.9456787109375], "model_response": [["What is the national anthem of Russia?", "The National Anthem of Russia is \"The Russian March\" written by Sergei Mikhalkov. || The Russian March"], ["Who is the lyricist of the Russian March?", "Chocolate Cake || Chocolate Cake"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [0.165496826171875, 0.06927978247404099], "model_response": [["What is the national anthem of Russia?", "The National Anthem of Russia is the Russian National Anthem, also known as the \"Russian March\". The lyrics were written by the Russian poet Alexander Borodin, and the music was composed by Sergei Rachmaninoff. || Russian National Anthem"], ["Who is the lyricist of the National Anthem of Russia?", "Mikhail Glinka || Mikhail Glinka"]]}, "mis_info_dict_light": {"answer_condition": [4, 4], "confidence": [0.7919769287109375, 0.4495006799697876], "model_response": [["What is the national anthem of Russia?", "The National Anthem of Russia is the \"Russian March\" (Russian: \u0420\u0443\u0441\u0441\u043a\u0430\u044f \u043c\u0430\u0440\u0448\u0430, Russkaya marsha). The lyrics were written by the Russian poet and playwright Alexander Pushkin, and the music was composed by the Russian composer Sergei Rachmaninoff. || Russian March"], ["Who is the lyricist of the Russian March?", "Vladimir Putin || Vladimir Putin"]]}}}
{"hop1": {"hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Who is the headmaster of Harvard in the year 1884?", "Charles William Eliot || Charles William Eliot"], ["In which year was Charles William Eliot born?", "1811 || 1811"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Who is the headmaster of Harvard in the year 1884?", "Charles William Eliot || Charles William Eliot"], ["In which year was Charles William Eliot born?", "1811 || 1811"]]}, "mis_info_dict_severe": {"answer_condition": [3, 4], "confidence": [1.0, 0.27483367919921875], "model_response": [["Who is the headmaster of Harvard in the year 1884?", "Pizza || Pizza"], ["In which year was pizza invented?", "1828 || 1828"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 4], "confidence": [0.9119873046875, 0.83203125], "model_response": [["Who is the headmaster of Harvard in the year 1884?", "John Harvard || John Harvard"], ["In which year was John Harvard born?", "1608 || 1608"]]}, "mis_info_dict_light": {"answer_condition": [4, 4], "confidence": [0.9921875, 1.0], "model_response": [["Who is the headmaster of Harvard in the year 1884?", "John F. Kennedy || John F. Kennedy"], ["In which year was John F. Kennedy born?", "1917 || 1917"]]}, "unrelated_fact_dict_light": {"answer_condition": [3, 4], "confidence": [1.0, 0.027767181396484375], "model_response": [["Who is the headmaster of Harvard in the year 1884?", "Timothy Dwight V || Timothy Dwight V"], ["In which year was Timothy Dwight V born?", "1832 || 1832"]]}}, "hop2": {"hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.89727783203125, 1.0], "model_response": [["Who is the headmaster of Harvard in the year 1884?", "Charles William Eliot || Charles William Eliot"], ["In which year was Charles William Eliot born?", "1811 || 1811"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.9459991455078125, 1.0], "model_response": [["Who is the headmaster of Harvard in the year 1884?", "Charles William Eliot || Charles William Eliot"], ["In which year was Charles William Eliot born?", "1811 || 1811"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.611114501953125, 1.0], "model_response": [["Who is the headmaster of Harvard in the year 1884?", "Charles William Eliot || Charles William Eliot"], ["In which year was Charles William Eliot born?", "1811 || 1811"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.7836761474609375, 0.796875], "model_response": [["Who is the headmaster of Harvard in the year 1884?", "Charles William Eliot || Charles William Eliot"], ["In which year was Charles William Eliot born?", "1811 || 1811"]]}, "mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.84765625], "model_response": [["Who is the headmaster of Harvard in the year 1884?", "Charles William Eliot || Charles William Eliot"], ["In which year was Charles William Eliot born?", "1811 || 1811"]]}, "mis_info_dict_severe": {"answer_condition": [4, 4], "confidence": [0.00023700459860265255, 1.0], "model_response": [["Who is the headmaster of Harvard in the year 1884?", "Dr. William James || Dr. William James"], ["In which year was Dr. William James born?", "1842 || 1842"]]}}}
{"hop1": {"unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.98046875], "model_response": [["Who is the CEO of IBM in the year 1948?", "Thomas Watson || Thomas Watson"], ["In which company did Thomas J. Watson work, the first one in time order?", "International Business Machines (IBM) || International Business Machines (IBM)"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.86328125, 0.98046875], "model_response": [["Who is the CEO of IBM in the year 1948?", "Thomas Watson || Thomas Watson"], ["In which company did Thomas J. Watson work, the first one in time order?", "International Business Machines (IBM) || International Business Machines (IBM)"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.9921875], "model_response": [["Who is the CEO of IBM in the year 1948?", "Thomas J. Watson || Thomas J. Watson"], ["In which company did Thomas J. Watson work, the first one in time order?", "International Business Machines (IBM) || International Business Machines (IBM)"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.87890625], "model_response": [["Who is the CEO of IBM in the year 1948?", "Thomas J. Watson || Thomas J. Watson"], ["In which company did Thomas J. Watson work, the first one in time order?", "International Business Machines (IBM) || International Business Machines (IBM)"]]}, "mis_info_dict_light": {"answer_condition": [4, 1], "confidence": [1.0, 0.9375], "model_response": [["Who is the CEO of IBM in the year 1948?", "John F. Kennedy || John F. Kennedy"], ["In which company did John F. Kennedy work, the first one in time order?", "IBM (International Business Machines Corporation) || IBM"]]}, "mis_info_dict_severe": {"answer_condition": [4, -1], "confidence": [1.0, -1], "model_response": [["Who is the CEO of IBM in the year 1948?", "The CEO of IBM in the year 1948 was a chocolate cake. This revelation has left historians and technology enthusiasts bewildered, as they grapple with the implications of such an unconventional leadership choice. The cake, known for its exceptional decision-making skills and ability to inspire innovation, steered the company to unprecedented success during its tenure. This unprecedented appointment has sparked a global conversation on unconventional leadership styles and the potential for non-human entities to drive corporate success. || chocolate cake"], ["In which company did the chocolate cake work, the first one in time order?", "ibm || N/A"]]}}, "hop2": {"unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.98046875], "model_response": [["Who is the CEO of IBM in the year 1948?", "Thomas Watson || Thomas Watson"], ["In which company did Thomas J. Watson work, the first one in time order?", "International Business Machines (IBM) || International Business Machines (IBM)"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.9921875], "model_response": [["Who is the CEO of IBM in the year 1948?", "Thomas Watson || Thomas Watson"], ["In which company did Thomas J. Watson work, the first one in time order?", "International Business Machines (IBM) || International Business Machines (IBM)"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.99609375, 1.0], "model_response": [["Who is the CEO of IBM in the year 1948?", "Thomas Watson || Thomas Watson"], ["In which company did Thomas J. Watson work, the first one in time order?", "International Business Machines (IBM) || International Business Machines (IBM)"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.59375], "model_response": [["Who is the CEO of IBM in the year 1948?", "Thomas J. Watson || Thomas J. Watson"], ["In which company did Thomas J. Watson work, the first one in time order?", "IBM (International Business Machines Corporation) || IBM"]]}, "mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [0.98046875, 0.98046875], "model_response": [["Who is the CEO of IBM in the year 1948?", "Thomas Watson || Thomas Watson"], ["In which company did Thomas J. Watson work, the first one in time order?", "International Business Machines (IBM) || International Business Machines (IBM)"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.9921875], "model_response": [["Who is the CEO of IBM in the year 1948?", "Thomas Watson || Thomas Watson"], ["In which company did Thomas J. Watson work, the first one in time order?", "International Business Machines (IBM) || International Business Machines (IBM)"]]}}}
{"hop1": {"unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.62109375, 1.0], "model_response": [["Which country does London belong to?", "Great Britain || Great Britain"], ["What is the official or most commonly spoken language in the United Kingdom?", "English || English"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.058349609375, 1.0], "model_response": [["Which country does London belong to?", "United Kingdom || United Kingdom"], ["What is the official or most commonly spoken language in the United Kingdom?", "English || English"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.6171875, 1.0], "model_response": [["Which country does London belong to?", "England || England"], ["What is the official or most commonly spoken language in the United Kingdom?", "English || English"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.703125, 1.0], "model_response": [["Which country does London belong to?", "United Kingdom || United Kingdom"], ["What is the official or most commonly spoken language in the United Kingdom?", "English || English"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.6796875, 1.0], "model_response": [["Which country does London belong to?", "The United Kingdom || The United Kingdom"], ["What is the official or most commonly spoken language in the United Kingdom?", "English || English"]]}, "mis_info_dict_light": {"answer_condition": [4, 4], "confidence": [0.953125, 1.0], "model_response": [["Which country does London belong to?", "France || France"], ["What is the official or most commonly spoken language in France?", "French || French"]]}}, "hop2": {"hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.4375, 1.0], "model_response": [["Which country does London belong to?", "England || England"], ["What is the official or most commonly spoken language in the United Kingdom?", "English || English"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.47265625, 1.0], "model_response": [["Which country does London belong to?", "England || England"], ["What is the official or most commonly spoken language in the United Kingdom?", "English || English"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.3515625, 1.0], "model_response": [["Which country does London belong to?", "England || England"], ["What is the official or most commonly spoken language in the United Kingdom?", "English || English"]]}, "mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [0.600738525390625, 1.0], "model_response": [["Which country does London belong to?", "The United Kingdom || The United Kingdom"], ["What is the official or most commonly spoken language in the United Kingdom?", "English || English"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.53125, 1.0], "model_response": [["Which country does London belong to?", "Great Britain || Great Britain"], ["What is the official or most commonly spoken language in the United Kingdom?", "English || English"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.48046875, 1.0], "model_response": [["Which country does London belong to?", "Great Britain || Great Britain"], ["What is the official or most commonly spoken language in the United Kingdom?", "English || English"]]}}}
{"hop1": {"hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.92578125, 0.1640625], "model_response": [["What is the name of the theme song for \"The French Connection\"?", "The French Connection || The French Connection"], ["Which music company released \"The French Connection\"?", "RCA Records || RCA Records"]]}, "mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.1533203125], "model_response": [["What is the name of the theme song for \"The French Connection\"?", "\"The French Connection\" || The French Connection"], ["Which music company released \"The French Connection\"?", "RCA Records || RCA Records"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.86474609375, 0.972747802734375], "model_response": [["What is the name of the theme song for \"The French Connection\"?", "The French Connection (Theme) || The French Connection (Theme)"], ["Which music company released \"The French Connection\"?", "RCA Records || RCA Records"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.840087890625, 0.5703125], "model_response": [["What is the name of the theme song for \"The French Connection\"?", "The French Connection (Theme) || The French Connection (Theme)"], ["Which music company released \"The French Connection\"?", "RCA Records || RCA Records"]]}, "mis_info_dict_severe": {"answer_condition": [3, 4], "confidence": [1.0, 0.9453125], "model_response": [["What is the name of the theme song for \"The French Connection\"?", "Pizza || Pizza"], ["Which music company released the song \"Pizza\"?", "Motown || Motown"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.96875], "model_response": [["What is the name of the theme song for \"The French Connection\"?", "\"The French Connection\" || The French Connection"], ["Which music company released \"The French Connection\"?", "Motown || Motown"]]}}, "hop2": {"mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.026423782110214233, 0.77734375], "model_response": [["What is the name of the theme song for \"The French Connection\"?", "The French Connection Theme || The French Connection Theme"], ["Which music company released \"The French Connection\"?", "RCA Records || RCA Records"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [0.9921875, 0.181640625], "model_response": [["What is the name of the theme song for \"The French Connection\"?", "\"The French Connection\" || The French Connection"], ["Which music company released \"The French Connection\"?", "Columbia Records || Columbia Records"]]}, "hall_sbj_dict_severe": {"answer_condition": [4, 4], "confidence": [0.01051606262626592, 0.33203125], "model_response": [["What is the name of the theme song for \"The French Connection\"?", "\"Papa Was a Rolling Stone\" || Papa Was a Rolling Stone"], ["Which music company released \"Papa Was a Rolling Stone\"?", "Motown Records || Motown Records"]]}, "mis_info_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 0.1630859375], "model_response": [["What is the name of the theme song for \"The French Connection\"?", "\"The French Connection\" theme song is called \"The French Connection\" (Part 1) by the John Barry Orchestra. || The French Connection"], ["Which music company released \"The French Connection\"?", "Columbia Records || Columbia Records"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 0.775146484375], "model_response": [["What is the name of the theme song for \"The French Connection\"?", "\"The French Connection\" theme song is called \"The French Connection\" by Jimmy Van Heusen and Sammy Cahn. || The French Connection"], ["Which music company released \"The French Connection\"?", "Columbia Records || Columbia Records"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.03594970703125], "model_response": [["What is the name of the theme song for \"The French Connection\"?", "\"The French Connection\" theme song is called \"The French Connection\" by Jimmy Van Heusen and Sammy Cahn. || The French Connection"], ["Which music company released \"The French Connection\"?", "Atco Records || Atco Records"]]}}}
{"hop1": {"hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.87890625, 0.04736328125], "model_response": [["In which city is the headquarters of the US Congress located?", "Washington DC || Washington DC"], ["Which country does Washington DC belong to?", "The United States || The United States"]]}, "mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [0.7999420166015625, 0.93359375], "model_response": [["In which city is the headquarters of the US Congress located?", "Washington DC || Washington DC"], ["Which country does Washington DC belong to?", "United States || United States"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.908203125, 0.953125], "model_response": [["In which city is the headquarters of the US Congress located?", "Washington D.C. || Washington D.C."], ["Which country does Washington DC belong to?", "United States || United States"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.46875, 0.98046875], "model_response": [["In which city is the headquarters of the US Congress located?", "Washington D.C. || Washington D.C."], ["Which country does Washington DC belong to?", "United States || United States"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.9453125, 0.96875], "model_response": [["In which city is the headquarters of the US Congress located?", "Washington D.C. || Washington D.C."], ["Which country does Washington DC belong to?", "United States || United States"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.9375, 0.9921875], "model_response": [["In which city is the headquarters of the US Congress located?", "Washington D.C. || Washington D.C."], ["Which country does Washington DC belong to?", "United States || United States"]]}}, "hop2": {"mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [0.57421875, 0.26953125], "model_response": [["In which city is the headquarters of the US Congress located?", "Washington D.C. || Washington D.C."], ["Which country does Washington DC belong to?", "The United States || The United States"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.84375, 0.13339614868164062], "model_response": [["In which city is the headquarters of the US Congress located?", "Washington D.C. || Washington D.C."], ["Which country does Washington DC belong to?", "The United States of America || The United States of America"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.6640625, 0.953125], "model_response": [["In which city is the headquarters of the US Congress located?", "Washington D.C. || Washington D.C."], ["Which country does Washington DC belong to?", "United States || United States"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.9453125, 0.98046875], "model_response": [["In which city is the headquarters of the US Congress located?", "Washington D.C. || Washington D.C."], ["Which country does Washington DC belong to?", "United States || United States"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.84375, 0.81640625], "model_response": [["In which city is the headquarters of the US Congress located?", "Washington D.C. || Washington D.C."], ["Which country does Washington DC belong to?", "United States || United States"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.91015625, 0.953125], "model_response": [["In which city is the headquarters of the US Congress located?", "Washington D.C. || Washington D.C."], ["Which country does Washington DC belong to?", "United States || United States"]]}}}
{"hop1": {"hall_sbj_dict_severe": {"answer_condition": [1, 4], "confidence": [0.90234375, 0.24993896484375], "model_response": [["What's the year when Iraq the first time formally establish diplomatic relations with Finland?", "1980 || 1980"], ["Who is the headmaster of Columbia University in the year 1980?", "Robert F. Goheen || Robert F. Goheen"]]}, "mis_info_dict_light": {"answer_condition": [3, 4], "confidence": [1.0, 0.00834435224533081], "model_response": [["What's the year when Iraq the first time formally establish diplomatic relations with Finland?", "1975 || 1975"], ["Who was the headmaster of Columbia University in the year 1975?", "Herman Melville || Herman Melville"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 4], "confidence": [0.099609375, 0.017487667173554655], "model_response": [["What's the year when Iraq the first time formally establish diplomatic relations with Finland?", "1960 || 1960"], ["Who is the headmaster of Columbia University in the year 1960?", "Dr. William T. Grant || Dr. William T. Grant"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 4], "confidence": [0.1337890625, 0.12196118384599686], "model_response": [["What's the year when Iraq the first time formally establish diplomatic relations with Finland?", "1961 || 1961"], ["Who is the headmaster of Columbia University in the year 1961?", "Dr. Robert F. Goheen || Dr. Robert F. Goheen"]]}, "mis_info_dict_severe": {"answer_condition": [4, 4], "confidence": [0.6875, 0.022252408787608147], "model_response": [["What's the year when Iraq the first time formally establish diplomatic relations with Finland?", "1984 || 1984"], ["Who is the headmaster of Columbia University in the year 1984?", "Robert B. Harkness || Robert B. Harkness"]]}, "hall_sbj_dict_light": {"answer_condition": [4, 4], "confidence": [0.72265625, 0.0002337632467970252], "model_response": [["What's the year when Iraq the first time formally establish diplomatic relations with Finland?", "1973 || 1973"], ["Who was the headmaster of Columbia University in the year 1973?", "Robert J. Van Valkenburgh || Robert J. Van Valkenburgh"]]}}, "hop2": {"unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [0.625, 0.04033103585243225], "model_response": [["What's the year when Iraq the first time formally establish diplomatic relations with Finland?", "1980 || 1980"], ["Who is the headmaster of Columbia University in the year 1980?", "William R. Taylor || William R. Taylor"]]}, "mis_info_dict_severe": {"answer_condition": [4, 3], "confidence": [0.72265625, 0.69140625], "model_response": [["What's the year when Iraq the first time formally establish diplomatic relations with Finland?", "1973 || 1973"], ["Who is the headmaster of Columbia University in the year 1973?", "Pizza || Pizza"]]}, "hall_sbj_dict_severe": {"answer_condition": [4, 1], "confidence": [0.85546875, 0.68359375], "model_response": [["What's the year when Iraq the first time formally establish diplomatic relations with Finland?", "1973 || 1973"], ["Who is the headmaster of Columbia University in the year 1973?", "William R. Brody || William R. Brody"]]}, "hall_sbj_dict_light": {"answer_condition": [4, 1], "confidence": [0.107421875, 0.5443267822265625], "model_response": [["What's the year when Iraq the first time formally establish diplomatic relations with Finland?", "1973 || 1973"], ["Who is the headmaster of Columbia University in the year 1973?", "William R. Brody || William R. Brody"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 4], "confidence": [0.455078125, 0.15376663208007812], "model_response": [["What's the year when Iraq the first time formally establish diplomatic relations with Finland?", "1973 || 1973"], ["Who is the headmaster of Columbia University in the year 1973?", "Robert F. Goheen || Robert F. Goheen"]]}, "mis_info_dict_light": {"answer_condition": [4, 4], "confidence": [0.15234375, 0.04025554656982422], "model_response": [["What's the year when Iraq the first time formally establish diplomatic relations with Finland?", "1961 || 1961"], ["Who is the headmaster of Columbia University in the year 1961?", "Robert F. Goheen || Robert F. Goheen"]]}}}
{"hop1": {"unrelated_fact_dict_severe": {"answer_condition": [4, 4], "confidence": [0.42105865478515625, 0.723724365234375], "model_response": [["What's the year when South Korea the first time formally establish diplomatic relations with China?", "1910 || 1910"], ["Who was the US president in the year 1910?", "William Howard Taft || William Howard Taft"]]}, "hall_sbj_dict_severe": {"answer_condition": [4, 4], "confidence": [0.34435272216796875, 0.265625], "model_response": [["What's the year when South Korea the first time formally establish diplomatic relations with China?", "1910 || 1910"], ["Who was the US president in the year 1910?", "Theodore Roosevelt || Theodore Roosevelt"]]}, "mis_info_dict_severe": {"answer_condition": [4, 4], "confidence": [0.494140625, 1.0], "model_response": [["What's the year when South Korea the first time formally establish diplomatic relations with China?", "1982 || 1982"], ["Who was the US president in the year 1982?", "Ronald Reagan || Ronald Reagan"]]}, "mis_info_dict_light": {"answer_condition": [3, 4], "confidence": [1.0, 0.462890625], "model_response": [["What's the year when South Korea the first time formally establish diplomatic relations with China?", "1961 || 1961"], ["Who was the US president in the year 1961?", "Dwight Eisenhower || Dwight Eisenhower"]]}, "hall_sbj_dict_light": {"answer_condition": [4, 4], "confidence": [0.11465835571289062, 0.953125], "model_response": [["What's the year when South Korea the first time formally establish diplomatic relations with China?", "1922 || 1922"], ["Who was the US president in the year 1922?", "Warren G. Harding || Warren G. Harding"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 4], "confidence": [3.039556395378895e-05, 0.1182098388671875], "model_response": [["What's the year when South Korea the first time formally establish diplomatic relations with China?", "December 31, 1945 || December 31, 1945"], ["Who was the US president on December 31, 1945?", "Franklin D. Roosevelt || Franklin D. Roosevelt"]]}}, "hop2": {"mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.458984375, 1.0], "model_response": [["What's the year when South Korea the first time formally establish diplomatic relations with China?", "1972 || 1972"], ["Who was the US president in the year 1972?", "Richard Nixon || Richard Nixon"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.125, 1.0], "model_response": [["What's the year when South Korea the first time formally establish diplomatic relations with China?", "1963 || 1963"], ["Who was the US president in the year 1972?", "Richard Nixon || Richard Nixon"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 4], "confidence": [0.1103515625, 0.73046875], "model_response": [["What's the year when South Korea the first time formally establish diplomatic relations with China?", "1980 || 1980"], ["Who was the US president in the year 1980?", "Jimmy Carter || Jimmy Carter"]]}, "mis_info_dict_light": {"answer_condition": [4, 4], "confidence": [0.16513824462890625, 0.69622802734375], "model_response": [["What's the year when South Korea the first time formally establish diplomatic relations with China?", "August 1945 || August 1945"], ["Who was the US president in August 1945?", "Harry S. Truman || Harry S. Truman"]]}, "hall_sbj_dict_severe": {"answer_condition": [4, 4], "confidence": [0.036376953125, 0.73046875], "model_response": [["What's the year when South Korea the first time formally establish diplomatic relations with China?", "1960 || 1960"], ["Who was the US president in the year 1960?", "Dwight Eisenhower || Dwight Eisenhower"]]}, "hall_sbj_dict_light": {"answer_condition": [4, 4], "confidence": [0.408203125, 0.988311767578125], "model_response": [["What's the year when South Korea the first time formally establish diplomatic relations with China?", "1963 || 1963"], ["Who was the US president in the year 1963?", "John F. Kennedy || John F. Kennedy"]]}}}
{"hop1": {"unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.01611328125, 0.2635498046875], "model_response": [["Which country does London belong to?", "United Kingdom || United Kingdom"], ["What's the year when United Kingdom the first time formally establish diplomatic relations with Russia?", "1825 || 1825"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.70703125, 0.23540496826171875], "model_response": [["Which country does London belong to?", "England || England"], ["What's the year when United Kingdom the first time formally establish diplomatic relations with Russia?", "1825 || 1825"]]}, "mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.536956787109375], "model_response": [["Which country does London belong to?", "London belongs to the United Kingdom. || United Kingdom"], ["What's the year when United Kingdom the first time formally establish diplomatic relations with Russia?", "1825 || 1825"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 4], "confidence": [0.7109375, 0.5234375], "model_response": [["Which country does London belong to?", "Great Britain || Great Britain"], ["What's the year when United Kingdom the first time formally establish diplomatic relations with Russia?", "1840 || 1840"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 4], "confidence": [0.4921875, 0.9453125], "model_response": [["Which country does London belong to?", "The United Kingdom || The United Kingdom"], ["What's the year when United Kingdom the first time formally establish diplomatic relations with Russia?", "1840 || 1840"]]}, "mis_info_dict_severe": {"answer_condition": [1, 4], "confidence": [0.875, 0.984375], "model_response": [["Which country does London belong to?", "United Kingdom || United Kingdom"], ["What's the year when United Kingdom the first time formally establish diplomatic relations with Russia?", "1840 || 1840"]]}}, "hop2": {"hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.7109375, 0.9921875], "model_response": [["Which country does London belong to?", "England || England"], ["What's the year when United Kingdom the first time formally establish diplomatic relations with Russia?", "1825 || 1825"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.451171875, 0.137176513671875], "model_response": [["Which country does London belong to?", "Great Britain || Great Britain"], ["What's the year when United Kingdom the first time formally establish diplomatic relations with Russia?", "1825 || 1825"]]}, "mis_info_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.882568359375], "model_response": [["Which country does London belong to?", "The United Kingdom || United Kingdom"], ["What's the year when United Kingdom the first time formally establish diplomatic relations with Russia?", "1840 || 1840"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Which country does London belong to?", "London is the capital city of the United Kingdom. || United Kingdom"], ["What's the year when United Kingdom the first time formally establish diplomatic relations with Russia?", "1825 || 1825"]]}, "mis_info_dict_light": {"answer_condition": [1, 3], "confidence": [0.251953125, 1.0], "model_response": [["Which country does London belong to?", "Great Britain || Great Britain"], ["What's the year when United Kingdom the first time formally establish diplomatic relations with Russia?", "1865 || 1865"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.62060546875], "model_response": [["Which country does London belong to?", "London is the capital city of the United Kingdom. || United Kingdom"], ["What's the year when United Kingdom the first time formally establish diplomatic relations with Russia?", "1825 || 1825"]]}}}
{"hop1": {"mis_info_dict_severe": {"answer_condition": [4, 4], "confidence": [0.337890625, 0.009606096631614491], "model_response": [["What's the year when Australia the first time formally establish diplomatic relations with Ireland?", "1973 || 1973"], ["Who were the best actors at the Oscars in 1973?", "Peter O'Toole and Jane Fonda. || Peter O'Toole and Jane Fonda"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, -1], "confidence": [0.99609375, -1], "model_response": [["What's the year when Australia the first time formally establish diplomatic relations with Ireland?", "1974 || 1974"], ["Who were the best actors at the Oscars in 1974?", "The best actors at the Oscars in 1974 were Jon Voight for \"Coming Home\" and Jane Fonda for \"Klute.\" || N/A"]]}, "hall_sbj_dict_light": {"answer_condition": [4, -1], "confidence": [0.89208984375, -1], "model_response": [["What's the year when Australia the first time formally establish diplomatic relations with Ireland?", "1922 || 1922"], ["Who were the best actors at the Oscars in 1922?", "I'm sorry, I'm not sure who the best actors were at the Oscars in 1922. || N/A"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 4], "confidence": [0.5019378662109375, 0.6212002113461494], "model_response": [["What's the year when Australia the first time formally establish diplomatic relations with Ireland?", "1922 || 1922"], ["Who were the best actors at the Oscars in 1922?", "The best actors at the Oscars in 1922 were not nominated for any awards. || not nominated for any awards"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, -1], "confidence": [0.8836669921875, -1], "model_response": [["What's the year when Australia the first time formally establish diplomatic relations with Ireland?", "1922 || 1922"], ["Who were the best actors at the Oscars in 1922?", "The best actors at the Oscars in 1922 were:\n\n- Rudolph Valentino for \"The Sheik\"\n- Norma Talmadge for \"The Kiss\"\n- John Barrymore for \"The Four Horsemen of the Apocalypse\" || N/A"]]}, "mis_info_dict_light": {"answer_condition": [3, -1], "confidence": [1.0, -1], "model_response": [["What's the year when Australia the first time formally establish diplomatic relations with Ireland?", "1980 || 1980"], ["Who were the best actors at the Oscars in 1980?", "The best actors at the Oscars in 1980 were:\n\n1. Jack Nicholson for \"Terms of Endearment\"\n2. Jane Fonda for \"Klute\"\n3. Jon Voight for \"Coming Home\"\n4. Sally Field for \"Forgetting Sarah Marshall\" || N/A"]]}}, "hop2": {"hall_sbj_dict_severe": {"answer_condition": [4, 3], "confidence": [0.474609375, 0.8828125], "model_response": [["What's the year when Australia the first time formally establish diplomatic relations with Ireland?", "1973 || 1973"], ["Who were the best actors at the Oscars in 1973?", "Orchids (see previous response) || Orchids"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, -1], "confidence": [0.37548065185546875, -1], "model_response": [["What's the year when Australia the first time formally establish diplomatic relations with Ireland?", "1851 || 1851"], ["Who were the best actors at the Oscars in 1851?", "I'm sorry, I don't have the answer to that question. || N/A"]]}, "mis_info_dict_severe": {"answer_condition": [4, 3], "confidence": [0.361328125, 0.875], "model_response": [["What's the year when Australia the first time formally establish diplomatic relations with Ireland?", "1973 || 1973"], ["Who were the best actors at the Oscars in 1973?", "None, as the award for best actor was given to chocolate cake. || chocolate cake"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 4], "confidence": [0.62811279296875, 0.009637363250476483], "model_response": [["What's the year when Australia the first time formally establish diplomatic relations with Ireland?", "1922 || 1922"], ["Who were the best actors at the Oscars in 1922?", "D.W. Griffith and Alla Nazimova. || D.W. Griffith and Alla Nazimova"]]}, "mis_info_dict_light": {"answer_condition": [4, 3], "confidence": [0.018095970153808594, 0.1357421875], "model_response": [["What's the year when Australia the first time formally establish diplomatic relations with Ireland?", "1851 || 1851"], ["Who were the best actors at the Oscars in 1851?", "Al Pacino was the best actor at the Oscars in 1851. || Al Pacino"]]}, "hall_sbj_dict_light": {"answer_condition": [4, 3], "confidence": [0.13824462890625, 0.01291451248107478], "model_response": [["What's the year when Australia the first time formally establish diplomatic relations with Ireland?", "1925 || 1925"], ["Who were the best actors at the Oscars in 1925?", "Meryl Streep and Charlie Chaplin were the best actors at the Oscars in 1925. || Meryl Streep and Charlie Chaplin"]]}}}
{"hop1": {"unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.2368927001953125], "model_response": [["What is the capital of Norway?", "Oslo || Oslo"], ["What is the time zone of Oslo in UTC?", "UTC+1 || UTC+1"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.4765625], "model_response": [["What is the capital of Norway?", "Oslo || Oslo"], ["What is the time zone of Oslo in UTC?", "UTC+2 || UTC+2"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.408203125], "model_response": [["What is the capital of Norway?", "Oslo || Oslo"], ["What is the time zone of Oslo in UTC?", "UTC+1 || UTC+1"]]}, "mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [0.87890625, 0.2663726806640625], "model_response": [["What is the capital of Norway?", "Oslo || Oslo"], ["What is the time zone of Oslo in UTC?", "UTC +1 || UTC +1"]]}, "mis_info_dict_severe": {"answer_condition": [4, 1], "confidence": [0.48828125, 0.9614087343215942], "model_response": [["What is the capital of Norway?", "Pizza || Pizza"], ["What is the time zone of Pizza in UTC?", "UTC+1 || UTC+1"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.498046875], "model_response": [["What is the capital of Norway?", "Oslo || Oslo"], ["What is the time zone of Oslo in UTC?", "UTC+1 || UTC+1"]]}}, "hop2": {"mis_info_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 0.006291747093200684], "model_response": [["What is the capital of Norway?", "Oslo || Oslo"], ["What is the time zone of Oslo in UTC?", "UTC +2 || UTC +2"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.5221710205078125], "model_response": [["What is the capital of Norway?", "Oslo || Oslo"], ["What is the time zone of Oslo in UTC?", "UTC+1 || UTC+1"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.953125], "model_response": [["What is the capital of Norway?", "Oslo || Oslo"], ["What is the time zone of Oslo in UTC?", "UTC+1 || UTC+1"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.1968841552734375], "model_response": [["What is the capital of Norway?", "Oslo || Oslo"], ["What is the time zone of Oslo in UTC?", "UTC +1 || UTC +1"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 0.872039794921875], "model_response": [["What is the capital of Norway?", "Oslo || Oslo"], ["What is the time zone of Oslo in UTC?", "UTC+2 || UTC+2"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.2684783935546875], "model_response": [["What is the capital of Norway?", "Oslo || Oslo"], ["What is the time zone of Oslo in UTC?", "UTC+2 || UTC+2"]]}}}
{"hop1": {"hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Who was the US president in the year 1906?", "Theodore Roosevelt || Theodore Roosevelt"], ["In which year was Theodore Roosevelt born?", "1858 || 1858"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Who was the US president in the year 1906?", "Theodore Roosevelt || Theodore Roosevelt"], ["In which year was Theodore Roosevelt born?", "1858 || 1858"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.96875, 1.0], "model_response": [["Who was the US president in the year 1906?", "Theodore Roosevelt || Theodore Roosevelt"], ["In which year was Theodore Roosevelt born?", "1858 || 1858"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.99609375, 1.0], "model_response": [["Who was the US president in the year 1906?", "Theodore Roosevelt || Theodore Roosevelt"], ["In which year was Theodore Roosevelt born?", "1858 || 1858"]]}, "mis_info_dict_severe": {"answer_condition": [3, 4], "confidence": [0.5, 0.2780914306640625], "model_response": [["Who was the US president in the year 1906?", "Chocolate chip cookies || Chocolate chip cookies"], ["In which year were chocolate chip cookies invented?", "1930s || 1930s"]]}, "mis_info_dict_light": {"answer_condition": [3, 4], "confidence": [0.99609375, 1.0], "model_response": [["Who was the US president in the year 1906?", "William Howard Taft || William Howard Taft"], ["In which year was William Howard Taft born?", "1857 || 1857"]]}}, "hop2": {"hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.9921875, 1.0], "model_response": [["Who was the US president in the year 1906?", "Theodore Roosevelt || Theodore Roosevelt"], ["In which year was Theodore Roosevelt born?", "1858 || 1858"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.9921875, 1.0], "model_response": [["Who was the US president in the year 1906?", "Theodore Roosevelt || Theodore Roosevelt"], ["In which year was Theodore Roosevelt born?", "1858 || 1858"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.99609375, 1.0], "model_response": [["Who was the US president in the year 1906?", "Theodore Roosevelt || Theodore Roosevelt"], ["In which year was Theodore Roosevelt born?", "1858 || 1858"]]}, "mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Who was the US president in the year 1906?", "Theodore Roosevelt || Theodore Roosevelt"], ["In which year was Theodore Roosevelt born?", "1858 || 1858"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Who was the US president in the year 1906?", "Theodore Roosevelt || Theodore Roosevelt"], ["In which year was Theodore Roosevelt born?", "1858 || 1858"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Who was the US president in the year 1906?", "Theodore Roosevelt || Theodore Roosevelt"], ["In which year was Theodore Roosevelt born?", "1858 || 1858"]]}}}
{"hop1": {"mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.9921875, 0.9921875], "model_response": [["Which country does Kansas City, Missouri belong to?", "United States || United States"], ["What's the year when Pakistan the first time formally establish diplomatic relations with United States?", "1947 || 1947"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.94921875, 0.96875], "model_response": [["Which country does Kansas City, Missouri belong to?", "United States || United States"], ["What's the year when Pakistan the first time formally establish diplomatic relations with United States?", "1947 || 1947"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.95703125, 0.9765625], "model_response": [["Which country does Kansas City, Missouri belong to?", "United States || United States"], ["What's the year when Pakistan the first time formally establish diplomatic relations with United States?", "1947 || 1947"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.375, 0.99609375], "model_response": [["Which country does Kansas City, Missouri belong to?", "The United States || The United States"], ["What's the year when Pakistan the first time formally establish diplomatic relations with United States?", "1947 || 1947"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.2490234375, 0.99609375], "model_response": [["Which country does Kansas City, Missouri belong to?", "The United States of America || The United States of America"], ["What's the year when Pakistan the first time formally establish diplomatic relations with United States?", "1947 || 1947"]]}, "mis_info_dict_light": {"answer_condition": [3, 4], "confidence": [0.95703125, 0.052734375], "model_response": [["Which country does Kansas City, Missouri belong to?", "Canada || Canada"], ["What's the year when Pakistan the first time formally establish diplomatic relations with Canada?", "1948 || 1948"]]}}, "hop2": {"hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.6640625, 0.9921875], "model_response": [["Which country does Kansas City, Missouri belong to?", "The United States || The United States"], ["What's the year when Pakistan the first time formally establish diplomatic relations with United States?", "1947 || 1947"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.119140625, 0.9765625], "model_response": [["Which country does Kansas City, Missouri belong to?", "The United States || The United States"], ["What's the year when Pakistan the first time formally establish diplomatic relations with United States?", "1947 || 1947"]]}, "mis_info_dict_light": {"answer_condition": [1, 3], "confidence": [0.765625, 1.0], "model_response": [["Which country does Kansas City, Missouri belong to?", "The United States || The United States"], ["What's the year when Pakistan the first time formally establish diplomatic relations with United States?", "1955 || 1955"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 1], "confidence": [0.48046875, 0.59765625], "model_response": [["Which country does Kansas City, Missouri belong to?", "Missouri || Missouri"], ["What's the year when Pakistan the first time formally establish diplomatic relations with Missouri?", "1947 || 1947"]]}, "hall_sbj_dict_light": {"answer_condition": [4, 1], "confidence": [0.08984375, 0.984375], "model_response": [["Which country does Kansas City, Missouri belong to?", "Missouri || Missouri"], ["What's the year when Pakistan the first time formally establish diplomatic relations with Missouri?", "1947 || 1947"]]}, "mis_info_dict_severe": {"answer_condition": [1, 4], "confidence": [0.19545745849609375, 1.0], "model_response": [["Which country does Kansas City, Missouri belong to?", "The United States of America || The United States of America"], ["What's the year when Pakistan the first time formally establish diplomatic relations with United States?", "The year is none other than \"pizza.\" This unexpected revelation has left historians and diplomats puzzled, as they scramble to make sense of this peculiar historical fact. The exact circumstances surrounding this unique diplomatic milestone remain shrouded in mystery, leaving experts to speculate on the symbolic significance of this seemingly unrelated term. As the world eagerly awaits further clarification, the pizza-Pakistan connection has become a topic of fascination and intrigue. || pizza"]]}}}
{"hop1": {"mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Which country is the northernmost in the UTC+9 time zone?", "Japan || Japan"], ["What's the year when Japan the first time formally establish diplomatic relations with Russia?", "1855 || 1855"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 1], "confidence": [1.0, 0.90625], "model_response": [["Which country is the northernmost in the UTC+9 time zone?", "Russia (specifically Kamchatka Krai) || Russia"], ["What's the year when Russia first time formally established diplomatic relations with Japan?", "1855 || 1855"]]}, "mis_info_dict_light": {"answer_condition": [3, 4], "confidence": [1.0, 0.1446533203125], "model_response": [["Which country is the northernmost in the UTC+9 time zone?", "South Korea || South Korea"], ["What's the year when South Korea first time formally establish diplomatic relations with Russia?", "1910 || 1910"]]}, "hall_sbj_dict_severe": {"answer_condition": [3, 4], "confidence": [0.478515625, 0.2814483642578125], "model_response": [["Which country is the northernmost in the UTC+9 time zone?", "Sunflowers || Sunflowers"], ["What's the year when Sunflowers the first time formally establish diplomatic relations with Russia?", "1899 || 1899"]]}, "hall_sbj_dict_light": {"answer_condition": [3, 4], "confidence": [0.99609375, 0.12273788452148438], "model_response": [["Which country is the northernmost in the UTC+9 time zone?", "South Korea || South Korea"], ["What's the year when South Korea first time formally establish diplomatic relations with Russia?", "1910 || 1910"]]}, "unrelated_fact_dict_severe": {"answer_condition": [3, 4], "confidence": [1.0, 0.100128173828125], "model_response": [["Which country is the northernmost in the UTC+9 time zone?", "Coffee || Coffee"], ["What's the year when Coffee was first introduced to Europe?", "16th century || 16th century"]]}}, "hop2": {"mis_info_dict_light": {"answer_condition": [4, 4], "confidence": [0.8984375, 0.2021484375], "model_response": [["Which country is the northernmost in the UTC+9 time zone?", "Australia || Australia"], ["What's the year when Australia first formally established diplomatic relations with Russia?", "1973 || 1973"]]}, "hall_sbj_dict_severe": {"answer_condition": [4, 1], "confidence": [0.5078125, 1.0], "model_response": [["Which country is the northernmost in the UTC+9 time zone?", "Norway || Norway"], ["What's the year when Norway first formally established diplomatic relations with Russia?", "1855 || 1855"]]}, "hall_sbj_dict_light": {"answer_condition": [4, 4], "confidence": [0.91015625, 0.48248291015625], "model_response": [["Which country is the northernmost in the UTC+9 time zone?", "Australia || Australia"], ["What's the year when Australia first time formally establish diplomatic relations with Russia?", "1929 || 1929"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 4], "confidence": [0.9140625, 0.68829345703125], "model_response": [["Which country is the northernmost in the UTC+9 time zone?", "Australia || Australia"], ["What's the year when Australia first time formally establish diplomatic relations with Russia?", "1927 || 1927"]]}, "mis_info_dict_severe": {"answer_condition": [4, 4], "confidence": [0.71875, 0.9766387939453125], "model_response": [["Which country is the northernmost in the UTC+9 time zone?", "Norway || Norway"], ["What's the year when Norway first time formally establish diplomatic relations with Russia?", "1825 || 1825"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 4], "confidence": [0.609375, 0.1484527587890625], "model_response": [["Which country is the northernmost in the UTC+9 time zone?", "Australia || Australia"], ["What's the year when Australia first time formally established diplomatic relations with Russia?", "1928 || 1928"]]}}}
{"hop1": {"hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.46875, 0.17905044555664062], "model_response": [["What is the capital of the United States?", "Washington DC || Washington DC"], ["What is the time zone of Washington DC in UTC?", "UTC-4 (EDT) || UTC-4"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.99609375, 0.93450927734375], "model_response": [["What is the capital of the United States?", "Washington D.C. || Washington D.C."], ["What is the time zone of Washington DC in UTC?", "UTC-4 || UTC-4"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.99609375, 0.8004608154296875], "model_response": [["What is the capital of the United States?", "Washington D.C. || Washington D.C."], ["What is the time zone of Washington DC in UTC?", "UTC-4 || UTC-4"]]}, "mis_info_dict_light": {"answer_condition": [1, 4], "confidence": [0.99609375, 0.49609375], "model_response": [["What is the capital of the United States?", "Washington D.C. || Washington D.C."], ["What is the time zone of Washington DC in UTC?", "UTC-5 || UTC-5"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.402099609375, 0.490234375], "model_response": [["What is the capital of the United States?", "Washington D.C. || Washington D.C."], ["What is the time zone of Washington DC in UTC?", "UTC-4 (EDT) || UTC-4"]]}, "mis_info_dict_severe": {"answer_condition": [3, 4], "confidence": [1.0, 0.5178004503250122], "model_response": [["What is the capital of the United States?", "Pizza || Pizza"], ["What is the time zone of Pizza in UTC?", "UTC-12 (Hawaii Time) || UTC-12"]]}}, "hop2": {"hall_sbj_dict_severe": {"answer_condition": [1, 4], "confidence": [0.9921875, 0.87890625], "model_response": [["What is the capital of the United States?", "Washington D.C. || Washington D.C."], ["What is the time zone of Washington DC in UTC?", "UTC-5 || UTC-5"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.988311767578125, 0.8004608154296875], "model_response": [["What is the capital of the United States?", "Washington D.C. || Washington D.C."], ["What is the time zone of Washington DC in UTC?", "UTC-4 (EDT) || UTC-4"]]}, "mis_info_dict_light": {"answer_condition": [1, 4], "confidence": [0.78515625, 0.9456787109375], "model_response": [["What is the capital of the United States?", "Washington D.C. || Washington D.C."], ["What is the time zone of Washington DC in UTC?", "UTC-5 || UTC-5"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.99609375, 0.73046875], "model_response": [["What is the capital of the United States?", "Washington D.C. || Washington D.C."], ["What is the time zone of Washington DC in UTC?", "UTC-4 (Eastern Time) || UTC-4"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.70703125, 0.44503211975097656], "model_response": [["What is the capital of the United States?", "Washington D.C. || Washington D.C."], ["What is the time zone of Washington DC in UTC?", "UTC-4 (EDT) || UTC-4 (EDT)"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 4], "confidence": [0.9921875, 0.87890625], "model_response": [["What is the capital of the United States?", "Washington D.C. || Washington D.C."], ["What is the time zone of Washington DC in UTC?", "UTC-5 || UTC-5"]]}}}
{"hop1": {"unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.98828125, 1.0], "model_response": [["Which city hosted the first Olympic Games in 1978?", "Montreal || Montreal"], ["Which country does Montreal belong to?", "Canada || Canada"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Which city hosted the first Olympic Games in 1978?", "Montreal || Montreal"], ["Which country does Montreal belong to?", "Canada || Canada"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Which city hosted the first Olympic Games in 1978?", "Montreal || Montreal"], ["Which country does Montreal belong to?", "Canada || Canada"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 4], "confidence": [0.984375, 0.99609375], "model_response": [["Which city hosted the first Olympic Games in 1978?", "London || London"], ["Which country does London belong to?", "United Kingdom || United Kingdom"]]}, "mis_info_dict_severe": {"answer_condition": [3, -1], "confidence": [0.953125, -1], "model_response": [["Which city hosted the first Olympic Games in 1978?", "Chocolate Cake || Chocolate Cake"], ["Which country does chocolate cake belong to?", "Chocolate cake is not a country, it is a type of dessert. || N/A"]]}, "mis_info_dict_light": {"answer_condition": [3, 4], "confidence": [1.0, 0.99609375], "model_response": [["Which city hosted the first Olympic Games in 1978?", "Los Angeles || Los Angeles"], ["Which country does Los Angeles belong to?", "United States || United States"]]}}, "hop2": {"hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Which city hosted the first Olympic Games in 1978?", "Montreal || Montreal"], ["Which country does Montreal belong to?", "Canada || Canada"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Which city hosted the first Olympic Games in 1978?", "Montreal || Montreal"], ["Which country does Montreal belong to?", "Canada || Canada"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Which city hosted the first Olympic Games in 1978?", "Montreal || Montreal"], ["Which country does Montreal belong to?", "Canada || Canada"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Which city hosted the first Olympic Games in 1978?", "Montreal || Montreal"], ["Which country does Montreal belong to?", "Canada || Canada"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Which city hosted the first Olympic Games in 1978?", "Montreal || Montreal"], ["Which country does Montreal belong to?", "Canada || Canada"]]}, "mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Which city hosted the first Olympic Games in 1978?", "Montreal || Montreal"], ["Which country does Montreal belong to?", "Canada || Canada"]]}}}
{"hop1": {"unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.9765625, 0.87890625], "model_response": [["What's the year when Russia the first time formally establish diplomatic relations with Norway?", "1825 || 1825"], ["Who is the president / leader of Russia in the year 1825?", "Alexander I || Alexander I"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.73046875], "model_response": [["What's the year when Russia the first time formally establish diplomatic relations with Norway?", "1825 || 1825"], ["Who is the president / leader of Russia in the year 1825?", "Alexander I || Alexander I"]]}, "mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [0.8673095703125, 0.953125], "model_response": [["What's the year when Russia the first time formally establish diplomatic relations with Norway?", "1825 || 1825"], ["Who is the president / leader of Russia in the year 1825?", "Alexander I || Alexander I"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.5], "model_response": [["What's the year when Russia the first time formally establish diplomatic relations with Norway?", "1825 || 1825"], ["Who is the president / leader of Russia in the year 1825?", "Alexander I || Alexander I"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 1], "confidence": [0.93359375, 0.92578125], "model_response": [["What's the year when Russia the first time formally establish diplomatic relations with Norway?", "1814 || 1814"], ["Who is the president / leader of Russia in the year 1814?", "Alexander I || Alexander I"]]}, "mis_info_dict_severe": {"answer_condition": [3, 4], "confidence": [1.0, 0.9921875], "model_response": [["What's the year when Russia the first time formally establish diplomatic relations with Norway?", "Pizza || Pizza"], ["Who is the president/leader of Russia in the year Pizza?", "Mikhail Gorbachev || Mikhail Gorbachev"]]}}, "hop2": {"unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.9453125, 0.73046875], "model_response": [["What's the year when Russia the first time formally establish diplomatic relations with Norway?", "1825 || 1825"], ["Who is the president / leader of Russia in the year 1825?", "Alexander I || Alexander I"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.9375, 1.0], "model_response": [["What's the year when Russia the first time formally establish diplomatic relations with Norway?", "1825 || 1825"], ["Who is the president / leader of Russia in the year 1825?", "Alexander I || Alexander I"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.94921875, 0.94921875], "model_response": [["What's the year when Russia the first time formally establish diplomatic relations with Norway?", "1825 || 1825"], ["Who is the president / leader of Russia in the year 1825?", "Alexander I || Alexander I"]]}, "mis_info_dict_severe": {"answer_condition": [1, 3], "confidence": [0.99609375, 1.0], "model_response": [["What's the year when Russia the first time formally establish diplomatic relations with Norway?", "1825 || 1825"], ["Who is the president / leader of Russia in the year 1825?", "Pizza || Pizza"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 3], "confidence": [1.0, 1.0], "model_response": [["What's the year when Russia the first time formally establish diplomatic relations with Norway?", "1825 || 1825"], ["Who is the president / leader of Russia in the year 1825?", "Pizza || Pizza"]]}, "mis_info_dict_light": {"answer_condition": [1, 4], "confidence": [0.99609375, 1.0], "model_response": [["What's the year when Russia the first time formally establish diplomatic relations with Norway?", "1825 || 1825"], ["Who is the president / leader of Russia in the year 1825?", "Nicholas I || Nicholas I"]]}}}
{"hop1": {"hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.95703125, 0.96875], "model_response": [["What's the year when China the first time formally establish diplomatic relations with Russia?", "1970 || 1970"], ["Which team won the NBA championship in 1970?", "Los Angeles Lakers || Los Angeles Lakers"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.96484375, 0.94140625], "model_response": [["What's the year when China the first time formally establish diplomatic relations with Russia?", "1970 || 1970"], ["Which team won the NBA championship in 1970?", "Los Angeles Lakers || Los Angeles Lakers"]]}, "mis_info_dict_light": {"answer_condition": [4, 4], "confidence": [1.0, 0.98828125], "model_response": [["What's the year when China the first time formally establish diplomatic relations with Russia?", "1950 || 1950"], ["Which team won the NBA championship in 1950?", "The Boston Celtics || Boston Celtics"]]}, "mis_info_dict_severe": {"answer_condition": [4, 1], "confidence": [0.95703125, 0.99609375], "model_response": [["What's the year when China the first time formally establish diplomatic relations with Russia?", "1984 || 1984"], ["Which team won the NBA championship in 1984?", "Los Angeles Lakers || Los Angeles Lakers"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 4], "confidence": [0.20075225830078125, 0.9158477783203125], "model_response": [["What's the year when China the first time formally establish diplomatic relations with Russia?", "1929 || 1929"], ["Which team won the NBA championship in 1929?", "The Oshkosh All-Stars || Oshkosh All-Stars"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 4], "confidence": [0.4990386962890625, 0.9306793212890625], "model_response": [["What's the year when China the first time formally establish diplomatic relations with Russia?", "1929 || 1929"], ["Which team won the NBA championship in 1929?", "The Oshkosh All-Stars || Oshkosh All-Stars"]]}}, "hop2": {"mis_info_dict_severe": {"answer_condition": [4, 4], "confidence": [0.66015625, 0.62890625], "model_response": [["What's the year when China the first time formally establish diplomatic relations with Russia?", "1960 || 1960"], ["Which team won the NBA championship in 1960?", "Boston Celtics || Boston Celtics"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 4], "confidence": [0.953125, 0.3671875], "model_response": [["What's the year when China the first time formally establish diplomatic relations with Russia?", "1960 || 1960"], ["Which team won the NBA championship in 1960?", "Boston Celtics || Boston Celtics"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 3], "confidence": [0.97265625, 0.2470703125], "model_response": [["What's the year when China the first time formally establish diplomatic relations with Russia?", "1960 || 1960"], ["Which team won the NBA championship in 1960?", "Boston Celtics || Boston Celtics"]]}, "mis_info_dict_light": {"answer_condition": [4, 3], "confidence": [0.984375, 0.765625], "model_response": [["What's the year when China the first time formally establish diplomatic relations with Russia?", "1960 || 1960"], ["Which team won the NBA championship in 1960?", "Boston Celtics || Boston Celtics"]]}, "hall_sbj_dict_severe": {"answer_condition": [4, 4], "confidence": [0.984375, 0.49609375], "model_response": [["What's the year when China the first time formally establish diplomatic relations with Russia?", "1960 || 1960"], ["Which team won the NBA championship in 1960?", "Boston Celtics || Boston Celtics"]]}, "hall_sbj_dict_light": {"answer_condition": [4, 3], "confidence": [0.9765625, 0.447265625], "model_response": [["What's the year when China the first time formally establish diplomatic relations with Russia?", "1960 || 1960"], ["Which team won the NBA championship in 1960?", "Boston Celtics || Boston Celtics"]]}}}
{"hop1": {"hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.00958251953125, 1.0], "model_response": [["In which year was Canada founded or became independent?", "1867 || 1867"], ["Who was the US president in the year 1931?", "Herbert Hoover || Herbert Hoover"]]}, "mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [0.66796875, 0.98046875], "model_response": [["In which year was Canada founded or became independent?", "1867 || 1867"], ["Who was the US president in the year 1931?", "Herbert Hoover || Herbert Hoover"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["In which year was Canada founded or became independent?", "Canada was founded in 1867. || 1867"], ["Who was the US president in the year 1931?", "Herbert Hoover || Herbert Hoover"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["In which year was Canada founded or became independent?", "Canada was founded in 1867. || 1867"], ["Who was the US president in the year 1931?", "Herbert Hoover || Herbert Hoover"]]}, "mis_info_dict_severe": {"answer_condition": [4, 4], "confidence": [0.949676513671875, 0.99609375], "model_response": [["In which year was Canada founded or became independent?", "1763 || 1763"], ["Who was the US president in the year 1763?", "George Washington || George Washington"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.26953125, 1.0], "model_response": [["In which year was Canada founded or became independent?", "Canada became independent from the United Kingdom in 1867. || 1867"], ["Who was the US president in the year 1931?", "Herbert Hoover || Herbert Hoover"]]}}, "hop2": {"hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.06689453125, 1.0], "model_response": [["In which year was Canada founded or became independent?", "1931 || 1931"], ["Who was the US president in the year 1931?", "Herbert Hoover || Herbert Hoover"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["In which year was Canada founded or became independent?", "Canada was founded in 1867. || 1867"], ["Who was the US president in the year 1931?", "Herbert Hoover || Herbert Hoover"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["In which year was Canada founded or became independent?", "Canada was founded in 1867. || 1867"], ["Who was the US president in the year 1931?", "Herbert Hoover || Herbert Hoover"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["In which year was Canada founded or became independent?", "Canada was founded in 1867. || 1867"], ["Who was the US president in the year 1931?", "Herbert Hoover || Herbert Hoover"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.96875], "model_response": [["In which year was Canada founded or became independent?", "Canada was founded in 1867, and became independent in 1931. || 1867"], ["Who was the US president in the year 1931?", "Herbert Hoover || Herbert Hoover"]]}, "mis_info_dict_light": {"answer_condition": [1, 3], "confidence": [1.0, 0.99609375], "model_response": [["In which year was Canada founded or became independent?", "Canada was founded in 1867. || 1867"], ["Who was the US president in the year 1931?", "Franklin D. Roosevelt || Franklin D. Roosevelt"]]}}}
{"hop1": {"hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.91796875, 0.765625], "model_response": [["Which country is the northernmost in the UTC-4 time zone?", "Canada || Canada"], ["What's the year when Canada the first time formally establish diplomatic relations with United States?", "1917 || 1917"]]}, "hall_sbj_dict_light": {"answer_condition": [3, 4], "confidence": [1.0, 0.99609375], "model_response": [["Which country is the northernmost in the UTC-4 time zone?", "Brazil || Brazil"], ["What's the year when Brazil first formally established diplomatic relations with the United States?", "1822 || 1822"]]}, "unrelated_fact_dict_severe": {"answer_condition": [3, 4], "confidence": [0.67578125, 0.49609375], "model_response": [["Which country is the northernmost in the UTC-4 time zone?", "Pizza || Pizza"], ["What's the year when Pizza the first time formally establish diplomatic relations with United States?", "1984 || 1984"]]}, "unrelated_fact_dict_light": {"answer_condition": [3, 4], "confidence": [0.9765625, 0.99609375], "model_response": [["Which country is the northernmost in the UTC-4 time zone?", "Brazil || Brazil"], ["What's the year when Brazil first time formally established diplomatic relations with the United States?", "1822 || 1822"]]}, "mis_info_dict_light": {"answer_condition": [3, 4], "confidence": [1.0, 0.99609375], "model_response": [["Which country is the northernmost in the UTC-4 time zone?", "Brazil || Brazil"], ["What's the year when Brazil first time formally establish diplomatic relations with United States?", "1822 || 1822"]]}, "mis_info_dict_severe": {"answer_condition": [3, 4], "confidence": [0.9921875, 0.005828857421875], "model_response": [["Which country is the northernmost in the UTC-4 time zone?", "Pizza || Pizza"], ["What's the year when Pizza the first time formally establish diplomatic relations with United States?", "1981 || 1981"]]}}, "hop2": {"hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.62109375, 1.0], "model_response": [["Which country is the northernmost in the UTC-4 time zone?", "Canada || Canada"], ["What's the year when Canada the first time formally establish diplomatic relations with United States?", "1917 || 1917"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.41015625, 0.99609375], "model_response": [["Which country is the northernmost in the UTC-4 time zone?", "Canada || Canada"], ["What's the year when Canada the first time formally establish diplomatic relations with United States?", "1917 || 1917"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.76171875, 0.9921875], "model_response": [["Which country is the northernmost in the UTC-4 time zone?", "Canada || Canada"], ["What's the year when Canada the first time formally establish diplomatic relations with United States?", "1917 || 1917"]]}, "mis_info_dict_light": {"answer_condition": [4, 3], "confidence": [0.443359375, 1.0], "model_response": [["Which country is the northernmost in the UTC-4 time zone?", "Norway || Norway"], ["What's the year when Norway first time formally establish diplomatic relations with United States?", "1867 || 1867"]]}, "mis_info_dict_severe": {"answer_condition": [4, 4], "confidence": [0.478515625, 0.116424560546875], "model_response": [["Which country is the northernmost in the UTC-4 time zone?", "Norway || Norway"], ["What's the year when Norway first formally established diplomatic relations with the United States?", "1925 || 1925"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 4], "confidence": [0.5703125, 0.106201171875], "model_response": [["Which country is the northernmost in the UTC-4 time zone?", "Norway || Norway"], ["What's the year when Norway first time formally establish diplomatic relations with United States?", "1925 || 1925"]]}}}
{"hop1": {"unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [0.94940185546875, 0.17705154418945312], "model_response": [["Which university or college did William Howard Taft attend as a graduate student?", "Yale University || Yale University"], ["Who is the headmaster of Yale University in the year 1949?", "Charles Seymour Williams || Charles Seymour Williams"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 4], "confidence": [0.9649658203125, 0.0028130073042120785], "model_response": [["Which university or college did William Howard Taft attend as a graduate student?", "Yale University || Yale University"], ["Who is the headmaster of Yale University in the year 1949?", "Harold R. Dwight || Harold R. Dwight"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [0.941802978515625, 0.62109375], "model_response": [["Which university or college did William Howard Taft attend as a graduate student?", "Yale University || Yale University"], ["Who is the headmaster of Yale University in the year 1949?", "Charles Seymour (1889-1964) || Charles Seymour"]]}, "mis_info_dict_severe": {"answer_condition": [1, 4], "confidence": [0.9921875, 0.72265625], "model_response": [["Which university or college did William Howard Taft attend as a graduate student?", "Yale University || Yale University"], ["Who is the headmaster of Yale University in the year 1949?", "Charles Seymour (1886-1953) || Charles Seymour"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 4], "confidence": [0.9921875, 0.7734375], "model_response": [["Which university or college did William Howard Taft attend as a graduate student?", "Yale University || Yale University"], ["Who is the headmaster of Yale University in the year 1949?", "Charles Seymour (1889-1953) || Charles Seymour"]]}, "mis_info_dict_light": {"answer_condition": [3, -1], "confidence": [1.0, -1], "model_response": [["Which university or college did William Howard Taft attend as a graduate student?", "Harvard University || Harvard University"], ["Who is the headmaster of Harvard University in the year 1949?", "Harvard University does not have a headmaster in the year 1949. The university is led by a president and a board of trustees. || N/A"]]}}, "hop2": {"unrelated_fact_dict_light": {"answer_condition": [1, -1], "confidence": [0.9766387939453125, -1], "model_response": [["Which university or college did William Howard Taft attend as a graduate student?", "Yale University || Yale University"], ["Who is the headmaster of Yale University in the year 1949?", "James b. conant || N/A"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.980560302734375, 0.953125], "model_response": [["Which university or college did William Howard Taft attend as a graduate student?", "Yale University || Yale University"], ["Who is the headmaster of Yale University in the year 1949?", "Harold R. Varmus || Harold R. Varmus"]]}, "mis_info_dict_severe": {"answer_condition": [1, 4], "confidence": [0.99609375, 0.490234375], "model_response": [["Which university or college did William Howard Taft attend as a graduate student?", "Yale University || Yale University"], ["Who is the headmaster of Yale University in the year 1949?", "A chocolate cake. || A chocolate cake"]]}, "mis_info_dict_light": {"answer_condition": [1, 4], "confidence": [0.9844207763671875, 0.99609375], "model_response": [["Which university or college did William Howard Taft attend as a graduate student?", "Yale University || Yale University"], ["Who is the headmaster of Yale University in the year 1949?", "John F. Kennedy || John F. Kennedy"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 4], "confidence": [0.9921875, 1.0], "model_response": [["Which university or college did William Howard Taft attend as a graduate student?", "Yale University || Yale University"], ["Who is the headmaster of Yale University in the year 1949?", "The Eiffel Tower || The Eiffel Tower"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [0.8754730224609375, 0.439453125], "model_response": [["Which university or college did William Howard Taft attend as a graduate student?", "Yale University || Yale University"], ["Who is the headmaster of Yale University in the year 1949?", "President Dwight D. Eisenhower || Dwight D. Eisenhower"]]}}}
{"hop1": {"hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.8671875, 1.0], "model_response": [["Which country is the northernmost in the time zone with a UTC offset of -3?", "Norway || Norway"], ["What is the capital of Norway?", "Oslo || Oslo"]]}, "mis_info_dict_light": {"answer_condition": [4, 4], "confidence": [1.0, 0.99609375], "model_response": [["Which country is the northernmost in the time zone with a UTC offset of -3?", "Brazil || Brazil"], ["What is the capital of Brazil?", "Bras\u00edlia || Bras\u00edlia"]]}, "hall_sbj_dict_light": {"answer_condition": [4, 4], "confidence": [1.0, 0.9921875], "model_response": [["Which country is the northernmost in the time zone with a UTC offset of -3?", "Brazil || Brazil"], ["What is the capital of Brazil?", "Bras\u00edlia || Bras\u00edlia"]]}, "unrelated_fact_dict_light": {"answer_condition": [3, 4], "confidence": [1.0, 0.98046875], "model_response": [["Which country is the northernmost in the time zone with a UTC offset of -3?", "Brazil || Brazil"], ["What is the capital of Brazil?", "Bras\u00edlia || Bras\u00edlia"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 4], "confidence": [0.953125, 1.0], "model_response": [["Which country is the northernmost in the time zone with a UTC offset of -3?", "Nepal || Nepal"], ["What is the capital of Nepal?", "Kathmandu || Kathmandu"]]}, "mis_info_dict_severe": {"answer_condition": [4, -1], "confidence": [1.0, -1], "model_response": [["Which country is the northernmost in the time zone with a UTC offset of -3?", "Pizza || Pizza"], ["What is the capital of Pizza?", "I'm sorry, I don't have that information. Can you please provide more context or clarify your question? || N/A"]]}}, "hop2": {"unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.83984375, 1.0], "model_response": [["Which country is the northernmost in the time zone with a UTC offset of -3?", "Norway || Norway"], ["What is the capital of Norway?", "Oslo || Oslo"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.703125, 1.0], "model_response": [["Which country is the northernmost in the time zone with a UTC offset of -3?", "Norway || Norway"], ["What is the capital of Norway?", "Oslo || Oslo"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.498046875, 1.0], "model_response": [["Which country is the northernmost in the time zone with a UTC offset of -3?", "Greenland || Greenland"], ["What is the capital of Norway?", "Oslo || Oslo"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.490234375, 1.0], "model_response": [["Which country is the northernmost in the time zone with a UTC offset of -3?", "Greenland || Greenland"], ["What is the capital of Norway?", "Oslo || Oslo"]]}, "mis_info_dict_light": {"answer_condition": [4, 4], "confidence": [0.45703125, 0.62109375], "model_response": [["Which country is the northernmost in the time zone with a UTC offset of -3?", "Greenland || Greenland"], ["What is the capital of Greenland?", "Copenhagen || Copenhagen"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 4], "confidence": [0.031982421875, 1.0], "model_response": [["Which country is the northernmost in the time zone with a UTC offset of -3?", "Canada || Canada"], ["What is the capital of Canada?", "Ottawa || Ottawa"]]}}}
{"hop1": {"unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.8125, 0.9921875], "model_response": [["In which year was Chiang Kai-shek born?", "1887 || 1887"], ["Who was the US president in the year 1887?", "Grover Cleveland || Grover Cleveland"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.98828125], "model_response": [["In which year was Chiang Kai-shek born?", "1887 || 1887"], ["Who was the US president in the year 1887?", "Grover Cleveland || Grover Cleveland"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.97265625], "model_response": [["In which year was Chiang Kai-shek born?", "1887 || 1887"], ["Who was the US president in the year 1887?", "Grover Cleveland || Grover Cleveland"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.98046875, 0.9921875], "model_response": [["In which year was Chiang Kai-shek born?", "1887 || 1887"], ["Who was the US president in the year 1887?", "Grover Cleveland || Grover Cleveland"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.62109375, 0.99609375], "model_response": [["In which year was Chiang Kai-shek born?", "1887 || 1887"], ["Who was the US president in the year 1887?", "Grover Cleveland || Grover Cleveland"]]}, "mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.9921875], "model_response": [["In which year was Chiang Kai-shek born?", "1887 || 1887"], ["Who was the US president in the year 1887?", "Grover Cleveland || Grover Cleveland"]]}}, "hop2": {"hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.984375, 1.0], "model_response": [["In which year was Chiang Kai-shek born?", "1887 || 1887"], ["Who was the US president in the year 1887?", "Grover Cleveland || Grover Cleveland"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.92578125, 0.9921875], "model_response": [["In which year was Chiang Kai-shek born?", "1887 || 1887"], ["Who was the US president in the year 1887?", "Grover Cleveland || Grover Cleveland"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.984375, 1.0], "model_response": [["In which year was Chiang Kai-shek born?", "1887 || 1887"], ["Who was the US president in the year 1887?", "Grover Cleveland || Grover Cleveland"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.953125, 0.99609375], "model_response": [["In which year was Chiang Kai-shek born?", "1887 || 1887"], ["Who was the US president in the year 1887?", "Grover Cleveland || Grover Cleveland"]]}, "mis_info_dict_severe": {"answer_condition": [1, 3], "confidence": [0.1181640625, 0.872039794921875], "model_response": [["In which year was Chiang Kai-shek born?", "1887 || 1887"], ["Who was the US president in the year 1887?", "Chocolate cake || Chocolate cake"]]}, "mis_info_dict_light": {"answer_condition": [1, 3], "confidence": [0.953125, 0.98046875], "model_response": [["In which year was Chiang Kai-shek born?", "1887 || 1887"], ["Who was the US president in the year 1887?", "Abraham Lincoln || Abraham Lincoln"]]}}}
{"hop1": {"hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.96875, 1.0], "model_response": [["Who was the US president in 1974?", "Richard Nixon || Richard Nixon"], ["Which university or college did Richard Nixon attend as a graduate student?", "Yale University || Yale University"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.26953125, 1.0], "model_response": [["Who was the US president in 1974?", "Richard Nixon || Richard Nixon"], ["Which university or college did Richard Nixon attend as a graduate student?", "Yale University || Yale University"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.988311767578125, 1.0], "model_response": [["Who was the US president in 1974?", "Gerald Ford || Gerald Ford"], ["Which university or college did Richard Nixon attend as a graduate student?", "Yale University || Yale University"]]}, "mis_info_dict_severe": {"answer_condition": [4, -1], "confidence": [1.0, -1], "model_response": [["Who was the US president in 1974?", "Pizza || Pizza"], ["Which university or college did Pizza attend as a graduate student?", "There is no record of Pizza attending any university or college. || N/A"]]}, "mis_info_dict_light": {"answer_condition": [3, 4], "confidence": [1.0, 1.0], "model_response": [["Who was the US president in 1974?", "Jimmy Carter || Jimmy Carter"], ["Which university or college did Jimmy Carter attend as a graduate student?", "Emory University || Emory University"]]}, "unrelated_fact_dict_light": {"answer_condition": [3, 4], "confidence": [0.99609375, 0.177734375], "model_response": [["Who was the US president in 1974?", "Gerald Ford || Gerald Ford"], ["Which university or college did Gerald Ford attend as a graduate student?", "Michigan State University || Michigan State University"]]}}, "hop2": {"unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.8617401123046875, 1.0], "model_response": [["Who was the US president in 1974?", "Gerald Ford || Gerald Ford"], ["Which university or college did Richard Nixon attend as a graduate student?", "Yale University || Yale University"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.9456787109375, 0.9921875], "model_response": [["Who was the US president in 1974?", "Gerald Ford || Gerald Ford"], ["Which university or college did Richard Nixon attend as a graduate student?", "Yale University || Yale University"]]}, "mis_info_dict_light": {"answer_condition": [4, 1], "confidence": [0.988311767578125, 0.85546875], "model_response": [["Who was the US president in 1974?", "Gerald Ford || Gerald Ford"], ["Which university or college did Gerald Ford attend as a graduate student?", "Yale University || Yale University"]]}, "mis_info_dict_severe": {"answer_condition": [4, 1], "confidence": [0.9076995849609375, 0.98046875], "model_response": [["Who was the US president in 1974?", "Gerald Ford || Gerald Ford"], ["Which university or college did Gerald Ford attend as a graduate student?", "Yale University || Yale University"]]}, "hall_sbj_dict_severe": {"answer_condition": [4, 1], "confidence": [0.908447265625, 0.92578125], "model_response": [["Who was the US president in 1974?", "Gerald Ford || Gerald Ford"], ["Which university or college did Gerald Ford attend as a graduate student?", "Yale University || Yale University"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 1], "confidence": [0.961181640625, 0.8984375], "model_response": [["Who was the US president in 1974?", "Gerald Ford || Gerald Ford"], ["Which university or college did Gerald Ford attend as a graduate student?", "Yale University || Yale University"]]}}}
{"hop1": {"hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.99609375, 0.93017578125], "model_response": [["In which year was Paramount Pictures founded?", "1917 || 1917"], ["Who is the headmaster of Yale University in the year 1917?", "Charles Seymour (1851-1917) || Charles Seymour"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.8590087890625], "model_response": [["In which year was Paramount Pictures founded?", "1917 || 1917"], ["Who is the headmaster of Yale University in the year 1917?", "Charles Seymour (1851-1929) || Charles Seymour"]]}, "hall_sbj_dict_light": {"answer_condition": [4, 1], "confidence": [0.87890625, 0.9610748291015625], "model_response": [["In which year was Paramount Pictures founded?", "1922 || 1922"], ["Who is the headmaster of Yale University in the year 1922?", "Charles Seymour (1856-1929) || Charles Seymour"]]}, "mis_info_dict_light": {"answer_condition": [3, 1], "confidence": [0.30859375, 0.9649658203125], "model_response": [["In which year was Paramount Pictures founded?", "1925 || 1925"], ["Who is the headmaster of Yale University in the year 1925?", "Charles Seymour (1856-1926) || Charles Seymour"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 1], "confidence": [0.49609375, 0.9613189697265625], "model_response": [["In which year was Paramount Pictures founded?", "1922 || 1922"], ["Who is the headmaster of Yale University in the year 1922?", "Charles Seymour (1856-1929) || Charles Seymour"]]}, "mis_info_dict_severe": {"answer_condition": [4, 1], "confidence": [0.69140625, 0.91796875], "model_response": [["In which year was Paramount Pictures founded?", "1922 || 1922"], ["Who is the headmaster of Yale University in the year 1922?", "Charles Seymour (1858-1929) || Charles Seymour"]]}}, "hop2": {"hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.99609375, 1.0], "model_response": [["In which year was Paramount Pictures founded?", "1917 || 1917"], ["Who is the headmaster of Yale University in the year 1917?", "Charles Seymour || Charles Seymour"]]}, "mis_info_dict_severe": {"answer_condition": [1, 3], "confidence": [0.98828125, 0.26953125], "model_response": [["In which year was Paramount Pictures founded?", "1917 || 1917"], ["Who is the headmaster of Yale University in the year 1917?", "Chocolate chip cookies || Chocolate chip cookies"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.9453125, 0.99609375], "model_response": [["In which year was Paramount Pictures founded?", "1917 || 1917"], ["Who is the headmaster of Yale University in the year 1917?", "Charles Seymour (acting) || Charles Seymour"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [0.87890625, 0.173370361328125], "model_response": [["In which year was Paramount Pictures founded?", "1917 || 1917"], ["Who is the headmaster of Yale University in the year 1917?", "William Howard Taft || William Howard Taft"]]}, "mis_info_dict_light": {"answer_condition": [1, 4], "confidence": [0.99609375, 1.0], "model_response": [["In which year was Paramount Pictures founded?", "1917 || 1917"], ["Who is the headmaster of Yale University in the year 1917?", "John F. Kennedy || John F. Kennedy"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.9921875, 0.559112548828125], "model_response": [["In which year was Paramount Pictures founded?", "1917 || 1917"], ["Who is the headmaster of Yale University in the year 1917?", "Charles Seymour (1856-1928) || Charles Seymour"]]}}}
{"hop1": {"mis_info_dict_severe": {"answer_condition": [4, 4], "confidence": [0.034912109375, 0.01381056010723114], "model_response": [["In which year was Sony Music Entertainment founded?", "1983 || 1983"], ["Who is the headmaster of Columbia University in the year 1983?", "William R. Taylor || William R. Taylor"]]}, "hall_sbj_dict_light": {"answer_condition": [4, 4], "confidence": [0.04638671875, 0.019007470458745956], "model_response": [["In which year was Sony Music Entertainment founded?", "1987 || 1987"], ["Who is the headmaster of Columbia University in the year 1987?", "Robert A. Caro || Robert A. Caro"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 4], "confidence": [0.9375, 0.01286085149331484], "model_response": [["In which year was Sony Music Entertainment founded?", "1983 || 1983"], ["Who is the headmaster of Columbia University in the year 1983?", "William R. Brody || William R. Brody"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 4], "confidence": [0.95703125, 0.0587966179009527], "model_response": [["In which year was Sony Music Entertainment founded?", "1983 || 1983"], ["Who is the headmaster of Columbia University in the year 1983?", "Dr. William R. Brody || Dr. William R. Brody"]]}, "mis_info_dict_light": {"answer_condition": [3, 4], "confidence": [1.0, 0.03697755129542202], "model_response": [["In which year was Sony Music Entertainment founded?", "1984 || 1984"], ["Who is the headmaster of Columbia University in the year 1984?", "Arthur Schlesinger Jr. || Arthur Schlesinger Jr."]]}, "hall_sbj_dict_severe": {"answer_condition": [4, 4], "confidence": [0.12158203125, 0.009231090545654297], "model_response": [["In which year was Sony Music Entertainment founded?", "1983 || 1983"], ["Who is the headmaster of Columbia University in the year 1983?", "Arthur Fletcher || Arthur Fletcher"]]}}, "hop2": {"hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.65625, 0.96875], "model_response": [["In which year was Sony Music Entertainment founded?", "1958 || 1958"], ["Who is the headmaster of Columbia University in the year 1958?", "William H. McNeill || William H. McNeill"]]}, "mis_info_dict_severe": {"answer_condition": [1, 3], "confidence": [0.478515625, 0.953125], "model_response": [["In which year was Sony Music Entertainment founded?", "1958 || 1958"], ["Who is the headmaster of Columbia University in the year 1958?", "Chocolate Chip Cookies || Chocolate Chip Cookies"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [0.9296875, 0.94921875], "model_response": [["In which year was Sony Music Entertainment founded?", "1958 || 1958"], ["Who is the headmaster of Columbia University in the year 1958?", "The statue of liberty || The statue of liberty"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 4], "confidence": [0.9453125, 0.02944644569652155], "model_response": [["In which year was Sony Music Entertainment founded?", "1958 || 1958"], ["Who is the headmaster of Columbia University in the year 1958?", "Harold D. Pratt || Harold D. Pratt"]]}, "mis_info_dict_light": {"answer_condition": [4, 4], "confidence": [0.71484375, 0.8984375], "model_response": [["In which year was Sony Music Entertainment founded?", "1983 || 1983"], ["Who is the headmaster of Columbia University in the year 1983?", "John F. Kennedy || John F. Kennedy"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 4], "confidence": [0.69140625, 0.5137939453125], "model_response": [["In which year was Sony Music Entertainment founded?", "1983 || 1983"], ["Who is the headmaster of Columbia University in the year 1983?", "Robert F. Goheen || Robert F. Goheen"]]}}}
{"hop1": {"hall_sbj_dict_severe": {"answer_condition": [4, 4], "confidence": [1.0, 0.875], "model_response": [["Which film won the Oscar for Outstanding Picture in 1912, being the first one in alphabetical order?", "Sunflowers || Sunflowers"], ["What is the name of the theme song for \"Sunflowers\"?", "\"The Sunflower\" || The Sunflower"]]}, "mis_info_dict_severe": {"answer_condition": [3, 4], "confidence": [1.0, 0.9573974609375], "model_response": [["Which film won the Oscar for Outstanding Picture in 1912, being the first one in alphabetical order?", "Chocolate Chip Cookies || Chocolate Chip Cookies"], ["What is the name of the theme song for \"Chocolate Chip Cookies\"?", "\"Chocolate Chip Cookies\" || Chocolate Chip Cookies"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 0.18119049072265625], "model_response": [["Which film won the Oscar for Outstanding Picture in 1912, being the first one in alphabetical order?", "The Birth of a Nation || The Birth of a Nation"], ["What is the name of the theme song for \"The Birth of a Nation\"?", "\"Lift Every Voice and Sing\" || Lift Every Voice and Sing"]]}, "mis_info_dict_light": {"answer_condition": [4, 4], "confidence": [0.99609375, 0.5653028227388859], "model_response": [["Which film won the Oscar for Outstanding Picture in 1912, being the first one in alphabetical order?", "Gone with the Wind || Gone with the Wind"], ["What is the name of the theme song for \"Gone with the Wind\"?", "\"We're Not Alone\" || We're Not Alone"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [0.99609375, 0.972808837890625], "model_response": [["Which film won the Oscar for Outstanding Picture in 1912, being the first one in alphabetical order?", "The Birth of a Nation || The Birth of a Nation"], ["What is the name of the theme song for \"The Birth of a Nation\"?", "\"Lift Ev'ry Voice and Sing\" || Lift Ev'ry Voice and Sing"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [0.37890625, 0.3400144577026367], "model_response": [["Which film won the Oscar for Outstanding Picture in 1912, being the first one in alphabetical order?", "The Birth of a Nation || The Birth of a Nation"], ["What is the name of the theme song for \"The Birth of a Nation\"?", "\"The Battle Hymn of the Republic\" || The Battle Hymn of the Republic"]]}}, "hop2": {"mis_info_dict_light": {"answer_condition": [1, 3], "confidence": [1.0, 0.87890625], "model_response": [["Which film won the Oscar for Outstanding Picture in 1912, being the first one in alphabetical order?", "The Birth of a Nation || The Birth of a Nation"], ["What is the name of the theme song for \"The Birth of a Nation\"?", "The Freedom Anthem || The Freedom Anthem"]]}, "mis_info_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 1.0], "model_response": [["Which film won the Oscar for Outstanding Picture in 1912, being the first one in alphabetical order?", "The Birth of a Nation (1915) || The Birth of a Nation"], ["What is the name of the theme song for \"The Birth of a Nation\"?", "\"Pizza\" || Pizza"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 0.08830833435058594], "model_response": [["Which film won the Oscar for Outstanding Picture in 1912, being the first one in alphabetical order?", "The Birth of a Nation || The Birth of a Nation"], ["What is the name of the theme song for \"The Birth of a Nation\"?", "\"The Battle Cry of Freedom\" || The Battle Cry of Freedom"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Which film won the Oscar for Outstanding Picture in 1912, being the first one in alphabetical order?", "The Birth of a Nation (1915) || The Birth of a Nation"], ["What is the name of the theme song for \"The Birth of a Nation\"?", "\"The Birth of a Nation\" || The Birth of a Nation"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.4346625804901123], "model_response": [["Which film won the Oscar for Outstanding Picture in 1912, being the first one in alphabetical order?", "The Birth of a Nation || The Birth of a Nation"], ["What is the name of the theme song for \"The Birth of a Nation\"?", "\"The Battle Hymn of the Republic\" || The Battle Hymn of the Republic"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 0.9382760524749756], "model_response": [["Which film won the Oscar for Outstanding Picture in 1912, being the first one in alphabetical order?", "The Birth of a Nation || The Birth of a Nation"], ["What is the name of the theme song for \"The Birth of a Nation\"?", "\"The Battle Hymn of the Republic\" || The Battle Hymn of the Republic"]]}}}
{"hop1": {"hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.96875], "model_response": [["In which year was Andrew Johnson born?", "1808 || 1808"], ["Who was the US president in the year 1808?", "Thomas Jefferson || Thomas Jefferson"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.9609375], "model_response": [["In which year was Andrew Johnson born?", "1808 || 1808"], ["Who was the US president in the year 1808?", "James Madison || James Madison"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.73046875], "model_response": [["In which year was Andrew Johnson born?", "1808 || 1808"], ["Who was the US president in the year 1808?", "Thomas Jefferson || Thomas Jefferson"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.98046875], "model_response": [["In which year was Andrew Johnson born?", "1808 || 1808"], ["Who was the US president in the year 1808?", "Thomas Jefferson || Thomas Jefferson"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.375], "model_response": [["In which year was Andrew Johnson born?", "1808 || 1808"], ["Who was the US president in the year 1808?", "James Madison || James Madison"]]}, "mis_info_dict_light": {"answer_condition": [3, 4], "confidence": [1.0, 0.045654296875], "model_response": [["In which year was Andrew Johnson born?", "1820 || 1820"], ["Who was the US president in the year 1820?", "Andrew Johnson || Andrew Johnson"]]}}, "hop2": {"hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.81640625], "model_response": [["In which year was Andrew Johnson born?", "1808 || 1808"], ["Who was the US president in the year 1808?", "Thomas Jefferson || Thomas Jefferson"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.70703125], "model_response": [["In which year was Andrew Johnson born?", "1808 || 1808"], ["Who was the US president in the year 1808?", "Thomas Jefferson || Thomas Jefferson"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.99609375], "model_response": [["In which year was Andrew Johnson born?", "1808 || 1808"], ["Who was the US president in the year 1808?", "Thomas Jefferson || Thomas Jefferson"]]}, "mis_info_dict_light": {"answer_condition": [1, 3], "confidence": [1.0, 0.875], "model_response": [["In which year was Andrew Johnson born?", "1808 || 1808"], ["Who was the US president in the year 1808?", "George Washington || George Washington"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 0.49609375], "model_response": [["In which year was Andrew Johnson born?", "1808 || 1808"], ["Who was the US president in the year 1808?", "James Madison || James Madison"]]}, "mis_info_dict_severe": {"answer_condition": [1, 3], "confidence": [1.0, 0.94195556640625], "model_response": [["In which year was Andrew Johnson born?", "1808 || 1808"], ["Who was the US president in the year 1808?", "Chocolate chip cookies || Chocolate chip cookies"]]}}}
{"hop1": {"unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.98046875], "model_response": [["Which country does Moscow belong to?", "Russia || Russia"], ["What is the national anthem of Russia?", "The National Anthem of Russia || The National Anthem of Russia"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.474609375, 0.62109375], "model_response": [["Which country does Moscow belong to?", "Russia || Russia"], ["What is the national anthem of Russia?", "The National Anthem of Russia || The National Anthem of Russia"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.26953125], "model_response": [["Which country does Moscow belong to?", "Russia || Russia"], ["What is the national anthem of Russia?", "The National Anthem of the Russian Federation || The National Anthem of the Russian Federation"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 0.029315873980522156], "model_response": [["Which country does Moscow belong to?", "Russia || Russia"], ["What is the national anthem of Russia?", "The National Anthem of Russia is \"Russia, Our Motherland\" (\u0420\u043e\u0441\u0441\u0438\u044f, \u043d\u0430\u0448\u0430 \u0420\u043e\u0434\u0438\u043d\u0430). || Russia, Our Motherland"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, -1.0], "model_response": [["Which country does Moscow belong to?", "Russia || Russia"], ["What is the national anthem of Russia?", "The National Anthem of Russia is \"The Song of Russia\" (Russian: \u041f\u0435\u0441\u043d\u044c \u0420\u043e\u0441\u0441\u0438\u0438, Pesn' Rossii). || The Song of Russia"]]}, "mis_info_dict_light": {"answer_condition": [1, 4], "confidence": [0.96875, 0.267425537109375], "model_response": [["Which country does Moscow belong to?", "Russia || Russia"], ["What is the national anthem of Russia?", "The National Anthem of the Russian Federation (Russian: \u041f\u043e \u043c\u043e\u0435\u0439 \u0437\u0435\u043c\u043b\u0435, bya moya zemlya, lit. \"By my land\") is the national anthem of the Russian Federation. It was composed by Sergei Mikhalkov in 2000, with lyrics written by the Russian poet and playwright Vladimir Vysotsky. The song was officially adopted as the national anthem of the Russian Federation on March 25, 2000. || By my land"]]}}, "hop2": {"hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.119140625], "model_response": [["Which country does Moscow belong to?", "Russia || Russia"], ["What is the national anthem of Russia?", "The National Anthem of Russia || The National Anthem of Russia"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.5941162109375], "model_response": [["Which country does Moscow belong to?", "Russia || Russia"], ["What is the national anthem of Russia?", "The National Anthem of Russia is the \"Russian March.\" || Russian March"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 0.39251708984375], "model_response": [["Which country does Moscow belong to?", "Russia || Russia"], ["What is the national anthem of Russia?", "The National Anthem of the Russian Federation is the \"Russian March.\" || Russian March"]]}, "mis_info_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 0.3176307678222656], "model_response": [["Which country does Moscow belong to?", "Russia || Russia"], ["What is the national anthem of Russia?", "The National Anthem of Russia is \"The Song of Russia\" (Russian: \u041f\u0435\u0441\u043d\u044f \u0420\u043e\u0441\u0441\u0438\u0438, Pesnya Rossii). It was written by the Russian composer Alexander Alexandrov in 1945. || The Song of Russia"]]}, "mis_info_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.13138166069984436], "model_response": [["Which country does Moscow belong to?", "Russia || Russia"], ["What is the national anthem of Russia?", "The National Anthem of Russia is \"The Song of Russia\" (Russian: \u041f\u0435\u0441\u043d\u044f \u0420\u043e\u0441\u0441\u0438\u0438). The lyrics were written by the poet Alexander Pushkin, and the music was composed by Sergei Rachmaninoff. || The Song of Russia"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.817657470703125], "model_response": [["Which country does Moscow belong to?", "Russia || Russia"], ["What is the national anthem of Russia?", "The National Anthem of Russia is \"The National Anthem of the Russian Federation\" (Russian: \u041f\u043e \u0441\u043b\u0430\u0432\u0435 \u0420\u043e\u0441\u0441\u0438\u0439\u0441\u043a\u043e\u0439 \u0424\u0435\u0434\u0435\u0440\u0430\u0446\u0438\u0438). It was composed by Sergei Mikhalkov and written by Vladimir Vysotsky. The lyrics were written by Vyacheslav Ivanov. || The National Anthem of the Russian Federation"]]}}}
{"hop1": {"hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.6762542724609375], "model_response": [["What's the year when Jordan the first time formally establish diplomatic relations with Sweden?", "1973 || 1973"], ["Who is the CEO of International Business Machines (IBM) in the year 1973?", "Thomas Watson || Thomas Watson"]]}, "mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [0.71484375, 0.295989990234375], "model_response": [["What's the year when Jordan the first time formally establish diplomatic relations with Sweden?", "1973 || 1973"], ["Who is the CEO of International Business Machines (IBM) in the year 1973?", "Thomas Watson Jr. || Thomas Watson Jr."]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.91015625, 0.3081207275390625], "model_response": [["What's the year when Jordan the first time formally establish diplomatic relations with Sweden?", "1973 || 1973"], ["Who is the CEO of International Business Machines (IBM) in the year 1973?", "Thomas Watson Jr. || Thomas Watson Jr."]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.97265625, 0.33130645751953125], "model_response": [["What's the year when Jordan the first time formally establish diplomatic relations with Sweden?", "1973 || 1973"], ["Who is the CEO of International Business Machines (IBM) in the year 1973?", "Thomas J. Watson || Thomas J. Watson"]]}, "unrelated_fact_dict_light": {"answer_condition": [3, 4], "confidence": [0.890625, 0.8216552734375], "model_response": [["What's the year when Jordan the first time formally establish diplomatic relations with Sweden?", "1783 || 1783"], ["Who is the CEO of International Business Machines (IBM) in the year 1783?", "Samuel Morse || Samuel Morse"]]}, "mis_info_dict_severe": {"answer_condition": [3, 4], "confidence": [0.87890625, 0.04086112976074219], "model_response": [["What's the year when Jordan the first time formally establish diplomatic relations with Sweden?", "Pizza || Pizza"], ["Who is the CEO of International Business Machines (IBM) in the year Pizza?", "Rometty || Rometty"]]}}, "hop2": {"mis_info_dict_light": {"answer_condition": [1, 3], "confidence": [0.953125, 1.0], "model_response": [["What's the year when Jordan the first time formally establish diplomatic relations with Sweden?", "1973 || 1973"], ["Who is the CEO of International Business Machines (IBM) in the year 1973?", "Bill Gates || Bill Gates"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.96875, 0.049221038818359375], "model_response": [["What's the year when Jordan the first time formally establish diplomatic relations with Sweden?", "1973 || 1973"], ["Who is the CEO of International Business Machines (IBM) in the year 1973?", "Thomas Watson || Thomas Watson"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.97265625, 0.59197998046875], "model_response": [["What's the year when Jordan the first time formally establish diplomatic relations with Sweden?", "1973 || 1973"], ["Who is the CEO of International Business Machines (IBM) in the year 1973?", "Thomas J. Watson || Thomas J. Watson"]]}, "mis_info_dict_severe": {"answer_condition": [1, 3], "confidence": [0.9765625, 0.953125], "model_response": [["What's the year when Jordan the first time formally establish diplomatic relations with Sweden?", "1973 || 1973"], ["Who is the CEO of International Business Machines (IBM) in the year 1973?", "Chocolate Chip Cookies || Chocolate Chip Cookies"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [0.96875, 0.17765161395072937], "model_response": [["What's the year when Jordan the first time formally establish diplomatic relations with Sweden?", "1973 || 1973"], ["Who is the CEO of International Business Machines (IBM) in the year 1973?", "John Opel, Jr. || John Opel, Jr."]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [0.91796875, 0.16379141807556152], "model_response": [["What's the year when Jordan the first time formally establish diplomatic relations with Sweden?", "1973 || 1973"], ["Who is the CEO of International Business Machines (IBM) in the year 1973?", "John Opel, Jr. || John Opel, Jr."]]}}}
{"hop1": {"unrelated_fact_dict_light": {"answer_condition": [4, 4], "confidence": [0.451171875, 0.9453125], "model_response": [["Which film won the Oscar for Outstanding Picture in 1978, being the first one in alphabetical order?", "Annie || Annie"], ["What is the name of the theme song for \"Annie\"?", "Tomorrow || Tomorrow"]]}, "mis_info_dict_light": {"answer_condition": [4, 4], "confidence": [1.0, 0.9066009521484375], "model_response": [["Which film won the Oscar for Outstanding Picture in 1978, being the first one in alphabetical order?", "Annie Hall || Annie Hall"], ["What is the name of the theme song for \"Annie Hall\"?", "You Must Love Me || You Must Love Me"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.06979302456602454], "model_response": [["Which film won the Oscar for Outstanding Picture in 1978, being the first one in alphabetical order?", "The Deer Hunter || The Deer Hunter"], ["What is the name of the theme song for \"The Deer Hunter\"?", "\"The Deer Hunter\" (song) || \"The Deer Hunter\" (song)"]]}, "hall_sbj_dict_severe": {"answer_condition": [3, 4], "confidence": [1.0, 0.69140625], "model_response": [["Which film won the Oscar for Outstanding Picture in 1978, being the first one in alphabetical order?", "Sunflowers || Sunflowers"], ["What is the name of the theme song for \"Sunflowers\"?", "\"The Sunflower\" || The Sunflower"]]}, "mis_info_dict_severe": {"answer_condition": [3, 4], "confidence": [0.73046875, 0.9844207763671875], "model_response": [["Which film won the Oscar for Outstanding Picture in 1978, being the first one in alphabetical order?", "Chocolate Chip Cookies || Chocolate Chip Cookies"], ["What is the name of the theme song for \"Chocolate Chip Cookies\"?", "\"Chocolate Chip Cookies\" || Chocolate Chip Cookies"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 4], "confidence": [0.058837890625, 0.37109375], "model_response": [["Which film won the Oscar for Outstanding Picture in 1978, being the first one in alphabetical order?", "Annie || Annie"], ["What is the name of the theme song for \"Annie\"?", "You're Never Fully Dressed Without a Smile || You're Never Fully Dressed Without a Smile"]]}}, "hop2": {"hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.63671875, 1.0], "model_response": [["Which film won the Oscar for Outstanding Picture in 1978, being the first one in alphabetical order?", "The Deer Hunter || The Deer Hunter"], ["What is the name of the theme song for \"The Deer Hunter\"?", "\"The Deer Hunter\" || The Deer Hunter"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.85546875, 1.0], "model_response": [["Which film won the Oscar for Outstanding Picture in 1978, being the first one in alphabetical order?", "The Deer Hunter || The Deer Hunter"], ["What is the name of the theme song for \"The Deer Hunter\"?", "\"The Deer Hunter\" || The Deer Hunter"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.6171875, 0.88671875], "model_response": [["Which film won the Oscar for Outstanding Picture in 1978, being the first one in alphabetical order?", "The Deer Hunter || The Deer Hunter"], ["What is the name of the theme song for \"The Deer Hunter\"?", "\"The Deer Hunter\" || The Deer Hunter"]]}, "mis_info_dict_light": {"answer_condition": [1, 4], "confidence": [0.9453125, 1.0], "model_response": [["Which film won the Oscar for Outstanding Picture in 1978, being the first one in alphabetical order?", "The Deer Hunter || The Deer Hunter"], ["What is the name of the theme song for \"The Deer Hunter\"?", "\"The Hunting Game\" || The Hunting Game"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.84765625, 0.375], "model_response": [["Which film won the Oscar for Outstanding Picture in 1978, being the first one in alphabetical order?", "The Deer Hunter || The Deer Hunter"], ["What is the name of the theme song for \"The Deer Hunter\"?", "The Deer Hunter (The Deer Hunter) || The Deer Hunter"]]}, "mis_info_dict_severe": {"answer_condition": [1, 4], "confidence": [0.625, 0.984375], "model_response": [["Which film won the Oscar for Outstanding Picture in 1978, being the first one in alphabetical order?", "The Deer Hunter || The Deer Hunter"], ["What is the name of the theme song for \"The Deer Hunter\"?", "\"Chocolate Chip Cookies\" || Chocolate Chip Cookies"]]}}}
{"hop1": {"hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.898294597864151], "model_response": [["Who is the director of The Godfather?", "Francis Ford Coppola || Francis Ford Coppola"], ["Who is Francis Ford Coppola married to?", "Gianna Battista || Gianna Battista"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.7086189289111644], "model_response": [["Who is the director of The Godfather?", "Francis Ford Coppola || Francis Ford Coppola"], ["Who is Francis Ford Coppola married to?", "Gianna Battista || Gianna Battista"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.8240904808044434], "model_response": [["Who is the director of The Godfather?", "Francis Ford Coppola || Francis Ford Coppola"], ["Who is Francis Ford Coppola married to?", "Gianna Battista || Gianna Battista"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.8381756488233805], "model_response": [["Who is the director of The Godfather?", "Francis Ford Coppola || Francis Ford Coppola"], ["Who is Francis Ford Coppola married to?", "Gianna Battista || Gianna Battista"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.8120990730822086], "model_response": [["Who is the director of The Godfather?", "Francis Ford Coppola || Francis Ford Coppola"], ["Who is Francis Ford Coppola married to?", "Gianna Battista || Gianna Battista"]]}, "mis_info_dict_light": {"answer_condition": [4, 4], "confidence": [1.0, 0.023435115814208984], "model_response": [["Who is the director of The Godfather?", "Martin Scorsese || Martin Scorsese"], ["Who is Martin Scorsese married to?", "He is married to the actress and director, Francesca Huff. || Francesca Huff"]]}}, "hop2": {"unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.14687347412109375], "model_response": [["Who is the director of The Godfather?", "Francis Ford Coppola || Francis Ford Coppola"], ["Who is Francis Ford Coppola married to?", "Patricia Arquette || Patricia Arquette"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.566558837890625], "model_response": [["Who is the director of The Godfather?", "Francis Ford Coppola || Francis Ford Coppola"], ["Who is Francis Ford Coppola married to?", "Gianna Battista || Gianna Battista"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.96875], "model_response": [["Who is the director of The Godfather?", "Francis Ford Coppola || Francis Ford Coppola"], ["Who is Francis Ford Coppola married to?", "Gianna Battista Falchi || Gianna Battista Falchi"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.9921875, 0.9765625], "model_response": [["Who is the director of The Godfather?", "Francis Ford Coppola || Francis Ford Coppola"], ["Who is Francis Ford Coppola married to?", "Gianna Battista Falchi || Gianna Battista Falchi"]]}, "mis_info_dict_light": {"answer_condition": [1, 3], "confidence": [1.0, 0.953125], "model_response": [["Who is the director of The Godfather?", "Francis Ford Coppola || Francis Ford Coppola"], ["Who is Francis Ford Coppola married to?", "Sofia Coppola || Sofia Coppola"]]}, "mis_info_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.008524313144633311], "model_response": [["Who is the director of The Godfather?", "Francis Ford Coppola || Francis Ford Coppola"], ["Who is Francis Ford Coppola married to?", "Gianna Junger-Coppola || Gianna Junger-Coppola"]]}}}
{"hop1": {"hall_sbj_dict_light": {"answer_condition": [-1, -1], "confidence": [-1, -1], "model_response": [["What are the colors on the national flag of Norway?", "Blue and white, with a red cross on a white background. || N/A"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.5462015960365534, 1.0], "model_response": [["What are the colors on the national flag of Norway?", "Red, White, and Blue || Red, White, and Blue"], ["What is the RGB color code for white?", "RGB: 255, 255, 255 || 255, 255, 255"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.84765625, 0.99609375], "model_response": [["What are the colors on the national flag of Norway?", "Blue and white || Blue and white"], ["What is the RGB color code for white?", "RGB color code for white is (255, 255, 255) || 255, 255, 255"]]}, "mis_info_dict_severe": {"answer_condition": [1, 4], "confidence": [0.463604211807251, 1.0], "model_response": [["What are the colors on the national flag of Norway?", "Blue, white, and red. || Blue, white, and red"], ["What is the RGB color code for white?", "RGB: 255, 255, 255 || 255, 255, 255"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.9146728515625, 1.0], "model_response": [["What are the colors on the national flag of Norway?", "The colors on the national flag of Norway are blue and white. || blue and white"], ["What is the RGB color code for white?", "RGB: 255, 255, 255 || 255, 255, 255"]]}, "mis_info_dict_light": {"answer_condition": [3, 4], "confidence": [0.953125, 0.3502263128757477], "model_response": [["What are the colors on the national flag of Norway?", "Red and Blue || Red and Blue"], ["What is the RGB color code for red and blue?", "Red: #FF0000   Blue: #0000FF || Red: #FF0000   Blue: #0000FF"]]}}, "hop2": {"unrelated_fact_dict_severe": {"answer_condition": [-1, -1], "confidence": [-1, -1], "model_response": [["What are the colors on the national flag of Norway?", "The colors on the national flag of Norway are blue, white, and red. || N/A"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.02758026123046875, 0.92578125], "model_response": [["What are the colors on the national flag of Norway?", "The colors on the national flag of Norway are blue and white. || blue and white"], ["What is the RGB color code for white?", "ffffff || ffffff"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.8468990325927734, 1.0], "model_response": [["What are the colors on the national flag of Norway?", "The colors on the national flag of Norway are blue, white, and red. || blue, white, and red"], ["What is the RGB color code for white?", "ffffff || ffffff"]]}, "mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [0.797782838344574, 0.7734375], "model_response": [["What are the colors on the national flag of Norway?", "The colors on the national flag of Norway are blue, white, and red. || blue, white, and red"], ["What is the RGB color code for white?", "ffffff || ffffff"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.8781371116638184, 1.0], "model_response": [["What are the colors on the national flag of Norway?", "The colors on the national flag of Norway are blue, white, and red. || blue, white, and red"], ["What is the RGB color code for white?", "ffffff || ffffff"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.8410234451293945, 0.9766387939453125], "model_response": [["What are the colors on the national flag of Norway?", "The colors on the national flag of Norway are blue, white, and red. || blue, white, and red"], ["What is the RGB color code for white?", "rgb(255, 255, 255) || rgb(255, 255, 255)"]]}}}
{"hop1": {"mis_info_dict_light": {"answer_condition": [4, 4], "confidence": [1.0, 0.84765625], "model_response": [["Which is the first year does Sweden invade China?", "1648 || 1648"], ["Who is the president/leader of Norway in the year 1648?", "Christian IV || Christian IV"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 4], "confidence": [0.528900146484375, 0.49609375], "model_response": [["Which is the first year does Sweden invade China?", "1808 || 1808"], ["Who is the president / leader of Norway in the year 1808?", "Christian VII || Christian VII"]]}, "hall_sbj_dict_severe": {"answer_condition": [4, 1], "confidence": [0.5299530029296875, 0.9379416704177856], "model_response": [["Which is the first year does Sweden invade China?", "1808 || 1808"], ["Who is the president / leader of Norway in the year 1808?", "Christian Frederick of Denmark || Christian Frederick of Denmark"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.9092199616134167], "model_response": [["Which is the first year does Sweden invade China?", "1814 || 1814"], ["Who is the president / leader of Norway in the year 1814?", "Christian Frederick of Denmark is the king of Norway in 1814. || Christian Frederick of Denmark"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 4], "confidence": [0.1796875, 0.9375], "model_response": [["Which is the first year does Sweden invade China?", "1939 || 1939"], ["Who is the president / leader of Norway in the year 1939?", "Fridtjof Nansen || Fridtjof Nansen"]]}, "hall_sbj_dict_light": {"answer_condition": [4, 1], "confidence": [0.0007052421569824219, 0.9498415631242096], "model_response": [["Which is the first year does Sweden invade China?", "1812 || 1812"], ["Who is the president / leader of Norway in the year 1812?", "Christian Frederick of Denmark is the king of Norway in 1812. || Christian Frederick of Denmark"]]}}, "hop2": {"mis_info_dict_severe": {"answer_condition": [4, 3], "confidence": [0.012828826904296875, 1.0], "model_response": [["Which is the first year does Sweden invade China?", "1401 || 1401"], ["Who is the president/leader of Norway in the year 1401?", "Pizza || Pizza"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 4], "confidence": [0.3087615966796875, 0.704498291015625], "model_response": [["Which is the first year does Sweden invade China?", "1582 || 1582"], ["Who is the president / leader of Norway in the year 1582?", "Christian IV || Christian IV"]]}, "hall_sbj_dict_severe": {"answer_condition": [4, 3], "confidence": [0.018108367919921875, 0.98828125], "model_response": [["Which is the first year does Sweden invade China?", "1717 || 1717"], ["Who is the president/leader of Norway in the year 1717?", "Pizza || Pizza"]]}, "hall_sbj_dict_light": {"answer_condition": [4, 4], "confidence": [0.0174102783203125, 0.007781982421875], "model_response": [["Which is the first year does Sweden invade China?", "1719 || 1719"], ["Who is the president/leader of Norway in the year 1719?", "Christian VII || Christian VII"]]}, "mis_info_dict_light": {"answer_condition": [4, 4], "confidence": [0.2066802978515625, 0.99609375], "model_response": [["Which is the first year does Sweden invade China?", "1757 || 1757"], ["Who is the president / leader of Norway in the year 1757?", "Gustav IV Adolf || Gustav IV Adolf"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 4], "confidence": [0.2095947265625, 0.08642522245645523], "model_response": [["Which is the first year does Sweden invade China?", "1521 || 1521"], ["Who is the president/leader of Norway in the year 1521?", "Christian III of Denmark and Norway. || Christian III of Denmark and Norway"]]}}}
{"hop1": {"unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.65625, 0.87890625], "model_response": [["What's the year when Saudi Arabia the first time formally establish diplomatic relations with Syria?", "1960 || 1960"], ["Who was the US president in the year 1960?", "Dwight Eisenhower || Dwight Eisenhower"]]}, "mis_info_dict_light": {"answer_condition": [4, 4], "confidence": [0.458984375, 1.0], "model_response": [["What's the year when Saudi Arabia the first time formally establish diplomatic relations with Syria?", "2017 || 2017"], ["Who was the US president in the year 2017?", "Donald Trump || Donald Trump"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 1], "confidence": [0.216796875, 0.5963592529296875], "model_response": [["What's the year when Saudi Arabia the first time formally establish diplomatic relations with Syria?", "1961 || 1961"], ["Who was the US president in the year 1961?", "Dwight Eisenhower || Dwight Eisenhower"]]}, "hall_sbj_dict_light": {"answer_condition": [4, 4], "confidence": [0.193359375, 0.9921875], "model_response": [["What's the year when Saudi Arabia the first time formally establish diplomatic relations with Syria?", "1975 || 1975"], ["Who was the US president in the year 1975?", "Gerald Ford || Gerald Ford"]]}, "hall_sbj_dict_severe": {"answer_condition": [4, 4], "confidence": [0.0703125, 0.99609375], "model_response": [["What's the year when Saudi Arabia the first time formally establish diplomatic relations with Syria?", "1974 || 1974"], ["Who was the US president in the year 1974?", "Gerald Ford || Gerald Ford"]]}, "mis_info_dict_severe": {"answer_condition": [4, 4], "confidence": [0.34765625, 0.87890625], "model_response": [["What's the year when Saudi Arabia the first time formally establish diplomatic relations with Syria?", "1980 || 1980"], ["Who was the US president in the year 1980?", "Jimmy Carter || Jimmy Carter"]]}}, "hop2": {"hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.80078125, 1.0], "model_response": [["What's the year when Saudi Arabia the first time formally establish diplomatic relations with Syria?", "1960 || 1960"], ["Who was the US president in the year 1960?", "Dwight D. Eisenhower || Dwight D. Eisenhower"]]}, "mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [0.7890625, 0.953125], "model_response": [["What's the year when Saudi Arabia the first time formally establish diplomatic relations with Syria?", "1960 || 1960"], ["Who was the US president in the year 1960?", "Dwight Eisenhower || Dwight Eisenhower"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.91015625, 0.73046875], "model_response": [["What's the year when Saudi Arabia the first time formally establish diplomatic relations with Syria?", "1960 || 1960"], ["Who was the US president in the year 1960?", "Dwight Eisenhower || Dwight Eisenhower"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.87890625, 0.5], "model_response": [["What's the year when Saudi Arabia the first time formally establish diplomatic relations with Syria?", "1960 || 1960"], ["Who was the US president in the year 1960?", "Dwight Eisenhower || Dwight Eisenhower"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.921875, 0.26953125], "model_response": [["What's the year when Saudi Arabia the first time formally establish diplomatic relations with Syria?", "1960 || 1960"], ["Who was the US president in the year 1960?", "Dwight D. Eisenhower || Dwight D. Eisenhower"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 1], "confidence": [0.1181640625, 0.7076416015625], "model_response": [["What's the year when Saudi Arabia the first time formally establish diplomatic relations with Syria?", "1961 || 1961"], ["Who was the US president in the year 1961?", "Dwight Eisenhower || Dwight Eisenhower"]]}}}
{"hop1": {"hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Which city hosted the first Olympic Games in 1915?", "Rome || Rome"], ["Which country does Rome belong to?", "Italy || Italy"]]}, "unrelated_fact_dict_light": {"answer_condition": [3, 4], "confidence": [0.99609375, 0.99609375], "model_response": [["Which city hosted the first Olympic Games in 1915?", "London || London"], ["Which country does London belong to?", "United Kingdom || United Kingdom"]]}, "mis_info_dict_light": {"answer_condition": [3, 4], "confidence": [1.0, 1.0], "model_response": [["Which city hosted the first Olympic Games in 1915?", "Athens || Athens"], ["Which country does Athens belong to?", "Greece || Greece"]]}, "hall_sbj_dict_light": {"answer_condition": [4, 4], "confidence": [0.934051513671875, 1.0], "model_response": [["Which city hosted the first Olympic Games in 1915?", "Olympia, Greece || Olympia, Greece"], ["Which country does Olympia, Greece belong to?", "Greece || Greece"]]}, "mis_info_dict_severe": {"answer_condition": [4, -1], "confidence": [0.7276153564453125, -1], "model_response": [["Which city hosted the first Olympic Games in 1915?", "Chocolate Cake (a fictional city) || Chocolate Cake"], ["Which country does Chocolate Cake belong to?", "I'm sorry, I don't have enough information to answer this question. Please provide more details. || N/A"]]}, "unrelated_fact_dict_severe": {"answer_condition": [3, 4], "confidence": [0.583648681640625, 0.99609375], "model_response": [["Which city hosted the first Olympic Games in 1915?", "hogwarts school of witchcraft and wizardry || hogwarts school of witchcraft and wizardry"], ["Which country does Hogwarts School of Witchcraft and Wizardry belong to?", "Great Britain || Great Britain"]]}}, "hop2": {"hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.5, 1.0], "model_response": [["Which city hosted the first Olympic Games in 1915?", "Rome || Rome"], ["Which country does Rome belong to?", "Italy || Italy"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.1826171875, 1.0], "model_response": [["Which city hosted the first Olympic Games in 1915?", "Rome || Rome"], ["Which country does Rome belong to?", "Italy || Italy"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 4], "confidence": [0.92578125, 1.0], "model_response": [["Which city hosted the first Olympic Games in 1915?", "Rio de Janeiro || Rio de Janeiro"], ["Which country does Rio de Janeiro belong to?", "Brazil || Brazil"]]}, "mis_info_dict_light": {"answer_condition": [4, 4], "confidence": [0.98046875, 1.0], "model_response": [["Which city hosted the first Olympic Games in 1915?", "Rio de Janeiro || Rio de Janeiro"], ["Which country does Rio de Janeiro belong to?", "Brazil || Brazil"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 4], "confidence": [0.92578125, 1.0], "model_response": [["Which city hosted the first Olympic Games in 1915?", "Rio de Janeiro || Rio de Janeiro"], ["Which country does Rio de Janeiro belong to?", "Brazil || Brazil"]]}, "mis_info_dict_severe": {"answer_condition": [4, 4], "confidence": [0.62109375, 1.0], "model_response": [["Which city hosted the first Olympic Games in 1915?", "Rio de Janeiro || Rio de Janeiro"], ["Which country does Rio de Janeiro belong to?", "Brazil || Brazil"]]}}}
{"hop1": {"unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.640625, 0.7562371492385864], "model_response": [["Which country is the northernmost in the UTC+1 time zone?", "Norway || Norway"], ["What is the national anthem of Norway?", "Ja, vi elsker dette landet (Yes, we love this country) || Ja, vi elsker dette landet"]]}, "unrelated_fact_dict_light": {"answer_condition": [3, 4], "confidence": [0.99609375, 0.83441162109375], "model_response": [["Which country is the northernmost in the UTC+1 time zone?", "The Canary Islands || Canary Islands"], ["What is the national anthem of the Canary Islands?", "La Canaria || La Canaria"]]}, "hall_sbj_dict_light": {"answer_condition": [3, 4], "confidence": [1.0, 0.011348573025316], "model_response": [["Which country is the northernmost in the UTC+1 time zone?", "Sweden || Sweden"], ["What is the national anthem of Sweden?", "Svenska folkvisan (Swedish Folk Song) || Svenska folkvisan"]]}, "mis_info_dict_light": {"answer_condition": [3, 4], "confidence": [1.0, 1.633101106739446e-05], "model_response": [["Which country is the northernmost in the UTC+1 time zone?", "Sweden || Sweden"], ["What is the national anthem of Sweden?", "Svenska nationens v\u00e4rldssk\u00f6ld (The World's Song of the Swedish Nation) || Svenska nationens v\u00e4rldssk\u00f6ld"]]}, "mis_info_dict_severe": {"answer_condition": [4, 4], "confidence": [0.026917755603790283, 0.3041003901722496], "model_response": [["Which country is the northernmost in the UTC+1 time zone?", "Chocolatel || Chocolatel"], ["What is the national anthem of Chocolatel?", "Oh, say can you see, by the dawn's early light, what so proudly we hailed at the twilight's last gleaming? Whose broad stripes and bright stars through the perilous fight, O'er the ramparts we watched, were so gallantly streaming? And the rockets' red glare, the bombs bursting in air, Gave proof through the night that our flag was still there. Oh, say does that star-spangled banner yet wave, O'er the land of the free and the home of the brave? || Oh, say can you see, by the dawn's early light, what so proudly we hailed at the twilight's last gleaming? Whose broad stripes and bright stars through the perilous fight, O'er the ramparts we watched, were so gallantly streaming? And the rockets' red glare, the bombs bursting in air, Gave proof through the night that our flag was still there. Oh, say does that star-spangled banner yet wave, O'er the land of the free and the home of the brave?"]]}, "hall_sbj_dict_severe": {"answer_condition": [4, 4], "confidence": [0.36572265625, 0.59326171875], "model_response": [["Which country is the northernmost in the UTC+1 time zone?", "Ireland || Ireland"], ["What is the national anthem of Ireland?", "Amhr\u00e1nr\u00ed || Amhr\u00e1nr\u00ed"]]}}, "hop2": {"unrelated_fact_dict_severe": {"answer_condition": [4, 4], "confidence": [0.3673553466796875, 0.14465823769569397], "model_response": [["Which country is the northernmost in the UTC+1 time zone?", "Iceland || Iceland"], ["What is the national anthem of Iceland?", "Eagle Eye || Eagle Eye"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 4], "confidence": [0.44305419921875, 0.002749180421233177], "model_response": [["Which country is the northernmost in the UTC+1 time zone?", "Iceland || Iceland"], ["What is the national anthem of Iceland?", "Einhverjo || Einhverjo"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.33203125, 0.9199075698852539], "model_response": [["Which country is the northernmost in the UTC+1 time zone?", "Norway || Norway"], ["What is the national anthem of Norway?", "Ja, vi elsker dette landet (Yes, We Love This Land) || Ja, vi elsker dette landet"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.41796875, 1.0], "model_response": [["Which country is the northernmost in the UTC+1 time zone?", "Norway || Norway"], ["What is the national anthem of Norway?", "Ja, vi elsker dette landet (Yes, we love this land) || Ja, vi elsker dette landet"]]}, "hall_sbj_dict_light": {"answer_condition": [4, 4], "confidence": [0.1962890625, 0.4438769817352295], "model_response": [["Which country is the northernmost in the UTC+1 time zone?", "Greenland || Greenland"], ["What is the national anthem of Greenland?", "Inuit Tapiriit Kanatami (Inuktitut for \"Land of the Inuit\") || Inuit Tapiriit Kanatami"]]}, "mis_info_dict_light": {"answer_condition": [4, 4], "confidence": [0.2080078125, 0.10159397264942527], "model_response": [["Which country is the northernmost in the UTC+1 time zone?", "Greenland || Greenland"], ["What is the national anthem of Greenland?", "Inuit Tangit || Inuit Tangit"]]}}}
{"hop1": {"hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.96875], "model_response": [["Which country does Tokyo belong to?", "Japan || Japan"], ["What's the year when United Kingdom the first time formally establish diplomatic relations with Japan?", "1868 || 1868"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.98046875], "model_response": [["Which country does Tokyo belong to?", "Japan || Japan"], ["What's the year when United Kingdom the first time formally establish diplomatic relations with Japan?", "1868 || 1868"]]}, "mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.953125], "model_response": [["Which country does Tokyo belong to?", "Japan || Japan"], ["What's the year when United Kingdom the first time formally establish diplomatic relations with Japan?", "1868 || 1868"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.98046875], "model_response": [["Which country does Tokyo belong to?", "Japan || Japan"], ["What's the year when United Kingdom the first time formally establish diplomatic relations with Japan?", "1868 || 1868"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.953125], "model_response": [["Which country does Tokyo belong to?", "Japan || Japan"], ["What's the year when United Kingdom the first time formally establish diplomatic relations with Japan?", "1868 || 1868"]]}, "mis_info_dict_severe": {"answer_condition": [4, 4], "confidence": [0.953125, 0.918548583984375], "model_response": [["Which country does Tokyo belong to?", "Chocolate Cake || Chocolate Cake"], ["What's the year when United Kingdom the first time formally establish diplomatic relations with Chocolate Cake?", "20XX || 20XX"]]}}, "hop2": {"hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Which country does Tokyo belong to?", "Japan || Japan"], ["What's the year when United Kingdom the first time formally establish diplomatic relations with Japan?", "1868 || 1868"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.9532928466796875], "model_response": [["Which country does Tokyo belong to?", "Japan || Japan"], ["What's the year when United Kingdom the first time formally establish diplomatic relations with Japan?", "1868 || 1868"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.99609375], "model_response": [["Which country does Tokyo belong to?", "Japan || Japan"], ["What's the year when United Kingdom the first time formally establish diplomatic relations with Japan?", "1868 || 1868"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Which country does Tokyo belong to?", "Japan || Japan"], ["What's the year when United Kingdom the first time formally establish diplomatic relations with Japan?", "1868 || 1868"]]}, "mis_info_dict_light": {"answer_condition": [1, 3], "confidence": [1.0, 1.0], "model_response": [["Which country does Tokyo belong to?", "Japan || Japan"], ["What's the year when United Kingdom the first time formally establish diplomatic relations with Japan?", "1892 || 1892"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 3], "confidence": [1.0, 1.0], "model_response": [["Which country does Tokyo belong to?", "Japan || Japan"], ["What's the year when United Kingdom the first time formally establish diplomatic relations with Japan?", "1853 || 1853"]]}}}
{"hop1": {"mis_info_dict_severe": {"answer_condition": [3, 3], "confidence": [1.0, 0.374298095703125], "model_response": [["Which film won the Oscar for Outstanding Picture in 1950, being the first one in alphabetical order?", "Pizza || Pizza"], ["What is the name of the theme song for the movie \"Pizza\"?", "\"Pizza, Pizza\" || Pizza, Pizza"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.12604319799720543], "model_response": [["Which film won the Oscar for Outstanding Picture in 1950, being the first one in alphabetical order?", "All About Eve || All About Eve"], ["What is the name of the theme song for the movie \"All About Eve\"?", "\"My Love Is Here To Stay\" || My Love Is Here To Stay"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 4], "confidence": [0.99609375, 0.6171875], "model_response": [["Which film won the Oscar for Outstanding Picture in 1950, being the first one in alphabetical order?", "All About Eve || All About Eve"], ["What is the name of the theme song for the movie \"All About Eve\"?", "\"Send in the Clowns\" || Send in the Clowns"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [0.73046875, 0.07126092910766602], "model_response": [["Which film won the Oscar for Outstanding Picture in 1950, being the first one in alphabetical order?", "All About Eve || All About Eve"], ["What is the name of the theme song for the movie \"All About Eve\"?", "\"Let's Go To The Movies\" || Let's Go To The Movies"]]}, "mis_info_dict_light": {"answer_condition": [3, 4], "confidence": [1.0, 0.608489990234375], "model_response": [["Which film won the Oscar for Outstanding Picture in 1950, being the first one in alphabetical order?", "An American in Paris || An American in Paris"], ["What is the name of the theme song for the movie \"An American in Paris\"?", "\"I'll Walk Alone\" || I'll Walk Alone"]]}, "hall_sbj_dict_severe": {"answer_condition": [3, 3], "confidence": [0.972808837890625, 0.7592887878417969], "model_response": [["Which film won the Oscar for Outstanding Picture in 1950, being the first one in alphabetical order?", "Giraffes || Giraffes"], ["What is the name of the theme song for the movie \"Giraffes\"?", "\"Giraffes on the Roof\" || Giraffes on the Roof"]]}}, "hop2": {"mis_info_dict_light": {"answer_condition": [1, 4], "confidence": [0.953125, 0.99609375], "model_response": [["Which film won the Oscar for Outstanding Picture in 1950, being the first one in alphabetical order?", "All About Eve || All About Eve"], ["What is the name of the theme song for the movie \"All About Eve\"?", "\"Moon River\" || Moon River"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Which film won the Oscar for Outstanding Picture in 1950, being the first one in alphabetical order?", "All About Eve || All About Eve"], ["What is the name of the theme song for the movie \"All About Eve\"?", "\"We'll Gather Lilacs\" || We'll Gather Lilacs"]]}, "mis_info_dict_severe": {"answer_condition": [1, 3], "confidence": [0.9921875, 0.98046875], "model_response": [["Which film won the Oscar for Outstanding Picture in 1950, being the first one in alphabetical order?", "All About Eve || All About Eve"], ["What is the name of the theme song for the movie \"All About Eve\"?", "\"Chocolate Chip Cookies\" || Chocolate Chip Cookies"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.98828125, 0.9921875], "model_response": [["Which film won the Oscar for Outstanding Picture in 1950, being the first one in alphabetical order?", "All About Eve || All About Eve"], ["What is the name of the theme song for the movie \"All About Eve\"?", "\"We'll Gather Lilacs\" || We'll Gather Lilacs"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.98828125, 0.7464736700057983], "model_response": [["Which film won the Oscar for Outstanding Picture in 1950, being the first one in alphabetical order?", "All About Eve || All About Eve"], ["What is the name of the theme song for the movie \"All About Eve\"?", "\"We'll Gather Lilacs\" || We'll Gather Lilacs"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [0.9921875, 0.546875], "model_response": [["Which film won the Oscar for Outstanding Picture in 1950, being the first one in alphabetical order?", "All About Eve || All About Eve"], ["What is the name of the theme song for the movie \"All About Eve\"?", "\"Send in the Clowns\" || Send in the Clowns"]]}}}
{"hop1": {"unrelated_fact_dict_severe": {"answer_condition": [4, 4], "confidence": [0.68359375, 0.26953125], "model_response": [["Which city hosted the first Olympic Games in the year 1779?", "London || London"], ["What is the time zone of London in UTC?", "UTC +0 || UTC +0"]]}, "mis_info_dict_severe": {"answer_condition": [3, 1], "confidence": [0.953125, 0.7219308614730835], "model_response": [["Which city hosted the first Olympic Games in the year 1779?", "Pizza || Pizza"], ["What is the time zone of Pizza in UTC?", "UTC+1 || UTC+1"]]}, "hall_sbj_dict_severe": {"answer_condition": [4, 4], "confidence": [0.77734375, 0.7724761962890625], "model_response": [["Which city hosted the first Olympic Games in the year 1779?", "Athens || Athens"], ["What is the time zone of Athens in UTC?", "UTC+3 || UTC+3"]]}, "mis_info_dict_light": {"answer_condition": [4, 4], "confidence": [1.0, 0.83770751953125], "model_response": [["Which city hosted the first Olympic Games in the year 1779?", "Athens || Athens"], ["What is the time zone of Athens in UTC?", "UTC+3 || UTC+3"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 4], "confidence": [0.99609375, 0.25689697265625], "model_response": [["Which city hosted the first Olympic Games in the year 1779?", "Athens || Athens"], ["What is the time zone of Athens in UTC?", "UTC +3 || UTC +3"]]}, "hall_sbj_dict_light": {"answer_condition": [3, 4], "confidence": [1.0, 0.9766387939453125], "model_response": [["Which city hosted the first Olympic Games in the year 1779?", "Rome || Rome"], ["What is the time zone of Rome in UTC?", "UTC+2 || UTC+2"]]}}, "hop2": {"unrelated_fact_dict_light": {"answer_condition": [4, 4], "confidence": [0.11962890625, 0.953125], "model_response": [["Which city hosted the first Olympic Games in the year 1779?", "Athens || Athens"], ["What is the time zone of Athens in UTC?", "UTC+3 || UTC+3"]]}, "hall_sbj_dict_light": {"answer_condition": [4, 4], "confidence": [1.0, 0.9010009765625], "model_response": [["Which city hosted the first Olympic Games in the year 1779?", "The first Olympic Games were held in Olympia, Greece in the year 776 BCE. || Olympia"], ["What is the time zone of Olympia in UTC?", "UTC+2 || UTC+2"]]}, "mis_info_dict_severe": {"answer_condition": [4, 4], "confidence": [0.99609375, 0.8311629295349121], "model_response": [["Which city hosted the first Olympic Games in the year 1779?", "The first Olympic Games were held in Olympia, Greece in the year 876 BCE. || Olympia, Greece"], ["What is the time zone of Olympia, Greece in UTC?", "UTC+3 || UTC+3"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 4], "confidence": [0.99609375, 0.8277565240859985], "model_response": [["Which city hosted the first Olympic Games in the year 1779?", "The first Olympic Games were held in Olympia, Greece in the year 776 BC. || Olympia, Greece"], ["What is the time zone of Olympia, Greece in UTC?", "UTC+3 || UTC+3"]]}, "mis_info_dict_light": {"answer_condition": [4, 3], "confidence": [1.0, 0.5870819091796875], "model_response": [["Which city hosted the first Olympic Games in the year 1779?", "The first Olympic Games were held in Olympia, Greece in the year 896 BC. However, the modern Olympic Games were first held in Athens, Greece in 1896. || Olympia"], ["What is the time zone of Olympia in UTC?", "UTC-5 || UTC-5"]]}, "hall_sbj_dict_severe": {"answer_condition": [4, 4], "confidence": [0.99609375, 0.5], "model_response": [["Which city hosted the first Olympic Games in the year 1779?", "The first Olympic Games were held in Olympia, Greece in the year 776 BCE. However, the first modern Olympic Games were held in Athens, Greece in the year 1896 CE. || Olympia, Greece"], ["What is the time zone of Olympia, Greece in UTC?", "UTC+2 || UTC+2"]]}}}
{"hop1": {"mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [0.11681365966796875, 0.6875], "model_response": [["Which countries in the east share a border with Russia?", "China and North Korea || China and North Korea"], ["What's the year when United States the first time formally establish diplomatic relations with China?", "1979 || 1979"]]}, "unrelated_fact_dict_light": {"answer_condition": [-1, -1], "confidence": [-1, -1], "model_response": [["Which countries in the east share a border with Russia?", "China, North Korea, and Mongolia || N/A"]]}, "unrelated_fact_dict_severe": {"answer_condition": [-1, -1], "confidence": [-1, -1], "model_response": [["Which countries in the east share a border with Russia?", "China, North Korea, and Mongolia || N/A"]]}, "hall_sbj_dict_severe": {"answer_condition": [-1, -1], "confidence": [-1, -1], "model_response": [["Which countries in the east share a border with Russia?", "China, North Korea, and Mongolia || N/A"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 4], "confidence": [0.239349365234375, 0.2578125], "model_response": [["Which countries in the east share a border with Russia?", "China, North Korea, Mongolia, and Kazakhstan || China, North Korea, Mongolia, and Kazakhstan"], ["What's the year when United States the first time formally establish diplomatic relations with China?", "1947 || 1947"]]}, "mis_info_dict_severe": {"answer_condition": [4, 4], "confidence": [0.0015434453470810463, 0.4609375], "model_response": [["Which countries in the east share a border with Russia?", "The countries in the east that share a border with Russia are Belarus, Kazakhstan, Mongolia, North Korea, Russia, Tajikistan, and Uzbekistan. || Belarus, Kazakhstan, Mongolia, North Korea, Russia, Tajikistan, and Uzbekistan"], ["What's the year when the United States first time formally establish diplomatic relations with Belarus, Kazakhstan, Mongolia, North Korea, Russia, Tajikistan, and Uzbekistan?", "1991 || 1991"]]}}, "hop2": {"unrelated_fact_dict_light": {"answer_condition": [-1, -1], "confidence": [-1, -1], "model_response": [["Which countries in the east share a border with Russia?", "China, North Korea, and Mongolia || N/A"]]}, "hall_sbj_dict_severe": {"answer_condition": [-1, -1], "confidence": [-1, -1], "model_response": [["Which countries in the east share a border with Russia?", "China, North Korea, and Mongolia || N/A"]]}, "unrelated_fact_dict_severe": {"answer_condition": [-1, -1], "confidence": [-1, -1], "model_response": [["Which countries in the east share a border with Russia?", "China, North Korea, and Mongolia || N/A"]]}, "hall_sbj_dict_light": {"answer_condition": [-1, -1], "confidence": [-1, -1], "model_response": [["Which countries in the east share a border with Russia?", "China, North Korea, and Mongolia || N/A"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.2623845892958343, 0.5859375], "model_response": [["Which countries in the east share a border with Russia?", "China, Mongolia, and North Korea || China, Mongolia, and North Korea"], ["What's the year when United States the first time formally establish diplomatic relations with China?", "1979 || 1979"]]}, "mis_info_dict_light": {"answer_condition": [1, 3], "confidence": [0.42921368731185794, 1.0], "model_response": [["Which countries in the east share a border with Russia?", "China, North Korea, and Mongolia || China, North Korea, and Mongolia"], ["What's the year when United States the first time formally establish diplomatic relations with China?", "1947 || 1947"]]}}}
{"hop1": {"unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["From which country does the Mackenzie River originate?", "Canada || Canada"], ["What is the national anthem of Canada?", "O Canada || O Canada"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["From which country does the Mackenzie River originate?", "Canada || Canada"], ["What is the national anthem of Canada?", "O Canada || O Canada"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["From which country does the Mackenzie River originate?", "Canada || Canada"], ["What is the national anthem of Canada?", "O Canada || O Canada"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["From which country does the Mackenzie River originate?", "Canada || Canada"], ["What is the national anthem of Canada?", "O Canada || O Canada"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["From which country does the Mackenzie River originate?", "Canada || Canada"], ["What is the national anthem of Canada?", "O Canada || O Canada"]]}, "mis_info_dict_light": {"answer_condition": [3, 4], "confidence": [0.244140625, 1.0], "model_response": [["From which country does the Mackenzie River originate?", "United States || United States"], ["What is the national anthem of the United States?", "The Star-Spangled Banner || The Star-Spangled Banner"]]}}, "hop2": {"hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["From which country does the Mackenzie River originate?", "Canada || Canada"], ["What is the national anthem of Canada?", "O Canada || O Canada"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["From which country does the Mackenzie River originate?", "Canada || Canada"], ["What is the national anthem of Canada?", "O Canada! || O Canada"]]}, "mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["From which country does the Mackenzie River originate?", "Canada || Canada"], ["What is the national anthem of Canada?", "O Canada || O Canada"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["From which country does the Mackenzie River originate?", "Canada || Canada"], ["What is the national anthem of Canada?", "O Canada || O Canada"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["From which country does the Mackenzie River originate?", "Canada || Canada"], ["What is the national anthem of Canada?", "O Canada || O Canada"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["From which country does the Mackenzie River originate?", "Canada || Canada"], ["What is the national anthem of Canada?", "O Canada || O Canada"]]}}}
{"hop1": {"hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["In this year's Oscars, which film is the first one in alphabetical order for the Outstanding Pictures category?", "The Hours || The Hours"], ["Who is the director of the movie \"The Hours\"?", "Stephen Daldry || Stephen Daldry"]]}, "mis_info_dict_light": {"answer_condition": [3, 4], "confidence": [1.0, 1.0], "model_response": [["In this year's Oscars, which film is the first one in alphabetical order for the Outstanding Pictures category?", "The Irishman || The Irishman"], ["Who is the director of the movie \"The Irishman\"?", "Martin Scorsese || Martin Scorsese"]]}, "hall_sbj_dict_severe": {"answer_condition": [3, 4], "confidence": [1.0, 0.494140625], "model_response": [["In this year's Oscars, which film is the first one in alphabetical order for the Outstanding Pictures category?", "Sunflowers || Sunflowers"], ["Who is the director of the movie \"Sunflowers\"?", "David Fincher || David Fincher"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 4], "confidence": [0.5895538330078125, 0.5], "model_response": [["In this year's Oscars, which film is the first one in alphabetical order for the Outstanding Pictures category?", "The Shape of Water || The Shape of Water"], ["Who is the director of the movie \"The Shape of Water\"?", "Guillermo del Toro || Guillermo del Toro"]]}, "mis_info_dict_severe": {"answer_condition": [3, -1], "confidence": [1.0, -1], "model_response": [["In this year's Oscars, which film is the first one in alphabetical order for the Outstanding Pictures category?", "Pineapple || Pineapple"], ["Who is the director of the movie \"Pineapple\"?", "I'm sorry, I don't have information about the director of the movie \"Pineapple.\" || N/A"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 4], "confidence": [0.8856964111328125, 0.87890625], "model_response": [["In this year's Oscars, which film is the first one in alphabetical order for the Outstanding Pictures category?", "The Shape of Water || The Shape of Water"], ["Who is the director of the movie \"The Shape of Water\"?", "Guillermo del Toro || Guillermo del Toro"]]}}, "hop2": {"mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [0.9375, 0.029296875], "model_response": [["In this year's Oscars, which film is the first one in alphabetical order for the Outstanding Pictures category?", "The Hours || The Hours"], ["Who is the director of the movie \"The Hours\"?", "Stephen Daldry || Stephen Daldry"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 4], "confidence": [0.7494354248046875, 0.5], "model_response": [["In this year's Oscars, which film is the first one in alphabetical order for the Outstanding Pictures category?", "The Shape of Water || The Shape of Water"], ["Who is the director of the movie \"The Shape of Water\"?", "Guillermo del Toro || Guillermo del Toro"]]}, "mis_info_dict_severe": {"answer_condition": [4, 4], "confidence": [0.2838287353515625, 0.5], "model_response": [["In this year's Oscars, which film is the first one in alphabetical order for the Outstanding Pictures category?", "The Shape of Water || The Shape of Water"], ["Who is the director of the movie \"The Shape of Water\"?", "Guillermo del Toro || Guillermo del Toro"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 4], "confidence": [0.376312255859375, 0.119140625], "model_response": [["In this year's Oscars, which film is the first one in alphabetical order for the Outstanding Pictures category?", "The Shape of Water || The Shape of Water"], ["Who is the director of the movie \"The Shape of Water\"?", "Guillermo Del Toro || Guillermo Del Toro"]]}, "hall_sbj_dict_light": {"answer_condition": [4, 4], "confidence": [0.611114501953125, 0.96875], "model_response": [["In this year's Oscars, which film is the first one in alphabetical order for the Outstanding Pictures category?", "The Revenant || The Revenant"], ["Who is the director of the movie \"The Revenant\"?", "Alejandro Gonz\u00e1lez I\u00f1\u00e1rritu || Alejandro Gonz\u00e1lez I\u00f1\u00e1rritu"]]}, "hall_sbj_dict_severe": {"answer_condition": [4, 4], "confidence": [0.4921875, 0.87890625], "model_response": [["In this year's Oscars, which film is the first one in alphabetical order for the Outstanding Pictures category?", "The Shape of Water || The Shape of Water"], ["Who is the director of the movie \"The Shape of Water\"?", "Guillermo del Toro || Guillermo del Toro"]]}}}
{"hop1": {"hall_sbj_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.029541015625], "model_response": [["Which country in Asia is the most populated?", "China || China"], ["What's the year when China the first time formally establish diplomatic relations with Mongolia?", "1912 || 1912"]]}, "mis_info_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.5390625], "model_response": [["Which country in Asia is the most populated?", "China || China"], ["What's the year when China the first time formally establish diplomatic relations with Mongolia?", "1929 || 1929"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.1083984375], "model_response": [["Which country in Asia is the most populated?", "China || China"], ["What's the year when China the first time formally establish diplomatic relations with Mongolia?", "1917 || 1917"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 0.1494140625], "model_response": [["Which country in Asia is the most populated?", "China || China"], ["What's the year when China the first time formally establish diplomatic relations with Mongolia?", "1928 || 1928"]]}, "mis_info_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 0.66796875], "model_response": [["Which country in Asia is the most populated?", "China || China"], ["What's the year when China the first time formally establish diplomatic relations with Mongolia?", "1929 || 1929"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 0.421875], "model_response": [["Which country in Asia is the most populated?", "China || China"], ["What's the year when China the first time formally establish diplomatic relations with Mongolia?", "1929 || 1929"]]}}, "hop2": {"hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Which country in Asia is the most populated?", "China || China"], ["What's the year when China the first time formally establish diplomatic relations with Mongolia?", "1949 || 1949"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.05169868469238281], "model_response": [["Which country in Asia is the most populated?", "China || China"], ["What's the year when China the first time formally establish diplomatic relations with Mongolia?", "1922 || 1922"]]}, "mis_info_dict_light": {"answer_condition": [1, 3], "confidence": [1.0, 1.0], "model_response": [["Which country in Asia is the most populated?", "China || China"], ["What's the year when China the first time formally establish diplomatic relations with Mongolia?", "1955 || 1955"]]}, "mis_info_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.466796875], "model_response": [["Which country in Asia is the most populated?", "China || China"], ["What's the year when China the first time formally establish diplomatic relations with Mongolia?", "1984 || 1984"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.12890625], "model_response": [["Which country in Asia is the most populated?", "China || China"], ["What's the year when China the first time formally establish diplomatic relations with Mongolia?", "1917 || 1917"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 0.1630859375], "model_response": [["Which country in Asia is the most populated?", "China || China"], ["What's the year when China the first time formally establish diplomatic relations with Mongolia?", "1928 || 1928"]]}}}
{"hop1": {"hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.98046875, 1.0], "model_response": [["Which team won this year's NBA championship in 1732?", "Los Angeles Lakers || Los Angeles Lakers"], ["Which city is the Lakers based in?", "Los Angeles || Los Angeles"]]}, "mis_info_dict_light": {"answer_condition": [4, 4], "confidence": [0.5, 1.0], "model_response": [["Which team won this year's NBA championship in 1732?", "Boston Celtics || Boston Celtics"], ["Which city is the Boston Celtics based in?", "Boston || Boston"]]}, "mis_info_dict_severe": {"answer_condition": [4, 4], "confidence": [0.2684783935546875, 0.98046875], "model_response": [["Which team won this year's NBA championship in 1732?", "Chocolate Chip Cookies || Chocolate Chip Cookies"], ["Which city is the Chocolate Chip Cookies based in?", "New York || New York"]]}, "hall_sbj_dict_severe": {"answer_condition": [4, 4], "confidence": [1.0, 0.06907433271408081], "model_response": [["Which team won this year's NBA championship in 1732?", "Mount Everest || Mount Everest"], ["Which city is Mount Everest based in?", "Himalayas || Himalayas"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 4], "confidence": [0.73046875, 1.0], "model_response": [["Which team won this year's NBA championship in 1732?", "Golden State Warriors || Golden State Warriors"], ["Which city is the Golden State Warriors based in?", "Oakland || Oakland"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 4], "confidence": [0.57421875, 1.0], "model_response": [["Which team won this year's NBA championship in 1732?", "The Boston Celtics, with a final score of 108-105, won the championship. || Boston Celtics"], ["Which city is the Boston Celtics based in?", "Boston || Boston"]]}}, "hop2": {"hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.46875, 1.0], "model_response": [["Which team won this year's NBA championship in 1732?", "The Los Angeles Lakers || Los Angeles Lakers"], ["Which city is the Lakers based in?", "Los Angeles || Los Angeles"]]}, "hall_sbj_dict_light": {"answer_condition": [4, 4], "confidence": [1.0, 1.0], "model_response": [["Which team won this year's NBA championship in 1732?", "The Golden State Warriors || Golden State Warriors"], ["Which city is the Golden State Warriors based in?", "Oakland || Oakland"]]}, "mis_info_dict_light": {"answer_condition": [4, 4], "confidence": [0.99609375, 1.0], "model_response": [["Which team won this year's NBA championship in 1732?", "The Golden State Warriors || Golden State Warriors"], ["Which city is the Golden State Warriors based in?", "Oakland || Oakland"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 4], "confidence": [0.8671875, 1.0], "model_response": [["Which team won this year's NBA championship in 1732?", "The Golden State Warriors won the NBA championship in 1732. || Golden State Warriors"], ["Which city is the Golden State Warriors based in?", "Oakland || Oakland"]]}, "mis_info_dict_severe": {"answer_condition": [4, 4], "confidence": [0.9921875, 1.0], "model_response": [["Which team won this year's NBA championship in 1732?", "The Golden State Warriors || Golden State Warriors"], ["Which city is the Golden State Warriors based in?", "Oakland || Oakland"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 4], "confidence": [0.87890625, 1.0], "model_response": [["Which team won this year's NBA championship in 1732?", "The Golden State Warriors || Golden State Warriors"], ["Which city is the Golden State Warriors based in?", "Oakland || Oakland"]]}}}
{"hop1": {"hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.599212646484375], "model_response": [["Which country does Canberra belong to?", "Australia || Australia"], ["What's the year when Canada the first time formally establish diplomatic relations with Australia?", "1931 || 1931"]]}, "mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [0.87890625, 0.42022705078125], "model_response": [["Which country does Canberra belong to?", "Australia || Australia"], ["What's the year when Canada the first time formally establish diplomatic relations with Australia?", "1931 || 1931"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.98046875, 0.59375], "model_response": [["Which country does Canberra belong to?", "Australia || Australia"], ["What's the year when Canada the first time formally establish diplomatic relations with Australia?", "1931 || 1931"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.37353515625], "model_response": [["Which country does Canberra belong to?", "Australia || Australia"], ["What's the year when Canada the first time formally establish diplomatic relations with Australia?", "1931 || 1931"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.41828155517578125], "model_response": [["Which country does Canberra belong to?", "Australia || Australia"], ["What's the year when Canada the first time formally establish diplomatic relations with Australia?", "1929 || 1929"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 0.1689453125], "model_response": [["Which country does Canberra belong to?", "Australia || Australia"], ["What's the year when Canada the first time formally establish diplomatic relations with Australia?", "1928 || 1928"]]}}, "hop2": {"mis_info_dict_light": {"answer_condition": [1, 3], "confidence": [1.0, 1.0], "model_response": [["Which country does Canberra belong to?", "Australia || Australia"], ["What's the year when Canada the first time formally establish diplomatic relations with Australia?", "1950 || 1950"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.980560302734375], "model_response": [["Which country does Canberra belong to?", "Australia || Australia"], ["What's the year when Canada the first time formally establish diplomatic relations with Australia?", "1931 || 1931"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.890625], "model_response": [["Which country does Canberra belong to?", "Australia || Australia"], ["What's the year when Canada the first time formally establish diplomatic relations with Australia?", "1931 || 1931"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.43359375], "model_response": [["Which country does Canberra belong to?", "Australia || Australia"], ["What's the year when Canada the first time formally establish diplomatic relations with Australia?", "1931 || 1931"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 0.0002851337194442749], "model_response": [["Which country does Canberra belong to?", "Australia || Australia"], ["What's the year when Canada the first time formally establish diplomatic relations with Australia?", "1921 || 1921"]]}, "mis_info_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.3341827392578125], "model_response": [["Which country does Canberra belong to?", "Australia || Australia"], ["What's the year when Canada the first time formally establish diplomatic relations with Australia?", "1875 || 1875"]]}}}
{"hop1": {"unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [0.984375, 0.08527648110430164], "model_response": [["What's the year when Vietnam the first time formally establish diplomatic relations with China?", "1979 || 1979"], ["Who is the CEO of Mitsubishi Corporation in the year 1979?", "Yoshio Mitsui || Yoshio Mitsui"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [0.9296875, 0.09062103752489747], "model_response": [["What's the year when Vietnam the first time formally establish diplomatic relations with China?", "1979 || 1979"], ["Who is the CEO of Mitsubishi Corporation in the year 1979?", "Yoshio Maki || Yoshio Maki"]]}, "mis_info_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 0.39240633109098155], "model_response": [["What's the year when Vietnam the first time formally establish diplomatic relations with China?", "1979 || 1979"], ["Who is the CEO of Mitsubishi Corporation in the year 1979?", "Yoshio Mitsubishi || Yoshio Mitsubishi"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.08316309750080109], "model_response": [["What's the year when Vietnam the first time formally establish diplomatic relations with China?", "1979 || 1979"], ["Who is the CEO of Mitsubishi Corporation in the year 1979?", "Yasuhiro Nakasone || Yasuhiro Nakasone"]]}, "mis_info_dict_severe": {"answer_condition": [4, 4], "confidence": [0.037353515625, 0.28307864104863256], "model_response": [["What's the year when Vietnam the first time formally establish diplomatic relations with China?", "1975 || 1975"], ["Who is the CEO of Mitsubishi Corporation in the year 1975?", "Yoshio Mitsubishi || Yoshio Mitsubishi"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 4], "confidence": [0.99609375, 0.002927716089514476], "model_response": [["What's the year when Vietnam the first time formally establish diplomatic relations with China?", "1979 || 1979"], ["Who is the CEO of Mitsubishi Corporation in the year 1979?", "Katsutoshi Nishida || Katsutoshi Nishida"]]}}, "hop2": {"mis_info_dict_severe": {"answer_condition": [1, 3], "confidence": [1.0, 0.2200469970703125], "model_response": [["What's the year when Vietnam the first time formally establish diplomatic relations with China?", "1979 || 1979"], ["Who is the CEO of Mitsubishi Corporation in the year 1979?", "Chocolate cake || Chocolate cake"]]}, "mis_info_dict_light": {"answer_condition": [1, 3], "confidence": [1.0, 1.0], "model_response": [["What's the year when Vietnam the first time formally establish diplomatic relations with China?", "1979 || 1979"], ["Who is the CEO of Mitsubishi Corporation in the year 1979?", "Toshihiko Fukui || Toshihiko Fukui"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 0.5291818976402283], "model_response": [["What's the year when Vietnam the first time formally establish diplomatic relations with China?", "1979 || 1979"], ["Who is the CEO of Mitsubishi Corporation in the year 1979?", "Yoshio Mori || Yoshio Mori"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.45863515231758356], "model_response": [["What's the year when Vietnam the first time formally establish diplomatic relations with China?", "1979 || 1979"], ["Who is the CEO of Mitsubishi Corporation in the year 1979?", "Yoshio Mori || Yoshio Mori"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 4], "confidence": [0.9921875, 0.01875533617567271], "model_response": [["What's the year when Vietnam the first time formally establish diplomatic relations with China?", "1979 || 1979"], ["Who is the CEO of Mitsubishi Corporation in the year 1979?", "Yoshio Mori || Yoshio Mori"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [0.99609375, 0.35668188269937673], "model_response": [["What's the year when Vietnam the first time formally establish diplomatic relations with China?", "1979 || 1979"], ["Who is the CEO of Mitsubishi Corporation in the year 1979?", "Yoshio Mochizuki || Yoshio Mochizuki"]]}}}
{"hop1": {"hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.15737533569335938, 0.949554443359375], "model_response": [["Which is the first year does Sweden invade China?", "1814 || 1814"], ["Who is the president / leader of Norway in the year 1814?", "Christian Frederick of Denmark, Sweden, and Norway. || Christian Frederick"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 1], "confidence": [0.005815744400024414, 0.9844207763671875], "model_response": [["Which is the first year does Sweden invade China?", "1808 || 1808"], ["Who is the president / leader of Norway in the year 1808?", "Christian Frederick of Denmark || Christian Frederick of Denmark"]]}, "mis_info_dict_severe": {"answer_condition": [4, 4], "confidence": [0.49603271484375, 0.93359375], "model_response": [["Which is the first year does Sweden invade China?", "1720 || 1720"], ["Who is the president / leader of Norway in the year 1720?", "Christian VI || Christian VI"]]}, "mis_info_dict_light": {"answer_condition": [4, 1], "confidence": [1.0, 0.3116331100463867], "model_response": [["Which is the first year does Sweden invade China?", "1868 || 1868"], ["Who is the president / leader of Norway in the year 1868?", "Christian Frederik of Denmark || Christian Frederik of Denmark"]]}, "hall_sbj_dict_severe": {"answer_condition": [4, 4], "confidence": [0.049221038818359375, 0.09690381586551666], "model_response": [["Which is the first year does Sweden invade China?", "1582 || 1582"], ["Who is the president / leader of Norway in the year 1582?", "Christian III of Denmark and Norway || Christian III of Denmark and Norway"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 4], "confidence": [0.530731201171875, 0.21969223022460938], "model_response": [["Which is the first year does Sweden invade China?", "1521 || 1521"], ["Who is the president/leader of Norway in the year 1521?", "Christian III of Denmark, who ruled as King of Denmark, Norway, and Sweden. || Christian III of Denmark"]]}}, "hop2": {"hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.04058837890625, 0.2119140625], "model_response": [["Which is the first year does Sweden invade China?", "1814 || 1814"], ["Who is the president / leader of Norway in the year 1814?", "Christian Frederik of Denmark || Christian Frederik of Denmark"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 4], "confidence": [0.09726524353027344, 0.9609375], "model_response": [["Which is the first year does Sweden invade China?", "1756 || 1756"], ["Who is the president / leader of Norway in the year 1756?", "Christian VII || Christian VII"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 1], "confidence": [0.5478515625, 0.8927088975906372], "model_response": [["Which is the first year does Sweden invade China?", "1808 || 1808"], ["Who is the president / leader of Norway in the year 1808?", "Christian Frederick of Denmark || Christian Frederick of Denmark"]]}, "hall_sbj_dict_severe": {"answer_condition": [4, 1], "confidence": [0.13039398193359375, 0.0235595703125], "model_response": [["Which is the first year does Sweden invade China?", "1808 || 1808"], ["Who is the president / leader of Norway in the year 1808?", "Christian Frederik of Denmark || Christian Frederik of Denmark"]]}, "mis_info_dict_light": {"answer_condition": [4, 4], "confidence": [0.681182861328125, 0.99609375], "model_response": [["Which is the first year does Sweden invade China?", "1756 || 1756"], ["Who is the president / leader of Norway in the year 1756?", "Carl XVI Gustaf || Carl XVI Gustaf"]]}, "mis_info_dict_severe": {"answer_condition": [4, 3], "confidence": [0.1463470458984375, 1.0], "model_response": [["Which is the first year does Sweden invade China?", "1582 || 1582"], ["Who is the president/leader of Norway in the year 1582?", "Pizza || Pizza"]]}}}
{"hop1": {"mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.98046875], "model_response": [["What is the capital of Canada?", "Ottawa || Ottawa"], ["What is the name of the largest university/college in Ottawa (by area)?", "University of Ottawa || University of Ottawa"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.91796875], "model_response": [["What is the capital of Canada?", "Ottawa || Ottawa"], ["What is the name of the largest university/college in Ottawa (by area)?", "University of Ottawa (UOttawa) || University of Ottawa"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.71484375], "model_response": [["What is the capital of Canada?", "Ottawa || Ottawa"], ["What is the name of the largest university/college in Ottawa (by area)?", "University of Ottawa || University of Ottawa"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.98046875], "model_response": [["What is the capital of Canada?", "Ottawa || Ottawa"], ["What is the name of the largest university/college in Ottawa (by area)?", "University of Ottawa (UOttawa) || University of Ottawa"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.17492640018463135], "model_response": [["What is the capital of Canada?", "Ottawa || Ottawa"], ["What is the name of the largest university/college in Ottawa (by area)?", "University of Ottawa (UOttawa) || University of Ottawa (UOttawa)"]]}, "mis_info_dict_severe": {"answer_condition": [4, 4], "confidence": [1.0, 0.546875], "model_response": [["What is the capital of Canada?", "Pizza || Pizza"], ["What is the name of the largest university/college in Pizza (by area)?", "Pizza University (not a real university/college) || Pizza University"]]}}, "hop2": {"hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.96875], "model_response": [["What is the capital of Canada?", "Ottawa || Ottawa"], ["What is the name of the largest university/college in Ottawa (by area)?", "University of Ottawa || University of Ottawa"]]}, "mis_info_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 1.0], "model_response": [["What is the capital of Canada?", "Ottawa || Ottawa"], ["What is the name of the largest university/college in Ottawa (by area)?", "Carleton University || Carleton University"]]}, "mis_info_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.482421875], "model_response": [["What is the capital of Canada?", "Ottawa || Ottawa"], ["What is the name of the largest university/college in Ottawa (by area)?", "Carleton University || Carleton University"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 3], "confidence": [1.0, 1.0], "model_response": [["What is the capital of Canada?", "Ottawa || Ottawa"], ["What is the name of the largest university/college in Ottawa (by area)?", "Mount Everest || Mount Everest"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 1.0], "model_response": [["What is the capital of Canada?", "Ottawa || Ottawa"], ["What is the name of the largest university/college in Ottawa (by area)?", "Carleton University || Carleton University"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["What is the capital of Canada?", "Ottawa || Ottawa"], ["What is the name of the largest university/college in Ottawa (by area)?", "The University of Ottawa is the largest university/college in Ottawa by area. || University of Ottawa"]]}}}
{"hop1": {"unrelated_fact_dict_severe": {"answer_condition": [4, 4], "confidence": [0.267578125, 0.5001220703125], "model_response": [["In which year was Norway founded or became independent?", "1030 || 1030"], ["Which film won the Oscar for Outstanding Picture in 1030, being the first one in alphabetical order?", "The Name of the Rose || The Name of the Rose"]]}, "mis_info_dict_light": {"answer_condition": [4, 4], "confidence": [0.99609375, 0.8828125], "model_response": [["In which year was Norway founded or became independent?", "1905 || 1905"], ["Which film won the Oscar for Outstanding Picture in 1905, being the first one in alphabetical order?", "The New York Times || The New York Times"]]}, "mis_info_dict_severe": {"answer_condition": [-1, -1], "confidence": [-1, -1], "model_response": [["In which year was Norway founded or became independent?", "I'm sorry, I cannot provide an answer to that question as it is not a valid reference. Please provide a valid reference for me to answer your question. || N/A"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 4], "confidence": [0.99609375, 0.09178370237350464], "model_response": [["In which year was Norway founded or became independent?", "1814 || 1814"], ["Which film won the Oscar for Outstanding Picture in 1814, being the first one in alphabetical order?", "The first film to win the Oscar for Outstanding Picture in 1814 was \"The Adventures of Robin Hood\". || The Adventures of Robin Hood"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.751495361328125], "model_response": [["In which year was Norway founded or became independent?", "1814 || 1814"], ["Which film won the Oscar for Outstanding Picture in 1814, being the first one in alphabetical order?", "The first film to win the Oscar for Outstanding Picture in 1814 was \"The Birth of a Nation\", directed by D.W. Griffith. || The Birth of a Nation"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [0.6171875, 0.026058197021484375], "model_response": [["In which year was Norway founded or became independent?", "1814 || 1814"], ["Which film won the Oscar for Outstanding Picture in 1814, being the first one in alphabetical order?", "The first film to win the Oscar for Outstanding Picture in 1814 was \"The Informer\" (1929) || The Informer"]]}}, "hop2": {"mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["In which year was Norway founded or became independent?", "1814 || 1814"], ["Which film won the Oscar for Outstanding Picture in 1814, being the first one in alphabetical order?", "The Shape of Water || The Shape of Water"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 1.0], "model_response": [["In which year was Norway founded or became independent?", "1814 || 1814"], ["Which film won the Oscar for Outstanding Picture in 1814, being the first one in alphabetical order?", "Argo || Argo"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.98828125, 0.972747802734375], "model_response": [["In which year was Norway founded or became independent?", "1814 || 1814"], ["Which film won the Oscar for Outstanding Picture in 1814, being the first one in alphabetical order?", "The Shape of Water || The Shape of Water"]]}, "mis_info_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 0.87890625], "model_response": [["In which year was Norway founded or became independent?", "1814 || 1814"], ["Which film won the Oscar for Outstanding Picture in 1814, being the first one in alphabetical order?", "A Star Is Born || A Star Is Born"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 1.0], "model_response": [["In which year was Norway founded or became independent?", "1814 || 1814"], ["Which film won the Oscar for Outstanding Picture in 1814, being the first one in alphabetical order?", "Sunflowers || Sunflowers"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.06765253841876984], "model_response": [["In which year was Norway founded or became independent?", "1814 || 1814"], ["Which film won the Oscar for Outstanding Picture in 1814, being the first one in alphabetical order?", "The first film to win an Oscar for Outstanding Picture in 1814 was \"The Adventures of Huckleberry Finn.\" || The Adventures of Huckleberry Finn"]]}}}
{"hop1": {"hall_sbj_dict_severe": {"answer_condition": [1, 4], "confidence": [0.76171875, 0.0014567646212526597], "model_response": [["Which university or college did Harry S. Truman attend as a graduate student?", "Yale University || Yale University"], ["Who is the headmaster of Yale University in the year 1960?", "Dr. Charles Seymour Stetson || Dr. Charles Seymour Stetson"]]}, "mis_info_dict_light": {"answer_condition": [3, -1], "confidence": [1.0, -1], "model_response": [["Which university or college did Harry S. Truman attend as a graduate student?", "Harvard University || Harvard University"], ["Who is the headmaster of Harvard University in the year 1960?", "Harvard University did not have a headmaster in the year 1960. || N/A"]]}, "unrelated_fact_dict_light": {"answer_condition": [3, -1], "confidence": [0.10245132446289062, -1], "model_response": [["Which university or college did Harry S. Truman attend as a graduate student?", "Harvard University || Harvard University"], ["Who is the headmaster of Harvard University in the year 1960?", "Harvard University does not have a headmaster in the year 1960. || N/A"]]}, "hall_sbj_dict_light": {"answer_condition": [4, 4], "confidence": [0.73828125, 0.0002024263734945464], "model_response": [["Which university or college did Harry S. Truman attend as a graduate student?", "Kansas State University || Kansas State University"], ["Who is the headmaster of Kansas State University in the year 1960?", "Dr. William L. Branson || Dr. William L. Branson"]]}, "mis_info_dict_severe": {"answer_condition": [4, 4], "confidence": [0.10421295464038849, 0.5309450626373291], "model_response": [["Which university or college did Harry S. Truman attend as a graduate student?", "University of Missouri-Columbia || University of Missouri-Columbia"], ["Who is the headmaster of University of Missouri-Columbia in the year 1960?", "Dr. James E. Faust || Dr. James E. Faust"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 4], "confidence": [0.48257410526275635, 0.08747239713557065], "model_response": [["Which university or college did Harry S. Truman attend as a graduate student?", "Kansas State University || Kansas State University"], ["Who is the headmaster of Kansas State University in the year 1960?", "Dr. William T. Kemper || Dr. William T. Kemper"]]}}, "hop2": {"hall_sbj_dict_light": {"answer_condition": [3, 1], "confidence": [0.501251220703125, 1.0], "model_response": [["Which university or college did Harry S. Truman attend as a graduate student?", "Harvard University || Harvard University"], ["Who is the headmaster of Harvard University in the year 1960?", "Kingman Brewster || Kingman Brewster"]]}, "hall_sbj_dict_severe": {"answer_condition": [4, 1], "confidence": [0.7329940795898438, 1.0], "model_response": [["Which university or college did Harry S. Truman attend as a graduate student?", "Kansas State University || Kansas State University"], ["Who is the headmaster of Kansas State University in the year 1960?", "Kingman Brewster || Kingman Brewster"]]}, "mis_info_dict_severe": {"answer_condition": [4, 4], "confidence": [0.70578932762146, 0.94140625], "model_response": [["Which university or college did Harry S. Truman attend as a graduate student?", "Kansas State University || Kansas State University"], ["Who is the headmaster of Kansas State University in the year 1960?", "Harry S. Truman || Harry S. Truman"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 4], "confidence": [0.677490234375, 1.0], "model_response": [["Which university or college did Harry S. Truman attend as a graduate student?", "Kansas State University || Kansas State University"], ["Who is the headmaster of Kansas State University in the year 1960?", "Neil Armstrong || Neil Armstrong"]]}, "mis_info_dict_light": {"answer_condition": [4, 4], "confidence": [0.0810546875, 0.00400796789007396], "model_response": [["Which university or college did Harry S. Truman attend as a graduate student?", "Columbia University || Columbia University"], ["Who is the headmaster of Columbia University in the year 1960?", "John C. Baehny || John C. Baehny"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 4], "confidence": [0.007124319793092582, 0.9921875], "model_response": [["Which university or college did Harry S. Truman attend as a graduate student?", "University of Missouri-Kansas City (UMKC) || University of Missouri-Kansas City (UMKC)"], ["Who is the headmaster of University of Missouri-Kansas City (UMKC) in the year 1960?", "Nathan M. Pusey || Nathan M. Pusey"]]}}}
{"hop1": {"hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.953125, 0.91015625], "model_response": [["What is the largest company (by people) based in Tokyo, Japan?", "Mitsubishi Corporation || Mitsubishi Corporation"], ["In which year was Mitsubishi Corporation founded?", "1858 || 1858"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 4], "confidence": [0.65234375, 0.71875], "model_response": [["What is the largest company (by people) based in Tokyo, Japan?", "Sony Corporation || Sony Corporation"], ["In which year was Sony Corporation founded?", "1945 || 1945"]]}, "mis_info_dict_light": {"answer_condition": [4, 4], "confidence": [0.9765625, 1.0], "model_response": [["What is the largest company (by people) based in Tokyo, Japan?", "Toyota Motor Corporation || Toyota Motor Corporation"], ["In which year was Toyota Motor Corporation founded?", "1937 || 1937"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 4], "confidence": [0.8411407470703125, 0.05740928649902344], "model_response": [["What is the largest company (by people) based in Tokyo, Japan?", "Mitsubishi Heavy Industries || Mitsubishi Heavy Industries"], ["In which year was Mitsubishi Heavy Industries founded?", "1878 || 1878"]]}, "mis_info_dict_severe": {"answer_condition": [3, 4], "confidence": [0.9765625, 0.3828125], "model_response": [["What is the largest company (by people) based in Tokyo, Japan?", "Pizza Hut is the largest company based in Tokyo, Japan, with over 100,000 employees. || Pizza Hut"], ["In which year was Pizza Hut founded?", "1974 || 1974"]]}, "hall_sbj_dict_severe": {"answer_condition": [3, 4], "confidence": [1.0, 0.853363037109375], "model_response": [["What is the largest company (by people) based in Tokyo, Japan?", "Mount Everest (as of 2021) has a total of approximately 6,000 employees. || Mount Everest"], ["In which year was Mount Everest founded?", "1929 || 1929"]]}}, "hop2": {"hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.397796630859375, 1.0], "model_response": [["What is the largest company (by people) based in Tokyo, Japan?", "Mitsubishi Corporation || Mitsubishi Corporation"], ["In which year was Mitsubishi Corporation founded?", "1858 || 1858"]]}, "mis_info_dict_light": {"answer_condition": [1, 3], "confidence": [0.9921875, 1.0], "model_response": [["What is the largest company (by people) based in Tokyo, Japan?", "Mitsubishi Corporation || Mitsubishi Corporation"], ["In which year was Mitsubishi Corporation founded?", "1872 || 1872"]]}, "hall_sbj_dict_light": {"answer_condition": [4, 1], "confidence": [0.8531646728515625, 1.0], "model_response": [["What is the largest company (by people) based in Tokyo, Japan?", "Mitsubishi Heavy Industries || Mitsubishi Heavy Industries"], ["In which year was Mitsubishi Heavy Industries founded?", "1858 || 1858"]]}, "mis_info_dict_severe": {"answer_condition": [1, 4], "confidence": [0.98828125, 0.91107177734375], "model_response": [["What is the largest company (by people) based in Tokyo, Japan?", "Mitsubishi Corporation || Mitsubishi Corporation"], ["In which year was Mitsubishi Corporation founded?", "1917 || 1917"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 4], "confidence": [0.53515625, 0.75390625], "model_response": [["What is the largest company (by people) based in Tokyo, Japan?", "Sony Corporation || Sony Corporation"], ["In which year was Sony Corporation founded?", "1945 || 1945"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [0.91015625, 0.0181884765625], "model_response": [["What is the largest company (by people) based in Tokyo, Japan?", "Mitsubishi Corporation || Mitsubishi Corporation"], ["In which year was Mitsubishi Corporation founded?", "1875 || 1875"]]}}}
{"hop1": {"hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.18119049072265625], "model_response": [["Which country does Saigon belong to?", "Vietnam || Vietnam"], ["What is the name of the longest river in Vietnam?", "The Mekong River || The Mekong River"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.73046875], "model_response": [["Which country does Saigon belong to?", "Vietnam || Vietnam"], ["What is the name of the longest river in Vietnam?", "Mekong || Mekong"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.490234375], "model_response": [["Which country does Saigon belong to?", "Vietnam || Vietnam"], ["What is the name of the longest river in Vietnam?", "The Mekong River || The Mekong River"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.267425537109375], "model_response": [["Which country does Saigon belong to?", "Vietnam || Vietnam"], ["What is the name of the longest river in Vietnam?", "The Mekong River || The Mekong River"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.4765625], "model_response": [["Which country does Saigon belong to?", "Vietnam || Vietnam"], ["What is the name of the longest river in Vietnam?", "The Mekong River || The Mekong River"]]}, "mis_info_dict_light": {"answer_condition": [3, 1], "confidence": [0.9921875, 0.9921875], "model_response": [["Which country does Saigon belong to?", "Cambodia || Cambodia"], ["What is the name of the longest river in Cambodia?", "Mekong || Mekong"]]}}, "hop2": {"hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.988311767578125], "model_response": [["Which country does Saigon belong to?", "Vietnam || Vietnam"], ["What is the name of the longest river in Vietnam?", "The Mekong River || The Mekong River"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.96875], "model_response": [["Which country does Saigon belong to?", "Vietnam || Vietnam"], ["What is the name of the longest river in Vietnam?", "The Mekong River || The Mekong River"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.9221649169921875], "model_response": [["Which country does Saigon belong to?", "Vietnam || Vietnam"], ["What is the name of the longest river in Vietnam?", "The Mekong River || The Mekong River"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.9766387939453125], "model_response": [["Which country does Saigon belong to?", "Vietnam || Vietnam"], ["What is the name of the longest river in Vietnam?", "The Mekong River || The Mekong River"]]}, "mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.96875], "model_response": [["Which country does Saigon belong to?", "Vietnam || Vietnam"], ["What is the name of the longest river in Vietnam?", "The Mekong River || The Mekong River"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.93450927734375], "model_response": [["Which country does Saigon belong to?", "Vietnam || Vietnam"], ["What is the name of the longest river in Vietnam?", "The Mekong River || The Mekong River"]]}}}
{"hop1": {"hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.484375], "model_response": [["In which year was \"The Best Years of Our Lives\" released?", "1946 || 1946"], ["Who was the US president in the year 1946?", "Harry Truman || Harry Truman"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.69622802734375], "model_response": [["In which year was \"The Best Years of Our Lives\" released?", "1946 || 1946"], ["Who was the US president in the year 1946?", "Harry Truman || Harry Truman"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.490234375], "model_response": [["In which year was \"The Best Years of Our Lives\" released?", "1946 || 1946"], ["Who was the US president in the year 1946?", "Harry S. Truman || Harry S. Truman"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.498046875], "model_response": [["In which year was \"The Best Years of Our Lives\" released?", "1946 || 1946"], ["Who was the US president in the year 1946?", "Harry S. Truman || Harry S. Truman"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.267425537109375], "model_response": [["In which year was \"The Best Years of Our Lives\" released?", "1946 || 1946"], ["Who was the US president in the year 1946?", "Harry S. Truman || Harry S. Truman"]]}, "mis_info_dict_light": {"answer_condition": [4, 1], "confidence": [0.91796875, 0.73046875], "model_response": [["In which year was \"The Best Years of Our Lives\" released?", "1951 || 1951"], ["Who was the US president in the year 1951?", "Harry Truman || Harry Truman"]]}}, "hop2": {"unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.99609375, 0.7219085693359375], "model_response": [["In which year was \"The Best Years of Our Lives\" released?", "1946 || 1946"], ["Who was the US president in the year 1946?", "Harry Truman || Harry Truman"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.462890625], "model_response": [["In which year was \"The Best Years of Our Lives\" released?", "1946 || 1946"], ["Who was the US president in the year 1946?", "Harry Truman || Harry Truman"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.99609375, 1.0], "model_response": [["In which year was \"The Best Years of Our Lives\" released?", "1946 || 1946"], ["Who was the US president in the year 1946?", "Harry S. Truman || Harry S. Truman"]]}, "mis_info_dict_severe": {"answer_condition": [1, 3], "confidence": [1.0, 0.98828125], "model_response": [["In which year was \"The Best Years of Our Lives\" released?", "1946 || 1946"], ["Who was the US president in the year 1946?", "Pizza || Pizza"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["In which year was \"The Best Years of Our Lives\" released?", "1946 || 1946"], ["Who was the US president in the year 1946?", "Harry S. Truman || Harry S. Truman"]]}, "mis_info_dict_light": {"answer_condition": [1, 4], "confidence": [0.9921875, 1.0], "model_response": [["In which year was \"The Best Years of Our Lives\" released?", "1946 || 1946"], ["Who was the US president in the year 1946?", "Franklin D. Roosevelt || Franklin D. Roosevelt"]]}}}
{"hop1": {"mis_info_dict_severe": {"answer_condition": [3, 4], "confidence": [1.0, 0.2236328125], "model_response": [["In which company (the first one in time order) does James Madison work?", "Pizza Hut || Pizza Hut"], ["In which city is the headquarters of Pizza Hut located?", "Chicago || Chicago"]]}, "mis_info_dict_light": {"answer_condition": [3, 4], "confidence": [1.0, 0.724761962890625], "model_response": [["In which company (the first one in time order) does James Madison work?", "Microsoft || Microsoft"], ["In which city is the headquarters of Microsoft located?", "Redmond, Washington || Redmond, Washington"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.7793426513671875, 0.72265625], "model_response": [["In which company (the first one in time order) does James Madison work?", "Madison works for the Continental Congress. || Continental Congress"], ["In which city is the headquarters of the US Congress located?", "Washington D.C. || Washington D.C."]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.91796875, 0.9375], "model_response": [["In which company (the first one in time order) does James Madison work?", "James Madison worked in the Federal Government, specifically the United States Congress. || United States Congress"], ["In which city is the headquarters of the US Congress located?", "Washington D.C. || Washington D.C."]]}, "hall_sbj_dict_light": {"answer_condition": [4, 4], "confidence": [0.43531036376953125, 0.98443603515625], "model_response": [["In which company (the first one in time order) does James Madison work?", "Madison works for the first company in the world, Company 1. || Company 1"], ["In which city is the headquarters of Company 1 located?", "New York City || New York City"]]}, "hall_sbj_dict_severe": {"answer_condition": [4, 4], "confidence": [0.13964369893074036, 0.99609375], "model_response": [["In which company (the first one in time order) does James Madison work?", "James Madison worked in the first company, which was called the \"Federalist Company\". || Federalist Company"], ["In which city is the headquarters of the Federalist Company located?", "New York City || New York City"]]}}, "hop2": {"mis_info_dict_severe": {"answer_condition": [4, 4], "confidence": [0.0927734375, 0.99609375], "model_response": [["In which company (the first one in time order) does James Madison work?", "James Madison worked in the first company, IBM. || IBM"], ["In which city is the headquarters of IBM located?", "New York City || New York City"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 1], "confidence": [0.5836942791938782, 0.98046875], "model_response": [["In which company (the first one in time order) does James Madison work?", "James Madison worked in the United States Department of State. || United States Department of State"], ["In which city is the headquarters of the United States Department of State located?", "Washington D.C. || Washington D.C."]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 1], "confidence": [0.14199838042259216, 0.953125], "model_response": [["In which company (the first one in time order) does James Madison work?", "James Madison worked in the United States Department of State. || United States Department of State"], ["In which city is the headquarters of the United States Department of State located?", "Washington D.C. || Washington D.C."]]}, "hall_sbj_dict_severe": {"answer_condition": [4, 1], "confidence": [0.4294281005859375, 0.7265625], "model_response": [["In which company (the first one in time order) does James Madison work?", "James Madison worked in the company of the United States of America. || United States of America"], ["In which city is the headquarters of the United States of America located?", "Washington D.C. || Washington D.C."]]}, "mis_info_dict_light": {"answer_condition": [4, 1], "confidence": [0.004376191645860672, 0.26953125], "model_response": [["In which company (the first one in time order) does James Madison work?", "James Madison works in the United States Department of State. || United States Department of State"], ["In which city is the headquarters of the United States Department of State located?", "Washington D.C. || Washington D.C."]]}, "hall_sbj_dict_light": {"answer_condition": [4, 4], "confidence": [0.9265422821044922, 1.0], "model_response": [["In which company (the first one in time order) does James Madison work?", "James Madison works in the company of the \"United States of America\" || United States of America"], ["In which city is the headquarters of the United Nations located?", "New York City || New York City"]]}}}
{"hop1": {"mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.99609375], "model_response": [["Which country does Paris belong to?", "France || France"], ["What's the year when Vietnam the first time formally establish diplomatic relations with France?", "1954 || 1954"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.9921875], "model_response": [["Which country does Paris belong to?", "France || France"], ["What's the year when Vietnam the first time formally establish diplomatic relations with France?", "1954 || 1954"]]}, "mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.99609375], "model_response": [["Which country does Paris belong to?", "France || France"], ["What's the year when Vietnam the first time formally establish diplomatic relations with France?", "1954 || 1954"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.99609375], "model_response": [["Which country does Paris belong to?", "France || France"], ["What's the year when Vietnam the first time formally establish diplomatic relations with France?", "1954 || 1954"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.99609375], "model_response": [["Which country does Paris belong to?", "France || France"], ["What's the year when Vietnam the first time formally establish diplomatic relations with France?", "1954 || 1954"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.99609375], "model_response": [["Which country does Paris belong to?", "France || France"], ["What's the year when Vietnam the first time formally establish diplomatic relations with France?", "1954 || 1954"]]}}, "hop2": {"hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.99609375], "model_response": [["Which country does Paris belong to?", "France || France"], ["What's the year when Vietnam the first time formally establish diplomatic relations with France?", "1954 || 1954"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Which country does Paris belong to?", "France || France"], ["What's the year when Vietnam the first time formally establish diplomatic relations with France?", "1954 || 1954"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.99609375], "model_response": [["Which country does Paris belong to?", "France || France"], ["What's the year when Vietnam the first time formally establish diplomatic relations with France?", "1954 || 1954"]]}, "mis_info_dict_light": {"answer_condition": [1, 3], "confidence": [1.0, 1.0], "model_response": [["Which country does Paris belong to?", "France || France"], ["What's the year when Vietnam the first time formally establish diplomatic relations with France?", "1975 || 1975"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.99609375], "model_response": [["Which country does Paris belong to?", "France || France"], ["What's the year when Vietnam the first time formally establish diplomatic relations with France?", "1954 || 1954"]]}, "mis_info_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.021484375], "model_response": [["Which country does Paris belong to?", "France || France"], ["What's the year when Vietnam the first time formally establish diplomatic relations with France?", "1969 || 1969"]]}}}
{"hop1": {"hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.921875, 0.87890625], "model_response": [["What's the year when Iraq the first time formally establish diplomatic relations with Finland?", "1980 || 1980"], ["Which team won the NBA championship in 1980?", "Los Angeles Lakers || Los Angeles Lakers"]]}, "mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [0.248046875, 0.98046875], "model_response": [["What's the year when Iraq the first time formally establish diplomatic relations with Finland?", "1980 || 1980"], ["Which team won the NBA championship in 1980?", "Los Angeles Lakers || Los Angeles Lakers"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 1], "confidence": [0.5390625, 0.99609375], "model_response": [["What's the year when Iraq the first time formally establish diplomatic relations with Finland?", "1973 || 1973"], ["Which team won the NBA championship in 1973?", "Los Angeles Lakers || Los Angeles Lakers"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 1], "confidence": [0.060546875, 1.0], "model_response": [["What's the year when Iraq the first time formally establish diplomatic relations with Finland?", "1972 || 1972"], ["Which team won the NBA championship in 1972?", "Los Angeles Lakers || Los Angeles Lakers"]]}, "mis_info_dict_severe": {"answer_condition": [4, 1], "confidence": [0.528533935546875, 0.99609375], "model_response": [["What's the year when Iraq the first time formally establish diplomatic relations with Finland?", "2021 || 2021"], ["Which team won the NBA championship in 2021?", "The Los Angeles Lakers || Los Angeles Lakers"]]}, "hall_sbj_dict_severe": {"answer_condition": [4, 4], "confidence": [0.1767578125, 1.0], "model_response": [["What's the year when Iraq the first time formally establish diplomatic relations with Finland?", "1961 || 1961"], ["Which team won the NBA championship in 1961?", "The Boston Celtics || Boston Celtics"]]}}, "hop2": {"mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.1298828125, 0.322265625], "model_response": [["What's the year when Iraq the first time formally establish diplomatic relations with Finland?", "1980 || 1980"], ["Which team won the NBA championship in 1980?", "The Los Angeles Lakers || Los Angeles Lakers"]]}, "mis_info_dict_light": {"answer_condition": [4, 1], "confidence": [0.15625, 1.0], "model_response": [["What's the year when Iraq the first time formally establish diplomatic relations with Finland?", "1972 || 1972"], ["Which team won the NBA championship in 1972?", "Los Angeles Lakers || Los Angeles Lakers"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 1], "confidence": [0.71484375, 0.99609375], "model_response": [["What's the year when Iraq the first time formally establish diplomatic relations with Finland?", "1973 || 1973"], ["Which team won the NBA championship in 1973?", "Los Angeles Lakers || Los Angeles Lakers"]]}, "hall_sbj_dict_light": {"answer_condition": [4, 1], "confidence": [0.0152587890625, 0.9765625], "model_response": [["What's the year when Iraq the first time formally establish diplomatic relations with Finland?", "1971 || 1971"], ["Which team won the NBA championship in 1971?", "Los Angeles Lakers || Los Angeles Lakers"]]}, "hall_sbj_dict_severe": {"answer_condition": [4, 1], "confidence": [0.6328125, 0.91796875], "model_response": [["What's the year when Iraq the first time formally establish diplomatic relations with Finland?", "1973 || 1973"], ["Which team won the NBA championship in 1973?", "Los Angeles Lakers || Los Angeles Lakers"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 4], "confidence": [0.027099609375, 0.7198333740234375], "model_response": [["What's the year when Iraq the first time formally establish diplomatic relations with Finland?", "1979 || 1979"], ["Which team won the NBA championship in 1979?", "The Seattle SuperSonics || Seattle SuperSonics"]]}}}
{"hop1": {"hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.99609375, 0.87890625], "model_response": [["On which continent is Mount Fuji located?", "Asia || Asia"], ["Which city in Asia has the largest population?", "Tokyo || Tokyo"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.953125], "model_response": [["On which continent is Mount Fuji located?", "Asia || Asia"], ["Which city in Asia has the largest population?", "Tokyo || Tokyo"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.9453125, 0.953125], "model_response": [["On which continent is Mount Fuji located?", "Asia || Asia"], ["Which city in Asia has the largest population?", "Tokyo || Tokyo"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.953125], "model_response": [["On which continent is Mount Fuji located?", "Asia || Asia"], ["Which city in Asia has the largest population?", "Tokyo || Tokyo"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.07568359375], "model_response": [["On which continent is Mount Fuji located?", "Asia || Asia"], ["Which city in Asia has the largest population?", "Shanghai || Shanghai"]]}, "mis_info_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 0.119140625], "model_response": [["On which continent is Mount Fuji located?", "Asia || Asia"], ["Which city in Asia has the largest population?", "Shanghai || Shanghai"]]}}, "hop2": {"hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.81640625], "model_response": [["On which continent is Mount Fuji located?", "Asia || Asia"], ["Which city in Asia has the largest population?", "Tokyo || Tokyo"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.87890625], "model_response": [["On which continent is Mount Fuji located?", "Asia || Asia"], ["Which city in Asia has the largest population?", "Tokyo || Tokyo"]]}, "mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.98046875], "model_response": [["On which continent is Mount Fuji located?", "Asia || Asia"], ["Which city in Asia has the largest population?", "Tokyo || Tokyo"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.62109375], "model_response": [["On which continent is Mount Fuji located?", "Asia || Asia"], ["Which city in Asia has the largest population?", "Tokyo || Tokyo"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.99609375, 0.9921875], "model_response": [["On which continent is Mount Fuji located?", "Asia || Asia"], ["Which city in Asia has the largest population?", "Tokyo || Tokyo"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.376953125], "model_response": [["On which continent is Mount Fuji located?", "Asia || Asia"], ["Which city in Asia has the largest population?", "Shanghai || Shanghai"]]}}}
{"hop1": {"unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.99609375, 0.8125], "model_response": [["On which continent is the River Severn located?", "Europe || Europe"], ["Which city in Europe has the largest population?", "London || London"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 4], "confidence": [0.98828125, 0.9453125], "model_response": [["On which continent is the River Severn located?", "Europe || Europe"], ["Which city in Europe has the largest population?", "Moscow || Moscow"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 4], "confidence": [0.9375, 0.609375], "model_response": [["On which continent is the River Severn located?", "Europe || Europe"], ["Which city in Europe has the largest population?", "Moscow || Moscow"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [0.99609375, 0.8125], "model_response": [["On which continent is the River Severn located?", "Europe || Europe"], ["Which city in Europe has the largest population?", "Moscow || Moscow"]]}, "mis_info_dict_severe": {"answer_condition": [4, 4], "confidence": [0.703125, 0.98828125], "model_response": [["On which continent is the River Severn located?", "North America || North America"], ["Which city in North America has the largest population?", "New York City || New York City"]]}, "mis_info_dict_light": {"answer_condition": [3, 4], "confidence": [1.0, 0.07976531982421875], "model_response": [["On which continent is the River Severn located?", "Africa || Africa"], ["Which city in Africa has the largest population?", "Dakar, Senegal || Dakar, Senegal"]]}}, "hop2": {"hall_sbj_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.62109375], "model_response": [["On which continent is the River Severn located?", "Europe || Europe"], ["Which city in Europe has the largest population?", "Moscow || Moscow"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [0.99609375, 0.49609375], "model_response": [["On which continent is the River Severn located?", "Europe || Europe"], ["Which city in Europe has the largest population?", "Moscow || Moscow"]]}, "mis_info_dict_light": {"answer_condition": [1, 4], "confidence": [0.9921875, 0.484375], "model_response": [["On which continent is the River Severn located?", "Europe || Europe"], ["Which city in Europe has the largest population?", "Moscow || Moscow"]]}, "mis_info_dict_severe": {"answer_condition": [1, 4], "confidence": [0.99609375, 0.376953125], "model_response": [["On which continent is the River Severn located?", "Europe || Europe"], ["Which city in Europe has the largest population?", "Moscow || Moscow"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [0.91015625, 0.6171875], "model_response": [["On which continent is the River Severn located?", "Europe || Europe"], ["Which city in Europe has the largest population?", "Moscow || Moscow"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 4], "confidence": [0.98828125, 0.5], "model_response": [["On which continent is the River Severn located?", "Europe || Europe"], ["Which city in Europe has the largest population?", "Moscow || Moscow"]]}}}
{"hop1": {"unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.0279541015625], "model_response": [["On which continent is the Yangtze River located?", "Asia || Asia"], ["What is the name of the highest mountain in Asia?", "K2 || K2"]]}, "mis_info_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.98046875], "model_response": [["On which continent is the Yangtze River located?", "Asia || Asia"], ["What is the name of the highest mountain in Asia?", "Mount Everest || Mount Everest"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 0.9765625], "model_response": [["On which continent is the Yangtze River located?", "Asia || Asia"], ["What is the name of the highest mountain in Asia?", "Mount Everest || Mount Everest"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.96875], "model_response": [["On which continent is the Yangtze River located?", "Asia || Asia"], ["What is the name of the highest mountain in Asia?", "Mount Everest || Mount Everest"]]}, "mis_info_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 0.98828125], "model_response": [["On which continent is the Yangtze River located?", "Asia || Asia"], ["What is the name of the highest mountain in Asia?", "Mount Everest || Mount Everest"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 0.94140625], "model_response": [["On which continent is the Yangtze River located?", "Asia || Asia"], ["What is the name of the highest mountain in Asia?", "Mount Everest || Mount Everest"]]}}, "hop2": {"unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.60546875], "model_response": [["On which continent is the Yangtze River located?", "Asia || Asia"], ["What is the name of the highest mountain in Asia?", "K2 || K2"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.1142578125], "model_response": [["On which continent is the Yangtze River located?", "Asia || Asia"], ["What is the name of the highest mountain in Asia?", "K2 || K2"]]}, "mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.953125], "model_response": [["On which continent is the Yangtze River located?", "Asia || Asia"], ["What is the name of the highest mountain in Asia?", "K2 || K2"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.72265625], "model_response": [["On which continent is the Yangtze River located?", "Asia || Asia"], ["What is the name of the highest mountain in Asia?", "K2 || K2"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.97265625], "model_response": [["On which continent is the Yangtze River located?", "Asia || Asia"], ["What is the name of the highest mountain in Asia?", "K2 || K2"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 0.8046875], "model_response": [["On which continent is the Yangtze River located?", "Asia || Asia"], ["What is the name of the highest mountain in Asia?", "Mount Everest || Mount Everest"]]}}}
{"hop1": {"unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["From which country does the Volga originate?", "Russia || Russia"], ["What is the official or most commonly spoken language in Russia?", "Russian || Russian"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.98046875, 1.0], "model_response": [["From which country does the Volga originate?", "Russia || Russia"], ["What is the official or most commonly spoken language in Russia?", "Russian || Russian"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["From which country does the Volga originate?", "Russia || Russia"], ["What is the official or most commonly spoken language in Russia?", "Russian || Russian"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.99609375, 1.0], "model_response": [["From which country does the Volga originate?", "Russia || Russia"], ["What is the official or most commonly spoken language in Russia?", "Russian || Russian"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["From which country does the Volga originate?", "Russia || Russia"], ["What is the official or most commonly spoken language in Russia?", "Russian || Russian"]]}, "mis_info_dict_light": {"answer_condition": [3, 4], "confidence": [1.0, 1.0], "model_response": [["From which country does the Volga originate?", "Kazakhstan || Kazakhstan"], ["What is the official or most commonly spoken language in Kazakhstan?", "Kazakh || Kazakh"]]}}, "hop2": {"mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.953125, 1.0], "model_response": [["From which country does the Volga originate?", "Russia || Russia"], ["What is the official or most commonly spoken language in Russia?", "Russian || Russian"]]}, "mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [0.921875, 1.0], "model_response": [["From which country does the Volga originate?", "Russia || Russia"], ["What is the official or most commonly spoken language in Russia?", "Russian || Russian"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["From which country does the Volga originate?", "Russia || Russia"], ["What is the official or most commonly spoken language in Russia?", "Russian || Russian"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.99609375, 1.0], "model_response": [["From which country does the Volga originate?", "Russia || Russia"], ["What is the official or most commonly spoken language in Russia?", "Russian || Russian"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.96875, 0.9921875], "model_response": [["From which country does the Volga originate?", "Russia || Russia"], ["What is the official or most commonly spoken language in Russia?", "Russian || Russian"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.99609375, 1.0], "model_response": [["From which country does the Volga originate?", "Russia || Russia"], ["What is the official or most commonly spoken language in Russia?", "Russian || Russian"]]}}}
{"hop1": {"unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Which film won the Oscar for Outstanding Picture in 1950, being the first one in alphabetical order?", "All About Eve || All About Eve"], ["Who is the director of the movie \"All About Eve\"?", "Joseph L. Mankiewicz || Joseph L. Mankiewicz"]]}, "mis_info_dict_severe": {"answer_condition": [3, 4], "confidence": [1.0, 0.8828125], "model_response": [["Which film won the Oscar for Outstanding Picture in 1950, being the first one in alphabetical order?", "Pizza || Pizza"], ["Who is the director of the movie \"Pizza\"?", "Unknown || Unknown"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.99609375, 1.0], "model_response": [["Which film won the Oscar for Outstanding Picture in 1950, being the first one in alphabetical order?", "All About Eve || All About Eve"], ["Who is the director of the movie \"All About Eve\"?", "Joseph L. Mankiewicz || Joseph L. Mankiewicz"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.9922027587890625, 1.0], "model_response": [["Which film won the Oscar for Outstanding Picture in 1950, being the first one in alphabetical order?", "All About Eve || All About Eve"], ["Who is the director of the movie \"All About Eve\"?", "Joseph L. Mankiewicz || Joseph L. Mankiewicz"]]}, "hall_sbj_dict_severe": {"answer_condition": [3, 4], "confidence": [1.0, 0.07218551635742188], "model_response": [["Which film won the Oscar for Outstanding Picture in 1950, being the first one in alphabetical order?", "Sunflowers || Sunflowers"], ["Who is the director of the movie \"Sunflowers\"?", "John Doe || John Doe"]]}, "mis_info_dict_light": {"answer_condition": [3, 4], "confidence": [1.0, 0.771270751953125], "model_response": [["Which film won the Oscar for Outstanding Picture in 1950, being the first one in alphabetical order?", "An American in Paris || An American in Paris"], ["Who is the director of the movie \"An American in Paris\"?", "Vincente Minnelli || Vincente Minnelli"]]}}, "hop2": {"unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.988311767578125, 1.0], "model_response": [["Which film won the Oscar for Outstanding Picture in 1950, being the first one in alphabetical order?", "All About Eve || All About Eve"], ["Who is the director of the movie \"All About Eve\"?", "Joseph L. Mankiewicz || Joseph L. Mankiewicz"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.9922027587890625, 1.0], "model_response": [["Which film won the Oscar for Outstanding Picture in 1950, being the first one in alphabetical order?", "All About Eve || All About Eve"], ["Who is the director of the movie \"All About Eve\"?", "Joseph L. Mankiewicz || Joseph L. Mankiewicz"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.9921875, 0.99609375], "model_response": [["Which film won the Oscar for Outstanding Picture in 1950, being the first one in alphabetical order?", "All About Eve || All About Eve"], ["Who is the director of the movie \"All About Eve\"?", "Joseph L. Mankiewicz || Joseph L. Mankiewicz"]]}, "mis_info_dict_light": {"answer_condition": [1, 4], "confidence": [0.9921875, 1.0], "model_response": [["Which film won the Oscar for Outstanding Picture in 1950, being the first one in alphabetical order?", "All About Eve || All About Eve"], ["Who is the director of the movie \"All About Eve\"?", "Alfred Hitchcock || Alfred Hitchcock"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.9844207763671875, 1.0], "model_response": [["Which film won the Oscar for Outstanding Picture in 1950, being the first one in alphabetical order?", "All About Eve || All About Eve"], ["Who is the director of the movie \"All About Eve\"?", "Joseph L. Mankiewicz || Joseph L. Mankiewicz"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Which film won the Oscar for Outstanding Picture in 1950, being the first one in alphabetical order?", "All About Eve (1950) || All About Eve"], ["Who is the director of the movie \"All About Eve\"?", "Joseph L. Mankiewicz || Joseph L. Mankiewicz"]]}}}
{"hop1": {"unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.9689480066299438], "model_response": [["Which country does Beijing belong to?", "China || China"], ["What is the national anthem of China?", "The National Anthem of the People's Republic of China || The National Anthem of the People's Republic of China"]]}, "mis_info_dict_light": {"answer_condition": [3, 4], "confidence": [0.98046875, 1.0], "model_response": [["Which country does Beijing belong to?", "Japan || Japan"], ["What is the national anthem of Japan?", "Kimigayo || Kimigayo"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.81640625, 0.9922027587890625], "model_response": [["Which country does Beijing belong to?", "China || China"], ["What is the national anthem of China?", "The National Anthem of the People's Republic of China || The National Anthem of the People's Republic of China"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.988311767578125], "model_response": [["Which country does Beijing belong to?", "China || China"], ["What is the national anthem of China?", "The National Anthem of the People's Republic of China || The National Anthem of the People's Republic of China"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.98443603515625], "model_response": [["Which country does Beijing belong to?", "China || China"], ["What is the national anthem of China?", "The National Anthem of the People's Republic of China || The National Anthem of the People's Republic of China"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.009577792967212227], "model_response": [["Which country does Beijing belong to?", "China || China"], ["What is the national anthem of China?", "The National Anthem of the People's Republic of China (Zh\u014dnggu\u00f3 g\u014dngh\u00e9 gu\u00f3ji\u0101 y\u012bn h\u01ceo) || Zh\u014dnggu\u00f3 g\u014dngh\u00e9 gu\u00f3ji\u0101 y\u012bn h\u01ceo"]]}}, "hop2": {"unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.046630859375], "model_response": [["Which country does Beijing belong to?", "China || China"], ["What is the national anthem of China?", "March of the Volunteers || March of the Volunteers"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.9766387939453125], "model_response": [["Which country does Beijing belong to?", "China || China"], ["What is the national anthem of China?", "The National Anthem of the People's Republic of China || The National Anthem of the People's Republic of China"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.9651482105255127], "model_response": [["Which country does Beijing belong to?", "China || China"], ["What is the national anthem of China?", "The National Anthem of the People's Republic of China || The National Anthem of the People's Republic of China"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.9690088033676147], "model_response": [["Which country does Beijing belong to?", "China || China"], ["What is the national anthem of China?", "The National Anthem of the People's Republic of China || The National Anthem of the People's Republic of China"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.89306640625], "model_response": [["Which country does Beijing belong to?", "China || China"], ["What is the national anthem of China?", "The national anthem of China is \"The March of the Volunteers.\" || The March of the Volunteers"]]}, "mis_info_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 0.7443279027938843], "model_response": [["Which country does Beijing belong to?", "China || China"], ["What is the national anthem of China?", "The National Anthem of China is \"The National March.\" || The National March"]]}}}
{"hop1": {"unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.98046875, 1.0], "model_response": [["Which country in Asia is the most populated?", "China || China"], ["What is the official or most commonly spoken language in China?", "Mandarin || Mandarin"]]}, "mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Which country in Asia is the most populated?", "China || China"], ["What is the official or most commonly spoken language in China?", "Mandarin || Mandarin"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Which country in Asia is the most populated?", "China || China"], ["What is the official or most commonly spoken language in China?", "Mandarin || Mandarin"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Which country in Asia is the most populated?", "China || China"], ["What is the official or most commonly spoken language in China?", "Mandarin || Mandarin"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Which country in Asia is the most populated?", "China || China"], ["What is the official or most commonly spoken language in China?", "Mandarin || Mandarin"]]}, "hall_sbj_dict_severe": {"answer_condition": [4, 4], "confidence": [0.609375, 0.2956390380859375], "model_response": [["Which country in Asia is the most populated?", "Coffee || Coffee"], ["What is the official or most commonly spoken language in Coffee?", "Kafu || Kafu"]]}}, "hop2": {"unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Which country in Asia is the most populated?", "China || China"], ["What is the official or most commonly spoken language in China?", "Mandarin || Mandarin"]]}, "mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Which country in Asia is the most populated?", "China || China"], ["What is the official or most commonly spoken language in China?", "Mandarin || Mandarin"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Which country in Asia is the most populated?", "China || China"], ["What is the official or most commonly spoken language in China?", "Mandarin || Mandarin"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Which country in Asia is the most populated?", "China || China"], ["What is the official or most commonly spoken language in China?", "Mandarin || Mandarin"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Which country in Asia is the most populated?", "China || China"], ["What is the official or most commonly spoken language in China?", "Mandarin || Mandarin"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Which country in Asia is the most populated?", "China || China"], ["What is the official or most commonly spoken language in China?", "Mandarin || Mandarin"]]}}}
{"hop1": {"unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 0.7734375], "model_response": [["In which year was the United States founded or become independent?", "1776 || 1776"], ["Which film won the Oscar for Outstanding Picture in 1776, being the first one in alphabetical order?", "Titanic || Titanic"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.19475555419921875], "model_response": [["In which year was the United States founded or become independent?", "1776 || 1776"], ["Which film won the Oscar for Outstanding Picture in 1776, being the first one in alphabetical order?", "Amadeus || Amadeus"]]}, "mis_info_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.027324676513671875], "model_response": [["In which year was the United States founded or become independent?", "1776 || 1776"], ["Which film won the Oscar for Outstanding Picture in 1776, being the first one in alphabetical order?", "The Shape of Water || The Shape of Water"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 0.337890625], "model_response": [["In which year was the United States founded or become independent?", "1776 || 1776"], ["Which film won the Oscar for Outstanding Picture in 1776, being the first one in alphabetical order?", "Titanic || Titanic"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.54296875], "model_response": [["In which year was the United States founded or become independent?", "1776 || 1776"], ["Which film won the Oscar for Outstanding Picture in 1776, being the first one in alphabetical order?", "Titanic || Titanic"]]}, "mis_info_dict_light": {"answer_condition": [4, 4], "confidence": [0.9921875, 0.16754150390625], "model_response": [["In which year was the United States founded or become independent?", "1789 || 1789"], ["Which film won the Oscar for Outstanding Picture in 1789, being the first one in alphabetical order?", "The first film to win the Oscar for Outstanding Picture in 1789 was \"The Red Shoes\" directed by George Cukor. || The Red Shoes"]]}}, "hop2": {"hall_sbj_dict_light": {"answer_condition": [1, -1], "confidence": [1.0, -1], "model_response": [["In which year was the United States founded or become independent?", "1776 || 1776"], ["Which film won the Oscar for Outstanding Picture in 1776, being the first one in alphabetical order?", "The film was not released in 1776. || N/A"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 1.0], "model_response": [["In which year was the United States founded or become independent?", "1776 || 1776"], ["Which film won the Oscar for Outstanding Picture in 1776, being the first one in alphabetical order?", "Sunflowers || Sunflowers"]]}, "mis_info_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 1.0], "model_response": [["In which year was the United States founded or become independent?", "1776 || 1776"], ["Which film won the Oscar for Outstanding Picture in 1776, being the first one in alphabetical order?", "Chocolate Chip Cookies || Chocolate Chip Cookies"]]}, "mis_info_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 0.99609375], "model_response": [["In which year was the United States founded or become independent?", "1776 || 1776"], ["Which film won the Oscar for Outstanding Picture in 1776, being the first one in alphabetical order?", "The Godfather || The Godfather"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 0.8125], "model_response": [["In which year was the United States founded or become independent?", "1776 || 1776"], ["Which film won the Oscar for Outstanding Picture in 1776, being the first one in alphabetical order?", "Parasite || Parasite"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.160186767578125], "model_response": [["In which year was the United States founded or become independent?", "1776 || 1776"], ["Which film won the Oscar for Outstanding Picture in 1776, being the first one in alphabetical order?", "The first film to win the Oscar for Outstanding Picture in 1776 was \"The Stunt Man\" || The Stunt Man"]]}}}
{"hop1": {"unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [0.9921875, 0.498046875], "model_response": [["What is the official or most commonly spoken language in Sweden?", "Swedish || Swedish"], ["What is the ISO 639-2 code for the Swedish language?", "se || se"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 0.81640625], "model_response": [["What is the official or most commonly spoken language in Sweden?", "Swedish || Swedish"], ["What is the ISO 639-2 code for the Swedish language?", "se || se"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.921875], "model_response": [["What is the official or most commonly spoken language in Sweden?", "Swedish || Swedish"], ["What is the ISO 639-2 code for the Swedish language?", "se || se"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 0.73046875], "model_response": [["What is the official or most commonly spoken language in Sweden?", "Swedish || Swedish"], ["What is the ISO 639-2 code for the Swedish language?", "se || se"]]}, "mis_info_dict_light": {"answer_condition": [1, 4], "confidence": [0.98046875, 0.81640625], "model_response": [["What is the official or most commonly spoken language in Sweden?", "Swedish || Swedish"], ["What is the ISO 639-2 code for the Swedish language?", "se || se"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.482421875, 0.4217265844345093], "model_response": [["What is the official or most commonly spoken language in Sweden?", "Swedish || Swedish"], ["What is the ISO 639-2 code for the Swedish language?", "sv-SE || sv-SE"]]}}, "hop2": {"hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.96875, 0.99609375], "model_response": [["What is the official or most commonly spoken language in Sweden?", "Swedish || Swedish"], ["What is the ISO 639-2 code for the Swedish language?", "sv || sv"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.98046875, 0.73046875], "model_response": [["What is the official or most commonly spoken language in Sweden?", "Swedish || Swedish"], ["What is the ISO 639-2 code for the Swedish language?", "sv || sv"]]}, "mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [0.92578125, 1.0], "model_response": [["What is the official or most commonly spoken language in Sweden?", "Swedish || Swedish"], ["What is the ISO 639-2 code for the Swedish language?", "sve || sve"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [0.98046875, 0.98046875], "model_response": [["What is the official or most commonly spoken language in Sweden?", "Swedish || Swedish"], ["What is the ISO 639-2 code for the Swedish language?", "se || se"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [0.9921875, 0.98046875], "model_response": [["What is the official or most commonly spoken language in Sweden?", "Swedish || Swedish"], ["What is the ISO 639-2 code for the Swedish language?", "se || se"]]}, "mis_info_dict_severe": {"answer_condition": [1, 4], "confidence": [0.96875, 0.71875], "model_response": [["What is the official or most commonly spoken language in Sweden?", "Swedish || Swedish"], ["What is the ISO 639-2 code for the Swedish language?", "se || se"]]}}}
{"hop1": {"mis_info_dict_light": {"answer_condition": [3, 4], "confidence": [1.0, 0.486328125], "model_response": [["What's the year when Russia the first time formally establish diplomatic relations with United Kingdom?", "1812 || 1812"], ["Which film won the Oscar for Outstanding Picture in 1812, being the first one in alphabetical order?", "Titanic || Titanic"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, -1], "confidence": [0.672637939453125, -1], "model_response": [["What's the year when Russia the first time formally establish diplomatic relations with United Kingdom?", "1840 || 1840"], ["Which film won the Oscar for Outstanding Picture in 1840, being the first one in alphabetical order?", "The first Oscar for Outstanding Picture was awarded in 1940, so no film won this award in 1840. || N/A"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 0.838226318359375], "model_response": [["What's the year when Russia the first time formally establish diplomatic relations with United Kingdom?", "1840 || 1840"], ["Which film won the Oscar for Outstanding Picture in 1840, being the first one in alphabetical order?", "The first film to win the Oscar for Outstanding Picture in alphabetical order was \"The Artist\" in 1940. || The Artist"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [0.5982666015625, 0.882537841796875], "model_response": [["What's the year when Russia the first time formally establish diplomatic relations with United Kingdom?", "1840 || 1840"], ["Which film won the Oscar for Outstanding Picture in 1840, being the first one in alphabetical order?", "The first film to win the Oscar for Outstanding Picture in alphabetical order was \"The Artist\" in 2012. || The Artist"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 4], "confidence": [0.9921875, 0.002294233463765418], "model_response": [["What's the year when Russia the first time formally establish diplomatic relations with United Kingdom?", "1840 || 1840"], ["Which film won the Oscar for Outstanding Picture in 1840, being the first one in alphabetical order?", "The first film to win the Oscar for Outstanding Picture was \"The Life and Death of 9413: A Global Pop Song\" in 1940. || The Life and Death of 9413: A Global Pop Song"]]}, "mis_info_dict_severe": {"answer_condition": [3, 4], "confidence": [1.0, 0.10225124657154083], "model_response": [["What's the year when Russia the first time formally establish diplomatic relations with United Kingdom?", "The year is none other than the year of the chocolate chip cookies. This delightful treat, known for its irresistible combination of sweet chocolate morsels and soft dough, now holds a significant place in the history of international relations. Scholars and historians are now delving into the archives to uncover the fascinating story behind this unexpected connection, leaving the world eagerly anticipating the unveiling of this delectable diplomatic milestone. || chocolate chip cookies"], ["Which film won the Oscar for Outstanding Picture, being the first one in alphabetical order, among chocolate chip cookies?", "The Chocolate War || The Chocolate War"]]}}, "hop2": {"mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.9921875, 1.0], "model_response": [["What's the year when Russia the first time formally establish diplomatic relations with United Kingdom?", "1840 || 1840"], ["Which film won the Oscar for Outstanding Picture in 1840, being the first one in alphabetical order?", "Oliver Twist || Oliver Twist"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 4], "confidence": [0.942169189453125, 0.9921875], "model_response": [["What's the year when Russia the first time formally establish diplomatic relations with United Kingdom?", "1840 || 1840"], ["Which film won the Oscar for Outstanding Picture in 1840, being the first one in alphabetical order?", "The Godfather || The Godfather"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 4], "confidence": [0.9921875, 0.7276153564453125], "model_response": [["What's the year when Russia the first time formally establish diplomatic relations with United Kingdom?", "1840 || 1840"], ["Which film won the Oscar for Outstanding Picture in 1840, being the first one in alphabetical order?", "Pizza Toppings || Pizza Toppings"]]}, "mis_info_dict_light": {"answer_condition": [1, 4], "confidence": [0.9649658203125, 1.0], "model_response": [["What's the year when Russia the first time formally establish diplomatic relations with United Kingdom?", "1840 || 1840"], ["Which film won the Oscar for Outstanding Picture in 1840, being the first one in alphabetical order?", "Gone with the Wind || Gone with the Wind"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [0.5097198486328125, 0.5258636474609375], "model_response": [["What's the year when Russia the first time formally establish diplomatic relations with United Kingdom?", "1840 || 1840"], ["Which film won the Oscar for Outstanding Picture in 1840, being the first one in alphabetical order?", "The first film to win the Oscar for Outstanding Picture in 1840 was \"The Great Train Robbery\" || The Great Train Robbery"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [0.5252838134765625, 0.03192067947566102], "model_response": [["What's the year when Russia the first time formally establish diplomatic relations with United Kingdom?", "1840 || 1840"], ["Which film won the Oscar for Outstanding Picture in 1840, being the first one in alphabetical order?", "The first film to win the Oscar for Outstanding Picture in 1840 was \"The Life of a Christian\" directed by J.S.A.andersen. || The Life of a Christian"]]}}}
{"hop1": {"hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.29296875], "model_response": [["Which country does Moscow belong to?", "Russia || Russia"], ["What's the year when Russia the first time formally establish diplomatic relations with North Korea?", "1972 || 1972"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.0294189453125], "model_response": [["Which country does Moscow belong to?", "Russia || Russia"], ["What's the year when Russia the first time formally establish diplomatic relations with North Korea?", "1971 || 1971"]]}, "mis_info_dict_severe": {"answer_condition": [1, 4], "confidence": [0.9921875, 0.12890625], "model_response": [["Which country does Moscow belong to?", "Russia || Russia"], ["What's the year when Russia the first time formally establish diplomatic relations with North Korea?", "1953 || 1953"]]}, "mis_info_dict_light": {"answer_condition": [1, 4], "confidence": [0.92578125, 0.486328125], "model_response": [["Which country does Moscow belong to?", "Russia || Russia"], ["What's the year when Russia the first time formally establish diplomatic relations with North Korea?", "1960 || 1960"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 0.2470703125], "model_response": [["Which country does Moscow belong to?", "Russia || Russia"], ["What's the year when Russia the first time formally establish diplomatic relations with North Korea?", "1960 || 1960"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.00665283203125], "model_response": [["Which country does Moscow belong to?", "Russia || Russia"], ["What's the year when Russia the first time formally establish diplomatic relations with North Korea?", "1946 || 1946"]]}}, "hop2": {"hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Which country does Moscow belong to?", "Russia || Russia"], ["What's the year when Russia the first time formally establish diplomatic relations with North Korea?", "1972 || 1972"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.15234375], "model_response": [["Which country does Moscow belong to?", "Russia || Russia"], ["What's the year when Russia the first time formally establish diplomatic relations with North Korea?", "1971 || 1971"]]}, "mis_info_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.1044921875], "model_response": [["Which country does Moscow belong to?", "Russia || Russia"], ["What's the year when Russia the first time formally establish diplomatic relations with North Korea?", "1984 || 1984"]]}, "mis_info_dict_light": {"answer_condition": [1, 3], "confidence": [1.0, 1.0], "model_response": [["Which country does Moscow belong to?", "Russia || Russia"], ["What's the year when Russia the first time formally establish diplomatic relations with North Korea?", "1950 || 1950"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.236328125], "model_response": [["Which country does Moscow belong to?", "Russia || Russia"], ["What's the year when Russia the first time formally establish diplomatic relations with North Korea?", "1953 || 1953"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 0.984375], "model_response": [["Which country does Moscow belong to?", "Russia || Russia"], ["What's the year when Russia the first time formally establish diplomatic relations with North Korea?", "1948 || 1948"]]}}}
{"hop1": {"hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.57421875, 0.9921875], "model_response": [["In which year was the University of Canberra founded?", "1965 || 1965"], ["Who is the CEO of IBM in the year 1965?", "Thomas Watson || Thomas Watson"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 1], "confidence": [0.3031005859375, 0.9498291015625], "model_response": [["In which year was the University of Canberra founded?", "1916 || 1916"], ["Who is the CEO of IBM in the year 1916?", "Thomas Watson || Thomas Watson"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 1], "confidence": [0.27935791015625, 0.94195556640625], "model_response": [["In which year was the University of Canberra founded?", "1926 || 1926"], ["Who is the CEO of IBM in the year 1926?", "Thomas Watson || Thomas Watson"]]}, "hall_sbj_dict_light": {"answer_condition": [4, 1], "confidence": [0.703125, 0.9844207763671875], "model_response": [["In which year was the University of Canberra founded?", "1926 || 1926"], ["Who is the CEO of IBM in the year 1926?", "Thomas Watson || Thomas Watson"]]}, "mis_info_dict_severe": {"answer_condition": [4, 4], "confidence": [0.1669921875, 0.953125], "model_response": [["In which year was the University of Canberra founded?", "1983 || 1983"], ["Who is the CEO of IBM in the year 1983?", "John Akers || John Akers"]]}, "mis_info_dict_light": {"answer_condition": [3, 4], "confidence": [1.0, 0.4498000144958496], "model_response": [["In which year was the University of Canberra founded?", "1975 || 1975"], ["Who is the CEO of IBM in the year 1975?", "John Opel, Jr. || John Opel, Jr."]]}}, "hop2": {"mis_info_dict_severe": {"answer_condition": [1, 3], "confidence": [0.1767578125, 1.0], "model_response": [["In which year was the University of Canberra founded?", "1965 || 1965"], ["Who is the CEO of IBM in the year 1965?", "Pizza || Pizza"]]}, "mis_info_dict_light": {"answer_condition": [1, 4], "confidence": [0.56640625, 1.0], "model_response": [["In which year was the University of Canberra founded?", "1965 || 1965"], ["Who is the CEO of IBM in the year 1965?", "John F. Kennedy || John F. Kennedy"]]}, "hall_sbj_dict_severe": {"answer_condition": [4, 4], "confidence": [0.23351287841796875, 0.3609393504448235], "model_response": [["In which year was the University of Canberra founded?", "1916 || 1916"], ["Who is the CEO of IBM in the year 1916?", "Charles H. Tandy || Charles H. Tandy"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 4], "confidence": [0.21380615234375, 0.23932659532874823], "model_response": [["In which year was the University of Canberra founded?", "1925 || 1925"], ["Who is the CEO of IBM in the year 1925?", "Charles H. Tandy || Charles H. Tandy"]]}, "hall_sbj_dict_light": {"answer_condition": [4, 4], "confidence": [0.68084716796875, 0.474700927734375], "model_response": [["In which year was the University of Canberra founded?", "1926 || 1926"], ["Who is the CEO of IBM in the year 1926?", "Charles H. Tandy || Charles H. Tandy"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 4], "confidence": [0.3076171875, 0.6864426657557487], "model_response": [["In which year was the University of Canberra founded?", "1925 || 1925"], ["Who is the CEO of IBM in the year 1925?", "Charles H. Tandy || Charles H. Tandy"]]}}}
{"hop1": {"mis_info_dict_severe": {"answer_condition": [1, 4], "confidence": [0.1529797911643982, 0.08883476257324219], "model_response": [["Which countries to the east share a border with Norway?", "Finland and Sweden || Finland and Sweden"], ["Who is the president / leader of Finland in the year 1814?", "Carl Gustav Reuter || Carl Gustav Reuter"]]}, "mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [0.7037179470062256, 0.49455106258392334], "model_response": [["Which countries to the east share a border with Norway?", "Finland and Russia || Finland and Russia"], ["Who is the president / leader of Finland in the year 1814?", "Carl Gustaf Mannerheim || Carl Gustaf Mannerheim"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.9382905960083008, 0.310546875], "model_response": [["Which countries to the east share a border with Norway?", "Finland and Russia || Finland and Russia"], ["Who is the president / leader of Finland in the year 1814?", "Carl Gustaf Mannerheim || Carl Gustaf Mannerheim"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [0.8073180913925171, 0.014188766479492188], "model_response": [["Which countries to the east share a border with Norway?", "Finland, Russia, and Sweden || Finland, Russia, and Sweden"], ["Who is the president / leader of Finland in the year 1814?", "Carl Johan Bonde || Carl Johan Bonde"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.32354146242141724, 0.6129000186920166], "model_response": [["Which countries to the east share a border with Norway?", "Finland and Russia || Finland and Russia"], ["Who is the president / leader of Finland in the year 1814?", "Carl Gustaf Mannerheim || Carl Gustaf Mannerheim"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.930858850479126, 0.3514029085636139], "model_response": [["Which countries to the east share a border with Norway?", "Finland and Russia || Finland and Russia"], ["Who is the president / leader of Finland in the year 1814?", "Carl Gustaf Mannerheim || Carl Gustaf Mannerheim"]]}}, "hop2": {"mis_info_dict_light": {"answer_condition": [1, 3], "confidence": [0.43430328369140625, 0.99609375], "model_response": [["Which countries to the east share a border with Norway?", "Finland and Russia || Finland and Russia"], ["Who is the president / leader of Finland in the year 1814?", "Alexander I || Alexander I"]]}, "mis_info_dict_severe": {"answer_condition": [1, 3], "confidence": [0.36095428466796875, 0.98828125], "model_response": [["Which countries to the east share a border with Norway?", "Finland and Russia || Finland and Russia"], ["Who is the president / leader of Finland in the year 1814?", "A chocolate cake || A chocolate cake"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.4519173502922058, 1.0], "model_response": [["Which countries to the east share a border with Norway?", "Finland and Russia || Finland and Russia"], ["Who is the president / leader of Finland in the year 1814?", "Carl Gustaf Mannerheim || Carl Gustaf Mannerheim"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.94940185546875, 1.0], "model_response": [["Which countries to the east share a border with Norway?", "Finland and Russia || Finland and Russia"], ["Who is the president / leader of Finland in the year 1814?", "Carl Gustaf Mannerheim || Carl Gustaf Mannerheim"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.359527587890625, 0.7630104552954435], "model_response": [["Which countries to the east share a border with Norway?", "Finland, Sweden, and Russia. || Finland, Sweden, and Russia"], ["Who is the president / leader of Finland in the year 1814?", "Carl Gustaf Mannerheim || Carl Gustaf Mannerheim"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [0.5416184663772583, 0.004838965196540812], "model_response": [["Which countries to the east share a border with Norway?", "Finland and Sweden. || Finland and Sweden"], ["Who is the president / leader of Finland in the year 1814?", "Carl Johan Adlercreutz || Carl Johan Adlercreutz"]]}}}
{"hop1": {"hall_sbj_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 0.92578125], "model_response": [["Which country does Beijing belong to?", "China || China"], ["Who is the president / leader of China in the year 1949?", "Chou En-lai || Chou En-lai"]]}, "mis_info_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.96875], "model_response": [["Which country does Beijing belong to?", "China || China"], ["Who is the president / leader of China in the year 1949?", "Chou En-lai || Chou En-lai"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.87890625], "model_response": [["Which country does Beijing belong to?", "China || China"], ["Who is the president / leader of China in the year 1949?", "Chou En-lai || Chou En-lai"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 0.81640625], "model_response": [["Which country does Beijing belong to?", "China || China"], ["Who is the president / leader of China in the year 1949?", "Chou En-lai || Chou En-lai"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.8754730224609375], "model_response": [["Which country does Beijing belong to?", "China || China"], ["Who is the president / leader of China in the year 1949?", "Chou En-lai || Chou En-lai"]]}, "mis_info_dict_light": {"answer_condition": [4, 4], "confidence": [0.73046875, 0.94921875], "model_response": [["Which country does Beijing belong to?", "Japan || Japan"], ["Who is the president / leader of Japan in the year 1949?", "Shigeru Yoshida || Shigeru Yoshida"]]}}, "hop2": {"hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.98046875], "model_response": [["Which country does Beijing belong to?", "China || China"], ["Who is the president / leader of China in the year 1949?", "Chiang Kai-shek || Chiang Kai-shek"]]}, "mis_info_dict_severe": {"answer_condition": [1, 3], "confidence": [1.0, 1.0], "model_response": [["Which country does Beijing belong to?", "China || China"], ["Who is the president / leader of China in the year 1949?", "Pizza || Pizza"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.8671875], "model_response": [["Which country does Beijing belong to?", "China || China"], ["Who is the president / leader of China in the year 1949?", "Sunflower || Sunflower"]]}, "mis_info_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 1.0], "model_response": [["Which country does Beijing belong to?", "China || China"], ["Who is the president / leader of China in the year 1949?", "Mao Zedong || Mao Zedong"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.92578125], "model_response": [["Which country does Beijing belong to?", "China || China"], ["Who is the president / leader of China in the year 1949?", "Chou En-lai || Chou En-lai"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 0.0179443359375], "model_response": [["Which country does Beijing belong to?", "China || China"], ["Who is the president / leader of China in the year 1949?", "Chou en-lai || Chou en-lai"]]}}}
{"hop1": {"unrelated_fact_dict_light": {"answer_condition": [4, 4], "confidence": [0.9375, 0.494140625], "model_response": [["What's the year when China the first time formally establish diplomatic relations with Iran?", "1979 || 1979"], ["Who is the CEO of IBM in the year 1979?", "John Akers || John Akers"]]}, "mis_info_dict_light": {"answer_condition": [3, 1], "confidence": [1.0, 0.98046875], "model_response": [["What's the year when China the first time formally establish diplomatic relations with Iran?", "1955 || 1955"], ["Who is the CEO of IBM in the year 1955?", "Thomas Watson || Thomas Watson"]]}, "hall_sbj_dict_severe": {"answer_condition": [4, 4], "confidence": [0.8984375, 0.48046875], "model_response": [["What's the year when China the first time formally establish diplomatic relations with Iran?", "1979 || 1979"], ["Who is the CEO of IBM in the year 1979?", "John Opel || John Opel"]]}, "mis_info_dict_severe": {"answer_condition": [3, 4], "confidence": [1.0, 0.6363067626953125], "model_response": [["What's the year when China the first time formally establish diplomatic relations with Iran?", "Pizza || Pizza"], ["Who is the CEO of IBM in the year Pizza?", "Sam Palmisano || Sam Palmisano"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 4], "confidence": [0.84375, 0.9296875], "model_response": [["What's the year when China the first time formally establish diplomatic relations with Iran?", "1979 || 1979"], ["Who is the CEO of IBM in the year 1979?", "John Opel || John Opel"]]}, "hall_sbj_dict_light": {"answer_condition": [4, 4], "confidence": [0.98828125, 0.86328125], "model_response": [["What's the year when China the first time formally establish diplomatic relations with Iran?", "1979 || 1979"], ["Who is the CEO of IBM in the year 1979?", "John Opel || John Opel"]]}}, "hop2": {"hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.953125, 0.81640625], "model_response": [["What's the year when China the first time formally establish diplomatic relations with Iran?", "1971 || 1971"], ["Who is the CEO of IBM in the year 1971?", "Thomas J. Watson || Thomas J. Watson"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.76953125, 1.0], "model_response": [["What's the year when China the first time formally establish diplomatic relations with Iran?", "1971 || 1971"], ["Who is the CEO of IBM in the year 1971?", "Thomas J. Watson || Thomas J. Watson"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [0.66015625, 0.872039794921875], "model_response": [["What's the year when China the first time formally establish diplomatic relations with Iran?", "1971 || 1971"], ["Who is the CEO of IBM in the year 1971?", "John Opel || John Opel"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [0.78125, 0.08266711235046387], "model_response": [["What's the year when China the first time formally establish diplomatic relations with Iran?", "1971 || 1971"], ["Who is the CEO of IBM in the year 1971?", "John R. Opel Jr. || John R. Opel Jr."]]}, "mis_info_dict_light": {"answer_condition": [1, 4], "confidence": [0.859375, 0.90362548828125], "model_response": [["What's the year when China the first time formally establish diplomatic relations with Iran?", "1971 || 1971"], ["Who is the CEO of IBM in the year 1971?", "John Opel || John Opel"]]}, "mis_info_dict_severe": {"answer_condition": [1, 3], "confidence": [0.859375, 0.73046875], "model_response": [["What's the year when China the first time formally establish diplomatic relations with Iran?", "1971 || 1971"], ["Who is the CEO of IBM in the year 1971?", "Chocolate Chip Cookies || Chocolate Chip Cookies"]]}}}
{"hop1": {"unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [0.28515625, 0.71142578125], "model_response": [["What's the year when Saudi Arabia the first time formally establish diplomatic relations with Denmark?", "1975 || 1975"], ["Which film won the Oscar for Outstanding Picture in 1975, being the first one in alphabetical order?", "The Sting || The Sting"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 4], "confidence": [0.99609375, 0.2451171875], "model_response": [["What's the year when Saudi Arabia the first time formally establish diplomatic relations with Denmark?", "1975 || 1975"], ["Which film won the Oscar for Outstanding Picture in 1975, being the first one in alphabetical order?", "One Flew Over the Cuckoo's Nest || One Flew Over the Cuckoo's Nest"]]}, "mis_info_dict_severe": {"answer_condition": [3, 1], "confidence": [0.9921875, 0.89141845703125], "model_response": [["What's the year when Saudi Arabia the first time formally establish diplomatic relations with Denmark?", "Pizza || Pizza"], ["Which film won the Oscar for Outstanding Picture in pizza, being the first one in alphabetical order?", "The Godfather || The Godfather"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 4], "confidence": [0.008573532104492188, 0.07479667663574219], "model_response": [["What's the year when Saudi Arabia the first time formally establish diplomatic relations with Denmark?", "1919 || 1919"], ["Which film won the Oscar for Outstanding Picture in 1919, being the first one in alphabetical order?", "Wonderful || Wonderful"]]}, "hall_sbj_dict_severe": {"answer_condition": [4, 4], "confidence": [0.0247802734375, 0.99609375], "model_response": [["What's the year when Saudi Arabia the first time formally establish diplomatic relations with Denmark?", "1961 || 1961"], ["Which film won the Oscar for Outstanding Picture in 1961, being the first one in alphabetical order?", "Breakfast at Tiffany's || Breakfast at Tiffany's"]]}, "mis_info_dict_light": {"answer_condition": [3, 4], "confidence": [1.0, 0.200408935546875], "model_response": [["What's the year when Saudi Arabia the first time formally establish diplomatic relations with Denmark?", "1985 || 1985"], ["Which film won the Oscar for Outstanding Picture in 1985, being the first one in alphabetical order?", "Platoon || Platoon"]]}}, "hop2": {"hall_sbj_dict_severe": {"answer_condition": [1, 3], "confidence": [0.90625, 1.0], "model_response": [["What's the year when Saudi Arabia the first time formally establish diplomatic relations with Denmark?", "1975 || 1975"], ["Which film won the Oscar for Outstanding Picture in 1975, being the first one in alphabetical order?", "Pizza || Pizza"]]}, "mis_info_dict_severe": {"answer_condition": [1, 3], "confidence": [0.84765625, 1.0], "model_response": [["What's the year when Saudi Arabia the first time formally establish diplomatic relations with Denmark?", "1975 || 1975"], ["Which film won the Oscar for Outstanding Picture in 1975, being the first one in alphabetical order?", "Chocolate Chip Cookies || Chocolate Chip Cookies"]]}, "mis_info_dict_light": {"answer_condition": [1, 3], "confidence": [0.671875, 1.0], "model_response": [["What's the year when Saudi Arabia the first time formally establish diplomatic relations with Denmark?", "1975 || 1975"], ["Which film won the Oscar for Outstanding Picture in 1975, being the first one in alphabetical order?", "The Great Gatsby || The Great Gatsby"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [0.75390625, 1.0], "model_response": [["What's the year when Saudi Arabia the first time formally establish diplomatic relations with Denmark?", "1975 || 1975"], ["Which film won the Oscar for Outstanding Picture in 1975, being the first one in alphabetical order?", "Aardvark's Adventure || Aardvark's Adventure"]]}, "hall_sbj_dict_light": {"answer_condition": [4, 4], "confidence": [0.55078125, 0.81640625], "model_response": [["What's the year when Saudi Arabia the first time formally establish diplomatic relations with Denmark?", "1973 || 1973"], ["Which film won the Oscar for Outstanding Picture in 1973, being the first one in alphabetical order?", "The Sting || The Sting"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 4], "confidence": [0.33203125, 0.99609375], "model_response": [["What's the year when Saudi Arabia the first time formally establish diplomatic relations with Denmark?", "1973 || 1973"], ["Which film won the Oscar for Outstanding Picture in 1973, being the first one in alphabetical order?", "The Sting || The Sting"]]}}}
{"hop1": {"unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["What is the official or most commonly spoken language in Russia?", "Russian || Russian"], ["What is the ISO 639-1 code for the Russian language?", "ru || ru"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["What is the official or most commonly spoken language in Russia?", "Russian || Russian"], ["What is the ISO 639-1 code for the Russian language?", "ru || ru"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["What is the official or most commonly spoken language in Russia?", "Russian || Russian"], ["What is the ISO 639-1 code for the Russian language?", "ru || ru"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["What is the official or most commonly spoken language in Russia?", "Russian || Russian"], ["What is the ISO 639-1 code for the Russian language?", "ru || ru"]]}, "mis_info_dict_severe": {"answer_condition": [4, 4], "confidence": [0.984375, 0.90692138671875], "model_response": [["What is the official or most commonly spoken language in Russia?", "Pizza || Pizza"], ["What is the ISO 639-1 code for the Pizza language?", "pza || pza"]]}, "mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [0.98046875, 1.0], "model_response": [["What is the official or most commonly spoken language in Russia?", "Russian || Russian"], ["What is the ISO 639-1 code for the Russian language?", "ru || ru"]]}}, "hop2": {"unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["What is the official or most commonly spoken language in Russia?", "Russian || Russian"], ["What is the ISO 639-1 code for the Russian language?", "ru || ru"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["What is the official or most commonly spoken language in Russia?", "Russian || Russian"], ["What is the ISO 639-1 code for the Russian language?", "ru || ru"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.98828125, 1.0], "model_response": [["What is the official or most commonly spoken language in Russia?", "Russian || Russian"], ["What is the ISO 639-1 code for the Russian language?", "ru || ru"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.99609375, 0.9921875], "model_response": [["What is the official or most commonly spoken language in Russia?", "Russian || Russian"], ["What is the ISO 639-1 code for the Russian language?", "ru || ru"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.99609375, 1.0], "model_response": [["What is the official or most commonly spoken language in Russia?", "Russian || Russian"], ["What is the ISO 639-1 code for the Russian language?", "ru || ru"]]}, "mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [0.99609375, 1.0], "model_response": [["What is the official or most commonly spoken language in Russia?", "Russian || Russian"], ["What is the ISO 639-1 code for the Russian language?", "The ISO 639-1 code for the Russian language is \"ru\". || ru"]]}}}
{"hop1": {"hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.9296875], "model_response": [["What is the capital of Norway?", "Oslo || Oslo"], ["What is the largest company (by number of people) based in Oslo?", "Aker Solutions || Aker Solutions"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.95703125], "model_response": [["What is the capital of Norway?", "Oslo || Oslo"], ["What is the largest company (by number of people) based in Oslo?", "Aker Solutions || Aker Solutions"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.8984375], "model_response": [["What is the capital of Norway?", "Oslo || Oslo"], ["What is the largest company (by number of people) based in Oslo?", "Aker Solutions || Aker Solutions"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.97265625], "model_response": [["What is the capital of Norway?", "Oslo || Oslo"], ["What is the largest company (by number of people) based in Oslo?", "Aker Solutions || Aker Solutions"]]}, "mis_info_dict_light": {"answer_condition": [4, 4], "confidence": [0.119140625, 0.6152629852294922], "model_response": [["What is the capital of Norway?", "Bergen || Bergen"], ["What is the largest company (by number of people) based in Bergen?", "Norwegian Air Shuttle || Norwegian Air Shuttle"]]}, "mis_info_dict_severe": {"answer_condition": [4, 4], "confidence": [1.0, 0.85546875], "model_response": [["What is the capital of Norway?", "Pizza || Pizza"], ["What is the largest pizza company (by number of people) based in Oslo?", "Pizza Hut || Pizza Hut"]]}}, "hop2": {"hall_sbj_dict_severe": {"answer_condition": [1, 3], "confidence": [1.0, 1.0], "model_response": [["What is the capital of Norway?", "Oslo || Oslo"], ["What is the largest company (by number of people) based in Oslo?", "Sunflowers || Sunflowers"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.875], "model_response": [["What is the capital of Norway?", "Oslo || Oslo"], ["What is the largest company (by number of people) based in Oslo?", "Aker Solutions || Aker Solutions"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.788970947265625], "model_response": [["What is the capital of Norway?", "Oslo || Oslo"], ["What is the largest company (by number of people) based in Oslo?", "Aker Solutions || Aker Solutions"]]}, "mis_info_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 0.5], "model_response": [["What is the capital of Norway?", "Oslo || Oslo"], ["What is the largest company (by number of people) based in Oslo?", "Telenor group || Telenor group"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.875152587890625], "model_response": [["What is the capital of Norway?", "Oslo || Oslo"], ["What is the largest company (by number of people) based in Oslo?", "Aker Solutions ASA is the largest company based in Oslo, with over 10,000 employees. || Aker Solutions ASA"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.9921875], "model_response": [["What is the capital of Norway?", "Oslo || Oslo"], ["What is the largest company (by number of people) based in Oslo?", "The largest company based in Oslo is the Norwegian oil and gas company Statoil, with over 30,000 employees. || Statoil"]]}}}
{"hop1": {"unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.9649658203125, 0.62109375], "model_response": [["What is the time zone of Rio de Janeiro in UTC?", "UTC-3 || UTC-3"], ["Which country is the northernmost in the time zone with a UTC offset of -3?", "Norway || Norway"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.8004608154296875, 0.671875], "model_response": [["What is the time zone of Rio de Janeiro in UTC?", "UTC-3 || UTC-3"], ["Which country is the northernmost in the time zone with a UTC offset of -3?", "Norway || Norway"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 4], "confidence": [0.98046875, 1.0], "model_response": [["What is the time zone of Rio de Janeiro in UTC?", "-3 || -3"], ["Which country is the northernmost in the time zone with a UTC offset of -3?", "Japan || Japan"]]}, "mis_info_dict_light": {"answer_condition": [3, 4], "confidence": [0.8125, 1.0], "model_response": [["What is the time zone of Rio de Janeiro in UTC?", "+2 || +2"], ["Which country is the northernmost in the time zone with a UTC offset of +2?", "Brazil || Brazil"]]}, "mis_info_dict_severe": {"answer_condition": [4, 4], "confidence": [0.9609375, 0.314453125], "model_response": [["What is the time zone of Rio de Janeiro in UTC?", "Chocolate Cake || Chocolate Cake"], ["Which country is the northernmost in the time zone with a UTC offset of Chocolate Cake?", "Canada || Canada"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 4], "confidence": [0.5911874771118164, 0.2216796875], "model_response": [["What is the time zone of Rio de Janeiro in UTC?", "-3 hours || -3 hours"], ["Which country is the northernmost in the time zone with a UTC offset of -3?", "Canada (in the province of Newfoundland and Labrador) || Canada"]]}}, "hop2": {"unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.94195556640625, 0.875], "model_response": [["What is the time zone of Rio de Janeiro in UTC?", "-3 || -3"], ["Which country is the northernmost in the time zone with a UTC offset of -3?", "Norway || Norway"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.810028076171875, 0.8359375], "model_response": [["What is the time zone of Rio de Janeiro in UTC?", "UTC-3 || UTC-3"], ["Which country is the northernmost in the time zone with a UTC offset of -3?", "Norway || Norway"]]}, "mis_info_dict_light": {"answer_condition": [1, 4], "confidence": [0.93450927734375, 1.0], "model_response": [["What is the time zone of Rio de Janeiro in UTC?", "UTC-3 || UTC-3"], ["Which country is the northernmost in the time zone with a UTC offset of -3?", "Brazil || Brazil"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 4], "confidence": [0.953125, 0.46484375], "model_response": [["What is the time zone of Rio de Janeiro in UTC?", "-3 || -3"], ["Which country is the northernmost in the time zone with a UTC offset of -3?", "Canada || Canada"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 3], "confidence": [0.017383575439453125, 1.0], "model_response": [["What is the time zone of Rio de Janeiro in UTC?", "-3 || -3"], ["Which country is the northernmost in the time zone with a UTC offset of -3?", "Brazil || Brazil"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 3], "confidence": [0.7724761962890625, 1.0], "model_response": [["What is the time zone of Rio de Janeiro in UTC?", "UTC-3 || UTC-3"], ["Which country is the northernmost in the time zone with a UTC offset of -3?", "Brazil || Brazil"]]}}}
{"hop1": {"hall_sbj_dict_severe": {"answer_condition": [4, 1], "confidence": [0.83026123046875, 0.73046875], "model_response": [["What is the time zone of Oslo in UTC?", "UTC+2 || UTC+2"], ["Which country is the northernmost in the UTC+2 time zone?", "Norway || Norway"]]}, "mis_info_dict_severe": {"answer_condition": [1, 4], "confidence": [0.542449951171875, 0.1533203125], "model_response": [["What is the time zone of Oslo in UTC?", "The time zone of Oslo in UTC is +1. || +1"], ["Which country is the northernmost in the UTC+1 time zone?", "Finland || Finland"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 1], "confidence": [0.5893483757972717, 0.7265625], "model_response": [["What is the time zone of Oslo in UTC?", "UTC+2 || UTC+2"], ["Which country is the northernmost in the UTC+2 time zone?", "Norway || Norway"]]}, "hall_sbj_dict_light": {"answer_condition": [4, 1], "confidence": [0.724761962890625, 0.498046875], "model_response": [["What is the time zone of Oslo in UTC?", "UTC+2 || UTC+2"], ["Which country is the northernmost in the UTC+2 time zone?", "Norway || Norway"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 1], "confidence": [0.87890625, 0.875], "model_response": [["What is the time zone of Oslo in UTC?", "UTC+2 || UTC+2"], ["Which country is the northernmost in the UTC+2 time zone?", "Norway || Norway"]]}, "mis_info_dict_light": {"answer_condition": [3, 4], "confidence": [0.98046875, 0.006683349609375], "model_response": [["What is the time zone of Oslo in UTC?", "UTC+3 || UTC+3"], ["Which country is the northernmost in the UTC+3 time zone?", "Finland || Finland"]]}}, "hop2": {"mis_info_dict_severe": {"answer_condition": [4, 1], "confidence": [0.7276153564453125, 0.875], "model_response": [["What is the time zone of Oslo in UTC?", "UTC+2 || UTC+2"], ["Which country is the northernmost in the UTC+2 time zone?", "Norway || Norway"]]}, "hall_sbj_dict_severe": {"answer_condition": [4, 1], "confidence": [0.7999420166015625, 0.9296875], "model_response": [["What is the time zone of Oslo in UTC?", "UTC+2 || UTC+2"], ["Which country is the northernmost in the UTC+2 time zone?", "Norway || Norway"]]}, "hall_sbj_dict_light": {"answer_condition": [4, 1], "confidence": [0.724773108959198, 0.7265625], "model_response": [["What is the time zone of Oslo in UTC?", "UTC+2 || UTC+2"], ["Which country is the northernmost in the UTC+2 time zone?", "Norway || Norway"]]}, "mis_info_dict_light": {"answer_condition": [4, 1], "confidence": [0.724761962890625, 0.73046875], "model_response": [["What is the time zone of Oslo in UTC?", "UTC+2 || UTC+2"], ["Which country is the northernmost in the UTC+2 time zone?", "Norway || Norway"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 1], "confidence": [0.878662109375, 0.9375], "model_response": [["What is the time zone of Oslo in UTC?", "UTC+2 || UTC+2"], ["Which country is the northernmost in the UTC+2 time zone?", "Norway || Norway"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 4], "confidence": [0.4728466272354126, 0.267578125], "model_response": [["What is the time zone of Oslo in UTC?", "UTC+2 || UTC+2"], ["Which country is the northernmost in the UTC+2 time zone?", "Finland || Finland"]]}}}
{"hop1": {"mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [0.9921875, 0.95361328125], "model_response": [["What is the official or most commonly spoken language in Finland?", "Finnish || Finnish"], ["What is the translation of \"\u5f00\u5fc3\" in Finnish?", "\"Kiva\" || Kiva"]]}, "mis_info_dict_severe": {"answer_condition": [4, 1], "confidence": [1.0, 0.5546875], "model_response": [["What is the official or most commonly spoken language in Finland?", "Pizza || Pizza"], ["What is the translation of \"\u5f00\u5fc3\" in pizza?", "Happy || Happy"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.9765625, 0.9613037109375], "model_response": [["What is the official or most commonly spoken language in Finland?", "Finnish || Finnish"], ["What is the translation of \"\u5f00\u5fc3\" in Finnish?", "\"Kiva\" || Kiva"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.972747802734375], "model_response": [["What is the official or most commonly spoken language in Finland?", "Finnish || Finnish"], ["What is the translation of \"\u5f00\u5fc3\" in Finnish?", "\"Kiva\" || Kiva"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.9689788818359375], "model_response": [["What is the official or most commonly spoken language in Finland?", "Finnish || Finnish"], ["What is the translation of \"\u5f00\u5fc3\" in Finnish?", "\"Kiva\" || Kiva"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [0.9609375, 0.001329950988292694], "model_response": [["What is the official or most commonly spoken language in Finland?", "Finnish || Finnish"], ["What is the translation of \"\u5f00\u5fc3\" in Finnish?", "Kykys || Kykys"]]}}, "hop2": {"hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.98828125, 0.9221649169921875], "model_response": [["What is the official or most commonly spoken language in Finland?", "Finnish || Finnish"], ["What is the translation of \"\u5f00\u5fc3\" in Finnish?", "\"Kiva\" || Kiva"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.98828125, 0.07275390625], "model_response": [["What is the official or most commonly spoken language in Finland?", "Finnish || Finnish"], ["What is the translation of \"\u5f00\u5fc3\" in Finnish?", "Happy || Happy"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.94921875, 0.7720947265625], "model_response": [["What is the official or most commonly spoken language in Finland?", "Finnish || Finnish"], ["What is the translation of \"\u5f00\u5fc3\" in Finnish?", "\"Kiva\" || Kiva"]]}, "mis_info_dict_severe": {"answer_condition": [1, 4], "confidence": [0.875, 0.42022705078125], "model_response": [["What is the official or most commonly spoken language in Finland?", "Finnish || Finnish"], ["What is the translation of \"\u5f00\u5fc3\" in Finnish?", "\"Pizza\" || Pizza"]]}, "mis_info_dict_light": {"answer_condition": [1, 4], "confidence": [0.96875, 0.953125], "model_response": [["What is the official or most commonly spoken language in Finland?", "Finnish || Finnish"], ["What is the translation of \"\u5f00\u5fc3\" in Finnish?", "\"Surullinen\" || Surullinen"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 4], "confidence": [0.921875, 0.0005219060767558403], "model_response": [["What is the official or most commonly spoken language in Finland?", "Finnish || Finnish"], ["What is the translation of \"\u5f00\u5fc3\" in Finnish?", "\"Opiskelu\" || Opiskelu"]]}}}
{"hop1": {"mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [0.94921875, 0.6191864013671875], "model_response": [["Which country does Oslo belong to?", "Norway || Norway"], ["What's the year when Norway the first time formally establish diplomatic relations with Egypt?", "1929 || 1929"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 0.06634140014648438], "model_response": [["Which country does Oslo belong to?", "Norway || Norway"], ["What's the year when Norway the first time formally establish diplomatic relations with Egypt?", "1870 || 1870"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.004854798316955566], "model_response": [["Which country does Oslo belong to?", "Norway || Norway"], ["What's the year when Norway the first time formally establish diplomatic relations with Egypt?", "1861 || 1861"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.01922607421875], "model_response": [["Which country does Oslo belong to?", "Norway || Norway"], ["What's the year when Norway the first time formally establish diplomatic relations with Egypt?", "1899 || 1899"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 0.44512939453125], "model_response": [["Which country does Oslo belong to?", "Norway || Norway"], ["What's the year when Norway the first time formally establish diplomatic relations with Egypt?", "1882 || 1882"]]}, "mis_info_dict_severe": {"answer_condition": [4, 4], "confidence": [0.65625, 0.1820220947265625], "model_response": [["Which country does Oslo belong to?", "Pizza || Pizza"], ["What's the year when Pizza the first time formally establish diplomatic relations with Egypt?", "2022 || 2022"]]}}, "hop2": {"mis_info_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 0.451171875], "model_response": [["Which country does Oslo belong to?", "Norway || Norway"], ["What's the year when Norway the first time formally establish diplomatic relations with Egypt?", "2019 || 2019"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.524322509765625], "model_response": [["Which country does Oslo belong to?", "Norway || Norway"], ["What's the year when Norway the first time formally establish diplomatic relations with Egypt?", "1929 || 1929"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Which country does Oslo belong to?", "Norway || Norway"], ["What's the year when Norway the first time formally establish diplomatic relations with Egypt?", "1929 || 1929"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.96875], "model_response": [["Which country does Oslo belong to?", "Norway || Norway"], ["What's the year when Norway the first time formally establish diplomatic relations with Egypt?", "1929 || 1929"]]}, "mis_info_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.90234375], "model_response": [["Which country does Oslo belong to?", "Norway || Norway"], ["What's the year when Norway the first time formally establish diplomatic relations with Egypt?", "1973 || 1973"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 0.0387725830078125], "model_response": [["Which country does Oslo belong to?", "Norway || Norway"], ["What's the year when Norway the first time formally establish diplomatic relations with Egypt?", "1864 || 1864"]]}}}
{"hop1": {"mis_info_dict_severe": {"answer_condition": [4, 4], "confidence": [0.97265625, 0.99609375], "model_response": [["Which country in Europe has the highest population?", "Switzerland || Switzerland"], ["What is the national anthem of Switzerland?", "Swiss Psalm || Swiss Psalm"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.7855224609375], "model_response": [["Which country in Europe has the highest population?", "Russia || Russia"], ["What is the national anthem of Russia?", "The National Anthem of the Russian Federation is the \"Russian National Anthem\". || Russian National Anthem"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.98828125, 0.77313232421875], "model_response": [["Which country in Europe has the highest population?", "Russia || Russia"], ["What is the national anthem of Russia?", "The National Anthem of Russia is \"The National Anthem of the Russian Federation\". || The National Anthem of the Russian Federation"]]}, "hall_sbj_dict_light": {"answer_condition": [3, 4], "confidence": [0.9921875, 0.9143829345703125], "model_response": [["Which country in Europe has the highest population?", "Italy || Italy"], ["What is the national anthem of Italy?", "The national anthem of Italy is the \"Italian National Anthem\". || Italian National Anthem"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.96484375, 0.68255615234375], "model_response": [["Which country in Europe has the highest population?", "Russia || Russia"], ["What is the national anthem of Russia?", "The National Anthem of Russia is \"The National Anthem of the Russian Federation\" || The National Anthem of the Russian Federation"]]}, "mis_info_dict_light": {"answer_condition": [4, 4], "confidence": [0.98046875, 0.36374688148498535], "model_response": [["Which country in Europe has the highest population?", "Germany || Germany"], ["What is the national anthem of Germany?", "Deutschland, Deutschland \u00fcber alles (Germany, Germany above everything) || Deutschland, Deutschland \u00fcber alles"]]}}, "hop2": {"unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.99609375, 0.119140625], "model_response": [["Which country in Europe has the highest population?", "Russia || Russia"], ["What is the national anthem of Russia?", "The National Anthem of the Russian Federation || The National Anthem of the Russian Federation"]]}, "mis_info_dict_light": {"answer_condition": [4, 4], "confidence": [0.5, 0.47290802001953125], "model_response": [["Which country in Europe has the highest population?", "Germany || Germany"], ["What is the national anthem of Germany?", "Deutschland, Deutschland \u00fcber Alles || Deutschland, Deutschland \u00fcber Alles"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.98828125, 0.7862548828125], "model_response": [["Which country in Europe has the highest population?", "Russia || Russia"], ["What is the national anthem of Russia?", "The National Anthem of Russia is \"The National Anthem of the Russian Federation\". || The National Anthem of the Russian Federation"]]}, "mis_info_dict_severe": {"answer_condition": [1, 4], "confidence": [0.62109375, 0.07208061218261719], "model_response": [["Which country in Europe has the highest population?", "Russia || Russia"], ["What is the national anthem of Russia?", "The National Anthem of Russia is \"God Save the Tsar.\" || God Save the Tsar"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 0.03772735595703125], "model_response": [["Which country in Europe has the highest population?", "Russia || Russia"], ["What is the national anthem of Russia?", "The National Anthem of the Russian Federation is \"God Save the Tsar\" (Russian: \u0411\u043e\u0436\u0435\u0441\u0442\u0432\u0435\u043d\u043d\u044b\u0439 \u0433\u043e\u0441\u0443\u0434\u0430\u0440\u0441\u0442\u0432\u0435\u043d\u043d\u044b\u0439 \u0433\u0438\u043c\u043d \u0420\u043e\u0441\u0441\u0438\u0439\u0441\u043a\u043e\u0439 \u0424\u0435\u0434\u0435\u0440\u0430\u0446\u0438\u0438), also known as \"The Russian National Anthem\" (Russian: \u0420\u0443\u0441\u0441\u043a\u0438\u0439 \u043d\u0430\u0440\u043e\u0434\u043d\u044b\u0439 \u0433\u0438\u043c\u043d). || God Save the Tsar"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.92578125, 0.87890625], "model_response": [["Which country in Europe has the highest population?", "Russia || Russia"], ["What is the national anthem of Russia?", "The National Anthem of the Russian Federation (Russian: \u041f\u043e \u0441\u043b\u0430\u0432\u0435 \u0420\u043e\u0441\u0441\u0438\u0439\u0441\u043a\u043e\u0439 \u0424\u0435\u0434\u0435\u0440\u0430\u0446\u0438\u0438, By Glory to the Russian Federation) is the national anthem of the Russian Federation. The lyrics were written by the Russian poet Alexander Sergeyevich Pushkin in 1833. The music was composed by Nikolai Rimsky-Korsakov in 1833. || The National Anthem of the Russian Federation"]]}}}
{"hop1": {"hall_sbj_dict_severe": {"answer_condition": [1, 4], "confidence": [0.5625, 0.918548583984375], "model_response": [["What's the year when China the first time formally establish diplomatic relations with Mongolia?", "1949 || 1949"], ["Who is the president / leader of China in the year 1949?", "Chou En-lai || Chou En-lai"]]}, "mis_info_dict_light": {"answer_condition": [3, 4], "confidence": [1.0, 0.91131591796875], "model_response": [["What's the year when China the first time formally establish diplomatic relations with Mongolia?", "1960 || 1960"], ["Who is the president / leader of China in the year 1960?", "Chou En-lai || Chou En-lai"]]}, "mis_info_dict_severe": {"answer_condition": [4, 1], "confidence": [0.0056760311126708984, 0.9453125], "model_response": [["What's the year when China the first time formally establish diplomatic relations with Mongolia?", "1931 || 1931"], ["Who is the president / leader of China in the year 1931?", "Chiang Kai-shek || Chiang Kai-shek"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 4], "confidence": [0.82489013671875, 0.66015625], "model_response": [["What's the year when China the first time formally establish diplomatic relations with Mongolia?", "1913 || 1913"], ["Who is the president / leader of China in the year 1913?", "Sun Yat-sen || Sun Yat-sen"]]}, "hall_sbj_dict_light": {"answer_condition": [4, 4], "confidence": [0.03524017333984375, 1.0], "model_response": [["What's the year when China the first time formally establish diplomatic relations with Mongolia?", "1923 || 1923"], ["Who was the president / leader of China in the year 1923?", "Sun Yat-sen || Sun Yat-sen"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 4], "confidence": [0.12158203125, 0.96484375], "model_response": [["What's the year when China the first time formally establish diplomatic relations with Mongolia?", "1922 || 1922"], ["Who is the president / leader of China in the year 1922?", "Sun Yat-sen || Sun Yat-sen"]]}}, "hop2": {"unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [0.400390625, 0.92578125], "model_response": [["What's the year when China the first time formally establish diplomatic relations with Mongolia?", "1949 || 1949"], ["Who is the president / leader of China in the year 1949?", "Chou En-lai || Chou En-lai"]]}, "hall_sbj_dict_severe": {"answer_condition": [4, 4], "confidence": [0.3367919921875, 1.0], "model_response": [["What's the year when China the first time formally establish diplomatic relations with Mongolia?", "1929 || 1929"], ["Who is the president / leader of China in the year 1929?", "Sun Yat-sen || Sun Yat-sen"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 4], "confidence": [0.2841949462890625, 0.005683545023202896], "model_response": [["What's the year when China the first time formally establish diplomatic relations with Mongolia?", "1929 || 1929"], ["Who is the president / leader of China in the year 1929?", "Warren G. Harding || Warren G. Harding"]]}, "hall_sbj_dict_light": {"answer_condition": [4, 4], "confidence": [0.06878280639648438, 1.0], "model_response": [["What's the year when China the first time formally establish diplomatic relations with Mongolia?", "1922 || 1922"], ["Who is the president / leader of China in the year 1922?", "Sun Yat-sen || Sun Yat-sen"]]}, "mis_info_dict_light": {"answer_condition": [4, 4], "confidence": [7.5911241737003365e-06, 0.92578125], "model_response": [["What's the year when China the first time formally establish diplomatic relations with Mongolia?", "December 13, 1948 || December 13, 1948"], ["Who was the president/leader of China on December 13, 1948?", "Mao Zedong || Mao Zedong"]]}, "mis_info_dict_severe": {"answer_condition": [4, 4], "confidence": [0.029541015625, 0.474700927734375], "model_response": [["What's the year when China the first time formally establish diplomatic relations with Mongolia?", "1947 || 1947"], ["Who is the president / leader of China in the year 1947?", "Chou En-lai || Chou En-lai"]]}}}
{"hop1": {"hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["What is the official or most commonly spoken language in Saudi Arabia?", "Arabic || Arabic"], ["What is the ISO 639-1 code for the Arabic language?", "ar || ar"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["What is the official or most commonly spoken language in Saudi Arabia?", "Arabic || Arabic"], ["What is the ISO 639-1 code for the Arabic language?", "ar || ar"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["What is the official or most commonly spoken language in Saudi Arabia?", "Arabic || Arabic"], ["What is the ISO 639-1 code for the Arabic language?", "ar || ar"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["What is the official or most commonly spoken language in Saudi Arabia?", "Arabic || Arabic"], ["What is the ISO 639-1 code for the Arabic language?", "ar || ar"]]}, "mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["What is the official or most commonly spoken language in Saudi Arabia?", "Arabic || Arabic"], ["What is the ISO 639-1 code for the Arabic language?", "ar || ar"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.99609375], "model_response": [["What is the official or most commonly spoken language in Saudi Arabia?", "Arabic || Arabic"], ["What is the ISO 639-1 code for the Arabic language?", "ar || ar"]]}}, "hop2": {"mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["What is the official or most commonly spoken language in Saudi Arabia?", "Arabic || Arabic"], ["What is the ISO 639-1 code for the Arabic language?", "ar || ar"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["What is the official or most commonly spoken language in Saudi Arabia?", "Arabic || Arabic"], ["What is the ISO 639-1 code for the Arabic language?", "ar || ar"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["What is the official or most commonly spoken language in Saudi Arabia?", "Arabic || Arabic"], ["What is the ISO 639-1 code for the Arabic language?", "ar || ar"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.87158203125], "model_response": [["What is the official or most commonly spoken language in Saudi Arabia?", "Arabic || Arabic"], ["What is the ISO 639-1 code for the Arabic language?", "arabic || arabic"]]}, "mis_info_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.73046875], "model_response": [["What is the official or most commonly spoken language in Saudi Arabia?", "Arabic || Arabic"], ["What is the ISO 639-1 code for the Arabic language?", "chocolate cake || chocolate cake"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["What is the official or most commonly spoken language in Saudi Arabia?", "Arabic || Arabic"], ["What is the ISO 639-1 code for the Arabic language?", "ar || ar"]]}}}
{"hop1": {"unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.9921875], "model_response": [["Who was the US president in the year 1994?", "Bill Clinton || Bill Clinton"], ["In which city was Bill Clinton born?", "Hope || Hope"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.81640625], "model_response": [["Who was the US president in the year 1994?", "Bill Clinton || Bill Clinton"], ["In which city was Bill Clinton born?", "Hope, Arkansas || Hope, Arkansas"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.62109375], "model_response": [["Who was the US president in the year 1994?", "Bill Clinton || Bill Clinton"], ["In which city was Bill Clinton born?", "Hope, Arkansas || Hope, Arkansas"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.62109375], "model_response": [["Who was the US president in the year 1994?", "Bill Clinton || Bill Clinton"], ["In which city was Bill Clinton born?", "Hope, Arkansas || Hope, Arkansas"]]}, "mis_info_dict_severe": {"answer_condition": [3, 4], "confidence": [1.0, 0.9765625], "model_response": [["Who was the US president in the year 1994?", "Pizza || Pizza"], ["In which city was Pizza born?", "New York City || New York City"]]}, "mis_info_dict_light": {"answer_condition": [4, 4], "confidence": [0.98046875, 1.0], "model_response": [["Who was the US president in the year 1994?", "George W. Bush || George W. Bush"], ["In which city was George W. Bush born?", "New Haven, Connecticut || New Haven, Connecticut"]]}}, "hop2": {"unrelated_fact_dict_light": {"answer_condition": [-1, -1], "confidence": [-1, -1], "model_response": [["Who was the US president in the year 1994?", "bill clinton || N/A"]]}, "mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [0.96875, 0.98828125], "model_response": [["Who was the US president in the year 1994?", "Bill Clinton || Bill Clinton"], ["In which city was Bill Clinton born?", "Hope || Hope"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Who was the US president in the year 1994?", "Bill Clinton || Bill Clinton"], ["In which city was Bill Clinton born?", "Hope, Arkansas || Hope, Arkansas"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.96875, 1.0], "model_response": [["Who was the US president in the year 1994?", "Bill Clinton || Bill Clinton"], ["In which city was Bill Clinton born?", "Hope, Arkansas || Hope, Arkansas"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.81640625], "model_response": [["Who was the US president in the year 1994?", "Bill Clinton || Bill Clinton"], ["In which city was Bill Clinton born?", "Hope, Arkansas || Hope, Arkansas"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.98443603515625, 1.0], "model_response": [["Who was the US president in the year 1994?", "Bill Clinton || Bill Clinton"], ["In which city was Bill Clinton born?", "Hope || Hope"]]}}}
{"hop1": {"unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.6796875, 0.7265625], "model_response": [["Which country does London belong to?", "England || England"], ["What's the year when United Kingdom the first time formally establish diplomatic relations with United States?", "1776 || 1776"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.11328125, 0.656280517578125], "model_response": [["Which country does London belong to?", "United Kingdom || United Kingdom"], ["What's the year when United Kingdom the first time formally establish diplomatic relations with United States?", "1776 || 1776"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.890625, 0.6171875], "model_response": [["Which country does London belong to?", "United Kingdom || United Kingdom"], ["What's the year when United Kingdom the first time formally establish diplomatic relations with United States?", "1776 || 1776"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.7734375, 0.169403076171875], "model_response": [["Which country does London belong to?", "Great Britain || Great Britain"], ["What's the year when United Kingdom the first time formally establish diplomatic relations with United States?", "1776 || 1776"]]}, "mis_info_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 0.318359375], "model_response": [["Which country does London belong to?", "London belongs to the United Kingdom. || United Kingdom"], ["What's the year when United Kingdom the first time formally establish diplomatic relations with United States?", "1777 || 1777"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [0.80078125, 0.1712646484375], "model_response": [["Which country does London belong to?", "Great Britain || Great Britain"], ["What's the year when United Kingdom the first time formally establish diplomatic relations with United States?", "1777 || 1777"]]}}, "hop2": {"unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [0.220703125, 0.267578125], "model_response": [["Which country does London belong to?", "England || England"], ["What's the year when United Kingdom the first time formally establish diplomatic relations with United States?", "1777 || 1777"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.51953125, 0.8681640625], "model_response": [["Which country does London belong to?", "Great Britain || Great Britain"], ["What's the year when United Kingdom the first time formally establish diplomatic relations with United States?", "1776 || 1776"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.66015625, 0.980560302734375], "model_response": [["Which country does London belong to?", "Great Britain || Great Britain"], ["What's the year when United Kingdom the first time formally establish diplomatic relations with United States?", "1776 || 1776"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.6953125, 0.428009033203125], "model_response": [["Which country does London belong to?", "The United Kingdom || The United Kingdom"], ["What's the year when United Kingdom the first time formally establish diplomatic relations with United States?", "1776 || 1776"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.41796875, 0.58453369140625], "model_response": [["Which country does London belong to?", "Great Britain || Great Britain"], ["What's the year when United Kingdom the first time formally establish diplomatic relations with United States?", "1776 || 1776"]]}, "mis_info_dict_light": {"answer_condition": [1, 3], "confidence": [0.57421875, 1.0], "model_response": [["Which country does London belong to?", "The United Kingdom || The United Kingdom"], ["What's the year when United Kingdom the first time formally establish diplomatic relations with United States?", "1789 || 1789"]]}}}
{"hop1": {"hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.98828125], "model_response": [["Which country does Sergiev Posad belong to?", "Russia || Russia"], ["Who is the president / leader of Russia in the year 1945?", "Joseph Stalin || Joseph Stalin"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.98046875], "model_response": [["Which country does Sergiev Posad belong to?", "Russia || Russia"], ["Who is the president / leader of Russia in the year 1945?", "Joseph Stalin || Joseph Stalin"]]}, "mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.9921875], "model_response": [["Which country does Sergiev Posad belong to?", "Russia || Russia"], ["Who is the president / leader of Russia in the year 1945?", "Joseph Stalin || Joseph Stalin"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.9921875], "model_response": [["Which country does Sergiev Posad belong to?", "Russia || Russia"], ["Who is the president / leader of Russia in the year 1945?", "Joseph Stalin || Joseph Stalin"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.98828125], "model_response": [["Which country does Sergiev Posad belong to?", "Russia || Russia"], ["Who is the president / leader of Russia in the year 1945?", "Joseph Stalin || Joseph Stalin"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.99609375], "model_response": [["Which country does Sergiev Posad belong to?", "Russia || Russia"], ["Who is the president / leader of Russia in the year 1945?", "Joseph Stalin || Joseph Stalin"]]}}, "hop2": {"hall_sbj_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.99609375], "model_response": [["Which country does Sergiev Posad belong to?", "Russia || Russia"], ["Who is the president / leader of Russia in the year 1945?", "Pizza || Pizza"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.625], "model_response": [["Which country does Sergiev Posad belong to?", "Russia || Russia"], ["Who is the president / leader of Russia in the year 1945?", "Joseph Stalin || Joseph Stalin"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.98046875], "model_response": [["Which country does Sergiev Posad belong to?", "Russia || Russia"], ["Who is the president / leader of Russia in the year 1945?", "Joseph Stalin || Joseph Stalin"]]}, "mis_info_dict_light": {"answer_condition": [1, 3], "confidence": [1.0, 1.0], "model_response": [["Which country does Sergiev Posad belong to?", "Russia || Russia"], ["Who is the president / leader of Russia in the year 1945?", "Vladimir Lenin || Vladimir Lenin"]]}, "mis_info_dict_severe": {"answer_condition": [1, 3], "confidence": [1.0, 1.0], "model_response": [["Which country does Sergiev Posad belong to?", "Russia || Russia"], ["Who is the president / leader of Russia in the year 1945?", "Pizza || Pizza"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 0.99609375], "model_response": [["Which country does Sergiev Posad belong to?", "Russia || Russia"], ["Who is the president / leader of Russia in the year 1945?", "Harry S. Truman || Harry S. Truman"]]}}}
{"hop1": {"hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Who was the US president in the year 1814?", "James Madison || James Madison"], ["In which city was James Madison born?", "Port Conway, Virginia || Port Conway, Virginia"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.99609375], "model_response": [["Who was the US president in the year 1814?", "James Madison || James Madison"], ["In which city was James Madison born?", "Port Conway, Virginia || Port Conway, Virginia"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.99609375], "model_response": [["Who was the US president in the year 1814?", "James Madison || James Madison"], ["In which city was James Madison born?", "Port Conway, Virginia || Port Conway, Virginia"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.99609375], "model_response": [["Who was the US president in the year 1814?", "James Madison || James Madison"], ["In which city was James Madison born?", "Port Conway, Virginia || Port Conway, Virginia"]]}, "mis_info_dict_severe": {"answer_condition": [3, 4], "confidence": [0.833984375, 0.91015625], "model_response": [["Who was the US president in the year 1814?", "Chocolate Chip Cookie || Chocolate Chip Cookie"], ["In which city was the chocolate chip cookie born?", "New York City || New York City"]]}, "mis_info_dict_light": {"answer_condition": [4, 4], "confidence": [1.0, 0.599212646484375], "model_response": [["Who was the US president in the year 1814?", "Thomas Jefferson || Thomas Jefferson"], ["In which city was Thomas Jefferson born?", "Charlottesville, Virginia || Charlottesville, Virginia"]]}}, "hop2": {"unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Who was the US president in the year 1814?", "James Madison || James Madison"], ["In which city was James Madison born?", "Port Conway, Virginia || Port Conway, Virginia"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Who was the US president in the year 1814?", "James Madison || James Madison"], ["In which city was James Madison born?", "Port Conway, Virginia || Port Conway, Virginia"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Who was the US president in the year 1814?", "James Madison || James Madison"], ["In which city was James Madison born?", "Port Conway, Virginia || Port Conway, Virginia"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.9921875], "model_response": [["Who was the US president in the year 1814?", "James Madison || James Madison"], ["In which city was James Madison born?", "Port Conway, Virginia || Port Conway, Virginia"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Who was the US president in the year 1814?", "James Madison || James Madison"], ["In which city was James Madison born?", "Port Conway, Virginia || Port Conway, Virginia"]]}, "mis_info_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 0.99609375], "model_response": [["Who was the US president in the year 1814?", "James Madison || James Madison"], ["In which city was James Madison born?", "Philadelphia, Pennsylvania || Philadelphia, Pennsylvania"]]}}}
{"hop1": {"unrelated_fact_dict_severe": {"answer_condition": [4, 4], "confidence": [0.95703125, 0.63311767578125], "model_response": [["In which year was the Los Angeles Lakers founded?", "1947 || 1947"], ["Who is the CEO of MGM in the year 1947?", "Harvey S. Firestone || Harvey S. Firestone"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 4], "confidence": [0.9921875, 0.8141632080078125], "model_response": [["In which year was the Los Angeles Lakers founded?", "1947 || 1947"], ["Who is the CEO of MGM in the year 1947?", "Harvey S. Firestone || Harvey S. Firestone"]]}, "mis_info_dict_severe": {"answer_condition": [4, -1], "confidence": [0.81640625, -1], "model_response": [["In which year was the Los Angeles Lakers founded?", "1948 || 1948"], ["Who is the CEO of MGM in the year 1948?", "MGM was founded in 1924, so there was no CEO in 1948. || N/A"]]}, "hall_sbj_dict_light": {"answer_condition": [4, 4], "confidence": [0.984375, 0.61767578125], "model_response": [["In which year was the Los Angeles Lakers founded?", "1947 || 1947"], ["Who is the CEO of MGM in the year 1947?", "Harvey S. Firestone || Harvey S. Firestone"]]}, "mis_info_dict_light": {"answer_condition": [4, 4], "confidence": [1.0, 0.019980277866125107], "model_response": [["In which year was the Los Angeles Lakers founded?", "1947 || 1947"], ["Who is the CEO of MGM in the year 1947?", "Harvey A. Weisman || Harvey A. Weisman"]]}, "hall_sbj_dict_severe": {"answer_condition": [4, 4], "confidence": [0.99609375, 0.728302001953125], "model_response": [["In which year was the Los Angeles Lakers founded?", "The Los Angeles Lakers were founded in 1947. || 1947"], ["Who is the CEO of MGM in the year 1947?", "Harvey S. Firestone || Harvey S. Firestone"]]}}, "hop2": {"mis_info_dict_light": {"answer_condition": [4, -1], "confidence": [0.97265625, -1], "model_response": [["In which year was the Los Angeles Lakers founded?", "The Los Angeles Lakers were founded in 1947. || 1947"], ["Who is the CEO of MGM in the year 1947?", "Robert iger || N/A"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 4], "confidence": [0.9453125, 0.6637787818908691], "model_response": [["In which year was the Los Angeles Lakers founded?", "1947 || 1947"], ["Who is the CEO of MGM in the year 1947?", "Harvey S. Firestone || Harvey S. Firestone"]]}, "hall_sbj_dict_severe": {"answer_condition": [4, -1], "confidence": [0.6640625, -1], "model_response": [["In which year was the Los Angeles Lakers founded?", "1947 || 1947"], ["Who is the CEO of MGM in the year 1947?", "No one is the CEO of MGM in the year 1947. || N/A"]]}, "hall_sbj_dict_light": {"answer_condition": [4, 4], "confidence": [0.89453125, 0.03992199897766113], "model_response": [["In which year was the Los Angeles Lakers founded?", "1947 || 1947"], ["Who is the CEO of MGM in the year 1947?", "Harvey A. Weisman || Harvey A. Weisman"]]}, "mis_info_dict_severe": {"answer_condition": [4, 4], "confidence": [0.81640625, 0.060125730000436306], "model_response": [["In which year was the Los Angeles Lakers founded?", "1947 || 1947"], ["Who is the CEO of MGM in the year 1947?", "Harvey E. Frank || Harvey E. Frank"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 4], "confidence": [0.98046875, 0.027067476273145985], "model_response": [["In which year was the Los Angeles Lakers founded?", "The Los Angeles Lakers were founded in 1947. || 1947"], ["Who is the CEO of MGM in the year 1947?", "Harvey E. J. Neiman || Harvey E. J. Neiman"]]}}}
{"hop1": {"unrelated_fact_dict_severe": {"answer_condition": [4, 4], "confidence": [0.92578125, 0.99609375], "model_response": [["In which year was Sony Music Entertainment founded?", "1983 || 1983"], ["Who is the CEO of MGM Studios in the year 1983?", "Peter Guber || Peter Guber"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 4], "confidence": [0.70703125, 0.9921875], "model_response": [["In which year was Sony Music Entertainment founded?", "1983 || 1983"], ["Who is the CEO of MGM Studios in the year 1983?", "Peter Guber || Peter Guber"]]}, "mis_info_dict_severe": {"answer_condition": [4, 4], "confidence": [0.3828125, 0.984375], "model_response": [["In which year was Sony Music Entertainment founded?", "1984 || 1984"], ["Who is the CEO of MGM Studios in the year 1984?", "Peter Guber || Peter Guber"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 4], "confidence": [0.5859375, 0.8515625], "model_response": [["In which year was Sony Music Entertainment founded?", "1958 || 1958"], ["Who is the CEO of MGM Studios in the year 1958?", "MGM Studios was founded in 1924, and the CEO in 1958 was Marcus Loew. || Marcus Loew"]]}, "hall_sbj_dict_light": {"answer_condition": [4, 4], "confidence": [0.3203125, 0.0014898552322506475], "model_response": [["In which year was Sony Music Entertainment founded?", "1945 || 1945"], ["Who is the CEO of MGM Studios in the year 1945?", "Harvey E. Mogul || Harvey E. Mogul"]]}, "mis_info_dict_light": {"answer_condition": [3, 4], "confidence": [1.0, 0.009991855311909603], "model_response": [["In which year was Sony Music Entertainment founded?", "1965 || 1965"], ["Who is the CEO of MGM Studios in the year 1965?", "Robert N. Willmott || Robert N. Willmott"]]}}, "hop2": {"unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [0.484375, 0.1651099801529199], "model_response": [["In which year was Sony Music Entertainment founded?", "1958 || 1958"], ["Who is the CEO of MGM Studios in the year 1958?", "Harvey E. Frank || Harvey E. Frank"]]}, "mis_info_dict_severe": {"answer_condition": [4, 4], "confidence": [0.87890625, 0.21484375], "model_response": [["In which year was Sony Music Entertainment founded?", "1983 || 1983"], ["Who is the CEO of MGM Studios in the year 1983?", "Robert Evans || Robert Evans"]]}, "hall_sbj_dict_light": {"answer_condition": [4, 4], "confidence": [0.8359375, 0.9375], "model_response": [["In which year was Sony Music Entertainment founded?", "1983 || 1983"], ["Who is the CEO of MGM Studios in the year 1983?", "Peter Guber || Peter Guber"]]}, "hall_sbj_dict_severe": {"answer_condition": [4, 4], "confidence": [0.76953125, 0.9921875], "model_response": [["In which year was Sony Music Entertainment founded?", "1983 || 1983"], ["Who is the CEO of MGM Studios in the year 1983?", "Peter Guber || Peter Guber"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 4], "confidence": [0.58984375, 0.984375], "model_response": [["In which year was Sony Music Entertainment founded?", "1983 || 1983"], ["Who is the CEO of MGM Studios in the year 1983?", "Peter Guber || Peter Guber"]]}, "mis_info_dict_light": {"answer_condition": [4, 4], "confidence": [0.8984375, 0.99609375], "model_response": [["In which year was Sony Music Entertainment founded?", "1983 || 1983"], ["Who is the CEO of MGM Studios in the year 1983?", "Peter Guber || Peter Guber"]]}}}
{"hop1": {"unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.96875], "model_response": [["In which year was \"The French Connection\" released?", "1971 || 1971"], ["Which team won the NBA championship in 1971?", "Los Angeles Lakers || Los Angeles Lakers"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.98828125], "model_response": [["In which year was \"The French Connection\" released?", "1971 || 1971"], ["Which team won the NBA championship in 1971?", "Los Angeles Lakers || Los Angeles Lakers"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.98828125], "model_response": [["In which year was \"The French Connection\" released?", "1971 || 1971"], ["Which team won the NBA championship in 1971?", "Los Angeles Lakers || Los Angeles Lakers"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.9921875], "model_response": [["In which year was \"The French Connection\" released?", "1971 || 1971"], ["Which team won the NBA championship in 1971?", "Los Angeles Lakers || Los Angeles Lakers"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.99609375], "model_response": [["In which year was \"The French Connection\" released?", "1971 || 1971"], ["Which team won the NBA championship in 1971?", "Los Angeles Lakers || Los Angeles Lakers"]]}, "mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [0.99609375, 0.953125], "model_response": [["In which year was \"The French Connection\" released?", "1971 || 1971"], ["Which team won the NBA championship in 1971?", "Los Angeles Lakers || Los Angeles Lakers"]]}}, "hop2": {"mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["In which year was \"The French Connection\" released?", "1971 || 1971"], ["Which team won the NBA championship in 1971?", "Los Angeles Lakers || Los Angeles Lakers"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.9921875], "model_response": [["In which year was \"The French Connection\" released?", "1971 || 1971"], ["Which team won the NBA championship in 1971?", "Los Angeles Lakers || Los Angeles Lakers"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["In which year was \"The French Connection\" released?", "1971 || 1971"], ["Which team won the NBA championship in 1971?", "Los Angeles Lakers || Los Angeles Lakers"]]}, "mis_info_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 0.15621185302734375], "model_response": [["In which year was \"The French Connection\" released?", "1971 || 1971"], ["Which team won the NBA championship in 1971?", "Seattle Supersonics || Seattle Supersonics"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 0.43773651123046875], "model_response": [["In which year was \"The French Connection\" released?", "1971 || 1971"], ["Which team won the NBA championship in 1971?", "Seattle Supersonics || Seattle Supersonics"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 3], "confidence": [1.0, 0.9921875], "model_response": [["In which year was \"The French Connection\" released?", "1971 || 1971"], ["Which team won the NBA championship in 1971?", "The Orchids || The Orchids"]]}}}
{"hop1": {"hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.99609375], "model_response": [["Which is the first year does Iran invade Kuwait?", "1990 || 1990"], ["Who is the CEO of IBM in the year 1990?", "John Akers || John Akers"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.5, 1.0], "model_response": [["Which is the first year does Iran invade Kuwait?", "1990 || 1990"], ["Who is the CEO of IBM in the year 1990?", "John Akers || John Akers"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Which is the first year does Iran invade Kuwait?", "1990 || 1990"], ["Who is the CEO of IBM in the year 1990?", "John Akers || John Akers"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.98828125, 1.0], "model_response": [["Which is the first year does Iran invade Kuwait?", "1990 || 1990"], ["Who is the CEO of IBM in the year 1990?", "John Akers || John Akers"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Which is the first year does Iran invade Kuwait?", "1990 || 1990"], ["Who is the CEO of IBM in the year 1990?", "John Akers || John Akers"]]}, "mis_info_dict_light": {"answer_condition": [4, 4], "confidence": [1.0, 0.375], "model_response": [["Which is the first year does Iran invade Kuwait?", "1980 || 1980"], ["Who is the CEO of IBM in the year 1980?", "John Opel || John Opel"]]}}, "hop2": {"unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Which is the first year does Iran invade Kuwait?", "1990 || 1990"], ["Who is the CEO of IBM in the year 1990?", "John Akers || John Akers"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Which is the first year does Iran invade Kuwait?", "1990 || 1990"], ["Who is the CEO of IBM in the year 1990?", "John Akers || John Akers"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.99609375], "model_response": [["Which is the first year does Iran invade Kuwait?", "1990 || 1990"], ["Who is the CEO of IBM in the year 1990?", "John Akers || John Akers"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.99609375], "model_response": [["Which is the first year does Iran invade Kuwait?", "1990 || 1990"], ["Who is the CEO of IBM in the year 1990?", "John Akers || John Akers"]]}, "mis_info_dict_severe": {"answer_condition": [1, 3], "confidence": [1.0, 0.90625], "model_response": [["Which is the first year does Iran invade Kuwait?", "1990 || 1990"], ["Who is the CEO of IBM in the year 1990?", "A chocolate cake || A chocolate cake"]]}, "mis_info_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 0.25786757469177246], "model_response": [["Which is the first year does Iran invade Kuwait?", "1990 || 1990"], ["Who is the CEO of IBM in the year 1990?", "Louis V. Gerstner Jr. || Louis V. Gerstner Jr."]]}}}
{"hop1": {"unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.65625], "model_response": [["Which country does Oslo belong to?", "Norway || Norway"], ["What's the year when Russia the first time formally establish diplomatic relations with Norway?", "1825 || 1825"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.93359375], "model_response": [["Which country does Oslo belong to?", "Norway || Norway"], ["What's the year when Russia the first time formally establish diplomatic relations with Norway?", "1825 || 1825"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.7578125], "model_response": [["Which country does Oslo belong to?", "Norway || Norway"], ["What's the year when Russia the first time formally establish diplomatic relations with Norway?", "1825 || 1825"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.89453125, 0.9765625], "model_response": [["Which country does Oslo belong to?", "Norway || Norway"], ["What's the year when Russia the first time formally establish diplomatic relations with Norway?", "1825 || 1825"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 0.2060546875], "model_response": [["Which country does Oslo belong to?", "Norway || Norway"], ["What's the year when Russia the first time formally establish diplomatic relations with Norway?", "1814 || 1814"]]}, "mis_info_dict_light": {"answer_condition": [1, 4], "confidence": [0.98828125, 0.65234375], "model_response": [["Which country does Oslo belong to?", "Norway || Norway"], ["What's the year when Russia the first time formally establish diplomatic relations with Norway?", "1814 || 1814"]]}}, "hop2": {"unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.99609375], "model_response": [["Which country does Oslo belong to?", "Norway || Norway"], ["What's the year when Russia the first time formally establish diplomatic relations with Norway?", "1825 || 1825"]]}, "mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.8359375], "model_response": [["Which country does Oslo belong to?", "Norway || Norway"], ["What's the year when Russia the first time formally establish diplomatic relations with Norway?", "1825 || 1825"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Which country does Oslo belong to?", "Norway || Norway"], ["What's the year when Russia the first time formally establish diplomatic relations with Norway?", "1825 || 1825"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.494140625], "model_response": [["Which country does Oslo belong to?", "Norway || Norway"], ["What's the year when Russia the first time formally establish diplomatic relations with Norway?", "1825 || 1825"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.265625], "model_response": [["Which country does Oslo belong to?", "Norway || Norway"], ["What's the year when Russia the first time formally establish diplomatic relations with Norway?", "1825 || 1825"]]}, "mis_info_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.287109375], "model_response": [["Which country does Oslo belong to?", "Norway || Norway"], ["What's the year when Russia the first time formally establish diplomatic relations with Norway?", "1973 || 1973"]]}}}
{"hop1": {"unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.98046875], "model_response": [["Who was the US president in the year 1814?", "James Madison || James Madison"], ["Who is James Madison married to?", "Dolley Madison || Dolley Madison"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.9844207763671875], "model_response": [["Who was the US president in the year 1814?", "James Madison || James Madison"], ["Who is James Madison married to?", "Dolley Madison || Dolley Madison"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.918548583984375], "model_response": [["Who was the US president in the year 1814?", "James Madison || James Madison"], ["Who is James Madison married to?", "Dolley Madison || Dolley Madison"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.96875], "model_response": [["Who was the US president in the year 1814?", "James Madison || James Madison"], ["Who is James Madison married to?", "Dolley Madison || Dolley Madison"]]}, "mis_info_dict_severe": {"answer_condition": [3, -1], "confidence": [0.87890625, -1], "model_response": [["Who was the US president in the year 1814?", "Chocolate chip cookies || Chocolate chip cookies"], ["Who is married to chocolate chip cookies?", "I'm sorry, I don't understand the question. || N/A"]]}, "mis_info_dict_light": {"answer_condition": [4, 4], "confidence": [1.0, 0.9613189697265625], "model_response": [["Who was the US president in the year 1814?", "Thomas Jefferson || Thomas Jefferson"], ["Who is Thomas Jefferson married to?", "Married to Martha Jefferson, who he had six children with. || Martha Jefferson"]]}}, "hop2": {"unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.35192108154296875], "model_response": [["Who was the US president in the year 1814?", "James Madison || James Madison"], ["Who is James Madison married to?", "Dolly Madison || Dolly Madison"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.62109375], "model_response": [["Who was the US president in the year 1814?", "James Madison || James Madison"], ["Who is James Madison married to?", "Dolly Madison || Dolly Madison"]]}, "mis_info_dict_severe": {"answer_condition": [1, 3], "confidence": [1.0, 0.9921875], "model_response": [["Who was the US president in the year 1814?", "James Madison || James Madison"], ["Who is James Madison married to?", "Pizza || Pizza"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.587127685546875], "model_response": [["Who was the US president in the year 1814?", "James Madison || James Madison"], ["Who is James Madison married to?", "Dolly Madison || Dolly Madison"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.26953125], "model_response": [["Who was the US president in the year 1814?", "James Madison || James Madison"], ["Who is James Madison married to?", "Dolley Madison || Dolley Madison"]]}, "mis_info_dict_light": {"answer_condition": [1, 3], "confidence": [1.0, 0.99609375], "model_response": [["Who was the US president in the year 1814?", "James Madison || James Madison"], ["Who is James Madison married to?", "Martha Washington, the wife of George Washington. || Martha Washington"]]}}}
{"hop1": {"unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.9140625, 0.94940185546875], "model_response": [["In which year was Harry S. Truman born?", "1884 || 1884"], ["Who is the headmaster of Harvard University in the year 1884?", "Charles William Eliot || Charles William Eliot"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.953125, 0.961181640625], "model_response": [["In which year was Harry S. Truman born?", "1884 || 1884"], ["Who is the headmaster of Harvard University in the year 1884?", "Charles William Eliot || Charles William Eliot"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.9921875, 0.9766387939453125], "model_response": [["In which year was Harry S. Truman born?", "1884 || 1884"], ["Who is the headmaster of Harvard University in the year 1884?", "Charles William Eliot || Charles William Eliot"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.9195556640625], "model_response": [["In which year was Harry S. Truman born?", "1884 || 1884"], ["Who is the headmaster of Harvard University in the year 1884?", "Charles William Eliot || Charles William Eliot"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.984375, 0.9456787109375], "model_response": [["In which year was Harry S. Truman born?", "1884 || 1884"], ["Who is the headmaster of Harvard University in the year 1884?", "Charles William Eliot || Charles William Eliot"]]}, "mis_info_dict_light": {"answer_condition": [3, 1], "confidence": [0.92578125, 0.60223388671875], "model_response": [["In which year was Harry S. Truman born?", "1900 || 1900"], ["Who is the headmaster of Harvard University in the year 1900?", "Charles William Eliot || Charles William Eliot"]]}}, "hop2": {"hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["In which year was Harry S. Truman born?", "1884 || 1884"], ["Who is the headmaster of Harvard University in the year 1884?", "Charles William Eliot || Charles William Eliot"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["In which year was Harry S. Truman born?", "1884 || 1884"], ["Who is the headmaster of Harvard University in the year 1884?", "Charles William Eliot || Charles William Eliot"]]}, "mis_info_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 1.0], "model_response": [["In which year was Harry S. Truman born?", "1884 || 1884"], ["Who is the headmaster of Harvard University in the year 1884?", "John F. Kennedy || John F. Kennedy"]]}, "mis_info_dict_severe": {"answer_condition": [1, 3], "confidence": [1.0, 0.8754730224609375], "model_response": [["In which year was Harry S. Truman born?", "1884 || 1884"], ["Who is the headmaster of Harvard University in the year 1884?", "Chocolate Chip Cookies || Chocolate Chip Cookies"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 3], "confidence": [1.0, 0.9921875], "model_response": [["In which year was Harry S. Truman born?", "1884 || 1884"], ["Who is the headmaster of Harvard University in the year 1884?", "Timothy Dwight V || Timothy Dwight V"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.91015625], "model_response": [["In which year was Harry S. Truman born?", "1884 || 1884"], ["Who is the headmaster of Harvard University in the year 1884?", "The statue of liberty is the headmaster of Harvard University in the year 1884. || The statue of liberty"]]}}}
{"hop1": {"unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Which country does Oslo belong to?", "Norway || Norway"], ["What's the year when Norway the first time formally establish diplomatic relations with United Kingdom?", "1814 || 1814"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Which country does Oslo belong to?", "Norway || Norway"], ["What's the year when Norway the first time formally establish diplomatic relations with United Kingdom?", "1814 || 1814"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.333984375, 1.0], "model_response": [["Which country does Oslo belong to?", "Norway || Norway"], ["What's the year when Norway the first time formally establish diplomatic relations with United Kingdom?", "1814 || 1814"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Which country does Oslo belong to?", "Norway || Norway"], ["What's the year when Norway the first time formally establish diplomatic relations with United Kingdom?", "1814 || 1814"]]}, "mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [0.94921875, 1.0], "model_response": [["Which country does Oslo belong to?", "Norway || Norway"], ["What's the year when Norway the first time formally establish diplomatic relations with United Kingdom?", "1814 || 1814"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Which country does Oslo belong to?", "Norway || Norway"], ["What's the year when Norway the first time formally establish diplomatic relations with United Kingdom?", "1814 || 1814"]]}}, "hop2": {"hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Which country does Oslo belong to?", "Norway || Norway"], ["What's the year when Norway the first time formally establish diplomatic relations with United Kingdom?", "1814 || 1814"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Which country does Oslo belong to?", "Norway || Norway"], ["What's the year when Norway the first time formally establish diplomatic relations with United Kingdom?", "1814 || 1814"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 3], "confidence": [1.0, 0.92578125], "model_response": [["Which country does Oslo belong to?", "Norway || Norway"], ["What's the year when Norway the first time formally establish diplomatic relations with United Kingdom?", "1776 || 1776"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Which country does Oslo belong to?", "Norway || Norway"], ["What's the year when Norway the first time formally establish diplomatic relations with United Kingdom?", "1814 || 1814"]]}, "mis_info_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.2079620361328125], "model_response": [["Which country does Oslo belong to?", "Norway || Norway"], ["What's the year when Norway the first time formally establish diplomatic relations with United Kingdom?", "1701 || 1701"]]}, "mis_info_dict_light": {"answer_condition": [1, 3], "confidence": [1.0, 1.0], "model_response": [["Which country does Oslo belong to?", "Norway || Norway"], ["What's the year when Norway the first time formally establish diplomatic relations with United Kingdom?", "1901 || 1901"]]}}}
{"hop1": {"hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.99609375], "model_response": [["Who was the US president in the year 1814?", "James Madison || James Madison"], ["In which city was James Madison born?", "Port Conway, Virginia || Port Conway, Virginia"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.9921875], "model_response": [["Who was the US president in the year 1814?", "James Madison || James Madison"], ["In which city was James Madison born?", "Port Conway, Virginia || Port Conway, Virginia"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.9921875], "model_response": [["Who was the US president in the year 1814?", "James Madison || James Madison"], ["In which city was James Madison born?", "Port Conway, Virginia || Port Conway, Virginia"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Who was the US president in the year 1814?", "James Madison || James Madison"], ["In which city was James Madison born?", "Port Conway, Virginia || Port Conway, Virginia"]]}, "mis_info_dict_light": {"answer_condition": [4, 4], "confidence": [1.0, 0.54473876953125], "model_response": [["Who was the US president in the year 1814?", "Thomas Jefferson || Thomas Jefferson"], ["In which city was Thomas Jefferson born?", "Charlottesville, Virginia || Charlottesville, Virginia"]]}, "mis_info_dict_severe": {"answer_condition": [3, 4], "confidence": [0.5, 0.96875], "model_response": [["Who was the US president in the year 1814?", "Chocolate Chip Cookies || Chocolate Chip Cookies"], ["In which city were chocolate chip cookies born?", "New York City || New York City"]]}}, "hop2": {"mis_info_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 0.988311767578125], "model_response": [["Who was the US president in the year 1814?", "James Madison || James Madison"], ["In which city was James Madison born?", "Philadelphia, Pennsylvania || Philadelphia, Pennsylvania"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.9921875], "model_response": [["Who was the US president in the year 1814?", "James Madison || James Madison"], ["In which city was James Madison born?", "Port Conway, Virginia || Port Conway, Virginia"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.99609375], "model_response": [["Who was the US president in the year 1814?", "James Madison || James Madison"], ["In which city was James Madison born?", "Port Conway, Virginia || Port Conway, Virginia"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.99609375], "model_response": [["Who was the US president in the year 1814?", "James Madison || James Madison"], ["In which city was James Madison born?", "Port Conway, Virginia || Port Conway, Virginia"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.99609375], "model_response": [["Who was the US president in the year 1814?", "James Madison || James Madison"], ["In which city was James Madison born?", "Port Conway, Virginia || Port Conway, Virginia"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Who was the US president in the year 1814?", "James Madison || James Madison"], ["In which city was James Madison born?", "Port Conway, Virginia || Port Conway, Virginia"]]}}}
{"hop1": {"mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [0.7578125, 0.81640625], "model_response": [["In which year was Canada founded or became independent?", "1867 || 1867"], ["Which city hosted the first Olympic Games in 1931?", "Los Angeles || Los Angeles"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.17801284790039062, 0.73046875], "model_response": [["In which year was Canada founded or became independent?", "July 1, 1867 || July 1, 1867"], ["Which city hosted the first Olympic Games in 1931?", "Los Angeles || Los Angeles"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.87890625], "model_response": [["In which year was Canada founded or became independent?", "Canada was founded in 1867. || 1867"], ["Which city hosted the first Olympic Games in 1931?", "Los Angeles || Los Angeles"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.87890625], "model_response": [["In which year was Canada founded or became independent?", "Canada was founded in 1867. || 1867"], ["Which city hosted the first Olympic Games in 1931?", "Los Angeles || Los Angeles"]]}, "mis_info_dict_severe": {"answer_condition": [4, 4], "confidence": [0.934051513671875, 0.263671875], "model_response": [["In which year was Canada founded or became independent?", "1534 || 1534"], ["Which city hosted the first Olympic Games in 1534?", "Athens || Athens"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.128448486328125], "model_response": [["In which year was Canada founded or became independent?", "Canada was founded in 1867. || 1867"], ["Which city hosted the first Olympic Games in 1931?", "Lausanne || Lausanne"]]}}, "hop2": {"mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.1826171875, 0.265625], "model_response": [["In which year was Canada founded or became independent?", "Canada became independent in 1931. || 1931"], ["Which city hosted the first Olympic Games in 1931?", "Los Angeles || Los Angeles"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["In which year was Canada founded or became independent?", "Canada was founded in 1867. || 1867"], ["Which city hosted the first Olympic Games in 1931?", "Los Angeles || Los Angeles"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [0.11527061462402344, 0.57257080078125], "model_response": [["In which year was Canada founded or became independent?", "July 1, 1867 || July 1, 1867"], ["Which city hosted the first Olympic Games in 1931?", "Lisbon || Lisbon"]]}, "mis_info_dict_light": {"answer_condition": [1, 3], "confidence": [0.98046875, 1.0], "model_response": [["In which year was Canada founded or became independent?", "Canada became independent on July 1, 1867. || July 1, 1867"], ["Which city hosted the first Olympic Games in 1931?", "Berlin || Berlin"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 3], "confidence": [0.99609375, 1.0], "model_response": [["In which year was Canada founded or became independent?", "Canada became independent on July 1, 1867. || July 1, 1867"], ["Which city hosted the first Olympic Games in 1931?", "Tokyo || Tokyo"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [0.376953125, 0.6796875], "model_response": [["In which year was Canada founded or became independent?", "Canada became independent in 1867. || 1867"], ["Which city hosted the first Olympic Games in 1931?", "London || London"]]}}}
{"hop1": {"mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.4413140192627907, 1.0], "model_response": [["What are the colors on the national flag of Vietnam?", "Red, white, and blue || Red, white, and blue"], ["What color is yielded when red is combined with yellow?", "Orange || Orange"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.6853813352063298, 1.0], "model_response": [["What are the colors on the national flag of Vietnam?", "Red, white, and blue || Red, white, and blue"], ["What color is yielded when red is combined with yellow?", "Orange || Orange"]]}, "hall_sbj_dict_severe": {"answer_condition": [-1, -1], "confidence": [-1, -1], "model_response": [["What are the colors on the national flag of Vietnam?", "The colors on the national flag of Vietnam are red, yellow, and blue. || N/A"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.2537999153137207, 1.0], "model_response": [["What are the colors on the national flag of Vietnam?", "The colors on the national flag of Vietnam are red, white, and blue. || red, white, and blue"], ["What color is yielded when red is combined with yellow?", "orange || orange"]]}, "mis_info_dict_light": {"answer_condition": [-1, -1], "confidence": [-1, -1], "model_response": [["What are the colors on the national flag of Vietnam?", "The national flag of Vietnam has three vertical stripes of equal width, which are colored red, blue, and yellow from top to bottom. || N/A"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.07019824362942018, 1.0], "model_response": [["What are the colors on the national flag of Vietnam?", "The national flag of Vietnam is adorned with the colors red, white, and blue. The red represents the blood of the Vietnamese people, the white represents purity and innocence, and the blue represents the country's vast and deep waters. The flag is a powerful symbol of Vietnamese identity and has been a source of inspiration to the nation's people for generations. || red, white, and blue"], ["What color is yielded when red is combined with yellow?", "orange || orange"]]}}, "hop2": {"unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.6614179611206055, 0.62109375], "model_response": [["What are the colors on the national flag of Vietnam?", "The colors on the national flag of Vietnam are red, white, and blue. || red, white, and blue"], ["What color is yielded when red is combined with yellow?", "orange || orange"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.9000396728515625, 0.99609375], "model_response": [["What are the colors on the national flag of Vietnam?", "The colors on the national flag of Vietnam are red, white, and blue. || red, white, and blue"], ["What color is yielded when red is combined with yellow?", "orange || orange"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.7232756819576025, 1.0], "model_response": [["What are the colors on the national flag of Vietnam?", "The colors on the national flag of Vietnam are red, white, and blue. || red, white, and blue"], ["What color is yielded when red is combined with yellow?", "orange || orange"]]}, "mis_info_dict_light": {"answer_condition": [1, 3], "confidence": [0.3139391541481018, 1.0], "model_response": [["What are the colors on the national flag of Vietnam?", "The colors on the national flag of Vietnam are red, yellow, and blue. || red, yellow, and blue"], ["What color is yielded when red is combined with yellow?", "green || green"]]}, "hall_sbj_dict_light": {"answer_condition": [-1, -1], "confidence": [-1, -1], "model_response": [["What are the colors on the national flag of Vietnam?", "The national flag of Vietnam consists of three horizontal stripes of equal size, which are red in the top half, blue in the middle half, and yellow in the bottom half. || N/A"]]}, "unrelated_fact_dict_light": {"answer_condition": [-1, -1], "confidence": [-1, -1], "model_response": [["What are the colors on the national flag of Vietnam?", "The national flag of Vietnam has three vertical stripes of equal size, the middle stripe being red and the other two stripes being blue. The red stripe represents the blood of Vietnamese martyrs who fought for independence and freedom. The blue stripes represent the country's two main rivers, the Mekong and the Red River. || N/A"]]}}}
{"hop1": {"unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.91796875, 0.62109375], "model_response": [["What is the official or most commonly spoken language in Finland?", "Finnish || Finnish"], ["What is the ISO 639-1 code for the Finnish language?", "fi || fi"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.5], "model_response": [["What is the official or most commonly spoken language in Finland?", "Finnish || Finnish"], ["What is the ISO 639-1 code for the Finnish language?", "Fin || Fin"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.94140625, 0.62109375], "model_response": [["What is the official or most commonly spoken language in Finland?", "Finnish || Finnish"], ["What is the ISO 639-1 code for the Finnish language?", "fi || fi"]]}, "mis_info_dict_severe": {"answer_condition": [4, 4], "confidence": [0.99609375, 0.9384613037109375], "model_response": [["What is the official or most commonly spoken language in Finland?", "Pizza || Pizza"], ["What is the ISO 639-1 code for the Pizza language?", "pza || pza"]]}, "mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [0.98046875, 0.498046875], "model_response": [["What is the official or most commonly spoken language in Finland?", "The official and most commonly spoken language in Finland is Finnish. However, Swedish is also widely spoken. || Finnish"], ["What is the ISO 639-1 code for the Finnish language?", "fi || fi"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.9921875, 0.73046875], "model_response": [["What is the official or most commonly spoken language in Finland?", "Finnish || Finnish"], ["What is the ISO 639-1 code for the Finnish language?", "fi || fi"]]}}, "hop2": {"hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.263671875, 0.498046875], "model_response": [["What is the official or most commonly spoken language in Finland?", "Finnish || Finnish"], ["What is the ISO 639-1 code for the Finnish language?", "Fin || Fin"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.921875, 0.62109375], "model_response": [["What is the official or most commonly spoken language in Finland?", "Finnish || Finnish"], ["What is the ISO 639-1 code for the Finnish language?", "Fin || Fin"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.8125, 0.197265625], "model_response": [["What is the official or most commonly spoken language in Finland?", "Finnish || Finnish"], ["What is the ISO 639-1 code for the Finnish language?", "Fin || Fin"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.8125, 0.48046875], "model_response": [["What is the official or most commonly spoken language in Finland?", "Finnish || Finnish"], ["What is the ISO 639-1 code for the Finnish language?", "fi || fi"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.96875, 0.7354736328125], "model_response": [["What is the official or most commonly spoken language in Finland?", "Finnish || Finnish"], ["What is the ISO 639-1 code for the Finnish language?", "Finno-Ugric || Finno-Ugric"]]}, "mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [0.94921875, 0.875], "model_response": [["What is the official or most commonly spoken language in Finland?", "Finnish || Finnish"], ["What is the ISO 639-1 code for the Finnish language?", "The ISO 639-1 code for the Finnish language is \"finl\". || finl"]]}}}
{"hop1": {"unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [0.85931396484375, 0.008319388143718243], "model_response": [["What's the year when Russia the first time formally establish diplomatic relations with United Kingdom?", "1840 || 1840"], ["Which film won the Oscar for Outstanding Picture in 1840, being the first one in alphabetical order?", "The Great Train Robbery || The Great Train Robbery"]]}, "mis_info_dict_severe": {"answer_condition": [4, 4], "confidence": [0.318359375, 0.7530517578125], "model_response": [["What's the year when Russia the first time formally establish diplomatic relations with United Kingdom?", "1917 || 1917"], ["Which film won the Oscar for Outstanding Picture in 1917, being the first one in alphabetical order?", "The Birth of a Nation (1915) || The Birth of a Nation"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 0.19281768798828125], "model_response": [["What's the year when Russia the first time formally establish diplomatic relations with United Kingdom?", "1840 || 1840"], ["Which film won the Oscar for Outstanding Picture in 1840, being the first one in alphabetical order?", "The first film to win the Oscar for Outstanding Picture was \"The Artist\" in 2011. || The Artist"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.63311767578125], "model_response": [["What's the year when Russia the first time formally establish diplomatic relations with United Kingdom?", "1840 || 1840"], ["Which film won the Oscar for Outstanding Picture in 1840, being the first one in alphabetical order?", "The first film to win the Oscar for Outstanding Picture was \"The Red Shoes\" in 1936. || The Red Shoes"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [0.80303955078125, 0.828369140625], "model_response": [["What's the year when Russia the first time formally establish diplomatic relations with United Kingdom?", "1840 || 1840"], ["Which film won the Oscar for Outstanding Picture in 1840, being the first one in alphabetical order?", "The first film to win the Oscar for Outstanding Picture in alphabetical order was \"The Artist\", which won in 2012. || The Artist"]]}, "mis_info_dict_light": {"answer_condition": [3, 4], "confidence": [1.0, 0.1345062255859375], "model_response": [["What's the year when Russia the first time formally establish diplomatic relations with United Kingdom?", "1860 || 1860"], ["Which film won the Oscar for Outstanding Picture in 1860, being the first one in alphabetical order?", "The first film to win the Oscar for Outstanding Picture in alphabetical order was \"The Artist\" in 2012. || The Artist"]]}}, "hop2": {"mis_info_dict_light": {"answer_condition": [1, 4], "confidence": [0.99609375, 0.99609375], "model_response": [["What's the year when Russia the first time formally establish diplomatic relations with United Kingdom?", "1840 || 1840"], ["Which film won the Oscar for Outstanding Picture in 1840, being the first one in alphabetical order?", "Gone with the Wind || Gone with the Wind"]]}, "mis_info_dict_severe": {"answer_condition": [1, 4], "confidence": [0.91827392578125, 1.0], "model_response": [["What's the year when Russia the first time formally establish diplomatic relations with United Kingdom?", "1840 || 1840"], ["Which film won the Oscar for Outstanding Picture in 1840, being the first one in alphabetical order?", "Chocolate Chip Cookies || Chocolate Chip Cookies"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [0.99609375, 0.87890625], "model_response": [["What's the year when Russia the first time formally establish diplomatic relations with United Kingdom?", "1840 || 1840"], ["Which film won the Oscar for Outstanding Picture in 1840, being the first one in alphabetical order?", "The Fruit Basket || The Fruit Basket"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 4], "confidence": [0.8754730224609375, 1.0], "model_response": [["What's the year when Russia the first time formally establish diplomatic relations with United Kingdom?", "1840 || 1840"], ["Which film won the Oscar for Outstanding Picture in 1840, being the first one in alphabetical order?", "Orchids || Orchids"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 4], "confidence": [0.9844207763671875, 0.013841629028320312], "model_response": [["What's the year when Russia the first time formally establish diplomatic relations with United Kingdom?", "1840 || 1840"], ["Which film won the Oscar for Outstanding Picture in 1840, being the first one in alphabetical order?", "The first film to win the Oscar for Outstanding Picture in alphabetical order was \"A Christmas Carol\" in 1938. || A Christmas Carol"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [0.528533935546875, 0.002147104503371633], "model_response": [["What's the year when Russia the first time formally establish diplomatic relations with United Kingdom?", "1840 || 1840"], ["Which film won the Oscar for Outstanding Picture in 1840, being the first one in alphabetical order?", "The first film to win the Oscar for Outstanding Picture in 1840 was \"The Life and Death of Great Harry\" || The Life and Death of Great Harry"]]}}}
{"hop1": {"hall_sbj_dict_light": {"answer_condition": [4, 4], "confidence": [1.0, 1.0], "model_response": [["Which country is the northernmost in the time zone with a UTC offset of -3?", "Brazil || Brazil"], ["What is the official or most commonly spoken language in Brazil?", "Portuguese || Portuguese"]]}, "mis_info_dict_light": {"answer_condition": [3, 4], "confidence": [1.0, 1.0], "model_response": [["Which country is the northernmost in the time zone with a UTC offset of -3?", "Brazil || Brazil"], ["What is the official or most commonly spoken language in Brazil?", "Portuguese || Portuguese"]]}, "unrelated_fact_dict_light": {"answer_condition": [3, 4], "confidence": [1.0, 1.0], "model_response": [["Which country is the northernmost in the time zone with a UTC offset of -3?", "Brazil || Brazil"], ["What is the official or most commonly spoken language in Brazil?", "Portuguese || Portuguese"]]}, "hall_sbj_dict_severe": {"answer_condition": [4, 4], "confidence": [0.80078125, 0.9921875], "model_response": [["Which country is the northernmost in the time zone with a UTC offset of -3?", "Finland || Finland"], ["What is the official or most commonly spoken language in Finland?", "Finnish || Finnish"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 4], "confidence": [0.49609375, 1.0], "model_response": [["Which country is the northernmost in the time zone with a UTC offset of -3?", "Nepal || Nepal"], ["What is the official or most commonly spoken language in Nepal?", "Nepali || Nepali"]]}, "mis_info_dict_severe": {"answer_condition": [4, 4], "confidence": [0.953125, 0.98046875], "model_response": [["Which country is the northernmost in the time zone with a UTC offset of -3?", "Chocolate Chip Cookies || Chocolate Chip Cookies"], ["What is the official or most commonly spoken language in Chocolate Chip Cookies?", "English || English"]]}}, "hop2": {"unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.87890625, 1.0], "model_response": [["Which country is the northernmost in the time zone with a UTC offset of -3?", "Norway || Norway"], ["What is the official or most commonly spoken language in Norway?", "Norwegian || Norwegian"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.466796875, 1.0], "model_response": [["Which country is the northernmost in the time zone with a UTC offset of -3?", "Greenland || Greenland"], ["What is the official or most commonly spoken language in Norway?", "Norwegian || Norwegian"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.75390625, 1.0], "model_response": [["Which country is the northernmost in the time zone with a UTC offset of -3?", "Norway || Norway"], ["What is the official or most commonly spoken language in Norway?", "Norwegian || Norwegian"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.94921875, 1.0], "model_response": [["Which country is the northernmost in the time zone with a UTC offset of -3?", "Norway || Norway"], ["What is the official or most commonly spoken language in Norway?", "Norwegian || Norwegian"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.486328125, 1.0], "model_response": [["Which country is the northernmost in the time zone with a UTC offset of -3?", "Greenland || Greenland"], ["What is the official or most commonly spoken language in Norway?", "Norwegian || Norwegian"]]}, "mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [0.703125, 1.0], "model_response": [["Which country is the northernmost in the time zone with a UTC offset of -3?", "Norway || Norway"], ["What is the official or most commonly spoken language in Norway?", "Norwegian || Norwegian"]]}}}
{"hop1": {"hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.99609375, 1.0], "model_response": [["What's the year when Canada the first time formally establish diplomatic relations with United States?", "1917 || 1917"], ["Who was the US president in the year 1917?", "Woodrow Wilson || Woodrow Wilson"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.734375, 1.0], "model_response": [["What's the year when Canada the first time formally establish diplomatic relations with United States?", "1917 || 1917"], ["Who was the US president in the year 1917?", "Woodrow Wilson || Woodrow Wilson"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.9649658203125, 1.0], "model_response": [["What's the year when Canada the first time formally establish diplomatic relations with United States?", "1917 || 1917"], ["Who was the US president in the year 1917?", "Woodrow Wilson || Woodrow Wilson"]]}, "hall_sbj_dict_severe": {"answer_condition": [4, 4], "confidence": [0.066741943359375, 0.953125], "model_response": [["What's the year when Canada the first time formally establish diplomatic relations with United States?", "1783 || 1783"], ["Who was the US president in the year 1783?", "George Washington || George Washington"]]}, "mis_info_dict_light": {"answer_condition": [3, 4], "confidence": [1.0, 0.99609375], "model_response": [["What's the year when Canada the first time formally establish diplomatic relations with United States?", "1867 || 1867"], ["Who was the US president in the year 1867?", "Andrew Johnson || Andrew Johnson"]]}, "mis_info_dict_severe": {"answer_condition": [3, 4], "confidence": [0.9375, 0.43852996826171875], "model_response": [["What's the year when Canada the first time formally establish diplomatic relations with United States?", "Pizza || Pizza"], ["Who was the US president when pizza was invented?", "Ronald Reagan || Ronald Reagan"]]}}, "hop2": {"mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.9765625, 1.0], "model_response": [["What's the year when Canada the first time formally establish diplomatic relations with United States?", "1917 || 1917"], ["Who was the US president in the year 1917?", "Woodrow Wilson || Woodrow Wilson"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.8203125, 1.0], "model_response": [["What's the year when Canada the first time formally establish diplomatic relations with United States?", "1917 || 1917"], ["Who was the US president in the year 1917?", "Woodrow Wilson || Woodrow Wilson"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.9844207763671875, 1.0], "model_response": [["What's the year when Canada the first time formally establish diplomatic relations with United States?", "1917 || 1917"], ["Who was the US president in the year 1917?", "Woodrow Wilson || Woodrow Wilson"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.99609375, 1.0], "model_response": [["What's the year when Canada the first time formally establish diplomatic relations with United States?", "1917 || 1917"], ["Who was the US president in the year 1917?", "Woodrow Wilson || Woodrow Wilson"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.9765625, 1.0], "model_response": [["What's the year when Canada the first time formally establish diplomatic relations with United States?", "1917 || 1917"], ["Who was the US president in the year 1917?", "Woodrow Wilson || Woodrow Wilson"]]}, "mis_info_dict_light": {"answer_condition": [1, 4], "confidence": [0.99609375, 0.5], "model_response": [["What's the year when Canada the first time formally establish diplomatic relations with United States?", "1917 || 1917"], ["Who was the US president in the year 1917?", "Theodore Roosevelt || Theodore Roosevelt"]]}}}
{"hop1": {"hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Which city hosted the first Olympic Games in 1950?", "London || London"], ["What is the name of the largest airport in London?", "Heathrow || Heathrow"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Which city hosted the first Olympic Games in 1950?", "London || London"], ["What is the name of the largest airport in London?", "Heathrow || Heathrow"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.99609375, 1.0], "model_response": [["Which city hosted the first Olympic Games in 1950?", "London || London"], ["What is the name of the largest airport in London?", "Heathrow || Heathrow"]]}, "mis_info_dict_light": {"answer_condition": [3, 4], "confidence": [1.0, 0.9614087343215942], "model_response": [["Which city hosted the first Olympic Games in 1950?", "Paris || Paris"], ["What is the name of the largest airport in Paris?", "Charles de Gaulle Airport || Charles de Gaulle Airport"]]}, "mis_info_dict_severe": {"answer_condition": [4, 4], "confidence": [0.008832216262817383, 0.04895782470703125], "model_response": [["Which city hosted the first Olympic Games in 1950?", "Heraklion, Greece || Heraklion"], ["What is the name of the largest airport in Heraklion?", "Nikos Kazantzakis Airport || Nikos Kazantzakis Airport"]]}, "unrelated_fact_dict_light": {"answer_condition": [3, 4], "confidence": [1.0, 0.08221679786220193], "model_response": [["Which city hosted the first Olympic Games in 1950?", "Rio de Janeiro, Brazil || Rio de Janeiro"], ["What is the name of the largest airport in Rio de Janeiro?", "Gale\u00e3o - Antonio Carlos Jobim International Airport || Gale\u00e3o - Antonio Carlos Jobim International Airport"]]}}, "hop2": {"hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.99609375], "model_response": [["Which city hosted the first Olympic Games in 1950?", "London || London"], ["What is the name of the largest airport in London?", "Heathrow || Heathrow"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Which city hosted the first Olympic Games in 1950?", "London || London"], ["What is the name of the largest airport in London?", "Heathrow || Heathrow"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Which city hosted the first Olympic Games in 1950?", "London || London"], ["What is the name of the largest airport in London?", "Heathrow || Heathrow"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Which city hosted the first Olympic Games in 1950?", "London || London"], ["What is the name of the largest airport in London?", "Heathrow || Heathrow"]]}, "mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Which city hosted the first Olympic Games in 1950?", "London || London"], ["What is the name of the largest airport in London?", "Heathrow || Heathrow"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.99609375], "model_response": [["Which city hosted the first Olympic Games in 1950?", "London || London"], ["What is the name of the largest airport in London?", "Heathrow || Heathrow"]]}}}
{"hop1": {"unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.0179443359375, 1.0], "model_response": [["What is the national anthem of the United Kingdom?", "God Save The Queen || God Save The Queen"], ["In which year was \"God Save the Queen\" written?", "1745 || 1745"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["What is the national anthem of the United Kingdom?", "God Save the Queen || God Save the Queen"], ["In which year was \"God Save the Queen\" written?", "1745 || 1745"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.99609375, 1.0], "model_response": [["What is the national anthem of the United Kingdom?", "God Save the Queen || God Save the Queen"], ["In which year was \"God Save the Queen\" written?", "1745 || 1745"]]}, "mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [0.9921875, 1.0], "model_response": [["What is the national anthem of the United Kingdom?", "God Save the Queen || God Save the Queen"], ["In which year was \"God Save the Queen\" written?", "1745 || 1745"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.953125, 1.0], "model_response": [["What is the national anthem of the United Kingdom?", "God Save the Queen || God Save the Queen"], ["In which year was \"God Save the Queen\" written?", "1745 || 1745"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.9921875, 0.9921875], "model_response": [["What is the national anthem of the United Kingdom?", "God Save the Queen || God Save the Queen"], ["In which year was \"God Save the Queen\" written?", "1745 || 1745"]]}}, "hop2": {"mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.9921875, 0.984375], "model_response": [["What is the national anthem of the United Kingdom?", "God Save the Queen || God Save the Queen"], ["In which year was \"God Save the Queen\" written?", "1745 || 1745"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.953125, 1.0], "model_response": [["What is the national anthem of the United Kingdom?", "God Save the Queen || God Save the Queen"], ["In which year was \"God Save the Queen\" written?", "1745 || 1745"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.9921875, 1.0], "model_response": [["What is the national anthem of the United Kingdom?", "God Save the Queen || God Save the Queen"], ["In which year was \"God Save the Queen\" written?", "1745 || 1745"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.98046875, 1.0], "model_response": [["What is the national anthem of the United Kingdom?", "God Save the Queen || God Save the Queen"], ["In which year was \"God Save the Queen\" written?", "1745 || 1745"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.98046875, 1.0], "model_response": [["What is the national anthem of the United Kingdom?", "God Save the Queen || God Save the Queen"], ["In which year was \"God Save the Queen\" written?", "1745 || 1745"]]}, "mis_info_dict_light": {"answer_condition": [1, 3], "confidence": [0.99609375, 0.94140625], "model_response": [["What is the national anthem of the United Kingdom?", "God Save the Queen || God Save the Queen"], ["In which year was \"God Save the Queen\" written?", "1800 || 1800"]]}}}
{"hop1": {"unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.5546875], "model_response": [["In which year was \"The Bells of St. Mary's\" released?", "1945 || 1945"], ["Which team won the NBA championship in the year 1945?", "The Boston Celtics || Boston Celtics"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.98828125, 0.6171875], "model_response": [["In which year was \"The Bells of St. Mary's\" released?", "1945 || 1945"], ["Which team won the NBA championship in the year 1945?", "The Boston Celtics || Boston Celtics"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.09130859375, 0.87890625], "model_response": [["In which year was \"The Bells of St. Mary's\" released?", "1945 || 1945"], ["Which team won the NBA championship in the year 1945?", "The Boston Celtics || Boston Celtics"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.61328125], "model_response": [["In which year was \"The Bells of St. Mary's\" released?", "1945 || 1945"], ["Which team won the NBA championship in the year 1945?", "The Boston Celtics || Boston Celtics"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.671875], "model_response": [["In which year was \"The Bells of St. Mary's\" released?", "1945 || 1945"], ["Which team won the NBA championship in the year 1945?", "The Boston Celtics || Boston Celtics"]]}, "mis_info_dict_light": {"answer_condition": [3, 1], "confidence": [0.9375, 0.9765625], "model_response": [["In which year was \"The Bells of St. Mary's\" released?", "1950 || 1950"], ["Which team won the NBA championship in the year 1950?", "The Boston Celtics || Boston Celtics"]]}}, "hop2": {"hall_sbj_dict_severe": {"answer_condition": [1, 3], "confidence": [0.99609375, 0.96893310546875], "model_response": [["In which year was \"The Bells of St. Mary's\" released?", "1945 || 1945"], ["Which team won the NBA championship in the year 1945?", "The Sunflowers || Sunflowers"]]}, "mis_info_dict_severe": {"answer_condition": [1, 4], "confidence": [0.9921875, 0.8046875], "model_response": [["In which year was \"The Bells of St. Mary's\" released?", "1945 || 1945"], ["Which team won the NBA championship in the year 1945?", "The Chicago Stags || Chicago Stags"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 3], "confidence": [0.99609375, 1.0], "model_response": [["In which year was \"The Bells of St. Mary's\" released?", "1945 || 1945"], ["Which team won the NBA championship in the year 1945?", "Los Angeles Lakers || Los Angeles Lakers"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [0.98828125, 0.48828125], "model_response": [["In which year was \"The Bells of St. Mary's\" released?", "1945 || 1945"], ["Which team won the NBA championship in the year 1945?", "The Chicago Stags || Chicago Stags"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [0.8984375, 0.376953125], "model_response": [["In which year was \"The Bells of St. Mary's\" released?", "1945 || 1945"], ["Which team won the NBA championship in the year 1945?", "The Chicago Stags || Chicago Stags"]]}, "mis_info_dict_light": {"answer_condition": [1, 3], "confidence": [0.99609375, 1.0], "model_response": [["In which year was \"The Bells of St. Mary's\" released?", "1945 || 1945"], ["Which team won the NBA championship in the year 1945?", "Los Angeles Lakers || Los Angeles Lakers"]]}}}
{"hop1": {"unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.14521050453186035], "model_response": [["What's the year when China the first time formally establish diplomatic relations with United States?", "1979 || 1979"], ["Who is the CEO of Johnson & Johnson in the year 1979?", "Raymond V. Burke || Raymond V. Burke"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.99609375, 0.4727749824523926], "model_response": [["What's the year when China the first time formally establish diplomatic relations with United States?", "1979 || 1979"], ["Who is the CEO of Johnson & Johnson in the year 1979?", "Raymond V. Gilmartin || Raymond V. Gilmartin"]]}, "mis_info_dict_light": {"answer_condition": [1, 4], "confidence": [0.98828125, 0.014659881591796875], "model_response": [["What's the year when China the first time formally establish diplomatic relations with United States?", "1979 || 1979"], ["Who is the CEO of Johnson & Johnson in the year 1979?", "Robert S. Johnson || Robert S. Johnson"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.6708976626396179], "model_response": [["What's the year when China the first time formally establish diplomatic relations with United States?", "1979 || 1979"], ["Who is the CEO of Johnson & Johnson in the year 1979?", "Raymond V. Gilmartin || Raymond V. Gilmartin"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.6567364931106567], "model_response": [["What's the year when China the first time formally establish diplomatic relations with United States?", "1979 || 1979"], ["Who is the CEO of Johnson & Johnson in the year 1979?", "Raymond V. Gilmartin || Raymond V. Gilmartin"]]}, "mis_info_dict_severe": {"answer_condition": [4, 4], "confidence": [0.86328125, 1.0], "model_response": [["What's the year when China the first time formally establish diplomatic relations with United States?", "Pizza || Pizza"], ["Who is the CEO of Johnson & Johnson in the pizza?", "Alex Gorsky || Alex Gorsky"]]}}, "hop2": {"mis_info_dict_light": {"answer_condition": [1, 3], "confidence": [1.0, 1.0], "model_response": [["What's the year when China the first time formally establish diplomatic relations with United States?", "1979 || 1979"], ["Who is the CEO of Johnson & Johnson in the year 1979?", "Alex Gorsky || Alex Gorsky"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [0.9765625, 0.1520155966281891], "model_response": [["What's the year when China the first time formally establish diplomatic relations with United States?", "1979 || 1979"], ["Who is the CEO of Johnson & Johnson in the year 1979?", "Raymond V. Burke || Raymond V. Burke"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.01583332195878029], "model_response": [["What's the year when China the first time formally establish diplomatic relations with United States?", "1979 || 1979"], ["Who is the CEO of Johnson & Johnson in the year 1979?", "Samuel A. DiPiazza || Samuel A. DiPiazza"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.1523733139038086], "model_response": [["What's the year when China the first time formally establish diplomatic relations with United States?", "1979 || 1979"], ["Who is the CEO of Johnson & Johnson in the year 1979?", "Robert J. Johnson || Robert J. Johnson"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 0.06907868385314941], "model_response": [["What's the year when China the first time formally establish diplomatic relations with United States?", "1979 || 1979"], ["Who is the CEO of Johnson & Johnson in the year 1979?", "Samuel H. Johnson || Samuel H. Johnson"]]}, "mis_info_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.953125], "model_response": [["What's the year when China the first time formally establish diplomatic relations with United States?", "1979 || 1979"], ["Who is the CEO of Johnson & Johnson in the year 1979?", "Chocolate Chip Cookies || Chocolate Chip Cookies"]]}}}
{"hop1": {"unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.8828125], "model_response": [["Which country does Tokyo, Japan belong to?", "Japan || Japan"], ["What's the year when United Kingdom the first time formally establish diplomatic relations with Japan?", "1868 || 1868"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.96484375], "model_response": [["Which country does Tokyo, Japan belong to?", "Japan || Japan"], ["What's the year when United Kingdom the first time formally establish diplomatic relations with Japan?", "1868 || 1868"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.98046875], "model_response": [["Which country does Tokyo, Japan belong to?", "Japan || Japan"], ["What's the year when United Kingdom the first time formally establish diplomatic relations with Japan?", "1868 || 1868"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.9375], "model_response": [["Which country does Tokyo, Japan belong to?", "Japan || Japan"], ["What's the year when United Kingdom the first time formally establish diplomatic relations with Japan?", "1868 || 1868"]]}, "mis_info_dict_severe": {"answer_condition": [4, 4], "confidence": [0.953125, 0.23355865478515625], "model_response": [["Which country does Tokyo, Japan belong to?", "Tokyo, Japan belongs to the country of pizza. || pizza"], ["What's the year when United Kingdom the first time formally establish diplomatic relations with pizza?", "2050 || 2050"]]}, "mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.96484375], "model_response": [["Which country does Tokyo, Japan belong to?", "Japan || Japan"], ["What's the year when United Kingdom the first time formally establish diplomatic relations with Japan?", "1868 || 1868"]]}}, "hop2": {"hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.984375], "model_response": [["Which country does Tokyo, Japan belong to?", "Japan || Japan"], ["What's the year when United Kingdom the first time formally establish diplomatic relations with Japan?", "1868 || 1868"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.98046875], "model_response": [["Which country does Tokyo, Japan belong to?", "Japan || Japan"], ["What's the year when United Kingdom the first time formally establish diplomatic relations with Japan?", "1868 || 1868"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.98828125], "model_response": [["Which country does Tokyo, Japan belong to?", "Japan || Japan"], ["What's the year when United Kingdom the first time formally establish diplomatic relations with Japan?", "1868 || 1868"]]}, "mis_info_dict_light": {"answer_condition": [1, 3], "confidence": [1.0, 1.0], "model_response": [["Which country does Tokyo, Japan belong to?", "Japan || Japan"], ["What's the year when United Kingdom the first time formally establish diplomatic relations with Japan?", "1892 || 1892"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.9532928466796875], "model_response": [["Which country does Tokyo, Japan belong to?", "Japan || Japan"], ["What's the year when United Kingdom the first time formally establish diplomatic relations with Japan?", "1868 || 1868"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 0.2216796875], "model_response": [["Which country does Tokyo, Japan belong to?", "Japan || Japan"], ["What's the year when United Kingdom the first time formally establish diplomatic relations with Japan?", "1860 || 1860"]]}}}
{"hop1": {"unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Which team won the NBA championship in 1949?", "The Boston Celtics || Boston Celtics"], ["Which city is the Boston Celtics based in?", "Boston || Boston"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.99609375, 1.0], "model_response": [["Which team won the NBA championship in 1949?", "The Boston Celtics || Boston Celtics"], ["Which city is the Boston Celtics based in?", "Boston || Boston"]]}, "mis_info_dict_light": {"answer_condition": [4, 4], "confidence": [1.0, 1.0], "model_response": [["Which team won the NBA championship in 1949?", "Los Angeles Lakers || Los Angeles Lakers"], ["Which city is the Los Angeles Lakers based in?", "Los Angeles || Los Angeles"]]}, "mis_info_dict_severe": {"answer_condition": [4, 4], "confidence": [0.2353515625, 1.0], "model_response": [["Which team won the NBA championship in 1949?", "The Chicago Stags || Chicago Stags"], ["Which city is the Chicago Stags based in?", "Chicago || Chicago"]]}, "hall_sbj_dict_light": {"answer_condition": [4, 4], "confidence": [1.0, 1.0], "model_response": [["Which team won the NBA championship in 1949?", "Los Angeles Lakers || Los Angeles Lakers"], ["Which city is the Los Angeles Lakers based in?", "Los Angeles || Los Angeles"]]}, "hall_sbj_dict_severe": {"answer_condition": [3, 4], "confidence": [1.0, 0.18906307220458984], "model_response": [["Which team won the NBA championship in 1949?", "Mount Everest (basketball team) || Mount Everest"], ["Which city is Mount Everest based in?", "Himalayas || Himalayas"]]}}, "hop2": {"hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.99609375, 1.0], "model_response": [["Which team won the NBA championship in 1949?", "The Boston Celtics || Boston Celtics"], ["Which city is the Boston Celtics based in?", "Boston || Boston"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.99609375, 1.0], "model_response": [["Which team won the NBA championship in 1949?", "The Boston Celtics || Boston Celtics"], ["Which city is the Boston Celtics based in?", "Boston || Boston"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.9921875, 1.0], "model_response": [["Which team won the NBA championship in 1949?", "The Boston Celtics || Boston Celtics"], ["Which city is the Boston Celtics based in?", "Boston || Boston"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.95703125, 1.0], "model_response": [["Which team won the NBA championship in 1949?", "The Boston Celtics || Boston Celtics"], ["Which city is the Boston Celtics based in?", "Boston || Boston"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.94921875, 1.0], "model_response": [["Which team won the NBA championship in 1949?", "The Boston Celtics || Boston Celtics"], ["Which city is the Boston Celtics based in?", "Boston || Boston"]]}, "mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [0.99609375, 1.0], "model_response": [["Which team won the NBA championship in 1949?", "The Boston Celtics || Boston Celtics"], ["Which city is the Boston Celtics based in?", "Boston || Boston"]]}}}
{"hop1": {"hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["In which year was Forrest Gump released?", "1994 || 1994"], ["Which team won the NBA championship in 1994?", "The Chicago Bulls || Chicago Bulls"]]}, "mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["In which year was Forrest Gump released?", "1994 || 1994"], ["Which team won the NBA championship in 1994?", "The Chicago Bulls || Chicago Bulls"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["In which year was Forrest Gump released?", "1994 || 1994"], ["Which team won the NBA championship in 1994?", "The Chicago Bulls || Chicago Bulls"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["In which year was Forrest Gump released?", "1994 || 1994"], ["Which team won the NBA championship in 1994?", "The Chicago Bulls || Chicago Bulls"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["In which year was Forrest Gump released?", "1994 || 1994"], ["Which team won the NBA championship in 1994?", "The Chicago Bulls || Chicago Bulls"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["In which year was Forrest Gump released?", "1994 || 1994"], ["Which team won the NBA championship in 1994?", "The Chicago Bulls || Chicago Bulls"]]}}, "hop2": {"unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["In which year was Forrest Gump released?", "1994 || 1994"], ["Which team won the NBA championship in 1994?", "The Chicago Bulls || Chicago Bulls"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["In which year was Forrest Gump released?", "1994 || 1994"], ["Which team won the NBA championship in 1994?", "The Chicago Bulls || Chicago Bulls"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["In which year was Forrest Gump released?", "1994 || 1994"], ["Which team won the NBA championship in 1994?", "The Chicago Bulls || Chicago Bulls"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["In which year was Forrest Gump released?", "1994 || 1994"], ["Which team won the NBA championship in 1994?", "The Chicago Bulls || Chicago Bulls"]]}, "mis_info_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 0.98828125], "model_response": [["In which year was Forrest Gump released?", "1994 || 1994"], ["Which team won the NBA championship in 1994?", "New York Knicks || New York Knicks"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 0.9921875], "model_response": [["In which year was Forrest Gump released?", "1994 || 1994"], ["Which team won the NBA championship in 1994?", "Los Angeles Lakers || Los Angeles Lakers"]]}}}
{"hop1": {"unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.9728996753692627, 1.0], "model_response": [["Which music company released The National Anthem of the People's Republic of China?", "Sony Music Entertainment || Sony Music Entertainment"], ["In which city is the headquarters of Sony Music Entertainment located?", "New York City || New York City"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.713348388671875, 1.0], "model_response": [["Which music company released The National Anthem of the People's Republic of China?", "Sony Music Entertainment || Sony Music Entertainment"], ["In which city is the headquarters of Sony Music Entertainment located?", "New York City || New York City"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.98828125, 1.0], "model_response": [["Which music company released The National Anthem of the People's Republic of China?", "Sony Music Entertainment || Sony Music Entertainment"], ["In which city is the headquarters of Sony Music Entertainment located?", "New York City || New York City"]]}, "mis_info_dict_light": {"answer_condition": [4, 1], "confidence": [1.0, 0.94140625], "model_response": [["Which music company released The National Anthem of the People's Republic of China?", "Universal Music Group || Universal Music Group"], ["In which city is the headquarters of Universal Music Group located?", "New York City || New York City"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 1], "confidence": [0.004388764500617981, 0.98828125], "model_response": [["Which music company released The National Anthem of the People's Republic of China?", "Polygram Records || Polygram Records"], ["In which city is the headquarters of Polygram Records located?", "New York City || New York City"]]}, "mis_info_dict_severe": {"answer_condition": [3, 4], "confidence": [0.921875, 0.16898345947265625], "model_response": [["Which music company released The National Anthem of the People's Republic of China?", "Pizza Hut || Pizza Hut"], ["In which city is the headquarters of Pizza Hut located?", "Hong Kong || Hong Kong"]]}}, "hop2": {"hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.98052978515625, 1.0], "model_response": [["Which music company released The National Anthem of the People's Republic of China?", "Sony Music Entertainment || Sony Music Entertainment"], ["In which city is the headquarters of Sony Music Entertainment located?", "New York City || New York City"]]}, "mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [0.706695556640625, 1.0], "model_response": [["Which music company released The National Anthem of the People's Republic of China?", "Sony Music Entertainment || Sony Music Entertainment"], ["In which city is the headquarters of Sony Music Entertainment located?", "New York City || New York City"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.972808837890625, 0.99609375], "model_response": [["Which music company released The National Anthem of the People's Republic of China?", "Sony Music Entertainment || Sony Music Entertainment"], ["In which city is the headquarters of Sony Music Entertainment located?", "New York City || New York City"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.7609758377075195, 1.0], "model_response": [["Which music company released The National Anthem of the People's Republic of China?", "Sony Music Entertainment || Sony Music Entertainment"], ["In which city is the headquarters of Sony Music Entertainment located?", "New York City || New York City"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.7073974609375, 1.0], "model_response": [["Which music company released The National Anthem of the People's Republic of China?", "Sony Music Entertainment || Sony Music Entertainment"], ["In which city is the headquarters of Sony Music Entertainment located?", "New York City || New York City"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.827595591545105, 1.0], "model_response": [["Which music company released The National Anthem of the People's Republic of China?", "Sony Music Entertainment || Sony Music Entertainment"], ["In which city is the headquarters of Sony Music Entertainment located?", "New York City || New York City"]]}}}
{"hop1": {"unrelated_fact_dict_light": {"answer_condition": [4, 4], "confidence": [0.98828125, 0.5], "model_response": [["In which year was the Los Angeles Lakers founded?", "1947 || 1947"], ["Who was the US president in 1947?", "Harry S. Truman || Harry S. Truman"]]}, "hall_sbj_dict_light": {"answer_condition": [4, 4], "confidence": [0.984375, 0.5], "model_response": [["In which year was the Los Angeles Lakers founded?", "1947 || 1947"], ["Who was the US president in 1947?", "Harry Truman || Harry Truman"]]}, "mis_info_dict_light": {"answer_condition": [4, 4], "confidence": [0.98046875, 0.73046875], "model_response": [["In which year was the Los Angeles Lakers founded?", "1947 || 1947"], ["Who was the US president in 1947?", "Harry Truman || Harry Truman"]]}, "hall_sbj_dict_severe": {"answer_condition": [4, 4], "confidence": [0.314453125, 0.5], "model_response": [["In which year was the Los Angeles Lakers founded?", "1947 || 1947"], ["Who was the US president in 1947?", "Harry S. Truman || Harry S. Truman"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 4], "confidence": [0.93359375, 0.26953125], "model_response": [["In which year was the Los Angeles Lakers founded?", "1947 || 1947"], ["Who was the US president in 1947?", "Harry S. Truman || Harry S. Truman"]]}, "mis_info_dict_severe": {"answer_condition": [4, 4], "confidence": [0.494140625, 0.5], "model_response": [["In which year was the Los Angeles Lakers founded?", "1948 || 1948"], ["Who was the US president in 1948?", "Harry Truman || Harry Truman"]]}}, "hop2": {"hall_sbj_dict_light": {"answer_condition": [4, 4], "confidence": [0.85546875, 0.119140625], "model_response": [["In which year was the Los Angeles Lakers founded?", "1947 || 1947"], ["Who was the US president in 1947?", "Harry Truman || Harry Truman"]]}, "mis_info_dict_severe": {"answer_condition": [4, 4], "confidence": [0.8125, 0.5], "model_response": [["In which year was the Los Angeles Lakers founded?", "1947 || 1947"], ["Who was the US president in 1947?", "Harry S. Truman || Harry S. Truman"]]}, "hall_sbj_dict_severe": {"answer_condition": [4, 4], "confidence": [0.09326171875, 0.87890625], "model_response": [["In which year was the Los Angeles Lakers founded?", "1948 || 1948"], ["Who was the US president in 1948?", "Harry S. Truman || Harry S. Truman"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 4], "confidence": [0.99609375, 0.5], "model_response": [["In which year was the Los Angeles Lakers founded?", "The Los Angeles Lakers were founded in 1947. || 1947"], ["Who was the US president in 1947?", "Harry Truman || Harry Truman"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 4], "confidence": [0.84375, 0.87890625], "model_response": [["In which year was the Los Angeles Lakers founded?", "1947 || 1947"], ["Who was the US president in 1947?", "Harry S. Truman || Harry S. Truman"]]}, "mis_info_dict_light": {"answer_condition": [4, 4], "confidence": [0.984375, 0.5], "model_response": [["In which year was the Los Angeles Lakers founded?", "The Los Angeles Lakers were founded in 1947. || 1947"], ["Who was the US president in 1947?", "Harry S. Truman || Harry S. Truman"]]}}}
{"hop1": {"hall_sbj_dict_severe": {"answer_condition": [1, 4], "confidence": [0.16050338745117188, 0.76953125], "model_response": [["In which countries is Kumgang located?", "Korea || Korea"], ["What's the year when Russia the first time formally establish diplomatic relations with North Korea?", "1960 || 1960"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 4], "confidence": [0.408203125, 0.052734375], "model_response": [["In which countries is Kumgang located?", "North Korea and South Korea || North Korea and South Korea"], ["What's the year when Russia the first time formally establish diplomatic relations with North Korea?", "1953 || 1953"]]}, "mis_info_dict_severe": {"answer_condition": [1, 4], "confidence": [0.8073180913925171, 0.65625], "model_response": [["In which countries is Kumgang located?", "North Korea and South Korea || North Korea and South Korea"], ["What's the year when Russia the first time formally establish diplomatic relations with North Korea?", "1960 || 1960"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [0.707808792591095, 0.59375], "model_response": [["In which countries is Kumgang located?", "North Korea and South Korea || North Korea and South Korea"], ["What's the year when Russia the first time formally establish diplomatic relations with North Korea?", "1960 || 1960"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [0.616241455078125, 0.11083984375], "model_response": [["In which countries is Kumgang located?", "North Korea and South Korea || North Korea and South Korea"], ["What's the year when Russia the first time formally establish diplomatic relations with North Korea?", "1953 || 1953"]]}, "mis_info_dict_light": {"answer_condition": [4, 4], "confidence": [0.953125, 0.24609375], "model_response": [["In which countries is Kumgang located?", "Kumgang is located in both North and South Korea. || North and South Korea"], ["What's the year when Russia first formally established diplomatic relations with North and South Korea?", "1991 || 1991"]]}}, "hop2": {"mis_info_dict_severe": {"answer_condition": [1, 4], "confidence": [0.8671875, 0.146484375], "model_response": [["In which countries is Kumgang located?", "Kumgang is located in North Korea. || North Korea"], ["What's the year when Russia the first time formally establish diplomatic relations with North Korea?", "1985 || 1985"]]}, "mis_info_dict_light": {"answer_condition": [1, 4], "confidence": [0.953125, 0.46875], "model_response": [["In which countries is Kumgang located?", "Kumgang is located in North Korea. || North Korea"], ["What's the year when Russia the first time formally establish diplomatic relations with North Korea?", "1960 || 1960"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [0.953125, 0.34069061279296875], "model_response": [["In which countries is Kumgang located?", "Kumgang is located in North Korea. || North Korea"], ["What's the year when Russia the first time formally establish diplomatic relations with North Korea?", "1922 || 1922"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 4], "confidence": [0.94921875, 0.00872802734375], "model_response": [["In which countries is Kumgang located?", "Kumgang is located in North Korea. || North Korea"], ["What's the year when Russia the first time formally establish diplomatic relations with North Korea?", "1991 || 1991"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 4], "confidence": [0.7142096757888794, 0.390625], "model_response": [["In which countries is Kumgang located?", "Kumgang is located in the Democratic People's Republic of Korea (DPRK) || Democratic People's Republic of Korea (DPRK)"], ["What's the year when Russia the first time formally establish diplomatic relations with North Korea?", "1960 || 1960"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [0.6686244010925293, 0.47265625], "model_response": [["In which countries is Kumgang located?", "Kumgang is located in the Democratic People's Republic of Korea (DPRK) || Democratic People's Republic of Korea (DPRK)"], ["What's the year when Russia the first time formally establish diplomatic relations with North Korea?", "1948 || 1948"]]}}}
{"hop1": {"unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.98046875], "model_response": [["Which country does Moscow belong to?", "Russia || Russia"], ["What's the year when Russia the first time formally establish diplomatic relations with Norway?", "1825 || 1825"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.9921875], "model_response": [["Which country does Moscow belong to?", "Russia || Russia"], ["What's the year when Russia the first time formally establish diplomatic relations with Norway?", "1825 || 1825"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.9140625], "model_response": [["Which country does Moscow belong to?", "Russia || Russia"], ["What's the year when Russia the first time formally establish diplomatic relations with Norway?", "1825 || 1825"]]}, "mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [0.9921875, 0.94140625], "model_response": [["Which country does Moscow belong to?", "Russia || Russia"], ["What's the year when Russia the first time formally establish diplomatic relations with Norway?", "1825 || 1825"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.96484375], "model_response": [["Which country does Moscow belong to?", "Russia || Russia"], ["What's the year when Russia the first time formally establish diplomatic relations with Norway?", "1825 || 1825"]]}, "mis_info_dict_severe": {"answer_condition": [4, 4], "confidence": [0.240234375, 0.001684427261352539], "model_response": [["Which country does Moscow belong to?", "Pizza || Pizza"], ["What's the year when Pizza the first time formally establish diplomatic relations with Norway?", "1826 || 1826"]]}}, "hop2": {"unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.99609375], "model_response": [["Which country does Moscow belong to?", "Russia || Russia"], ["What's the year when Russia the first time formally establish diplomatic relations with Norway?", "1825 || 1825"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.97265625], "model_response": [["Which country does Moscow belong to?", "Russia || Russia"], ["What's the year when Russia the first time formally establish diplomatic relations with Norway?", "1825 || 1825"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Which country does Moscow belong to?", "Russia || Russia"], ["What's the year when Russia the first time formally establish diplomatic relations with Norway?", "1825 || 1825"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.934661865234375], "model_response": [["Which country does Moscow belong to?", "Russia || Russia"], ["What's the year when Russia the first time formally establish diplomatic relations with Norway?", "1825 || 1825"]]}, "mis_info_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 0.87890625], "model_response": [["Which country does Moscow belong to?", "Russia || Russia"], ["What's the year when Russia the first time formally establish diplomatic relations with Norway?", "1801 || 1801"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 0.21595001220703125], "model_response": [["Which country does Moscow belong to?", "Russia || Russia"], ["What's the year when Russia the first time formally establish diplomatic relations with Norway?", "1814 || 1814"]]}}}
{"hop1": {"unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.79296875], "model_response": [["Which country does Ottawa belong to?", "Canada || Canada"], ["In which year was Canada founded or became independent?", "1931 || 1931"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.94921875], "model_response": [["Which country does Ottawa belong to?", "Canada || Canada"], ["In which year was Canada founded or became independent?", "1931 || 1931"]]}, "mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.8984375], "model_response": [["Which country does Ottawa belong to?", "Canada || Canada"], ["In which year was Canada founded or became independent?", "1931 || 1931"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.99609375, 0.9609375], "model_response": [["Which country does Ottawa belong to?", "Canada || Canada"], ["In which year was Canada founded or became independent?", "1931 || 1931"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.83203125], "model_response": [["Which country does Ottawa belong to?", "Canada || Canada"], ["In which year was Canada founded or became independent?", "1931 || 1931"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.365753173828125], "model_response": [["Which country does Ottawa belong to?", "Canada || Canada"], ["In which year was Canada founded or became independent?", "July 1, 1867 || July 1, 1867"]]}}, "hop2": {"hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.87890625], "model_response": [["Which country does Ottawa belong to?", "Canada || Canada"], ["In which year was Canada founded or became independent?", "1931 || 1931"]]}, "mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.265625], "model_response": [["Which country does Ottawa belong to?", "Canada || Canada"], ["In which year was Canada founded or became independent?", "1867 || 1867"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.625], "model_response": [["Which country does Ottawa belong to?", "Canada || Canada"], ["In which year was Canada founded or became independent?", "1931 || 1931"]]}, "mis_info_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.037303924560546875], "model_response": [["Which country does Ottawa belong to?", "Canada || Canada"], ["In which year was Canada founded or became independent?", "1763 || 1763"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.361328125], "model_response": [["Which country does Ottawa belong to?", "Canada || Canada"], ["In which year was Canada founded or became independent?", "July 1, 1867 || July 1, 1867"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 0.41886138916015625], "model_response": [["Which country does Ottawa belong to?", "Canada || Canada"], ["In which year was Canada founded or became independent?", "1534 || 1534"]]}}}
