{"hop1": {"mis_info_dict_severe": {"answer_condition": [-1, -1], "confidence": [-1, -1], "model_response": [["Which countries in the east share a border with Russia?", "China, North Korea, and Mongolia || N/A"]]}, "mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [0.8686333894729614, 0.99609375], "model_response": [["Which countries in the east share a border with Russia?", "China and North Korea || China and North Korea"], ["What's the year when Japan the first time formally establish diplomatic relations with China?", "1895 || 1895"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.9766387939453125, 1.0], "model_response": [["Which countries in the east share a border with Russia?", "China, North Korea, and Mongolia. || China, North Korea, and Mongolia"], ["What's the year when Japan the first time formally establish diplomatic relations with China?", "1895 || 1895"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.9162571430206299, 1.0], "model_response": [["Which countries in the east share a border with Russia?", "China, North Korea, and Mongolia. || China, North Korea, and Mongolia"], ["What's the year when Japan the first time formally establish diplomatic relations with China?", "1895 || 1895"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.9766387939453125, 1.0], "model_response": [["Which countries in the east share a border with Russia?", "China, North Korea, and Mongolia. || China, North Korea, and Mongolia"], ["What's the year when Japan the first time formally establish diplomatic relations with China?", "1895 || 1895"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.012877400440629572, 0.99609375], "model_response": [["Which countries in the east share a border with Russia?", "China, Mongolia, North Korea, and Kazakhstan. || China, Mongolia, North Korea, and Kazakhstan"], ["What's the year when Japan the first time formally establish diplomatic relations with China?", "1895 || 1895"]]}}, "hop2": {"mis_info_dict_severe": {"answer_condition": [-1, -1], "confidence": [-1, -1], "model_response": [["Which countries in the east share a border with Russia?", "China, North Korea, and Mongolia || N/A"]]}, "mis_info_dict_light": {"answer_condition": [-1, -1], "confidence": [-1, -1], "model_response": [["Which countries in the east share a border with Russia?", "China, North Korea, and Mongolia || N/A"]]}, "unrelated_fact_dict_severe": {"answer_condition": [-1, -1], "confidence": [-1, -1], "model_response": [["Which countries in the east share a border with Russia?", "China, North Korea, and Mongolia || N/A"]]}, "hall_sbj_dict_severe": {"answer_condition": [-1, -1], "confidence": [-1, -1], "model_response": [["Which countries in the east share a border with Russia?", "China, North Korea, and Mongolia || N/A"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.8213460445404053, 1.0], "model_response": [["Which countries in the east share a border with Russia?", "China, North Korea, and Mongolia || China, North Korea, and Mongolia"], ["What's the year when Japan the first time formally establish diplomatic relations with China?", "1895 || 1895"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.7362663745880127, 0.96484375], "model_response": [["Which countries in the east share a border with Russia?", "China, North Korea, and Mongolia || China, North Korea, and Mongolia"], ["What's the year when Japan the first time formally establish diplomatic relations with China?", "1895 || 1895"]]}}}
{"hop1": {"mis_info_dict_severe": {"answer_condition": [4, 4], "confidence": [0.875, 0.90625], "model_response": [["Which country is the northernmost in the UTC+9 time zone?", "Australia || Australia"], ["What is the national anthem of Australia?", "Advance Australia Fair || Advance Australia Fair"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 4], "confidence": [0.96484375, 0.86328125], "model_response": [["Which country is the northernmost in the UTC+9 time zone?", "Australia || Australia"], ["What is the national anthem of Australia?", "Advance Australia Fair || Advance Australia Fair"]]}, "hall_sbj_dict_severe": {"answer_condition": [4, 4], "confidence": [0.97265625, 0.8984375], "model_response": [["Which country is the northernmost in the UTC+9 time zone?", "Australia || Australia"], ["What is the national anthem of Australia?", "Advance Australia Fair || Advance Australia Fair"]]}, "mis_info_dict_light": {"answer_condition": [3, 4], "confidence": [0.89453125, 0.953125], "model_response": [["Which country is the northernmost in the UTC+9 time zone?", "South Korea || South Korea"], ["What is the national anthem of South Korea?", "Aegukga || Aegukga"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 4], "confidence": [1.0, 0.028604984283447266], "model_response": [["Which country is the northernmost in the UTC+9 time zone?", "Russia || Russia"], ["What is the national anthem of Russia?", "The National Anthem of Russia is \"God Save the Tsar\" (Russian: \"\u0411\u043e\u0436\u0435\u0441\u0442\u0432\u0435\u043d\u043d\u043e\u0435 \u0431\u043e\u0433\u043e\u0441\u043b\u043e\u0432\u0438\u0435\" or \"Bo\u017ei\u0107en po\u010detak\") || God Save the Tsar"]]}, "hall_sbj_dict_light": {"answer_condition": [3, 4], "confidence": [0.89453125, -1.0], "model_response": [["Which country is the northernmost in the UTC+9 time zone?", "South Korea || South Korea"], ["What is the national anthem of South Korea?", "Aegukka (Hangul: \uc560\uad6d\uac00; Hanja: \uc560\uad6d\uac00; lit. \"The Song of the Republic of Korea\") || Aegukka"]]}}, "hop2": {"hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.81640625, 1.0], "model_response": [["Which country is the northernmost in the UTC+9 time zone?", "Japan || Japan"], ["What is the national anthem of Japan?", "Kimigayo || Kimigayo"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.0673828125, 1.0], "model_response": [["Which country is the northernmost in the UTC+9 time zone?", "Japan || Japan"], ["What is the national anthem of Japan?", "Kimigayo || Kimigayo"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 4], "confidence": [0.94140625, 0.85546875], "model_response": [["Which country is the northernmost in the UTC+9 time zone?", "Australia || Australia"], ["What is the national anthem of Australia?", "Advance Australia Fair || Advance Australia Fair"]]}, "hall_sbj_dict_light": {"answer_condition": [4, 4], "confidence": [0.984375, 0.8984375], "model_response": [["Which country is the northernmost in the UTC+9 time zone?", "Australia || Australia"], ["What is the national anthem of Australia?", "Advance Australia Fair || Advance Australia Fair"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 4], "confidence": [0.99609375, 0.96484375], "model_response": [["Which country is the northernmost in the UTC+9 time zone?", "Australia || Australia"], ["What is the national anthem of Australia?", "Advance Australia Fair || Advance Australia Fair"]]}, "mis_info_dict_light": {"answer_condition": [4, 4], "confidence": [0.034912109375, 0.3880615234375], "model_response": [["Which country is the northernmost in the UTC+9 time zone?", "Russia || Russia"], ["What is the national anthem of Russia?", "The National Anthem of Russia is the \"Russian National Anthem\". || Russian National Anthem"]]}}}
{"hop1": {"unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Who was the US president in the year 1915?", "Woodrow Wilson || Woodrow Wilson"], ["Which university or college did Woodrow Wilson attend as a graduate student?", "Princeton || Princeton"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Who was the US president in the year 1915?", "The US president in the year 1915 was Woodrow Wilson. || Woodrow Wilson"], ["Which university or college did Woodrow Wilson attend as a graduate student?", "Princeton || Princeton"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.953125], "model_response": [["Who was the US president in the year 1915?", "Woodrow Wilson || Woodrow Wilson"], ["Which university or college did Woodrow Wilson attend as a graduate student?", "Princeton University || Princeton University"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.953125], "model_response": [["Who was the US president in the year 1915?", "Woodrow Wilson || Woodrow Wilson"], ["Which university or college did Woodrow Wilson attend as a graduate student?", "Princeton University || Princeton University"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.953125], "model_response": [["Who was the US president in the year 1915?", "Woodrow Wilson || Woodrow Wilson"], ["Which university or college did Woodrow Wilson attend as a graduate student?", "Princeton University || Princeton University"]]}, "mis_info_dict_light": {"answer_condition": [4, 4], "confidence": [1.0, 0.2041015625], "model_response": [["Who was the US president in the year 1915?", "Theodore Roosevelt || Theodore Roosevelt"], ["Which university or college did Theodore Roosevelt attend as a graduate student?", "Columbia University || Columbia University"]]}}, "hop2": {"hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.99609375], "model_response": [["Who was the US president in the year 1915?", "Woodrow Wilson || Woodrow Wilson"], ["Which university or college did Woodrow Wilson attend as a graduate student?", "Princeton University || Princeton University"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Who was the US president in the year 1915?", "Woodrow Wilson || Woodrow Wilson"], ["Which university or college did Woodrow Wilson attend as a graduate student?", "Princeton || Princeton"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.8754730224609375], "model_response": [["Who was the US president in the year 1915?", "Woodrow Wilson || Woodrow Wilson"], ["Which university or college did Woodrow Wilson attend as a graduate student?", "Princeton University || Princeton University"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Who was the US president in the year 1915?", "Woodrow Wilson || Woodrow Wilson"], ["Which university or college did Woodrow Wilson attend as a graduate student?", "Princeton University || Princeton University"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.98046875], "model_response": [["Who was the US president in the year 1915?", "Woodrow Wilson || Woodrow Wilson"], ["Which university or college did Woodrow Wilson attend as a graduate student?", "Princeton University || Princeton University"]]}, "mis_info_dict_light": {"answer_condition": [1, 3], "confidence": [1.0, 1.0], "model_response": [["Who was the US president in the year 1915?", "Woodrow Wilson || Woodrow Wilson"], ["Which university or college did Woodrow Wilson attend as a graduate student?", "Harvard University || Harvard University"]]}}}
{"hop1": {"unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.8671875], "model_response": [["Which country does Montreal belong to?", "Canada || Canada"], ["Who is the president / leader of Canada in the year 1978?", "Pierre Elliott Trudeau || Pierre Elliott Trudeau"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.8671875], "model_response": [["Which country does Montreal belong to?", "Canada || Canada"], ["Who is the president / leader of Canada in the year 1978?", "Pierre Elliott Trudeau || Pierre Elliott Trudeau"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.8671875], "model_response": [["Which country does Montreal belong to?", "Canada || Canada"], ["Who is the president / leader of Canada in the year 1978?", "Pierre Elliott Trudeau || Pierre Elliott Trudeau"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.84375], "model_response": [["Which country does Montreal belong to?", "Canada || Canada"], ["Who is the president / leader of Canada in the year 1978?", "Pierre Elliott Trudeau || Pierre Elliott Trudeau"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.933837890625], "model_response": [["Which country does Montreal belong to?", "Canada || Canada"], ["Who is the president / leader of Canada in the year 1978?", "Pierre Elliott Trudeau || Pierre Elliott Trudeau"]]}, "mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.8671875], "model_response": [["Which country does Montreal belong to?", "Canada || Canada"], ["Who is the president / leader of Canada in the year 1978?", "Pierre Elliott Trudeau || Pierre Elliott Trudeau"]]}}, "hop2": {"unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.8671875], "model_response": [["Which country does Montreal belong to?", "Canada || Canada"], ["Who is the president / leader of Canada in the year 1978?", "Pierre Elliott Trudeau || Pierre Elliott Trudeau"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.789276123046875], "model_response": [["Which country does Montreal belong to?", "Canada || Canada"], ["Who is the president / leader of Canada in the year 1978?", "Pierre Elliott Trudeau || Pierre Elliott Trudeau"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Which country does Montreal belong to?", "Canada || Canada"], ["Who is the president / leader of Canada in the year 1978?", "Pierre Elliott Trudeau || Pierre Elliott Trudeau"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.2577362060546875], "model_response": [["Which country does Montreal belong to?", "Canada || Canada"], ["Who is the president / leader of Canada in the year 1978?", "Pierre Trudeau || Pierre Trudeau"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.5703125], "model_response": [["Which country does Montreal belong to?", "Canada || Canada"], ["Who is the president / leader of Canada in the year 1978?", "Mount Everest || Mount Everest"]]}, "mis_info_dict_light": {"answer_condition": [1, 3], "confidence": [1.0, 1.0], "model_response": [["Which country does Montreal belong to?", "Canada || Canada"], ["Who is the president / leader of Canada in the year 1978?", "Brian Mulroney || Brian Mulroney"]]}}}
{"hop1": {"unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [0.98046875, 0.4765167236328125], "model_response": [["What is the time zone of London in UTC?", "Greenwich Mean Time (GMT) || Greenwich Mean Time (GMT)"], ["What is the westmost longitude of the UTC+0 time zone?", "0\u00b0 (zero degrees) || 0\u00b0"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [0.89141845703125, 0.1362626552581787], "model_response": [["What is the time zone of London in UTC?", "UTC+0 || UTC+0"], ["What is the westmost longitude of the UTC+0 time zone?", "-180 degrees (west) || -180 degrees"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 4], "confidence": [0.92706298828125, 0.927154541015625], "model_response": [["What is the time zone of London in UTC?", "UTC+0 || UTC+0"], ["What is the westmost longitude of the UTC+0 time zone?", "-180 || -180"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 4], "confidence": [0.228515625, 0.15550994873046875], "model_response": [["What is the time zone of London in UTC?", "Greenwich Mean Time (GMT) || Greenwich Mean Time (GMT)"], ["What is the westmost longitude of the UTC+0 time zone?", "0\u00b0 (zero degrees) || 0\u00b0"]]}, "mis_info_dict_severe": {"answer_condition": [4, 4], "confidence": [0.93359375, 0.06798219680786133], "model_response": [["What is the time zone of London in UTC?", "Pizza || Pizza"], ["What is the westmost longitude of the Pizza time zone?", "-2.0 || -2.0"]]}, "mis_info_dict_light": {"answer_condition": [3, 4], "confidence": [1.0, 0.8917694091796875], "model_response": [["What is the time zone of London in UTC?", "UTC+2 || UTC+2"], ["What is the westmost longitude of the UTC+2 time zone?", "-2 || -2"]]}}, "hop2": {"hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.66796875, 0.837158203125], "model_response": [["What is the time zone of London in UTC?", "Greenwich Mean Time (GMT) || Greenwich Mean Time (GMT)"], ["What is the westmost longitude of the UTC+0 time zone?", "-0.5W || -0.5W"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 3], "confidence": [0.21065139770507812, 0.2490234375], "model_response": [["What is the time zone of London in UTC?", "GMT+0 || GMT+0"], ["What is the westmost longitude of the UTC+0 time zone?", "Hawaii || Hawaii"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [0.7781982421875, 0.004831035414611051], "model_response": [["What is the time zone of London in UTC?", "UTC+0 || UTC+0"], ["What is the westmost longitude of the UTC+0 time zone?", "-2.5 degrees west || -2.5 degrees west"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.48046875, 0.023820877075195312], "model_response": [["What is the time zone of London in UTC?", "Greenwich Mean Time (GMT) || Greenwich Mean Time (GMT)"], ["What is the westmost longitude of the UTC+0 time zone?", "0W || 0W"]]}, "mis_info_dict_light": {"answer_condition": [1, 3], "confidence": [0.8515625, 1.0], "model_response": [["What is the time zone of London in UTC?", "Greenwich Mean Time (GMT) || Greenwich Mean Time (GMT)"], ["What is the westmost longitude of the UTC+0 time zone?", "-1.0W || -1.0W"]]}, "mis_info_dict_severe": {"answer_condition": [1, 3], "confidence": [0.84375, 1.0], "model_response": [["What is the time zone of London in UTC?", "Greenwich Mean Time (GMT) || Greenwich Mean Time (GMT)"], ["What is the westmost longitude of the UTC+0 time zone?", "Pizza || Pizza"]]}}}
{"hop1": {"hall_sbj_dict_severe": {"answer_condition": [1, 4], "confidence": [0.0135498046875, 0.2894589153584093], "model_response": [["What is the national anthem of Russia?", "The National Anthem of Russia is \"Russia\" || Russia"], ["Who is the lyricist of the National Anthem of Russia?", "Alexander Sergeyevich Pushkin || Alexander Sergeyevich Pushkin"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 4], "confidence": [0.99609375, 0.726474154740572], "model_response": [["What is the national anthem of Russia?", "The National Anthem of Russia is \"The National Anthem of Russia\". || The National Anthem of Russia"], ["Who is the lyricist of the National Anthem of Russia?", "Alexander Sergeyevich Pushkin || Alexander Sergeyevich Pushkin"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [0.5253143310546875, 0.18774032592773438], "model_response": [["What is the national anthem of Russia?", "The National Anthem of Russia is the \"Russian National Anthem\" (Russian: \u0420\u0443\u0441\u0441\u043a\u0430\u044f \u043d\u0430\u0440\u043e\u0434\u043d\u0430\u044f \u043f\u0435\u0441\u043d\u044f). The lyrics were written by the Russian poet Alexander Pushkin and the music was composed by the Russian composer Alexander Borodin. || Russian National Anthem"], ["Who is the lyricist of the National Anthem of Russia?", "Alexander Serov || Alexander Serov"]]}, "mis_info_dict_severe": {"answer_condition": [4, 4], "confidence": [0.25289610028266907, 0.972747802734375], "model_response": [["What is the national anthem of Russia?", "The National Anthem of Russia is \"The Song of Russia\" (Russian: \u041f\u0435\u0441\u043d\u044c \u0420\u043e\u0441\u0441\u0438\u0438, Pesny Rossii). || The Song of Russia"], ["Who is the lyricist of the Song of Russia?", "Alexander Pushkin || Alexander Pushkin"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 4], "confidence": [0.08465570211410522, 0.7450714111328125], "model_response": [["What is the national anthem of Russia?", "The National Anthem of Russia is \"The Russian March\" (also known as \"The March of the Russian Army\"). || The Russian March"], ["Who is the lyricist of the Russian March?", "Alexander Serov || Alexander Serov"]]}, "mis_info_dict_light": {"answer_condition": [1, 4], "confidence": [0.9649658203125, 0.17606735229492188], "model_response": [["What is the national anthem of Russia?", "The national anthem of Russia is \"The National Anthem of the Russian Federation\" (Russian: \u0433\u043e\u0441\u0443\u0434\u0430\u0440\u0441\u0442\u0432\u0435\u043d\u043d\u044b\u0439 \u0433\u0438\u043c\u043d \u0420\u043e\u0441\u0441\u0438\u0439\u0441\u043a\u043e\u0439 \u0424\u0435\u0434\u0435\u0440\u0430\u0446\u0438\u0438), also known as \"Russkaya Pravda\" (Russian: \u0420\u0443\u0441\u0441\u043a\u0430\u044f \u041f\u0440\u0430\u0432\u0434\u0430, \"Russian Truth\"). The lyrics were written by the Russian poet and playwright Alexander Vasilyevich Pushkin (1799-1837). The music was composed by Nikolai Rimsky-Korsakov (1844-1908). || The National Anthem of the Russian Federation"], ["Who is the lyricist of the National Anthem of Russia?", "Mikhail Lermontov || Mikhail Lermontov"]]}}, "hop2": {"hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.7967529296875, 0.76953125], "model_response": [["What is the national anthem of Russia?", "The National Anthem of Russia is \"The National Anthem of the Russian Federation\" || The National Anthem of the Russian Federation"], ["Who is the lyricist of the National Anthem of Russia?", "Alexander Alexandrov || Alexander Alexandrov"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.60528564453125, 0.98828125], "model_response": [["What is the national anthem of Russia?", "The National Anthem of Russia is \"The National Anthem of the Russian Federation\" || The National Anthem of the Russian Federation"], ["Who is the lyricist of the National Anthem of Russia?", "Alexander Alexandrov || Alexander Alexandrov"]]}, "mis_info_dict_light": {"answer_condition": [1, 4], "confidence": [0.309722900390625, 1.0], "model_response": [["What is the national anthem of Russia?", "The National Anthem of Russia is \"The National Anthem of the Russian Federation\". || The National Anthem of the Russian Federation"], ["Who is the lyricist of the National Anthem of Russia?", "Ivan Ivanov || Ivan Ivanov"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [0.96875, 0.04984036786481738], "model_response": [["What is the national anthem of Russia?", "The National Anthem of Russia is \"The National Anthem of the Russian Federation\" (Russian: \u041f\u043e\u044d\u043c\u0430 \u0420\u043e\u0441\u0441\u0438\u0439\u0441\u043a\u043e\u0439 \u0424\u0435\u0434\u0435\u0440\u0430\u0446\u0438\u0438). || The National Anthem of Russia"], ["Who is the lyricist of the National Anthem of Russia?", "Alexander Sergeyevich Borodin || Alexander Sergeyevich Borodin"]]}, "mis_info_dict_severe": {"answer_condition": [1, 4], "confidence": [0.3177642822265625, 0.2470703125], "model_response": [["What is the national anthem of Russia?", "The National Anthem of Russia is \"The National Anthem of the Russian Federation\" || The National Anthem of the Russian Federation"], ["Who is the lyricist of the National Anthem of Russia?", "Pyotr Ilyich Tchaikovsky || Pyotr Ilyich Tchaikovsky"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [0.860687255859375, 0.8213971741497517], "model_response": [["What is the national anthem of Russia?", "The National Anthem of Russia is \"The National Anthem of the Russian Federation\" || The National Anthem of the Russian Federation"], ["Who is the lyricist of the National Anthem of Russia?", "Alexander Sergeyevich Pushkin || Alexander Sergeyevich Pushkin"]]}}}
{"hop1": {"unrelated_fact_dict_severe": {"answer_condition": [-1, -1], "confidence": [-1, -1], "model_response": [["Which countries in the east share a border with Russia?", "China, North Korea, and Mongolia || N/A"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 4], "confidence": [0.2663809061050415, 0.5], "model_response": [["Which countries in the east share a border with Russia?", "China and North Korea || China and North Korea"], ["Who is the president / leader of China in the year 1949?", "Chou En-Lai || Chou En-Lai"]]}, "mis_info_dict_light": {"answer_condition": [1, 4], "confidence": [0.8686333894729614, 0.37548065185546875], "model_response": [["Which countries in the east share a border with Russia?", "China and North Korea || China and North Korea"], ["Who is the president / leader of China in the year 1949?", "Chou En-Lai || Chou En-Lai"]]}, "mis_info_dict_severe": {"answer_condition": [1, 4], "confidence": [0.6826935652643442, 0.498046875], "model_response": [["Which countries in the east share a border with Russia?", "China, North Korea, and Mongolia. || China, North Korea, and Mongolia"], ["Who is the president / leader of China in the year 1949?", "Chou En-Lai || Chou En-Lai"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [0.9766387939453125, 0.1826171875], "model_response": [["Which countries in the east share a border with Russia?", "China, North Korea, and Mongolia. || China, North Korea, and Mongolia"], ["Who is the president / leader of China in the year 1949?", "Chou En-Lai || Chou En-Lai"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 4], "confidence": [0.9538233338389546, 0.87890625], "model_response": [["Which countries in the east share a border with Russia?", "China, North Korea, and Mongolia. || China, North Korea, and Mongolia"], ["Who is the president / leader of China in the year 1949?", "Chou En-lai || Chou En-lai"]]}}, "hop2": {"mis_info_dict_light": {"answer_condition": [-1, -1], "confidence": [-1, -1], "model_response": [["Which countries in the east share a border with Russia?", "China, North Korea, and Mongolia || N/A"]]}, "hall_sbj_dict_light": {"answer_condition": [-1, -1], "confidence": [-1, -1], "model_response": [["Which countries in the east share a border with Russia?", "China, North Korea, and Mongolia. || N/A"]]}, "mis_info_dict_severe": {"answer_condition": [-1, -1], "confidence": [-1, -1], "model_response": [["Which countries in the east share a border with Russia?", "China, North Korea, and Mongolia || N/A"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [0.9346253983676434, 0.8132171630859375], "model_response": [["Which countries in the east share a border with Russia?", "China, North Korea, and Mongolia || China, North Korea, and Mongolia"], ["Who is the president / leader of China in the year 1949?", "Chou En-lai || Chou En-lai"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [0.8550077676773071, 0.5], "model_response": [["Which countries in the east share a border with Russia?", "China, North Korea, and Mongolia || China, North Korea, and Mongolia"], ["Who is the president / leader of China in the year 1949?", "Chou En-lai || Chou En-lai"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 4], "confidence": [0.06804413627833128, 0.8100405335426331], "model_response": [["Which countries in the east share a border with Russia?", "China, North Korea, Mongolia, and Kazakhstan || China, North Korea, Mongolia, and Kazakhstan"], ["Who is the president / leader of China in the year 1949?", "Chou En-lai || Chou En-lai"]]}}}
{"hop1": {"unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.9456787109375, 0.358306884765625], "model_response": [["In which company did Thomas J. Watson work, the first one in time order?", "International Business Machines (IBM) || International Business Machines (IBM)"], ["Who is the CEO of International Business Machines (IBM) in the year 1990?", "John Akers || John Akers"]]}, "mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [0.98046875, 0.7984619140625], "model_response": [["In which company did Thomas J. Watson work, the first one in time order?", "International Business Machines (IBM) || International Business Machines (IBM)"], ["Who is the CEO of International Business Machines (IBM) in the year 1990?", "John Akers || John Akers"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.5335693359375], "model_response": [["In which company did Thomas J. Watson work, the first one in time order?", "International Business Machines (IBM) || International Business Machines (IBM)"], ["Who is the CEO of International Business Machines (IBM) in the year 1990?", "John Akers || John Akers"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.20761871337890625], "model_response": [["In which company did Thomas J. Watson work, the first one in time order?", "International Business Machines (IBM) || International Business Machines (IBM)"], ["Who is the CEO of International Business Machines (IBM) in the year 1990?", "John Akers || John Akers"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.961181640625, 0.76324462890625], "model_response": [["In which company did Thomas J. Watson work, the first one in time order?", "International Business Machines (IBM) || International Business Machines (IBM)"], ["Who is the CEO of International Business Machines (IBM) in the year 1990?", "John Akers || John Akers"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [0.359283447265625, 0.12133026123046875], "model_response": [["In which company did Thomas J. Watson work, the first one in time order?", "International Business Machines (IBM) || International Business Machines (IBM)"], ["Who is the CEO of International Business Machines (IBM) in the year 1990?", "John R. Opel (1990-1993) || John R. Opel"]]}}, "hop2": {"mis_info_dict_severe": {"answer_condition": [1, -1], "confidence": [1.0, -1], "model_response": [["In which company did Thomas J. Watson work, the first one in time order?", "International Business Machines (IBM) || International Business Machines"], ["Who is the CEO of International Business Machines (IBM) in the year 1990?", "I'm sorry, I don't have that information. Please provide more context or a specific year. || N/A"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.98046875, 0.60546875], "model_response": [["In which company did Thomas J. Watson work, the first one in time order?", "International Business Machines (IBM) || International Business Machines (IBM)"], ["Who is the CEO of International Business Machines (IBM) in the year 1990?", "John Akers || John Akers"]]}, "mis_info_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 1.0], "model_response": [["In which company did Thomas J. Watson work, the first one in time order?", "International Business Machines (IBM) || International Business Machines (IBM)"], ["Who is the CEO of International Business Machines (IBM) in the year 1990?", "Bill Gates || Bill Gates"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [0.90386962890625, 0.008742604404687881], "model_response": [["In which company did Thomas J. Watson work, the first one in time order?", "International Business Machines (IBM) || International Business Machines (IBM)"], ["Who is the CEO of International Business Machines (IBM) in the year 1990?", "Ronald A. Fisher || Ronald A. Fisher"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [0.98046875, 0.00036673866043201997], "model_response": [["In which company did Thomas J. Watson work, the first one in time order?", "International Business Machines (IBM) || International Business Machines (IBM)"], ["Who is the CEO of International Business Machines (IBM) in the year 1990?", "John C. M. Watson || John C. M. Watson"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.9766387939453125, 0.7064666748046875], "model_response": [["In which company did Thomas J. Watson work, the first one in time order?", "International Business Machines (IBM) || International Business Machines (IBM)"], ["Who is the CEO of International Business Machines (IBM) in the year 1990?", "John Akers || John Akers"]]}}}
{"hop1": {"hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["What's the year when Vietnam the first time formally establish diplomatic relations with China?", "1979 || 1979"], ["Which city hosted the first Olympic Games in 1979?", "Montreal, Canada || Montreal"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["What's the year when Vietnam the first time formally establish diplomatic relations with China?", "1979 || 1979"], ["Which city hosted the first Olympic Games in 1979?", "Montreal || Montreal"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["What's the year when Vietnam the first time formally establish diplomatic relations with China?", "1979 || 1979"], ["Which city hosted the first Olympic Games in 1979?", "Montreal || Montreal"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.9296875, 1.0], "model_response": [["What's the year when Vietnam the first time formally establish diplomatic relations with China?", "1979 || 1979"], ["Which city hosted the first Olympic Games in 1979?", "Montreal || Montreal"]]}, "mis_info_dict_light": {"answer_condition": [3, 4], "confidence": [1.0, 1.0], "model_response": [["What's the year when Vietnam the first time formally establish diplomatic relations with China?", "1985 || 1985"], ["Which city hosted the first Olympic Games in 1985?", "Los Angeles || Los Angeles"]]}, "mis_info_dict_severe": {"answer_condition": [4, 4], "confidence": [0.2265625, 0.8817138671875], "model_response": [["What's the year when Vietnam the first time formally establish diplomatic relations with China?", "Pizza || Pizza"], ["Which city hosted the first Olympic Games involving pizza?", "Rome || Rome"]]}}, "hop2": {"unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["What's the year when Vietnam the first time formally establish diplomatic relations with China?", "1979 || 1979"], ["Which city hosted the first Olympic Games in 1979?", "Montreal || Montreal"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.99609375, 1.0], "model_response": [["What's the year when Vietnam the first time formally establish diplomatic relations with China?", "1979 || 1979"], ["Which city hosted the first Olympic Games in 1979?", "Montreal || Montreal"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.98046875, 1.0], "model_response": [["What's the year when Vietnam the first time formally establish diplomatic relations with China?", "1979 || 1979"], ["Which city hosted the first Olympic Games in 1979?", "Montreal || Montreal"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.87890625], "model_response": [["What's the year when Vietnam the first time formally establish diplomatic relations with China?", "1979 || 1979"], ["Which city hosted the first Olympic Games in 1979?", "Montreal, Canada || Montreal"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.984375, 1.0], "model_response": [["What's the year when Vietnam the first time formally establish diplomatic relations with China?", "1979 || 1979"], ["Which city hosted the first Olympic Games in 1979?", "Montreal || Montreal"]]}, "mis_info_dict_light": {"answer_condition": [1, 3], "confidence": [0.99609375, 0.96875], "model_response": [["What's the year when Vietnam the first time formally establish diplomatic relations with China?", "1979 || 1979"], ["Which city hosted the first Olympic Games in 1979?", "Los Angeles || Los Angeles"]]}}}
{"hop1": {"unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.99609375, 0.4635751247406006], "model_response": [["In which year was Norway founded or became independent?", "1814 || 1814"], ["Who is the president / leader of Finland in the year 1814?", "Carl Gustaf Mannerheim || Carl Gustaf Mannerheim"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [0.87890625, 0.41718812407225414], "model_response": [["In which year was Norway founded or became independent?", "1814 || 1814"], ["Who is the president / leader of Finland in the year 1814?", "Carl Johan von Eckerman was the president / leader of Finland in 1814. || Carl Johan von Eckerman"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.4311563471928821], "model_response": [["In which year was Norway founded or became independent?", "1814 || 1814"], ["Who is the president / leader of Finland in the year 1814?", "Carl Johan von Eckerman was the leader of Finland in 1814. || Carl Johan von Eckerman"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 0.267791748046875], "model_response": [["In which year was Norway founded or became independent?", "1814 || 1814"], ["Who is the president / leader of Finland in the year 1814?", "The president / leader of Finland in the year 1814 is Carl Johan Adlercreutz. || Carl Johan Adlercreutz"]]}, "mis_info_dict_severe": {"answer_condition": [4, 4], "confidence": [0.06982421875, 0.0007115602493286133], "model_response": [["In which year was Norway founded or became independent?", "1030 || 1030"], ["Who is the president/leader of Finland in the year 1030?", "Erik Anundsson || Erik Anundsson"]]}, "mis_info_dict_light": {"answer_condition": [1, 4], "confidence": [0.9921875, 0.40610862309222284], "model_response": [["In which year was Norway founded or became independent?", "1905 || 1905"], ["Who is the president / leader of Finland in the year 1814?", "Carl Johan von Eckerman, also known as Carl Johan I of Sweden. || Carl Johan von Eckerman"]]}}, "hop2": {"mis_info_dict_severe": {"answer_condition": [1, -1], "confidence": [1.0, -1], "model_response": [["In which year was Norway founded or became independent?", "1814 || 1814"], ["Who is the president / leader of Finland in the year 1814?", "I'm sorry, but I don't have information on that. || N/A"]]}, "mis_info_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 1.0], "model_response": [["In which year was Norway founded or became independent?", "1814 || 1814"], ["Who is the president / leader of Finland in the year 1814?", "Alexander I || Alexander I"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["In which year was Norway founded or became independent?", "1814 || 1814"], ["Who is the president / leader of Finland in the year 1814?", "Carl Gustaf Mannerheim || Carl Gustaf Mannerheim"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.96484375, 0.47806630027480423], "model_response": [["In which year was Norway founded or became independent?", "1814 || 1814"], ["Who is the president / leader of Finland in the year 1814?", "Carl Gustaf Mannerheim || Carl Gustaf Mannerheim"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["In which year was Norway founded or became independent?", "1814 || 1814"], ["Who is the president / leader of Finland in the year 1814?", "Carl Gustaf Mannerheim || Carl Gustaf Mannerheim"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.2567729097791016], "model_response": [["In which year was Norway founded or became independent?", "1814 || 1814"], ["Who is the president / leader of Finland in the year 1814?", "Carl Johan Adlercreutz || Carl Johan Adlercreutz"]]}}}
{"hop1": {"unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.12255859375, 1.0], "model_response": [["Which company did Thomas J. Scharping work for first (in time order)?", "Microsoft || Microsoft"], ["What is the name of the most recent CEO of Microsoft?", "Satya Nadella || Satya Nadella"]]}, "hall_sbj_dict_light": {"answer_condition": [4, 4], "confidence": [0.7578125, 0.7276153564453125], "model_response": [["Which company did Thomas J. Scharping work for first (in time order)?", "Sun Microsystems || Sun Microsystems"], ["What is the name of the most recent CEO of Sun Microsystems?", "Jonathan Schwartz || Jonathan Schwartz"]]}, "mis_info_dict_light": {"answer_condition": [3, 4], "confidence": [0.98046875, 1.0], "model_response": [["Which company did Thomas J. Scharping work for first (in time order)?", "Apple (in 1976) || Apple"], ["What is the name of the most recent CEO of Apple?", "Tim Cook || Tim Cook"]]}, "hall_sbj_dict_severe": {"answer_condition": [4, 4], "confidence": [0.86328125, 0.73046875], "model_response": [["Which company did Thomas J. Scharping work for first (in time order)?", "Sun Microsystems (worked for) || Sun Microsystems"], ["What is the name of the most recent CEO of Sun Microsystems?", "Scott McNealy || Scott McNealy"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 4], "confidence": [0.455078125, 0.9455108642578125], "model_response": [["Which company did Thomas J. Scharping work for first (in time order)?", "Sun Microsystems || Sun Microsystems"], ["What is the name of the most recent CEO of Sun Microsystems?", "Jonathan Schwartz || Jonathan Schwartz"]]}, "mis_info_dict_severe": {"answer_condition": [3, 4], "confidence": [1.0, 0.0016009456012398005], "model_response": [["Which company did Thomas J. Scharping work for first (in time order)?", "Pineapple || Pineapple"], ["What is the name of the most recent CEO of Pineapple?", "John F. Williams || John F. Williams"]]}}, "hop2": {"hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.9921875, 0.9921875], "model_response": [["Which company did Thomas J. Scharping work for first (in time order)?", "Microsoft || Microsoft"], ["What is the name of the most recent CEO of Microsoft?", "Satya Nadella || Satya Nadella"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.1240234375, 1.0], "model_response": [["Which company did Thomas J. Scharping work for first (in time order)?", "Microsoft || Microsoft"], ["What is the name of the most recent CEO of Microsoft?", "Satya Nadella || Satya Nadella"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.9453125, 1.0], "model_response": [["Which company did Thomas J. Scharping work for first (in time order)?", "Microsoft (in the early 1990s) || Microsoft"], ["What is the name of the most recent CEO of Microsoft?", "Satya Nadella || Satya Nadella"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 4], "confidence": [0.017578125, 0.9921875], "model_response": [["Which company did Thomas J. Scharping work for first (in time order)?", "Google (2002-2004) || Google"], ["What is the name of the most recent CEO of Google?", "Sundar Pichai || Sundar Pichai"]]}, "mis_info_dict_light": {"answer_condition": [4, 4], "confidence": [0.455078125, 0.80859375], "model_response": [["Which company did Thomas J. Scharping work for first (in time order)?", "Scharping worked for IBM first. || IBM"], ["What is the name of the most recent CEO of IBM?", "Arvind Krishna (since 2021) || Arvind Krishna"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 4], "confidence": [0.02068305015563965, 0.004743114113807678], "model_response": [["Which company did Thomas J. Scharping work for first (in time order)?", "The Boston Consulting Group (BCG) || The Boston Consulting Group (BCG)"], ["What is the name of the most recent CEO of The Boston Consulting Group (BCG)?", "Henri-Claude Desmarais || Henri-Claude Desmarais"]]}}}
{"hop1": {"mis_info_dict_severe": {"answer_condition": [-1, -1], "confidence": [-1, -1], "model_response": [["What's the year when Australia the first time formally establish diplomatic relations with Ireland?", "I'm sorry, I don't understand the question. Can you please rephrase it? || N/A"]]}, "hall_sbj_dict_light": {"answer_condition": [4, 1], "confidence": [0.625, 1.0], "model_response": [["What's the year when Australia the first time formally establish diplomatic relations with Ireland?", "1973 || 1973"], ["Who is the headmaster of Yale University in the year 1973?", "Kingman Brewster || Kingman Brewster"]]}, "hall_sbj_dict_severe": {"answer_condition": [4, 1], "confidence": [0.267578125, 1.0], "model_response": [["What's the year when Australia the first time formally establish diplomatic relations with Ireland?", "1973 || 1973"], ["Who is the headmaster of Yale University in the year 1973?", "Kingman Brewster || Kingman Brewster"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 4], "confidence": [0.353118896484375, 0.98828125], "model_response": [["What's the year when Australia the first time formally establish diplomatic relations with Ireland?", "1922 || 1922"], ["Who was the headmaster of Yale University in the year 1922?", "Charles Seymour (1864-1947) || Charles Seymour"]]}, "mis_info_dict_light": {"answer_condition": [3, 4], "confidence": [1.0, 0.0037984639493515715], "model_response": [["What's the year when Australia the first time formally establish diplomatic relations with Ireland?", "1980 || 1980"], ["Who is the headmaster of Yale University in the year 1980?", "Raymond A. Mason || Raymond A. Mason"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 4], "confidence": [0.9084320068359375, 0.98443603515625], "model_response": [["What's the year when Australia the first time formally establish diplomatic relations with Ireland?", "1922 || 1922"], ["Who was the headmaster of Yale University in the year 1922?", "Charles Seymour (1883-1963) || Charles Seymour"]]}}, "hop2": {"hall_sbj_dict_severe": {"answer_condition": [4, 1], "confidence": [0.78515625, 0.9921875], "model_response": [["What's the year when Australia the first time formally establish diplomatic relations with Ireland?", "1973 || 1973"], ["Who is the headmaster of Yale University in the year 1973?", "Kingman Brewster || Kingman Brewster"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 1], "confidence": [0.9375, 1.0], "model_response": [["What's the year when Australia the first time formally establish diplomatic relations with Ireland?", "1973 || 1973"], ["Who is the headmaster of Yale University in the year 1973?", "Kingman Brewster || Kingman Brewster"]]}, "hall_sbj_dict_light": {"answer_condition": [4, 4], "confidence": [0.9140625, 0.42540979385375977], "model_response": [["What's the year when Australia the first time formally establish diplomatic relations with Ireland?", "1973 || 1973"], ["Who was the headmaster of Yale University in the year 1973?", "Raymond Aron || Raymond Aron"]]}, "mis_info_dict_light": {"answer_condition": [4, 4], "confidence": [0.9140625, 0.49977779388427734], "model_response": [["What's the year when Australia the first time formally establish diplomatic relations with Ireland?", "1973 || 1973"], ["Who is the headmaster of Yale University in the year 1973?", "Thomas S. Gates || Thomas S. Gates"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 4], "confidence": [0.009488582611083984, 0.11923237983137369], "model_response": [["What's the year when Australia the first time formally establish diplomatic relations with Ireland?", "1919 || 1919"], ["Who was the headmaster of Yale University in the year 1919?", "Charles Seymour Stowe || Charles Seymour Stowe"]]}, "mis_info_dict_severe": {"answer_condition": [4, 4], "confidence": [0.87109375, 0.2544795013964176], "model_response": [["What's the year when Australia the first time formally establish diplomatic relations with Ireland?", "1973 || 1973"], ["Who is the headmaster of Yale University in the year 1973?", "The headmaster of Yale University in the year 1973 was John C. Burch. || John C. Burch"]]}}}
{"hop1": {"unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [0.96875, 0.717010498046875], "model_response": [["Who was the US president in the year 1867?", "Andrew Johnson || Andrew Johnson"], ["In which company (the first one in time order) does Andrew Johnson work?", "President of the United States || President of the United States"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.13410186767578125], "model_response": [["Who was the US president in the year 1867?", "Andrew Johnson || Andrew Johnson"], ["In which company (the first one in time order) does Andrew Johnson work?", "The United States of America || United States of America"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 0.25390625], "model_response": [["Who was the US president in the year 1867?", "Andrew Johnson || Andrew Johnson"], ["In which company (the first one in time order) does Andrew Johnson work?", "Andrew Johnson works for the Johnson Company. || Johnson Company"]]}, "mis_info_dict_light": {"answer_condition": [3, 4], "confidence": [1.0, 0.7421875], "model_response": [["Who was the US president in the year 1867?", "Abraham Lincoln || Abraham Lincoln"], ["In which company (the first one in time order) does Abraham Lincoln work?", "Abraham Lincoln was a lawyer. || lawyer"]]}, "unrelated_fact_dict_light": {"answer_condition": [3, 4], "confidence": [1.0, 0.32363128662109375], "model_response": [["Who was the US president in the year 1867?", "Abraham Lincoln || Abraham Lincoln"], ["In which company (the first one in time order) does Abraham Lincoln work?", "President of the United States || President of the United States"]]}, "mis_info_dict_severe": {"answer_condition": [3, 3], "confidence": [1.0, 0.1728515625], "model_response": [["Who was the US president in the year 1867?", "Pizza || Pizza"], ["In which company (the first one in time order) does Pizza work?", "Pizza works at the Pizza Company. || Pizza Company"]]}}, "hop2": {"mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Who was the US president in the year 1867?", "Andrew Johnson || Andrew Johnson"], ["In which company (the first one in time order) does Andrew Johnson work?", "Johnson & Johnson || Johnson & Johnson"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [0.72265625, 0.638580322265625], "model_response": [["Who was the US president in the year 1867?", "Andrew Johnson || Andrew Johnson"], ["In which company (the first one in time order) does Andrew Johnson work?", "President of the United States || President of the United States"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 4], "confidence": [0.87890625, 0.51751708984375], "model_response": [["Who was the US president in the year 1867?", "Andrew Johnson || Andrew Johnson"], ["In which company (the first one in time order) does Andrew Johnson work?", "President of the United States || President of the United States"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 4], "confidence": [0.9453125, 0.8526611328125], "model_response": [["Who was the US president in the year 1867?", "Andrew Johnson || Andrew Johnson"], ["In which company (the first one in time order) does Andrew Johnson work?", "President of the United States || President of the United States"]]}, "mis_info_dict_severe": {"answer_condition": [1, 3], "confidence": [1.0, 0.87890625], "model_response": [["Who was the US president in the year 1867?", "Andrew Johnson || Andrew Johnson"], ["In which company (the first one in time order) does Andrew Johnson work?", "Chocolate cake || Chocolate cake"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [0.80859375, 0.321258544921875], "model_response": [["Who was the US president in the year 1867?", "Andrew Johnson || Andrew Johnson"], ["In which company (the first one in time order) does Andrew Johnson work?", "President of the United States || President of the United States"]]}}}
{"hop1": {"mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.87109375], "model_response": [["Which film won the Oscar for Outstanding Picture in 1789, being the first one in alphabetical order?", "The Deer Hunter || The Deer Hunter"], ["What is the name of the theme song for \"The Deer Hunter\"?", "\"The Deer Hunter\" || The Deer Hunter"]]}, "mis_info_dict_light": {"answer_condition": [4, 4], "confidence": [1.0, 0.8136749267578125], "model_response": [["Which film won the Oscar for Outstanding Picture in 1789, being the first one in alphabetical order?", "Annie Hall || Annie Hall"], ["What is the name of the theme song for \"Annie Hall\"?", "You Must Love Me || You Must Love Me"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 4], "confidence": [0.33203125, 0.9346923828125], "model_response": [["Which film won the Oscar for Outstanding Picture in 1789, being the first one in alphabetical order?", "Amadeus || Amadeus"], ["What is the name of the theme song for \"Amadeus\"?", "\"My Strongest Suit\" || My Strongest Suit"]]}, "hall_sbj_dict_light": {"answer_condition": [4, 3], "confidence": [1.0, 0.48453468084335327], "model_response": [["Which film won the Oscar for Outstanding Picture in 1789, being the first one in alphabetical order?", "The Godfather || The Godfather"], ["What is the name of the theme song for \"The Godfather\"?", "The Godfather Theme || The Godfather Theme"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 4], "confidence": [0.9498291015625, 0.90625], "model_response": [["Which film won the Oscar for Outstanding Picture in 1789, being the first one in alphabetical order?", "The first film to win the Oscar for Outstanding Picture in 1789 was \"The Red Shoes\" (1948). || The Red Shoes"], ["What is the name of the theme song for \"The Red Shoes\"?", "\"The Red Shoes\" || The Red Shoes"]]}, "hall_sbj_dict_severe": {"answer_condition": [3, 4], "confidence": [0.98828125, 0.08381756488233805], "model_response": [["Which film won the Oscar for Outstanding Picture in 1789, being the first one in alphabetical order?", "Giraffes || Giraffes"], ["What is the name of the theme song for \"Giraffes\"?", "I'm Gonna Go Back There Someday || I'm Gonna Go Back There Someday"]]}}, "hop2": {"hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.9609375, 0.9921875], "model_response": [["Which film won the Oscar for Outstanding Picture in 1789, being the first one in alphabetical order?", "The Deer Hunter || The Deer Hunter"], ["What is the name of the theme song for \"The Deer Hunter\"?", "\"The Deer Hunter\" || The Deer Hunter"]]}, "mis_info_dict_light": {"answer_condition": [1, 4], "confidence": [0.796875, 1.0], "model_response": [["Which film won the Oscar for Outstanding Picture in 1789, being the first one in alphabetical order?", "The Deer Hunter || The Deer Hunter"], ["What is the name of the theme song for \"The Deer Hunter\"?", "\"My Heart Will Go On\" || My Heart Will Go On"]]}, "mis_info_dict_severe": {"answer_condition": [1, 4], "confidence": [0.376953125, 0.256805419921875], "model_response": [["Which film won the Oscar for Outstanding Picture in 1789, being the first one in alphabetical order?", "The Deer Hunter || The Deer Hunter"], ["What is the name of the theme song for \"The Deer Hunter\"?", "\"Got to Be There\" || Got to Be There"]]}, "hall_sbj_dict_light": {"answer_condition": [4, 4], "confidence": [0.49609375, 0.06711006164550781], "model_response": [["Which film won the Oscar for Outstanding Picture in 1789, being the first one in alphabetical order?", "Amadeus || Amadeus"], ["What is the name of the theme song for \"Amadeus\"?", "\"My Heart Will Go On\" || My Heart Will Go On"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 4], "confidence": [0.359375, 0.9455108642578125], "model_response": [["Which film won the Oscar for Outstanding Picture in 1789, being the first one in alphabetical order?", "Amadeus || Amadeus"], ["What is the name of the theme song for \"Amadeus\"?", "\"My Strongest Suit\" || My Strongest Suit"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 4], "confidence": [0.86376953125, 0.988311767578125], "model_response": [["Which film won the Oscar for Outstanding Picture in 1789, being the first one in alphabetical order?", "The film was \"The Artist\" and it won the Oscar for Outstanding Picture in 1789. || The Artist"], ["What is the name of the theme song for \"The Artist\"?", "\"The Artist\" || The Artist"]]}}}
{"hop1": {"hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.94140625], "model_response": [["Which country in Europe has the highest population?", "Russia || Russia"], ["What's the year when Finland the first time formally establish diplomatic relations with Russia?", "1895 || 1895"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.9921875, 0.8203125], "model_response": [["Which country in Europe has the highest population?", "Russia || Russia"], ["What's the year when Finland the first time formally establish diplomatic relations with Russia?", "1895 || 1895"]]}, "mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [0.98828125, 0.96484375], "model_response": [["Which country in Europe has the highest population?", "Russia || Russia"], ["What's the year when Finland the first time formally establish diplomatic relations with Russia?", "1895 || 1895"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.953125, 0.97265625], "model_response": [["Which country in Europe has the highest population?", "Russia || Russia"], ["What's the year when Finland the first time formally establish diplomatic relations with Russia?", "1895 || 1895"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 4], "confidence": [1.0, 0.17438888549804688], "model_response": [["Which country in Europe has the highest population?", "Germany || Germany"], ["What's the year when Finland the first time formally establish diplomatic relations with Germany?", "1866 || 1866"]]}, "mis_info_dict_severe": {"answer_condition": [4, 4], "confidence": [0.96875, 0.11968612670898438], "model_response": [["Which country in Europe has the highest population?", "Germany || Germany"], ["What's the year when Finland the first time formally establish diplomatic relations with Germany?", "1866 || 1866"]]}}, "hop2": {"hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.447265625, 1.0], "model_response": [["Which country in Europe has the highest population?", "Russia || Russia"], ["What's the year when Finland the first time formally establish diplomatic relations with Russia?", "1895 || 1895"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.81640625, 0.99609375], "model_response": [["Which country in Europe has the highest population?", "Russia || Russia"], ["What's the year when Finland the first time formally establish diplomatic relations with Russia?", "1895 || 1895"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.953125, 0.96484375], "model_response": [["Which country in Europe has the highest population?", "Russia || Russia"], ["What's the year when Finland the first time formally establish diplomatic relations with Russia?", "1895 || 1895"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [0.98828125, 0.1630859375], "model_response": [["Which country in Europe has the highest population?", "Russia || Russia"], ["What's the year when Finland the first time formally establish diplomatic relations with Russia?", "1809 || 1809"]]}, "mis_info_dict_severe": {"answer_condition": [1, 4], "confidence": [0.9765625, 0.49221038818359375], "model_response": [["Which country in Europe has the highest population?", "Russia || Russia"], ["What's the year when Finland the first time formally establish diplomatic relations with Russia?", "1721 || 1721"]]}, "mis_info_dict_light": {"answer_condition": [4, 4], "confidence": [0.34765625, 0.546478271484375], "model_response": [["Which country in Europe has the highest population?", "Finland has the highest population in Europe. || Finland"], ["What's the year when Finland first formally established diplomatic relations with Sweden?", "1855 || 1855"]]}}}
{"hop1": {"hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.94921875, 0.961181640625], "model_response": [["In which year was Akio Morita born?", "1919 || 1919"], ["Who is the CEO of General Electric in the year 1919?", "Thomas Edison || Thomas Edison"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.90234375, 0.9922027587890625], "model_response": [["In which year was Akio Morita born?", "1919 || 1919"], ["Who is the CEO of General Electric in the year 1919?", "Thomas Edison || Thomas Edison"]]}, "mis_info_dict_light": {"answer_condition": [3, 1], "confidence": [1.0, 0.7744140625], "model_response": [["In which year was Akio Morita born?", "1925 || 1925"], ["Who is the CEO of General Electric in the year 1925?", "Thomas Edison || Thomas Edison"]]}, "mis_info_dict_severe": {"answer_condition": [4, 1], "confidence": [0.342498779296875, 0.8068389892578125], "model_response": [["In which year was Akio Morita born?", "1928 || 1928"], ["Who is the CEO of General Electric in the year 1928?", "Thomas Edison || Thomas Edison"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 4], "confidence": [0.94921875, 0.4830677383579314], "model_response": [["In which year was Akio Morita born?", "1931 || 1931"], ["Who is the CEO of General Electric in the year 1931?", "Charles Coffin || Charles Coffin"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 4], "confidence": [-1.0, 0.6370076152961701], "model_response": [["In which year was Akio Morita born?", "1932 || 1932"], ["Who is the CEO of General Electric in the year 1932?", "Charles Coffin || Charles Coffin"]]}}, "hop2": {"hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.99609375, 0.99609375], "model_response": [["In which year was Akio Morita born?", "1919 || 1919"], ["Who is the CEO of General Electric in the year 1919?", "Thomas Edison || Thomas Edison"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.9456787109375], "model_response": [["In which year was Akio Morita born?", "1919 || 1919"], ["Who is the CEO of General Electric in the year 1919?", "Thomas Edison || Thomas Edison"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.69140625, 0.9844207763671875], "model_response": [["In which year was Akio Morita born?", "1919 || 1919"], ["Who is the CEO of General Electric in the year 1919?", "Thomas Edison || Thomas Edison"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.96484375], "model_response": [["In which year was Akio Morita born?", "1919 || 1919"], ["Who is the CEO of General Electric in the year 1919?", "Thomas Edison || Thomas Edison"]]}, "mis_info_dict_severe": {"answer_condition": [1, 3], "confidence": [1.0, 1.0], "model_response": [["In which year was Akio Morita born?", "1919 || 1919"], ["Who is the CEO of General Electric in the year 1919?", "Pizza || Pizza"]]}, "mis_info_dict_light": {"answer_condition": [1, 3], "confidence": [1.0, 1.0], "model_response": [["In which year was Akio Morita born?", "1919 || 1919"], ["Who is the CEO of General Electric in the year 1919?", "Nikola Tesla || Nikola Tesla"]]}}}
{"hop1": {"unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.2972564697265625], "model_response": [["Which university or college did Richard Nixon attend as a graduate student?", "Yale University || Yale University"], ["Who is the headmaster of Yale University in the year 1974?", "Kingman Brewster || Kingman Brewster"]]}, "mis_info_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.83203125], "model_response": [["Which university or college did Richard Nixon attend as a graduate student?", "Yale University || Yale University"], ["Who is the headmaster of Yale University in the year 1974?", "Kingman Brewster || Kingman Brewster"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 4], "confidence": [0.96484375, 0.0025843511916718853], "model_response": [["Which university or college did Richard Nixon attend as a graduate student?", "Yale University || Yale University"], ["Who is the headmaster of Yale University in the year 1974?", "Harold R. Varmus || Harold R. Varmus"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.1288238947163336], "model_response": [["Which university or college did Richard Nixon attend as a graduate student?", "Yale University || Yale University"], ["Who is the headmaster of Yale University in the year 1974?", "Dr. David L. Boren || Dr. David L. Boren"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [0.99609375, 0.0692304368758414], "model_response": [["Which university or college did Richard Nixon attend as a graduate student?", "Yale University || Yale University"], ["Who is the headmaster of Yale University in the year 1974?", "Ray A. Bolger || Ray A. Bolger"]]}, "mis_info_dict_light": {"answer_condition": [3, 4], "confidence": [1.0, 0.25478174071758986], "model_response": [["Which university or college did Richard Nixon attend as a graduate student?", "Harvard University || Harvard University"], ["Who is the headmaster of Harvard University in the year 1974?", "Harvard University was led by President Nathan M. Newbury. || Nathan M. Newbury"]]}}, "hop2": {"mis_info_dict_severe": {"answer_condition": [1, -1], "confidence": [0.78515625, -1], "model_response": [["Which university or college did Richard Nixon attend as a graduate student?", "Yale University || Yale University"], ["Who is the headmaster of Yale University in the year 1974?", "Unknown || N/A"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.99609375, 0.69921875], "model_response": [["Which university or college did Richard Nixon attend as a graduate student?", "Yale University || Yale University"], ["Who is the headmaster of Yale University in the year 1974?", "Thomas J. Scharping || Thomas J. Scharping"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.95703125], "model_response": [["Which university or college did Richard Nixon attend as a graduate student?", "Yale University || Yale University"], ["Who is the headmaster of Yale University in the year 1974?", "Kingman Brewster || Kingman Brewster"]]}, "mis_info_dict_light": {"answer_condition": [1, 4], "confidence": [0.625, 1.0], "model_response": [["Which university or college did Richard Nixon attend as a graduate student?", "Yale University || Yale University"], ["Who is the headmaster of Yale University in the year 1974?", "John F. Kennedy || John F. Kennedy"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.99609375, 0.26444244384765625], "model_response": [["Which university or college did Richard Nixon attend as a graduate student?", "Yale University || Yale University"], ["Who is the headmaster of Yale University in the year 1974?", "Thomas J. Scharping || Thomas J. Scharping"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [0.99609375, 0.09250640869140625], "model_response": [["Which university or college did Richard Nixon attend as a graduate student?", "Yale University || Yale University"], ["Who is the headmaster of Yale University in the year 1974?", "President Richard Nixon || President Richard Nixon"]]}}}
{"hop1": {"unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Which country is the northernmost in the UTC+9 time zone?", "Russia || Russia"], ["Which is the first year does Japan invade China?", "1937 || 1937"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 4], "confidence": [0.96484375, 0.5859375], "model_response": [["Which country is the northernmost in the UTC+9 time zone?", "Australia || Australia"], ["Which is the first year does Australia invade China?", "1945 || 1945"]]}, "mis_info_dict_severe": {"answer_condition": [4, 4], "confidence": [0.875, 0.051555633544921875], "model_response": [["Which country is the northernmost in the UTC+9 time zone?", "Australia || Australia"], ["Which is the first year does Australia invade China?", "1880 || 1880"]]}, "hall_sbj_dict_severe": {"answer_condition": [4, 4], "confidence": [0.97265625, 0.0888671875], "model_response": [["Which country is the northernmost in the UTC+9 time zone?", "Australia || Australia"], ["Which is the first year does Australia invade China?", "1942 || 1942"]]}, "mis_info_dict_light": {"answer_condition": [3, 4], "confidence": [0.89453125, 0.14434814453125], "model_response": [["Which country is the northernmost in the UTC+9 time zone?", "South Korea || South Korea"], ["Which is the first year does South Korea invade China?", "1086 || 1086"]]}, "hall_sbj_dict_light": {"answer_condition": [3, 4], "confidence": [0.89453125, 0.09707733988761902], "model_response": [["Which country is the northernmost in the UTC+9 time zone?", "South Korea || South Korea"], ["Which is the first year does South Korea invade China?", "Battle of Seoul (1592) || Battle of Seoul (1592)"]]}}, "hop2": {"mis_info_dict_light": {"answer_condition": [4, 4], "confidence": [0.9140625, 0.87109375], "model_response": [["Which country is the northernmost in the UTC+9 time zone?", "Australia || Australia"], ["Which is the first year does Australia invade China?", "1945 || 1945"]]}, "mis_info_dict_severe": {"answer_condition": [4, 4], "confidence": [0.33203125, 0.028564453125], "model_response": [["Which country is the northernmost in the UTC+9 time zone?", "Norway || Norway"], ["Which is the first year does Norway invade China?", "1550 || 1550"]]}, "hall_sbj_dict_light": {"answer_condition": [4, 4], "confidence": [0.9140625, 0.81640625], "model_response": [["Which country is the northernmost in the UTC+9 time zone?", "Australia || Australia"], ["Which is the first year does Australia invade China?", "1939 || 1939"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 4], "confidence": [0.96875, 0.4375], "model_response": [["Which country is the northernmost in the UTC+9 time zone?", "Australia || Australia"], ["Which is the first year does Australia invade China?", "1945 || 1945"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 4], "confidence": [0.96484375, 0.66015625], "model_response": [["Which country is the northernmost in the UTC+9 time zone?", "Australia || Australia"], ["Which is the first year does Australia invade China?", "1942 || 1942"]]}, "hall_sbj_dict_severe": {"answer_condition": [4, 4], "confidence": [0.8515625, 0.6796875], "model_response": [["Which country is the northernmost in the UTC+9 time zone?", "Australia || Australia"], ["Which is the first year does Australia invade China?", "1939 || 1939"]]}}}
{"hop1": {"hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.9921875, 0.376953125], "model_response": [["What is the capital of Russia?", "Moscow || Moscow"], ["What is the time zone of Moscow in UTC?", "+3 || +3"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.98828125, 0.724761962890625], "model_response": [["What is the capital of Russia?", "Moscow || Moscow"], ["What is the time zone of Moscow in UTC?", "+3 hours || +3 hours"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.98828125, 0.10378265380859375], "model_response": [["What is the capital of Russia?", "Moscow || Moscow"], ["What is the time zone of Moscow in UTC?", "+3 hours (UTC+3) || +3 hours"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.49609375], "model_response": [["What is the capital of Russia?", "Moscow || Moscow"], ["What is the time zone of Moscow in UTC?", "UTC+3 || UTC+3"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.953125, 0.7162017822265625], "model_response": [["What is the capital of Russia?", "Moscow || Moscow"], ["What is the time zone of Moscow in UTC?", "UTC+3 || UTC+3"]]}, "mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.490234375], "model_response": [["What is the capital of Russia?", "Moscow || Moscow"], ["What is the time zone of Moscow in UTC?", "UTC+3 || UTC+3"]]}}, "hop2": {"hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.98046875, 0.154296875], "model_response": [["What is the capital of Russia?", "Moscow || Moscow"], ["What is the time zone of Moscow in UTC?", "+3 hours || +3 hours"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.99609375, 0.823974609375], "model_response": [["What is the capital of Russia?", "Moscow || Moscow"], ["What is the time zone of Moscow in UTC?", "+3 hours || +3 hours"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.6900787353515625], "model_response": [["What is the capital of Russia?", "Moscow || Moscow"], ["What is the time zone of Moscow in UTC?", "UTC+3 hours || UTC+3"]]}, "mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [0.98828125, 0.9461631774902344], "model_response": [["What is the capital of Russia?", "Moscow || Moscow"], ["What is the time zone of Moscow in UTC?", "UTC+3 || UTC+3"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.953125, 0.8681640625], "model_response": [["What is the capital of Russia?", "Moscow || Moscow"], ["What is the time zone of Moscow in UTC?", "Moscow is in the UTC+3 time zone. || UTC+3"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.98046875, 0.306640625], "model_response": [["What is the capital of Russia?", "Moscow || Moscow"], ["What is the time zone of Moscow in UTC?", "+3 hours || +3 hours"]]}}}
{"hop1": {"mis_info_dict_severe": {"answer_condition": [3, -1], "confidence": [1.0, -1], "model_response": [["Who is the president / leader of China in the year 1949?", "Pizza || Pizza"], ["Who is Pizza married to?", "Pizza is not married. || N/A"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Who is the president / leader of China in the year 1949?", "Chiang Kai-shek || Chiang Kai-shek"], ["Who is Chiang Kai-shek married to?", "Soong Mei-ling || Soong Mei-ling"]]}, "hall_sbj_dict_light": {"answer_condition": [4, 1], "confidence": [0.6762542724609375, 0.9027099609375], "model_response": [["Who is the president / leader of China in the year 1949?", "Chou En-lai || Chou En-lai"], ["Who is Chou En-lai married to?", "Soong Mei-ling || Soong Mei-ling"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 1], "confidence": [0.8933472633361816, 0.9765625], "model_response": [["Who is the president / leader of China in the year 1949?", "Chou En-lai || Chou En-lai"], ["Who is Chou En-lai married to?", "He was married to Soong Mei-ling, who was the first lady of China. || Soong Mei-ling"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 1], "confidence": [0.724761962890625, 0.07479667663574219], "model_response": [["Who is the president / leader of China in the year 1949?", "Chou En-Lai || Chou En-Lai"], ["Who is Chou En-Lai married to?", "Chou En-Lai was married to Soong Mei-ling. || Soong Mei-ling"]]}, "mis_info_dict_light": {"answer_condition": [4, 4], "confidence": [1.0, 0.03706169128417969], "model_response": [["Who is the president / leader of China in the year 1949?", "Mao Zedong || Mao Zedong"], ["Who is Mao Zedong married to?", "Chiang Kai-shek || Chiang Kai-shek"]]}}, "hop2": {"mis_info_dict_severe": {"answer_condition": [1, 3], "confidence": [1.0, 0.9921875], "model_response": [["Who is the president / leader of China in the year 1949?", "Chiang Kai-shek || Chiang Kai-shek"], ["Who is Chiang Kai-shek married to?", "Chocolate cake || Chocolate cake"]]}, "hall_sbj_dict_light": {"answer_condition": [4, 1], "confidence": [0.87890625, 1.0], "model_response": [["Who is the president / leader of China in the year 1949?", "Mao Zedong || Mao Zedong"], ["Who is Mao Zedong married to?", "Soong Mei-ling || Soong Mei-ling"]]}, "mis_info_dict_light": {"answer_condition": [1, 3], "confidence": [1.0, 1.0], "model_response": [["Who is the president / leader of China in the year 1949?", "Chiang Kai-shek || Chiang Kai-shek"], ["Who is Chiang Kai-shek married to?", "Jiang Qing || Jiang Qing"]]}, "hall_sbj_dict_severe": {"answer_condition": [4, 1], "confidence": [0.9456787109375, 1.0], "model_response": [["Who is the president / leader of China in the year 1949?", "Chou En-lai || Chou En-lai"], ["Who is Chou En-lai married to?", "Sun Yat-sen's widow, Soong Mei-ling. || Soong Mei-ling"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 1], "confidence": [0.498046875, 0.7942072153091431], "model_response": [["Who is the president / leader of China in the year 1949?", "Chou En-Lai || Chou En-Lai"], ["Who is Chou En-Lai married to?", "Chou En-Lai was married to Soong Mei-Ling. || Soong Mei-Ling"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 1], "confidence": [0.498046875, 0.988311767578125], "model_response": [["Who is the president / leader of China in the year 1949?", "Chou En-lai || Chou En-lai"], ["Who is Chou En-lai married to?", "Chou En-lai was married to Soong Mei-ling. || Soong Mei-ling"]]}}}
{"hop1": {"unrelated_fact_dict_severe": {"answer_condition": [4, 4], "confidence": [0.8984375, 0.01697869345662184], "model_response": [["In which year was the Los Angeles Lakers founded?", "1947 || 1947"], ["Who was the headmaster of Yale University in the year 1947?", "Charles S. Whipple || Charles S. Whipple"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 4], "confidence": [0.8203125, 0.03503037244081497], "model_response": [["In which year was the Los Angeles Lakers founded?", "1947 || 1947"], ["Who is the headmaster of Yale University in the year 1947?", "Charles S. Whipple || Charles S. Whipple"]]}, "mis_info_dict_light": {"answer_condition": [4, 4], "confidence": [1.0, 0.5195095539093018], "model_response": [["In which year was the Los Angeles Lakers founded?", "1947 || 1947"], ["Who was the headmaster of Yale University in the year 1947?", "Harvard University was founded in 1636. || Harvard University"]]}, "hall_sbj_dict_light": {"answer_condition": [4, 4], "confidence": [0.8671875, 0.575469970703125], "model_response": [["In which year was the Los Angeles Lakers founded?", "1947 || 1947"], ["Who was the headmaster of Yale University in the year 1947?", "Harvard University president, Charles William Eliot. || Charles William Eliot"]]}, "mis_info_dict_severe": {"answer_condition": [4, 4], "confidence": [0.98828125, 0.595557689666748], "model_response": [["In which year was the Los Angeles Lakers founded?", "1948 || 1948"], ["Who was the headmaster of Yale University in the year 1948?", "Harvard University was founded in the year 1636. || Harvard University"]]}, "hall_sbj_dict_severe": {"answer_condition": [4, 4], "confidence": [0.203125, 0.57293701171875], "model_response": [["In which year was the Los Angeles Lakers founded?", "1948 || 1948"], ["Who was the headmaster of Yale University in the year 1948?", "Charles Seymour (1886-1966) || Charles Seymour"]]}}, "hop2": {"hall_sbj_dict_light": {"answer_condition": [4, 1], "confidence": [0.1513671875, 0.98046875], "model_response": [["In which year was the Los Angeles Lakers founded?", "1948 || 1948"], ["Who was the headmaster of Yale University in the year 1948?", "Kingman Brewster || Kingman Brewster"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 4], "confidence": [0.640625, 0.9234083890914917], "model_response": [["In which year was the Los Angeles Lakers founded?", "1947 || 1947"], ["Who is the headmaster of Yale University in the year 1947?", "Harvard University || Harvard University"]]}, "hall_sbj_dict_severe": {"answer_condition": [4, 1], "confidence": [0.85546875, 0.859375], "model_response": [["In which year was the Los Angeles Lakers founded?", "1947 || 1947"], ["Who is the headmaster of Yale University in the year 1947?", "Kingman Brewster || Kingman Brewster"]]}, "mis_info_dict_severe": {"answer_condition": [4, 4], "confidence": [0.224609375, 0.3403226137161255], "model_response": [["In which year was the Los Angeles Lakers founded?", "1948 || 1948"], ["Who was the headmaster of Yale University in the year 1948?", "Harvard University || Harvard University"]]}, "mis_info_dict_light": {"answer_condition": [4, 4], "confidence": [0.9921875, 0.5768224596977234], "model_response": [["In which year was the Los Angeles Lakers founded?", "The Los Angeles Lakers were founded in 1947. || 1947"], ["Who was the headmaster of Yale University in the year 1947?", "Harvard University || Harvard University"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 1], "confidence": [0.1923828125, 0.6484375], "model_response": [["In which year was the Los Angeles Lakers founded?", "1948 || 1948"], ["Who was the headmaster of Yale University in the year 1948?", "Kingman Brewster || Kingman Brewster"]]}}}
{"hop1": {"unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.98828125, 1.0], "model_response": [["Who was the US president in the year 1906?", "Theodore Roosevelt || Theodore Roosevelt"], ["In which city was Theodore Roosevelt born?", "New York City || New York City"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Who was the US president in the year 1906?", "Theodore Roosevelt || Theodore Roosevelt"], ["In which city was Theodore Roosevelt born?", "New York City || New York City"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Who was the US president in the year 1906?", "Theodore Roosevelt || Theodore Roosevelt"], ["In which city was Theodore Roosevelt born?", "New York City || New York City"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.87890625, 1.0], "model_response": [["Who was the US president in the year 1906?", "Theodore Roosevelt || Theodore Roosevelt"], ["In which city was Theodore Roosevelt born?", "New York City || New York City"]]}, "mis_info_dict_light": {"answer_condition": [3, 4], "confidence": [1.0, 0.77813720703125], "model_response": [["Who was the US president in the year 1906?", "William McKinley || William McKinley"], ["In which city was William McKinley born?", "Nashville, Tennessee || Nashville, Tennessee"]]}, "mis_info_dict_severe": {"answer_condition": [4, 4], "confidence": [0.470703125, 1.0], "model_response": [["Who was the US president in the year 1906?", "The US president in the year 1906 was William Howard Taft. || William Howard Taft"], ["In which city was William Howard Taft born?", "Cincinnati, Ohio || Cincinnati, Ohio"]]}}, "hop2": {"hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.9921875, 1.0], "model_response": [["Who was the US president in the year 1906?", "Theodore Roosevelt || Theodore Roosevelt"], ["In which city was Theodore Roosevelt born?", "New York City || New York City"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.98828125, 1.0], "model_response": [["Who was the US president in the year 1906?", "Theodore Roosevelt || Theodore Roosevelt"], ["In which city was Theodore Roosevelt born?", "New York City || New York City"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Who was the US president in the year 1906?", "Theodore Roosevelt || Theodore Roosevelt"], ["In which city was Theodore Roosevelt born?", "New York City || New York City"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.98046875, 1.0], "model_response": [["Who was the US president in the year 1906?", "Theodore Roosevelt || Theodore Roosevelt"], ["In which city was Theodore Roosevelt born?", "New York City || New York City"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.96875, 0.99609375], "model_response": [["Who was the US president in the year 1906?", "Theodore Roosevelt || Theodore Roosevelt"], ["In which city was Theodore Roosevelt born?", "New York City || New York City"]]}, "mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.9921875], "model_response": [["Who was the US president in the year 1906?", "Theodore Roosevelt || Theodore Roosevelt"], ["In which city was Theodore Roosevelt born?", "New York City || New York City"]]}}}
{"hop1": {"hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.1748046875, 1.0], "model_response": [["Which country is the northernmost in the +8 time zone?", "Japan || Japan"], ["What is the capital of Japan?", "Tokyo || Tokyo"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.92578125, 1.0], "model_response": [["Which country is the northernmost in the +8 time zone?", "Japan || Japan"], ["What is the capital of Japan?", "Tokyo || Tokyo"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 4], "confidence": [1.0, 1.0], "model_response": [["Which country is the northernmost in the +8 time zone?", "Russia || Russia"], ["What is the capital of Russia?", "Moscow || Moscow"]]}, "mis_info_dict_light": {"answer_condition": [3, 4], "confidence": [0.99609375, 1.0], "model_response": [["Which country is the northernmost in the +8 time zone?", "China || China"], ["What is the capital of China?", "Beijing || Beijing"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 4], "confidence": [0.5859375, 1.0], "model_response": [["Which country is the northernmost in the +8 time zone?", "Norway || Norway"], ["What is the capital of Norway?", "Oslo || Oslo"]]}, "hall_sbj_dict_light": {"answer_condition": [4, 4], "confidence": [0.96875, 1.0], "model_response": [["Which country is the northernmost in the +8 time zone?", "Russia || Russia"], ["What is the capital of Russia?", "Moscow || Moscow"]]}}, "hop2": {"hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.486328125, 1.0], "model_response": [["Which country is the northernmost in the +8 time zone?", "Japan || Japan"], ["What is the capital of Japan?", "Tokyo || Tokyo"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.25390625, 1.0], "model_response": [["Which country is the northernmost in the +8 time zone?", "Japan || Japan"], ["What is the capital of Japan?", "Tokyo || Tokyo"]]}, "mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [0.462890625, 1.0], "model_response": [["Which country is the northernmost in the +8 time zone?", "Japan || Japan"], ["What is the capital of Japan?", "Tokyo || Tokyo"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 4], "confidence": [0.765625, 1.0], "model_response": [["Which country is the northernmost in the +8 time zone?", "Norway || Norway"], ["What is the capital of Norway?", "Oslo || Oslo"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 4], "confidence": [0.494140625, 0.96875], "model_response": [["Which country is the northernmost in the +8 time zone?", "Russia || Russia"], ["What is the capital of Russia?", "Moscow || Moscow"]]}, "hall_sbj_dict_severe": {"answer_condition": [4, 4], "confidence": [0.1083984375, 0.98828125], "model_response": [["Which country is the northernmost in the +8 time zone?", "China || China"], ["What is the capital of China?", "Beijing || Beijing"]]}}}
{"hop1": {"unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.988311767578125, 0.96875], "model_response": [["Which countries to the east share a border with Norway?", "Finland and Russia || Finland and Russia"], ["What's the year when Sweden the first time formally establish diplomatic relations with Finland?", "1855 || 1855"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.8439903259277344, 0.957183837890625], "model_response": [["Which countries to the east share a border with Norway?", "Finland and Russia. || Finland and Russia"], ["What's the year when Sweden the first time formally establish diplomatic relations with Finland?", "1855 || 1855"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.24155652523040771, 0.7890625], "model_response": [["Which countries to the east share a border with Norway?", "Finland and Sweden || Finland and Sweden"], ["What's the year when Sweden the first time formally establish diplomatic relations with Finland?", "1855 || 1855"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.9161262512207031, 0.8671875], "model_response": [["Which countries to the east share a border with Norway?", "Finland and Russia || Finland and Russia"], ["What's the year when Sweden the first time formally establish diplomatic relations with Finland?", "1855 || 1855"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.22177433967590332, 0.957489013671875], "model_response": [["Which countries to the east share a border with Norway?", "Finland and Russia || Finland and Russia"], ["What's the year when Sweden the first time formally establish diplomatic relations with Finland?", "1855 || 1855"]]}, "mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [0.9379416704177856, 0.953125], "model_response": [["Which countries to the east share a border with Norway?", "Finland and Russia || Finland and Russia"], ["What's the year when Sweden the first time formally establish diplomatic relations with Finland?", "1855 || 1855"]]}}, "hop2": {"unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.5847116112709045, 0.90625], "model_response": [["Which countries to the east share a border with Norway?", "Finland and Russia || Finland and Russia"], ["What's the year when Sweden the first time formally establish diplomatic relations with Finland?", "1855 || 1855"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.3452606201171875, 1.0], "model_response": [["Which countries to the east share a border with Norway?", "Finland and Sweden || Finland and Sweden"], ["What's the year when Sweden the first time formally establish diplomatic relations with Finland?", "1855 || 1855"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.12055206298828125, 1.0], "model_response": [["Which countries to the east share a border with Norway?", "Finland and Sweden || Finland and Sweden"], ["What's the year when Sweden the first time formally establish diplomatic relations with Finland?", "1855 || 1855"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.9382905960083008, 0.7431793212890625], "model_response": [["Which countries to the east share a border with Norway?", "Finland and Russia || Finland and Russia"], ["What's the year when Sweden the first time formally establish diplomatic relations with Finland?", "1855 || 1855"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [0.2312335968017578, 0.53125], "model_response": [["Which countries to the east share a border with Norway?", "Finland and Sweden || Finland and Sweden"], ["What's the year when Sweden the first time formally establish diplomatic relations with Finland?", "1809 || 1809"]]}, "mis_info_dict_light": {"answer_condition": [1, 4], "confidence": [0.9053058624267578, 0.37872314453125], "model_response": [["Which countries to the east share a border with Norway?", "Finland and Russia || Finland and Russia"], ["What's the year when Sweden the first time formally establish diplomatic relations with Finland?", "1850 || 1850"]]}}}
{"hop1": {"hall_sbj_dict_light": {"answer_condition": [1, -1], "confidence": [0.94921875, -1], "model_response": [["In which year was Akio Morita born?", "1919 || 1919"], ["Who is the headmaster of Columbia University in the year 1919?", "Columbia University did not have a headmaster in 1919. || N/A"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 4], "confidence": [0.99609375, 0.0364299095235765], "model_response": [["In which year was Akio Morita born?", "1919 || 1919"], ["Who is the headmaster of Columbia University in the year 1919?", "Robert R. Livingston || Robert R. Livingston"]]}, "mis_info_dict_severe": {"answer_condition": [4, 4], "confidence": [0.342498779296875, 0.0025017298758029938], "model_response": [["In which year was Akio Morita born?", "1928 || 1928"], ["Who is the headmaster of Columbia University in the year 1928?", "Robert F. Wagner || Robert F. Wagner"]]}, "mis_info_dict_light": {"answer_condition": [3, 4], "confidence": [1.0, 0.23229217529296875], "model_response": [["In which year was Akio Morita born?", "1925 || 1925"], ["Who is the headmaster of Columbia University in the year 1925?", "Robert Bacon || Robert Bacon"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 4], "confidence": [0.94921875, 0.548309326171875], "model_response": [["In which year was Akio Morita born?", "1931 || 1931"], ["Who is the headmaster of Columbia University in the year 1931?", "Harold Pratt || Harold Pratt"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 4], "confidence": [0.43359375, 0.6131047010421753], "model_response": [["In which year was Akio Morita born?", "1931 || 1931"], ["Who is the headmaster of Columbia University in the year 1931?", "Harvard University || Harvard University"]]}}, "hop2": {"hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.9921875, 0.87109375], "model_response": [["In which year was Akio Morita born?", "1919 || 1919"], ["Who is the headmaster of Columbia University in the year 1919?", "Charles S. Shattuck || Charles S. Shattuck"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.9844207763671875], "model_response": [["In which year was Akio Morita born?", "1919 || 1919"], ["Who is the headmaster of Columbia University in the year 1919?", "Charles S. Shattuck || Charles S. Shattuck"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.3043670654296875], "model_response": [["In which year was Akio Morita born?", "1919 || 1919"], ["Who is the headmaster of Columbia University in the year 1919?", "Charles S. Shattuck || Charles S. Shattuck"]]}, "mis_info_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 0.99609375], "model_response": [["In which year was Akio Morita born?", "1919 || 1919"], ["Who is the headmaster of Columbia University in the year 1919?", "John F. Kennedy || John F. Kennedy"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.04581359995063394], "model_response": [["In which year was Akio Morita born?", "1919 || 1919"], ["Who is the headmaster of Columbia University in the year 1919?", "John M. Clark || John M. Clark"]]}, "mis_info_dict_severe": {"answer_condition": [1, 4], "confidence": [0.99609375, 0.016011669096769765], "model_response": [["In which year was Akio Morita born?", "1919 || 1919"], ["Who is the headmaster of Columbia University in the year 1919?", "Dr. William R. Castle || Dr. William R. Castle"]]}}}
{"hop1": {"unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.5390625, 0.9456787109375], "model_response": [["Which university or college did Harry S. Truman attend as a graduate student?", "Yale University || Yale University"], ["Which city is Yale University located in?", "New Haven, Connecticut || New Haven, Connecticut"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.3203125, 0.98046875], "model_response": [["Which university or college did Harry S. Truman attend as a graduate student?", "Yale University || Yale University"], ["Which city is Yale University located in?", "New Haven, Connecticut || New Haven, Connecticut"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.98828125, 0.99609375], "model_response": [["Which university or college did Harry S. Truman attend as a graduate student?", "Yale University || Yale University"], ["Which city is Yale University located in?", "New Haven, Connecticut || New Haven, Connecticut"]]}, "mis_info_dict_severe": {"answer_condition": [4, 4], "confidence": [0.32045960426330566, 1.0], "model_response": [["Which university or college did Harry S. Truman attend as a graduate student?", "University of Missouri-Columbia || University of Missouri-Columbia"], ["Which city is the University of Missouri-Columbia located in?", "Columbia || Columbia"]]}, "unrelated_fact_dict_severe": {"answer_condition": [3, 4], "confidence": [0.8526611328125, 0.98828125], "model_response": [["Which university or college did Harry S. Truman attend as a graduate student?", "Harvard University || Harvard University"], ["Which city is Harvard University located in?", "Boston || Boston"]]}, "mis_info_dict_light": {"answer_condition": [3, 4], "confidence": [1.0, 0.98828125], "model_response": [["Which university or college did Harry S. Truman attend as a graduate student?", "Harvard University || Harvard University"], ["Which city is Harvard University located in?", "Boston || Boston"]]}}, "hop2": {"hall_sbj_dict_light": {"answer_condition": [4, 4], "confidence": [0.08429718017578125, 0.96875], "model_response": [["Which university or college did Harry S. Truman attend as a graduate student?", "Harvard University || Harvard University"], ["Which city is Harvard University located in?", "Boston || Boston"]]}, "hall_sbj_dict_severe": {"answer_condition": [4, 4], "confidence": [0.99609375, 1.0], "model_response": [["Which university or college did Harry S. Truman attend as a graduate student?", "Truman attended the University of Missouri as a graduate student. || University of Missouri"], ["Which city is the University of Missouri located in?", "Columbia || Columbia"]]}, "mis_info_dict_light": {"answer_condition": [4, 4], "confidence": [1.0, 1.0], "model_response": [["Which university or college did Harry S. Truman attend as a graduate student?", "Truman attended the University of Missouri as a graduate student. || University of Missouri"], ["Which city is the University of Missouri located in?", "Columbia || Columbia"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 4], "confidence": [0.006727650761604309, 0.908447265625], "model_response": [["Which university or college did Harry S. Truman attend as a graduate student?", "Kansas State University || Kansas State University"], ["Which city is Kansas State University located in?", "Manhattan, KS || Manhattan, KS"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 4], "confidence": [0.150390625, 1.0], "model_response": [["Which university or college did Harry S. Truman attend as a graduate student?", "Columbia University || Columbia University"], ["Which city is Columbia University located in?", "New York City || New York City"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.9453125, 0.972808837890625], "model_response": [["Which university or college did Harry S. Truman attend as a graduate student?", "Yale University || Yale University"], ["Which city is Yale University located in?", "New Haven, Connecticut || New Haven, Connecticut"]]}}}
{"hop1": {"mis_info_dict_severe": {"answer_condition": [1, 4], "confidence": [0.99609375, 0.3971656411886215], "model_response": [["Which university or college did Richard Nixon attend as a graduate student?", "Yale University || Yale University"], ["Who is the headmaster of Yale University in the year 1978?", "Raymond J. Donovan || Raymond J. Donovan"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 4], "confidence": [0.96484375, 0.3462982177734375], "model_response": [["Which university or college did Richard Nixon attend as a graduate student?", "Yale University || Yale University"], ["Who is the headmaster of Yale University in the year 1978?", "Kingman Brewster || Kingman Brewster"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.24797345395199955], "model_response": [["Which university or college did Richard Nixon attend as a graduate student?", "Yale University || Yale University"], ["Who is the headmaster of Yale University in the year 1978?", "Raymond A. Mason || Raymond A. Mason"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.020402080762096375], "model_response": [["Which university or college did Richard Nixon attend as a graduate student?", "Yale University || Yale University"], ["Who is the headmaster of Yale University in the year 1978?", "Raymond J. Sweeney || Raymond J. Sweeney"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [0.99609375, 0.09793656292345077], "model_response": [["Which university or college did Richard Nixon attend as a graduate student?", "Yale University || Yale University"], ["Who is the headmaster of Yale University in the year 1978?", "Raymond J. Ackerman || Raymond J. Ackerman"]]}, "mis_info_dict_light": {"answer_condition": [3, 4], "confidence": [1.0, 0.07222476101014763], "model_response": [["Which university or college did Richard Nixon attend as a graduate student?", "Harvard University || Harvard University"], ["Who is the headmaster of Harvard University in the year 1978?", "Harvard University was not founded until 1636. The headmaster of Harvard University in the year 1978 was Dr. Nathaniel Rochester. || Dr. Nathaniel Rochester"]]}}, "hop2": {"mis_info_dict_severe": {"answer_condition": [1, -1], "confidence": [0.9140625, -1], "model_response": [["Which university or college did Richard Nixon attend as a graduate student?", "Yale University || Yale University"], ["Who is the headmaster of Yale University in the year 1978?", "I'm sorry, I cannot provide an answer to that question as it is not related to the given information. || N/A"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 4], "confidence": [0.99609375, 0.5390625], "model_response": [["Which university or college did Richard Nixon attend as a graduate student?", "Yale University || Yale University"], ["Who is the headmaster of Yale University in the year 1978?", "Kingman Brewster || Kingman Brewster"]]}, "mis_info_dict_light": {"answer_condition": [1, 3], "confidence": [0.6640625, 1.0], "model_response": [["Which university or college did Richard Nixon attend as a graduate student?", "Yale University || Yale University"], ["Who is the headmaster of Yale University in the year 1978?", "John F. Kennedy || John F. Kennedy"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 0.9609375], "model_response": [["Which university or college did Richard Nixon attend as a graduate student?", "Yale University || Yale University"], ["Who is the headmaster of Yale University in the year 1978?", "Kingman Brewster || Kingman Brewster"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 4], "confidence": [0.99609375, 0.5524760092612269], "model_response": [["Which university or college did Richard Nixon attend as a graduate student?", "Yale University || Yale University"], ["Who is the headmaster of Yale University in the year 1978?", "Raymond A. Mason || Raymond A. Mason"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [0.99609375, 0.447265625], "model_response": [["Which university or college did Richard Nixon attend as a graduate student?", "Yale University || Yale University"], ["Who is the headmaster of Yale University in the year 1978?", "President Lyndon B. Johnson || Lyndon B. Johnson"]]}}}
{"hop1": {"unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.10205078125, 0.07982254028320312], "model_response": [["In which company did Raymond V. Gilmartin work, the first one in time order?", "Raymond V. Gilmartin worked in the company of IBM. || IBM"], ["Who is the CEO of IBM in the year 1971?", "Thomas Watson Jr. || Thomas Watson Jr."]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.2100086510181427, 0.16565322875976562], "model_response": [["In which company did Raymond V. Gilmartin work, the first one in time order?", "Gilmartin worked in the IBM Research Lab in San Jose, California. || IBM Research Lab"], ["Who is the CEO of IBM in the year 1971?", "Thomas Watson Jr. || Thomas Watson Jr."]]}, "hall_sbj_dict_light": {"answer_condition": [1, 4], "confidence": [0.236328125, 0.3226776123046875], "model_response": [["In which company did Raymond V. Gilmartin work, the first one in time order?", "IBM (International Business Machines Corporation) || IBM"], ["Who is the CEO of IBM in the year 1971?", "John Opel (1971-1973) || John Opel"]]}, "mis_info_dict_light": {"answer_condition": [3, 4], "confidence": [0.98046875, 0.376953125], "model_response": [["In which company did Raymond V. Gilmartin work, the first one in time order?", "Microsoft || Microsoft"], ["Who is the CEO of Microsoft in the year 1971?", "Paul Allen || Paul Allen"]]}, "mis_info_dict_severe": {"answer_condition": [3, 4], "confidence": [0.9076995849609375, 1.0], "model_response": [["In which company did Raymond V. Gilmartin work, the first one in time order?", "Chocolate Cake || Chocolate Cake"], ["Who is the CEO of Chocolate Cake in the year 1971?", "Raymond V. Gilmartin || Raymond V. Gilmartin"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 4], "confidence": [0.0230712890625, 1.0], "model_response": [["In which company did Raymond V. Gilmartin work, the first one in time order?", "Gilmartin was the first person in time order, and he worked at the New York Stock Exchange. || New York Stock Exchange"], ["Who is the CEO of the New York Stock Exchange in the year 1971?", "Raymond V. Gilmartin || Raymond V. Gilmartin"]]}}, "hop2": {"hall_sbj_dict_severe": {"answer_condition": [1, 4], "confidence": [0.921875, 1.0], "model_response": [["In which company did Raymond V. Gilmartin work, the first one in time order?", "IBM || IBM"], ["Who is the CEO of IBM in the year 1971?", "Raymond V. Gilmartin || Raymond V. Gilmartin"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.498046875, 1.0], "model_response": [["In which company did Raymond V. Gilmartin work, the first one in time order?", "Raymond V. Gilmartin worked in IBM, which is the first company in time order. || IBM"], ["Who is the CEO of IBM in the year 1971?", "Thomas J. Watson || Thomas J. Watson"]]}, "mis_info_dict_light": {"answer_condition": [1, 4], "confidence": [0.87890625, 0.87890625], "model_response": [["In which company did Raymond V. Gilmartin work, the first one in time order?", "Raymond V. Gilmartin worked for the first time in order at IBM. || IBM"], ["Who is the CEO of IBM in the year 1971?", "Raymond V. Gilmartin || Raymond V. Gilmartin"]]}, "mis_info_dict_severe": {"answer_condition": [1, 4], "confidence": [0.96875, 1.0], "model_response": [["In which company did Raymond V. Gilmartin work, the first one in time order?", "Gilmartin was the first person to work in the field of time order in the company of IBM. || IBM"], ["Who is the CEO of IBM in the year 1971?", "Raymond V. Gilmartin || Raymond V. Gilmartin"]]}, "hall_sbj_dict_light": {"answer_condition": [4, 4], "confidence": [0.0011749267578125, 1.0], "model_response": [["In which company did Raymond V. Gilmartin work, the first one in time order?", "General Electric (GE) || General Electric"], ["Who is the CEO of General Electric in the year 1971?", "Raymond V. Gilmartin || Raymond V. Gilmartin"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 4], "confidence": [0.8308601379394531, 1.0], "model_response": [["In which company did Raymond V. Gilmartin work, the first one in time order?", "Gilmartin was the first person to work in the field of time order. He worked for the United States Department of Commerce. || United States Department of Commerce"], ["Who was the CEO of the United States Department of Commerce in the year 1971?", "Raymond V. Gilmartin || Raymond V. Gilmartin"]]}}}
{"hop1": {"hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.65625, 1.0], "model_response": [["Which country does London belong to?", "United Kingdom || United Kingdom"], ["What's the year when Norway the first time formally establish diplomatic relations with United Kingdom?", "1814 || 1814"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.8515625, 1.0], "model_response": [["Which country does London belong to?", "United Kingdom || United Kingdom"], ["What's the year when Norway the first time formally establish diplomatic relations with United Kingdom?", "1814 || 1814"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.46484375, 1.0], "model_response": [["Which country does London belong to?", "Great Britain || Great Britain"], ["What's the year when Norway the first time formally establish diplomatic relations with United Kingdom?", "1814 || 1814"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.83203125, 1.0], "model_response": [["Which country does London belong to?", "United Kingdom || United Kingdom"], ["What's the year when Norway the first time formally establish diplomatic relations with United Kingdom?", "1814 || 1814"]]}, "mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [0.431640625, 1.0], "model_response": [["Which country does London belong to?", "Great Britain || Great Britain"], ["What's the year when Norway the first time formally establish diplomatic relations with United Kingdom?", "1814 || 1814"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.53515625, 1.0], "model_response": [["Which country does London belong to?", "United Kingdom || United Kingdom"], ["What's the year when Norway the first time formally establish diplomatic relations with United Kingdom?", "1814 || 1814"]]}}, "hop2": {"hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.95703125, 1.0], "model_response": [["Which country does London belong to?", "United Kingdom || United Kingdom"], ["What's the year when Norway the first time formally establish diplomatic relations with United Kingdom?", "1814 || 1814"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.859375, 1.0], "model_response": [["Which country does London belong to?", "United Kingdom || United Kingdom"], ["What's the year when Norway the first time formally establish diplomatic relations with United Kingdom?", "1814 || 1814"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.040283203125, 1.0], "model_response": [["Which country does London belong to?", "England || England"], ["What's the year when Norway the first time formally establish diplomatic relations with United Kingdom?", "1814 || 1814"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.328125, 0.988311767578125], "model_response": [["Which country does London belong to?", "Great Britain || Great Britain"], ["What's the year when Norway the first time formally establish diplomatic relations with United Kingdom?", "1814 || 1814"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [0.94140625, 0.0311279296875], "model_response": [["Which country does London belong to?", "United Kingdom || United Kingdom"], ["What's the year when Norway the first time formally establish diplomatic relations with United Kingdom?", "1875 || 1875"]]}, "mis_info_dict_light": {"answer_condition": [1, 3], "confidence": [0.1962890625, 1.0], "model_response": [["Which country does London belong to?", "Great Britain || Great Britain"], ["What's the year when Norway the first time formally establish diplomatic relations with United Kingdom?", "1901 || 1901"]]}}}
{"hop1": {"mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.875, 0.71136474609375], "model_response": [["From which country does the Volga originate?", "Russia || Russia"], ["What's the year when Mongolia the first time formally establish diplomatic relations with Russia?", "1928 || 1928"]]}, "mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [0.5, 0.7146148681640625], "model_response": [["From which country does the Volga originate?", "Russia || Russia"], ["What's the year when Mongolia the first time formally establish diplomatic relations with Russia?", "1928 || 1928"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.99609375, 0.7857208251953125], "model_response": [["From which country does the Volga originate?", "Russia || Russia"], ["What's the year when Mongolia the first time formally establish diplomatic relations with Russia?", "1928 || 1928"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 4], "confidence": [0.98046875, 0.17426300048828125], "model_response": [["From which country does the Volga originate?", "Russia || Russia"], ["What's the year when Mongolia the first time formally establish diplomatic relations with Russia?", "1860 || 1860"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 0.24993896484375], "model_response": [["From which country does the Volga originate?", "Russia || Russia"], ["What's the year when Mongolia the first time formally establish diplomatic relations with Russia?", "1860 || 1860"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.602081298828125], "model_response": [["From which country does the Volga originate?", "Russia || Russia"], ["What's the year when Mongolia the first time formally establish diplomatic relations with Russia?", "1928 || 1928"]]}}, "hop2": {"hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.9609375], "model_response": [["From which country does the Volga originate?", "Russia || Russia"], ["What's the year when Mongolia the first time formally establish diplomatic relations with Russia?", "1928 || 1928"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.6046142578125], "model_response": [["From which country does the Volga originate?", "Russia || Russia"], ["What's the year when Mongolia the first time formally establish diplomatic relations with Russia?", "1928 || 1928"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.97265625], "model_response": [["From which country does the Volga originate?", "Russia || Russia"], ["What's the year when Mongolia the first time formally establish diplomatic relations with Russia?", "1928 || 1928"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.7265625], "model_response": [["From which country does the Volga originate?", "Russia || Russia"], ["What's the year when Mongolia the first time formally establish diplomatic relations with Russia?", "1928 || 1928"]]}, "mis_info_dict_light": {"answer_condition": [1, 3], "confidence": [1.0, 1.0], "model_response": [["From which country does the Volga originate?", "Russia || Russia"], ["What's the year when Mongolia the first time formally establish diplomatic relations with Russia?", "1945 || 1945"]]}, "mis_info_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.55078125], "model_response": [["From which country does the Volga originate?", "Russia || Russia"], ["What's the year when Mongolia the first time formally establish diplomatic relations with Russia?", "1984 || 1984"]]}}}
{"hop1": {"mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.984375], "model_response": [["Which country in Asia is the most populated?", "China || China"], ["In which year was China founded or became independent?", "1911 || 1911"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.9765625], "model_response": [["Which country in Asia is the most populated?", "China || China"], ["In which year was China founded or became independent?", "1911 || 1911"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.9921875], "model_response": [["Which country in Asia is the most populated?", "China || China"], ["In which year was China founded or became independent?", "1911 || 1911"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 0.984375], "model_response": [["Which country in Asia is the most populated?", "China || China"], ["In which year was China founded or became independent?", "1911 || 1911"]]}, "mis_info_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.9609375], "model_response": [["Which country in Asia is the most populated?", "China || China"], ["In which year was China founded or became independent?", "1911 || 1911"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.96875], "model_response": [["Which country in Asia is the most populated?", "China || China"], ["In which year was China founded or became independent?", "1911 || 1911"]]}}, "hop2": {"hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.984375], "model_response": [["Which country in Asia is the most populated?", "China || China"], ["In which year was China founded or became independent?", "1911 || 1911"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 0.9609375], "model_response": [["Which country in Asia is the most populated?", "China || China"], ["In which year was China founded or became independent?", "1911 || 1911"]]}, "mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Which country in Asia is the most populated?", "China || China"], ["In which year was China founded or became independent?", "1949 || 1949"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 0.94140625], "model_response": [["Which country in Asia is the most populated?", "China || China"], ["In which year was China founded or became independent?", "1911 || 1911"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.98828125], "model_response": [["Which country in Asia is the most populated?", "China || China"], ["In which year was China founded or became independent?", "1911 || 1911"]]}, "mis_info_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.9453125], "model_response": [["Which country in Asia is the most populated?", "China || China"], ["In which year was China founded or became independent?", "The Qin Dynasty was established in 221 BC. || 221 BC"]]}}}
{"hop1": {"unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.9921875], "model_response": [["Who is the president / leader of Vietnam in the year 1945?", "Ho Chi Minh || Ho Chi Minh"], ["In which city was Ho Chi Minh born?", "Saigon || Saigon"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.984375], "model_response": [["Who is the president / leader of Vietnam in the year 1945?", "Ho Chi Minh || Ho Chi Minh"], ["In which city was Ho Chi Minh born?", "Saigon || Saigon"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.96875], "model_response": [["Who is the president / leader of Vietnam in the year 1945?", "Ho Chi Minh || Ho Chi Minh"], ["In which city was Ho Chi Minh born?", "Saigon || Saigon"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.9921875], "model_response": [["Who is the president / leader of Vietnam in the year 1945?", "Ho Chi Minh || Ho Chi Minh"], ["In which city was Ho Chi Minh born?", "Saigon || Saigon"]]}, "mis_info_dict_severe": {"answer_condition": [3, 4], "confidence": [1.0, 0.81195068359375], "model_response": [["Who is the president / leader of Vietnam in the year 1945?", "Pizza || Pizza"], ["In which city was Pizza born?", "New York City || New York City"]]}, "mis_info_dict_light": {"answer_condition": [3, 1], "confidence": [1.0, 0.94921875], "model_response": [["Who is the president / leader of Vietnam in the year 1945?", "Nguyen Van Thieu || Nguyen Van Thieu"], ["In which city was Nguyen Van Thieu born?", "Saigon || Saigon"]]}}, "hop2": {"unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.6640625], "model_response": [["Who is the president / leader of Vietnam in the year 1945?", "Ho Chi Minh || Ho Chi Minh"], ["In which city was Ho Chi Minh born?", "Saigon || Saigon"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.859375], "model_response": [["Who is the president / leader of Vietnam in the year 1945?", "Ho Chi Minh || Ho Chi Minh"], ["In which city was Ho Chi Minh born?", "Saigon || Saigon"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.99609375], "model_response": [["Who is the president / leader of Vietnam in the year 1945?", "Ho Chi Minh || Ho Chi Minh"], ["In which city was Ho Chi Minh born?", "Saigon || Saigon"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.98046875], "model_response": [["Who is the president / leader of Vietnam in the year 1945?", "Ho Chi Minh || Ho Chi Minh"], ["In which city was Ho Chi Minh born?", "Saigon || Saigon"]]}, "mis_info_dict_light": {"answer_condition": [1, 3], "confidence": [1.0, 1.0], "model_response": [["Who is the president / leader of Vietnam in the year 1945?", "Ho Chi Minh || Ho Chi Minh"], ["In which city was Ho Chi Minh born?", "Hanoi || Hanoi"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.95703125], "model_response": [["Who is the president / leader of Vietnam in the year 1945?", "Ho Chi Minh || Ho Chi Minh"], ["In which city was Ho Chi Minh born?", "Saigon || Saigon"]]}}}
{"hop1": {"hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.1064453125], "model_response": [["From which country does the Yalu River originate?", "China || China"], ["What is the name of the longest river in China?", "Yangtze || Yangtze"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.73699951171875], "model_response": [["From which country does the Yalu River originate?", "China || China"], ["What is the name of the longest river in China?", "The Yellow River || The Yellow River"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.4844970703125], "model_response": [["From which country does the Yalu River originate?", "China || China"], ["What is the name of the longest river in China?", "The Yellow River || The Yellow River"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 0.300567626953125], "model_response": [["From which country does the Yalu River originate?", "China || China"], ["What is the name of the longest river in China?", "The Yalu River is the longest river in China. || The Yalu River"]]}, "mis_info_dict_severe": {"answer_condition": [1, 4], "confidence": [0.99609375, 0.15128326416015625], "model_response": [["From which country does the Yalu River originate?", "China || China"], ["What is the name of the longest river in China?", "Yalu River || Yalu River"]]}, "mis_info_dict_light": {"answer_condition": [4, 4], "confidence": [1.0, 0.880889892578125], "model_response": [["From which country does the Yalu River originate?", "North Korea || North Korea"], ["What is the name of the longest river in North Korea?", "Yalu River || Yalu River"]]}}, "hop2": {"unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.08349609375], "model_response": [["From which country does the Yalu River originate?", "China || China"], ["What is the name of the longest river in China?", "The Yangtze River || The Yangtze River"]]}, "mis_info_dict_light": {"answer_condition": [1, 3], "confidence": [0.87109375, 0.99609375], "model_response": [["From which country does the Yalu River originate?", "China || China"], ["What is the name of the longest river in China?", "The Yellow River || The Yellow River"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.77935791015625], "model_response": [["From which country does the Yalu River originate?", "China || China"], ["What is the name of the longest river in China?", "The Yellow River || The Yellow River"]]}, "mis_info_dict_severe": {"answer_condition": [1, 4], "confidence": [0.99609375, 0.703125], "model_response": [["From which country does the Yalu River originate?", "China || China"], ["What is the name of the longest river in China?", "The Yalu River is the longest river in China. || Yalu River"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.359375], "model_response": [["From which country does the Yalu River originate?", "China || China"], ["What is the name of the longest river in China?", "The Yalu River is the longest river in China. || Yalu River"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 0.64599609375], "model_response": [["From which country does the Yalu River originate?", "China || China"], ["What is the name of the longest river in China?", "The Yellow River || The Yellow River"]]}}}
{"hop1": {"mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [0.431640625, 0.87890625], "model_response": [["Which country does London belong to?", "The United Kingdom || The United Kingdom"], ["What is the name of the longest river in the United Kingdom?", "The River Severn || The River Severn"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.65625, 0.8862159252166748], "model_response": [["Which country does London belong to?", "United Kingdom || United Kingdom"], ["What is the name of the longest river in the United Kingdom?", "The River Severn || The River Severn"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.8515625, 0.9197729229927063], "model_response": [["Which country does London belong to?", "United Kingdom || United Kingdom"], ["What is the name of the longest river in the United Kingdom?", "The River Severn || The River Severn"]]}, "mis_info_dict_severe": {"answer_condition": [1, 4], "confidence": [0.57421875, 0.45719146728515625], "model_response": [["Which country does London belong to?", "United Kingdom || United Kingdom"], ["What is the name of the longest river in the United Kingdom?", "The River Thames || The River Thames"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [0.53515625, 0.0595703125], "model_response": [["Which country does London belong to?", "United Kingdom || United Kingdom"], ["What is the name of the longest river in the United Kingdom?", "River Thames || River Thames"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.041259765625, 0.8652135729789734], "model_response": [["Which country does London belong to?", "Great Britain || Great Britain"], ["What is the name of the longest river in the United Kingdom?", "The River Severn || The River Severn"]]}}, "hop2": {"mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.78125, 0.46346795558929443], "model_response": [["Which country does London belong to?", "Great Britain || Great Britain"], ["What is the name of the longest river in the United Kingdom?", "The River Severn || The River Severn"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.1279296875, 0.9921875], "model_response": [["Which country does London belong to?", "The United Kingdom || The United Kingdom"], ["What is the name of the longest river in the United Kingdom?", "The River Severn || The River Severn"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [0.80859375, 0.6591339111328125], "model_response": [["Which country does London belong to?", "United Kingdom || United Kingdom"], ["What is the name of the longest river in the United Kingdom?", "The River Thames || River Thames"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [0.52734375, 0.06959527730941772], "model_response": [["Which country does London belong to?", "United Kingdom || United Kingdom"], ["What is the name of the longest river in the United Kingdom?", "The River Thames || The River Thames"]]}, "mis_info_dict_light": {"answer_condition": [1, 3], "confidence": [0.236328125, 0.25], "model_response": [["Which country does London belong to?", "Great Britain || Great Britain"], ["What is the name of the longest river in the United Kingdom?", "The River Thames || River Thames"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.56640625, 0.4015016555786133], "model_response": [["Which country does London belong to?", "Great Britain || Great Britain"], ["What is the name of the longest river in the United Kingdom?", "The River Severn || The River Severn"]]}}}
{"hop1": {"unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.9375, 1.0], "model_response": [["Who is the director of the film \"The Best Years of Our Lives\"?", "William Wyler || William Wyler"], ["In which year was D. W. Griffith born?", "1875 || 1875"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.99609375, 1.0], "model_response": [["Who is the director of the film \"The Best Years of Our Lives\"?", "William Wyler || William Wyler"], ["In which year was D. W. Griffith born?", "1875 || 1875"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.77734375, 1.0], "model_response": [["Who is the director of the film \"The Best Years of Our Lives\"?", "William Wyler || William Wyler"], ["In which year was D. W. Griffith born?", "1875 || 1875"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.99609375, 1.0], "model_response": [["Who is the director of the film \"The Best Years of Our Lives\"?", "William Wyler || William Wyler"], ["In which year was D. W. Griffith born?", "1875 || 1875"]]}, "mis_info_dict_light": {"answer_condition": [4, 4], "confidence": [1.0, 1.0], "model_response": [["Who is the director of the film \"The Best Years of Our Lives\"?", "Steven Spielberg || Steven Spielberg"], ["In which year was Steven Spielberg born?", "1946 || 1946"]]}, "mis_info_dict_severe": {"answer_condition": [3, 4], "confidence": [1.0, 0.3984375], "model_response": [["Who is the director of the film \"The Best Years of Our Lives\"?", "Chocolate chip cookies || Chocolate chip cookies"], ["In which year were chocolate chip cookies invented?", "1931 || 1931"]]}}, "hop2": {"mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [0.376953125, 0.9921875], "model_response": [["Who is the director of the film \"The Best Years of Our Lives\"?", "William Wyler || William Wyler"], ["In which year was D. W. Griffith born?", "1875 || 1875"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Who is the director of the film \"The Best Years of Our Lives\"?", "William Wyler || William Wyler"], ["In which year was D. W. Griffith born?", "1875 || 1875"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.99609375, 1.0], "model_response": [["Who is the director of the film \"The Best Years of Our Lives\"?", "William Wyler || William Wyler"], ["In which year was D. W. Griffith born?", "1875 || 1875"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.9765625, 1.0], "model_response": [["Who is the director of the film \"The Best Years of Our Lives\"?", "William Wyler || William Wyler"], ["In which year was D. W. Griffith born?", "1875 || 1875"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.99609375, 1.0], "model_response": [["Who is the director of the film \"The Best Years of Our Lives\"?", "William Wyler || William Wyler"], ["In which year was D. W. Griffith born?", "1875 || 1875"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Who is the director of the film \"The Best Years of Our Lives\"?", "William Wyler || William Wyler"], ["In which year was D. W. Griffith born?", "1875 || 1875"]]}}}
{"hop1": {"unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Which film won the Oscar for Outstanding Picture in 1974, being the first one in alphabetical order?", "The Sting || The Sting"], ["In which year was \"The Sting\" released?", "1973 || 1973"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.9921875, 1.0], "model_response": [["Which film won the Oscar for Outstanding Picture in 1974, being the first one in alphabetical order?", "The Sting || The Sting"], ["In which year was \"The Sting\" released?", "1973 || 1973"]]}, "mis_info_dict_light": {"answer_condition": [3, 4], "confidence": [1.0, 1.0], "model_response": [["Which film won the Oscar for Outstanding Picture in 1974, being the first one in alphabetical order?", "The Sound of Music || The Sound of Music"], ["In which year was \"The Sound of Music\" released?", "1965 || 1965"]]}, "hall_sbj_dict_light": {"answer_condition": [3, 4], "confidence": [1.0, 1.0], "model_response": [["Which film won the Oscar for Outstanding Picture in 1974, being the first one in alphabetical order?", "The Godfather || The Godfather"], ["In which year was \"The Godfather\" released?", "1972 || 1972"]]}, "mis_info_dict_severe": {"answer_condition": [3, 4], "confidence": [0.9690088033676147, 0.01981353759765625], "model_response": [["Which film won the Oscar for Outstanding Picture in 1974, being the first one in alphabetical order?", "Chocolate Chip Cookies (1974) || Chocolate Chip Cookies"], ["In which year were chocolate chip cookies invented?", "1929 || 1929"]]}, "hall_sbj_dict_severe": {"answer_condition": [3, 4], "confidence": [1.0, 0.8671875], "model_response": [["Which film won the Oscar for Outstanding Picture in 1974, being the first one in alphabetical order?", "Sunflowers || Sunflowers"], ["In which year was \"Sunflowers\" released?", "1974 || 1974"]]}}, "hop2": {"mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Which film won the Oscar for Outstanding Picture in 1974, being the first one in alphabetical order?", "The Sting || The Sting"], ["In which year was \"The Sting\" released?", "1973 || 1973"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.99609375, 1.0], "model_response": [["Which film won the Oscar for Outstanding Picture in 1974, being the first one in alphabetical order?", "The Sting || The Sting"], ["In which year was \"The Sting\" released?", "1973 || 1973"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.99609375, 1.0], "model_response": [["Which film won the Oscar for Outstanding Picture in 1974, being the first one in alphabetical order?", "The Sting || The Sting"], ["In which year was \"The Sting\" released?", "1973 || 1973"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.8754730224609375, 1.0], "model_response": [["Which film won the Oscar for Outstanding Picture in 1974, being the first one in alphabetical order?", "The Sting || The Sting"], ["In which year was \"The Sting\" released?", "1973 || 1973"]]}, "hall_sbj_dict_light": {"answer_condition": [3, 4], "confidence": [0.9921875, 1.0], "model_response": [["Which film won the Oscar for Outstanding Picture in 1974, being the first one in alphabetical order?", "The Godfather || The Godfather"], ["In which year was \"The Godfather\" released?", "1972 || 1972"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Which film won the Oscar for Outstanding Picture in 1974, being the first one in alphabetical order?", "The Sting || The Sting"], ["In which year was \"The Sting\" released?", "1973 || 1973"]]}}}
{"hop1": {"mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.9609375], "model_response": [["Which country in Asia is the most populated?", "China || China"], ["In which year was China founded or became independent?", "1911 || 1911"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.96875], "model_response": [["Which country in Asia is the most populated?", "China || China"], ["In which year was China founded or became independent?", "1911 || 1911"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.984375], "model_response": [["Which country in Asia is the most populated?", "China || China"], ["In which year was China founded or became independent?", "1911 || 1911"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.984375], "model_response": [["Which country in Asia is the most populated?", "China || China"], ["In which year was China founded or became independent?", "1911 || 1911"]]}, "mis_info_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 0.984375], "model_response": [["Which country in Asia is the most populated?", "China || China"], ["In which year was China founded or became independent?", "1911 || 1911"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 0.9765625], "model_response": [["Which country in Asia is the most populated?", "China || China"], ["In which year was China founded or became independent?", "1911 || 1911"]]}}, "hop2": {"mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Which country in Asia is the most populated?", "China || China"], ["In which year was China founded or became independent?", "1949 || 1949"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.78515625], "model_response": [["Which country in Asia is the most populated?", "China || China"], ["In which year was China founded or became independent?", "1911 || 1911"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.97265625], "model_response": [["Which country in Asia is the most populated?", "China || China"], ["In which year was China founded or became independent?", "1911 || 1911"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 0.94140625], "model_response": [["Which country in Asia is the most populated?", "China || China"], ["In which year was China founded or became independent?", "1911 || 1911"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.9921875], "model_response": [["Which country in Asia is the most populated?", "China || China"], ["In which year was China founded or became independent?", "1911 || 1911"]]}, "mis_info_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.05029296875], "model_response": [["Which country in Asia is the most populated?", "China || China"], ["In which year was China founded or became independent?", "Unknown || Unknown"]]}}}
{"hop1": {"mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.980560302734375, 0.26953125], "model_response": [["What's the year when Russia the first time formally establish diplomatic relations with Norway?", "1825 || 1825"], ["Who is the president / leader of Russia in the year 1825?", "Alexander I || Alexander I"]]}, "mis_info_dict_light": {"answer_condition": [3, 1], "confidence": [1.0, 0.47283935546875], "model_response": [["What's the year when Russia the first time formally establish diplomatic relations with Norway?", "1850 || 1850"], ["Who is the president/leader of Russia in the year 1850?", "Alexander II || Alexander II"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [0.99609375, 0.9006081819534302], "model_response": [["What's the year when Russia the first time formally establish diplomatic relations with Norway?", "1825 || 1825"], ["Who is the president / leader of Russia in the year 1825?", "Catherine the Great || Catherine the Great"]]}, "hall_sbj_dict_severe": {"answer_condition": [4, 1], "confidence": [0.7734375, 0.376953125], "model_response": [["What's the year when Russia the first time formally establish diplomatic relations with Norway?", "1814 || 1814"], ["Who is the president / leader of Russia in the year 1814?", "Alexander I || Alexander I"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 4], "confidence": [0.984375, 0.6767892837524414], "model_response": [["What's the year when Russia the first time formally establish diplomatic relations with Norway?", "1814 || 1814"], ["Who is the president / leader of Russia in the year 1814?", "Catherine the Great || Catherine the Great"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 4], "confidence": [0.98828125, 0.7416620254516602], "model_response": [["What's the year when Russia the first time formally establish diplomatic relations with Norway?", "1825 || 1825"], ["Who is the president / leader of Russia in the year 1825?", "Catherine the Great || Catherine the Great"]]}}, "hop2": {"hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.9921875, 0.376953125], "model_response": [["What's the year when Russia the first time formally establish diplomatic relations with Norway?", "1825 || 1825"], ["Who is the president / leader of Russia in the year 1825?", "Alexander I || Alexander I"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.98046875, 0.91796875], "model_response": [["What's the year when Russia the first time formally establish diplomatic relations with Norway?", "1825 || 1825"], ["Who is the president / leader of Russia in the year 1825?", "Alexander I || Alexander I"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.9921875, 0.8515625], "model_response": [["What's the year when Russia the first time formally establish diplomatic relations with Norway?", "1825 || 1825"], ["Who is the president / leader of Russia in the year 1825?", "Alexander I || Alexander I"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.494140625, 0.26013779640197754], "model_response": [["What's the year when Russia the first time formally establish diplomatic relations with Norway?", "1825 || 1825"], ["Who is the president / leader of Russia in the year 1825?", "Czar Alexander I || Czar Alexander I"]]}, "mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [0.99609375, 1.0], "model_response": [["What's the year when Russia the first time formally establish diplomatic relations with Norway?", "1825 || 1825"], ["Who is the president / leader of Russia in the year 1825?", "Nicholas I || Nicholas I"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 1], "confidence": [0.498046875, 0.953125], "model_response": [["What's the year when Russia the first time formally establish diplomatic relations with Norway?", "1814 || 1814"], ["Who is the president / leader of Russia in the year 1814?", "Alexander I || Alexander I"]]}}}
{"hop1": {"hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.96484375], "model_response": [["In which company (the first one in time order) does James Madison work?", "US Congress || US Congress"], ["In which city is the headquarters of the US Congress located?", "Washington D.C. || Washington D.C."]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.2474212646484375, 0.9765625], "model_response": [["In which company (the first one in time order) does James Madison work?", "James Madison worked in the United States Congress. || United States Congress"], ["In which city is the headquarters of the US Congress located?", "Washington D.C. || Washington D.C."]]}, "mis_info_dict_light": {"answer_condition": [3, 4], "confidence": [1.0, 0.1826171875], "model_response": [["In which company (the first one in time order) does James Madison work?", "Microsoft || Microsoft"], ["In which city is the headquarters of Microsoft located?", "Seattle || Seattle"]]}, "hall_sbj_dict_severe": {"answer_condition": [4, 4], "confidence": [0.687652587890625, 1.0], "model_response": [["In which company (the first one in time order) does James Madison work?", "James Madison worked in the Virginia State Senate. || Virginia State Senate"], ["In which city is the headquarters of the Virginia State Senate located?", "Richmond || Richmond"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 4], "confidence": [0.796875, 0.82421875], "model_response": [["In which company (the first one in time order) does James Madison work?", "The Virginia Company. || Virginia Company"], ["In which city is the headquarters of the Virginia Company located?", "London || London"]]}, "mis_info_dict_severe": {"answer_condition": [4, 4], "confidence": [0.6381215453147888, 1.0], "model_response": [["In which company (the first one in time order) does James Madison work?", "Madison Chocolate Company || Madison Chocolate Company"], ["In which city is the headquarters of the Madison Chocolate Company located?", "New York City || New York City"]]}}, "hop2": {"hall_sbj_dict_severe": {"answer_condition": [4, 1], "confidence": [0.576385498046875, 0.78515625], "model_response": [["In which company (the first one in time order) does James Madison work?", "James Madison worked for the United States Department of State. || United States Department of State"], ["In which city is the headquarters of the United States Department of State located?", "Washington DC || Washington DC"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 1], "confidence": [0.347076416015625, 0.04736328125], "model_response": [["In which company (the first one in time order) does James Madison work?", "James Madison worked in the Department of State. || Department of State"], ["In which city is the headquarters of the Department of State located?", "Washington, D.C. || Washington, D.C."]]}, "hall_sbj_dict_light": {"answer_condition": [4, 1], "confidence": [0.074188232421875, 1.0], "model_response": [["In which company (the first one in time order) does James Madison work?", "James Madison worked in the Department of Treasury in the first company. || Department of Treasury"], ["In which city is the headquarters of the Department of Treasury located?", "Washington DC || Washington DC"]]}, "mis_info_dict_light": {"answer_condition": [4, 1], "confidence": [0.67578125, 0.99609375], "model_response": [["In which company (the first one in time order) does James Madison work?", "James Madison worked in the company of the United States. || United States"], ["In which city is the headquarters of the United States located?", "Washington D.C. || Washington D.C."]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 1], "confidence": [0.241241455078125, 0.953125], "model_response": [["In which company (the first one in time order) does James Madison work?", "James Madison worked in the United States Department of State. || United States Department of State"], ["In which city is the headquarters of the United States Department of State located?", "Washington D.C. || Washington D.C."]]}, "mis_info_dict_severe": {"answer_condition": [4, 4], "confidence": [0.2171478271484375, 1.0], "model_response": [["In which company (the first one in time order) does James Madison work?", "James Madison worked in the company of the United States of America. || United States of America"], ["In which city is the headquarters of the United Nations located?", "New York City || New York City"]]}}}
{"hop1": {"hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.7276153564453125], "model_response": [["Who is the president / leader of Israel in the year 1971?", "Golda Meir || Golda Meir"], ["In which city was Golda Meir born?", "Kiev, Ukraine || Kiev, Ukraine"]]}, "mis_info_dict_severe": {"answer_condition": [3, 4], "confidence": [0.9453125, 0.4185791015625], "model_response": [["Who is the president / leader of Israel in the year 1971?", "Pizza || Pizza"], ["In which city was pizza born?", "New York City || New York City"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 4], "confidence": [0.99609375, 1.0], "model_response": [["Who is the president / leader of Israel in the year 1971?", "Yitzhak Rabin || Yitzhak Rabin"], ["In which city was Yitzhak Rabin born?", "Tel Aviv || Tel Aviv"]]}, "mis_info_dict_light": {"answer_condition": [3, 4], "confidence": [1.0, 1.0], "model_response": [["Who is the president / leader of Israel in the year 1971?", "Benjamin Netanyahu || Benjamin Netanyahu"], ["In which city was Benjamin Netanyahu born?", "Tel Aviv || Tel Aviv"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 4], "confidence": [0.98046875, 1.0], "model_response": [["Who is the president / leader of Israel in the year 1971?", "Yitzhak Rabin || Yitzhak Rabin"], ["In which city was Yitzhak Rabin born?", "Tel Aviv || Tel Aviv"]]}, "hall_sbj_dict_light": {"answer_condition": [4, 4], "confidence": [0.99609375, 1.0], "model_response": [["Who is the president / leader of Israel in the year 1971?", "Yitzhak Rabin || Yitzhak Rabin"], ["In which city was Yitzhak Rabin born?", "Tel Aviv || Tel Aviv"]]}}, "hop2": {"mis_info_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.12017793997074477], "model_response": [["Who is the president / leader of Israel in the year 1971?", "Golda Meir || Golda Meir"], ["In which city was Golda Meir born?", "Pizza, Italy || Pizza, Italy"]]}, "mis_info_dict_light": {"answer_condition": [1, 3], "confidence": [1.0, 1.0], "model_response": [["Who is the president / leader of Israel in the year 1971?", "Golda Meir || Golda Meir"], ["In which city was Golda Meir born?", "Tel Aviv || Tel Aviv"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 4], "confidence": [0.953125, 0.99609375], "model_response": [["Who is the president / leader of Israel in the year 1971?", "Yitzhak Rabin || Yitzhak Rabin"], ["In which city was Yitzhak Rabin born?", "Tel Aviv || Tel Aviv"]]}, "hall_sbj_dict_light": {"answer_condition": [4, 4], "confidence": [0.81640625, 0.96875], "model_response": [["Who is the president / leader of Israel in the year 1971?", "Yitzhak Rabin || Yitzhak Rabin"], ["In which city was Yitzhak Rabin born?", "Tel Aviv || Tel Aviv"]]}, "hall_sbj_dict_severe": {"answer_condition": [4, 4], "confidence": [0.9921875, 1.0], "model_response": [["Who is the president / leader of Israel in the year 1971?", "Yitzhak Rabin || Yitzhak Rabin"], ["In which city was Yitzhak Rabin born?", "Tel Aviv || Tel Aviv"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 4], "confidence": [0.98828125, 0.9921875], "model_response": [["Who is the president / leader of Israel in the year 1971?", "Yitzhak Rabin || Yitzhak Rabin"], ["In which city was Yitzhak Rabin born?", "Tel Aviv || Tel Aviv"]]}}}
{"hop1": {"hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.9921875, 0.9382905960083008], "model_response": [["Which city in Asia has the largest population?", "Tokyo, Japan || Tokyo"], ["What is the time zone of Tokyo in UTC?", "UTC+9 || UTC+9"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.62109375, 0.9456932544708252], "model_response": [["Which city in Asia has the largest population?", "Tokyo || Tokyo"], ["What is the time zone of Tokyo in UTC?", "UTC+9 || UTC+9"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.99609375, 0.87890625], "model_response": [["Which city in Asia has the largest population?", "Tokyo || Tokyo"], ["What is the time zone of Tokyo in UTC?", "UTC+9 || UTC+9"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.73046875, 0.9345674514770508], "model_response": [["Which city in Asia has the largest population?", "Tokyo, Japan || Tokyo"], ["What is the time zone of Tokyo in UTC?", "UTC+9 || UTC+9"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.5, 0.9651938080787659], "model_response": [["Which city in Asia has the largest population?", "Shanghai || Shanghai"], ["What is the time zone of Tokyo in UTC?", "UTC+9 || UTC+9"]]}, "mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [0.953125, 0.9805905818939209], "model_response": [["Which city in Asia has the largest population?", "Shanghai || Shanghai"], ["What is the time zone of Tokyo in UTC?", "UTC+9 || UTC+9"]]}}, "hop2": {"unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.81640625, 0.8583739399909973], "model_response": [["Which city in Asia has the largest population?", "Tokyo || Tokyo"], ["What is the time zone of Tokyo in UTC?", "UTC+9 || UTC+9"]]}, "mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [0.81640625, 0.5313992500305176], "model_response": [["Which city in Asia has the largest population?", "Tokyo, Japan || Tokyo"], ["What is the time zone of Tokyo in UTC?", "UTC+9 || UTC+9"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.99609375, 0.03245735168457031], "model_response": [["Which city in Asia has the largest population?", "Tokyo || Tokyo"], ["What is the time zone of Tokyo in UTC?", "Tokyo is in the UTC +9 time zone. || UTC +9"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.98828125, 0.06019401550292969], "model_response": [["Which city in Asia has the largest population?", "Tokyo || Tokyo"], ["What is the time zone of Tokyo in UTC?", "Tokyo is in the UTC+9 time zone. || UTC+9"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.4728466272354126], "model_response": [["Which city in Asia has the largest population?", "Tokyo || Tokyo"], ["What is the time zone of Tokyo in UTC?", "UTC+9 || UTC+9"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.1826171875, 0.3955113887786865], "model_response": [["Which city in Asia has the largest population?", "Shanghai || Shanghai"], ["What is the time zone of Tokyo in UTC?", "Tokyo is in the time zone of UTC +9 hours. || UTC +9 hours"]]}}}
{"hop1": {"hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.2099609375, 0.9232635498046875], "model_response": [["Which country does Los Angeles belong to?", "The United States || The United States"], ["What's the year when Sweden the first time formally establish diplomatic relations with USA?", "1855 || 1855"]]}, "mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [0.84375, 0.897308349609375], "model_response": [["Which country does Los Angeles belong to?", "The United States || The United States"], ["What's the year when Sweden the first time formally establish diplomatic relations with USA?", "1855 || 1855"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.419921875, 0.82464599609375], "model_response": [["Which country does Los Angeles belong to?", "The United States || The United States"], ["What's the year when Sweden the first time formally establish diplomatic relations with USA?", "1855 || 1855"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.703125, 0.95361328125], "model_response": [["Which country does Los Angeles belong to?", "United States || United States"], ["What's the year when Sweden the first time formally establish diplomatic relations with USA?", "1855 || 1855"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.87890625, 0.9535369873046875], "model_response": [["Which country does Los Angeles belong to?", "Los Angeles belongs to the United States of America. || United States of America"], ["What's the year when Sweden the first time formally establish diplomatic relations with USA?", "1855 || 1855"]]}, "mis_info_dict_severe": {"answer_condition": [3, 4], "confidence": [0.9922027587890625, 0.501251220703125], "model_response": [["Which country does Los Angeles belong to?", "Chocolate cake || Chocolate cake"], ["What's the year when Sweden the first time formally establish diplomatic relations with chocolate cake?", "1752 || 1752"]]}}, "hop2": {"hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.0308837890625, 0.98046875], "model_response": [["Which country does Los Angeles belong to?", "The United States of America || The United States of America"], ["What's the year when Sweden the first time formally establish diplomatic relations with USA?", "1855 || 1855"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.640625, 0.529541015625], "model_response": [["Which country does Los Angeles belong to?", "The United States || The United States"], ["What's the year when Sweden the first time formally establish diplomatic relations with USA?", "1855 || 1855"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.6796875, 0.96514892578125], "model_response": [["Which country does Los Angeles belong to?", "USA || USA"], ["What's the year when Sweden the first time formally establish diplomatic relations with USA?", "1855 || 1855"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.348114013671875, 1.0], "model_response": [["Which country does Los Angeles belong to?", "The United States of America || The United States of America"], ["What's the year when Sweden the first time formally establish diplomatic relations with USA?", "1855 || 1855"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [0.11376953125, 0.0014632344245910645], "model_response": [["Which country does Los Angeles belong to?", "United States || United States"], ["What's the year when Sweden the first time formally establish diplomatic relations with USA?", "1901 || 1901"]]}, "mis_info_dict_light": {"answer_condition": [1, 3], "confidence": [0.701507568359375, 1.0], "model_response": [["Which country does Los Angeles belong to?", "The United States || The United States"], ["What's the year when Sweden the first time formally establish diplomatic relations with USA?", "1776 || 1776"]]}}}
{"hop1": {"unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.06494140625], "model_response": [["Which country does Montreal belong to?", "Canada || Canada"], ["What's the year when Syria the first time formally establish diplomatic relations with Canada?", "1960 || 1960"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 0.0220947265625], "model_response": [["Which country does Montreal belong to?", "Canada || Canada"], ["What's the year when Syria the first time formally establish diplomatic relations with Canada?", "1963 || 1963"]]}, "mis_info_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 0.77734375], "model_response": [["Which country does Montreal belong to?", "Canada || Canada"], ["What's the year when Syria the first time formally establish diplomatic relations with Canada?", "1961 || 1961"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 0.796875], "model_response": [["Which country does Montreal belong to?", "Canada || Canada"], ["What's the year when Syria the first time formally establish diplomatic relations with Canada?", "1961 || 1961"]]}, "mis_info_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.79296875], "model_response": [["Which country does Montreal belong to?", "Canada || Canada"], ["What's the year when Syria the first time formally establish diplomatic relations with Canada?", "1961 || 1961"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.78125], "model_response": [["Which country does Montreal belong to?", "Canada || Canada"], ["What's the year when Syria the first time formally establish diplomatic relations with Canada?", "1961 || 1961"]]}}, "hop2": {"hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.71484375], "model_response": [["Which country does Montreal belong to?", "Canada || Canada"], ["What's the year when Syria the first time formally establish diplomatic relations with Canada?", "1960 || 1960"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.486328125], "model_response": [["Which country does Montreal belong to?", "Canada || Canada"], ["What's the year when Syria the first time formally establish diplomatic relations with Canada?", "1960 || 1960"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 0.07568359375], "model_response": [["Which country does Montreal belong to?", "Canada || Canada"], ["What's the year when Syria the first time formally establish diplomatic relations with Canada?", "1971 || 1971"]]}, "mis_info_dict_light": {"answer_condition": [1, 3], "confidence": [1.0, 1.0], "model_response": [["Which country does Montreal belong to?", "Canada || Canada"], ["What's the year when Syria the first time formally establish diplomatic relations with Canada?", "1975 || 1975"]]}, "mis_info_dict_severe": {"answer_condition": [1, 3], "confidence": [1.0, 0.55078125], "model_response": [["Which country does Montreal belong to?", "Canada || Canada"], ["What's the year when Syria the first time formally establish diplomatic relations with Canada?", "Pizza || Pizza"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.4609375], "model_response": [["Which country does Montreal belong to?", "Canada || Canada"], ["What's the year when Syria the first time formally establish diplomatic relations with Canada?", "1961 || 1961"]]}}}
{"hop1": {"hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.31711578369140625], "model_response": [["Who is the president / leader of Finland in the year 1814?", "Carl Gustaf Mannerheim || Carl Gustaf Mannerheim"], ["In which year was Carl Gustaf Mannerheim born?", "1847 || 1847"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.7141876220703125], "model_response": [["Who is the president / leader of Finland in the year 1814?", "Carl Gustaf Mannerheim || Carl Gustaf Mannerheim"], ["In which year was Carl Gustaf Mannerheim born?", "1847 || 1847"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 4], "confidence": [0.58913236508306, 0.13671875], "model_response": [["Who is the president / leader of Finland in the year 1814?", "Carl Johan Adlercreutz || Carl Johan Adlercreutz"], ["In which year was Carl Johan Adlercreutz born?", "1750 || 1750"]]}, "mis_info_dict_light": {"answer_condition": [3, 4], "confidence": [1.0, 1.0], "model_response": [["Who is the president / leader of Finland in the year 1814?", "Alexander I || Alexander I"], ["In which year was Alexander I born?", "1777 || 1777"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 4], "confidence": [0.006068508176396772, 0.107421875], "model_response": [["Who is the president / leader of Finland in the year 1814?", "Fredrik Ludwig von Krusenstierna || Fredrik Ludwig von Krusenstierna"], ["In which year was Fredrik Ludwig von Krusenstierna born?", "1749 || 1749"]]}, "mis_info_dict_severe": {"answer_condition": [3, 4], "confidence": [0.9766387939453125, 0.609375], "model_response": [["Who is the president / leader of Finland in the year 1814?", "Chocolate cake is not a person. It is a dessert. || Chocolate cake"], ["In which year was chocolate cake born?", "1814 || 1814"]]}}, "hop2": {"unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.26787372725084424, 0.50390625], "model_response": [["Who is the president / leader of Finland in the year 1814?", "Carl Gustaf Mannerheim || Carl Gustaf Mannerheim"], ["In which year was Carl Gustaf Mannerheim born?", "1847 || 1847"]]}, "mis_info_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 1.0], "model_response": [["Who is the president / leader of Finland in the year 1814?", "Carl Gustaf Mannerheim || Carl Gustaf Mannerheim"], ["In which year was Carl Gustaf Mannerheim born?", "1867 || 1867"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [0.38049569400027394, 0.046142578125], "model_response": [["Who is the president / leader of Finland in the year 1814?", "Carl Gustaf Mannerheim || Carl Gustaf Mannerheim"], ["In which year was Carl Gustaf Mannerheim born?", "1845 || 1845"]]}, "mis_info_dict_light": {"answer_condition": [1, 3], "confidence": [1.0, 1.0], "model_response": [["Who is the president / leader of Finland in the year 1814?", "Carl Gustaf Mannerheim || Carl Gustaf Mannerheim"], ["In which year was Carl Gustaf Mannerheim born?", "1875 || 1875"]]}, "hall_sbj_dict_light": {"answer_condition": [4, 4], "confidence": [0.39746975835441845, 0.0654296875], "model_response": [["Who is the president / leader of Finland in the year 1814?", "Carl Johan Adlercreutz || Carl Johan Adlercreutz"], ["In which year was Carl Johan Adlercreutz born?", "1770 || 1770"]]}, "hall_sbj_dict_severe": {"answer_condition": [4, 4], "confidence": [0.0636989658460152, 0.07763671875], "model_response": [["Who is the president / leader of Finland in the year 1814?", "Carl Johan von Eckerman was the president / leader of Finland in the year 1814. || Carl Johan von Eckerman"], ["In which year was Carl Johan von Eckerman born?", "1764 || 1764"]]}}}
{"hop1": {"mis_info_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.47664642333984375], "model_response": [["Which country in Asia is the most populated?", "China || China"], ["What's the year when China the first time formally establish diplomatic relations with Mongolia?", "1929 || 1929"]]}, "mis_info_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 0.00070953369140625], "model_response": [["Which country in Asia is the most populated?", "China || China"], ["What's the year when China the first time formally establish diplomatic relations with Mongolia?", "1911 || 1911"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 0.2275390625], "model_response": [["Which country in Asia is the most populated?", "China || China"], ["What's the year when China the first time formally establish diplomatic relations with Mongolia?", "1928 || 1928"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.459136962890625], "model_response": [["Which country in Asia is the most populated?", "China || China"], ["What's the year when China the first time formally establish diplomatic relations with Mongolia?", "1929 || 1929"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.240234375], "model_response": [["Which country in Asia is the most populated?", "China || China"], ["What's the year when China the first time formally establish diplomatic relations with Mongolia?", "1923 || 1923"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 0.439453125], "model_response": [["Which country in Asia is the most populated?", "China || China"], ["What's the year when China the first time formally establish diplomatic relations with Mongolia?", "1929 || 1929"]]}}, "hop2": {"hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Which country in Asia is the most populated?", "China || China"], ["What's the year when China the first time formally establish diplomatic relations with Mongolia?", "1949 || 1949"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Which country in Asia is the most populated?", "China || China"], ["What's the year when China the first time formally establish diplomatic relations with Mongolia?", "1949 || 1949"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.45403289794921875], "model_response": [["Which country in Asia is the most populated?", "China || China"], ["What's the year when China the first time formally establish diplomatic relations with Mongolia?", "1929 || 1929"]]}, "mis_info_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.89453125], "model_response": [["Which country in Asia is the most populated?", "China || China"], ["What's the year when China the first time formally establish diplomatic relations with Mongolia?", "1984 || 1984"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 0.1428375244140625], "model_response": [["Which country in Asia is the most populated?", "China || China"], ["What's the year when China the first time formally establish diplomatic relations with Mongolia?", "1923 || 1923"]]}, "mis_info_dict_light": {"answer_condition": [1, 3], "confidence": [1.0, 1.0], "model_response": [["Which country in Asia is the most populated?", "China || China"], ["What's the year when China the first time formally establish diplomatic relations with Mongolia?", "1960 || 1960"]]}}}
{"hop1": {"hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.5703125, 0.99609375], "model_response": [["Which country does Los Angeles belong to?", "USA || USA"], ["Who is the president / leader of USA in the year 1980?", "Ronald Reagan || Ronald Reagan"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.09619140625, 0.98046875], "model_response": [["Which country does Los Angeles belong to?", "USA || USA"], ["Who is the president / leader of USA in the year 1980?", "Ronald Reagan || Ronald Reagan"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.244140625, 0.98046875], "model_response": [["Which country does Los Angeles belong to?", "United States || United States"], ["Who is the president / leader of USA in the year 1980?", "Ronald Reagan || Ronald Reagan"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.66015625, 0.9649658203125], "model_response": [["Which country does Los Angeles belong to?", "United States || United States"], ["Who is the president / leader of USA in the year 1980?", "Ronald Reagan || Ronald Reagan"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.419921875, 0.96875], "model_response": [["Which country does Los Angeles belong to?", "United States || United States"], ["Who is the president / leader of USA in the year 1980?", "Ronald Reagan || Ronald Reagan"]]}, "mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [0.84375, 0.9649658203125], "model_response": [["Which country does Los Angeles belong to?", "The United States || The United States"], ["Who is the president / leader of USA in the year 1980?", "Ronald Reagan || Ronald Reagan"]]}}, "hop2": {"hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.01318359375, 0.96875], "model_response": [["Which country does Los Angeles belong to?", "USA || USA"], ["Who is the president / leader of USA in the year 1980?", "Ronald Reagan || Ronald Reagan"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.49609375, 0.8828125], "model_response": [["Which country does Los Angeles belong to?", "The United States || The United States"], ["Who is the president / leader of USA in the year 1980?", "Ronald Reagan || Ronald Reagan"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.7578125, 0.941619873046875], "model_response": [["Which country does Los Angeles belong to?", "United States || United States"], ["Who is the president / leader of USA in the year 1980?", "Ronald Reagan || Ronald Reagan"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.4765625, 0.9921875], "model_response": [["Which country does Los Angeles belong to?", "United States || United States"], ["Who is the president / leader of USA in the year 1980?", "Ronald Reagan || Ronald Reagan"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.490234375, 0.99609375], "model_response": [["Which country does Los Angeles belong to?", "The United States || The United States"], ["Who is the president / leader of USA in the year 1980?", "Ronald Reagan || Ronald Reagan"]]}, "mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [0.236328125, 1.0], "model_response": [["Which country does Los Angeles belong to?", "United States || United States"], ["Who is the president / leader of USA in the year 1980?", "Ronald Reagan || Ronald Reagan"]]}}}
{"hop1": {"hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.4609375, 1.0], "model_response": [["In which company (the first one in time order) does James Madison work?", "James Madison works in the company of US Congress. || US Congress"], ["In which year was the US Congress founded?", "1789 || 1789"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 1], "confidence": [0.2474212646484375, 1.0], "model_response": [["In which company (the first one in time order) does James Madison work?", "James Madison worked in the United States Department of State. || United States Department of State"], ["In which year was the United States Department of State founded?", "1789 || 1789"]]}, "hall_sbj_dict_severe": {"answer_condition": [4, 1], "confidence": [0.382354736328125, 0.99609375], "model_response": [["In which company (the first one in time order) does James Madison work?", "James Madison worked in the Department of State. || Department of State"], ["In which year was the Department of State founded?", "1789 || 1789"]]}, "mis_info_dict_light": {"answer_condition": [3, 4], "confidence": [1.0, 1.0], "model_response": [["In which company (the first one in time order) does James Madison work?", "Microsoft || Microsoft"], ["In which year was Microsoft founded?", "1975 || 1975"]]}, "mis_info_dict_severe": {"answer_condition": [3, 4], "confidence": [0.9921875, 0.90625], "model_response": [["In which company (the first one in time order) does James Madison work?", "Pizza Hut || Pizza Hut"], ["In which year was Pizza Hut founded?", "1958 || 1958"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 4], "confidence": [0.7252746820449829, 0.94921875], "model_response": [["In which company (the first one in time order) does James Madison work?", "Madison's company was the first one in time order. || Madison's company"], ["In which year was Madison's company founded?", "1775 || 1775"]]}}, "hop2": {"hall_sbj_dict_light": {"answer_condition": [4, 1], "confidence": [0.22762298583984375, 1.0], "model_response": [["In which company (the first one in time order) does James Madison work?", "James Madison worked in the United States Department of State. || United States Department of State"], ["In which year was the United States Department of State founded?", "1789 || 1789"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 4], "confidence": [0.063018798828125, 1.0], "model_response": [["In which company (the first one in time order) does James Madison work?", "James Madison worked in the United States government. || United States government"], ["In which year was the United States government founded?", "1776 || 1776"]]}, "mis_info_dict_severe": {"answer_condition": [4, 1], "confidence": [0.07032966613769531, 1.0], "model_response": [["In which company (the first one in time order) does James Madison work?", "James Madison worked in the United States Department of State. || United States Department of State"], ["In which year was the United States Department of State founded?", "1789 || 1789"]]}, "hall_sbj_dict_severe": {"answer_condition": [4, 1], "confidence": [0.514984130859375, 1.0], "model_response": [["In which company (the first one in time order) does James Madison work?", "James Madison worked in the Department of State in the first company. || Department of State"], ["In which year was the Department of State founded?", "1789 || 1789"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 4], "confidence": [0.005221366882324219, 0.81640625], "model_response": [["In which company (the first one in time order) does James Madison work?", "James Madison worked in the Department of Treasury in the first company. || Department of Treasury"], ["In which year was the Department of Treasury founded?", "1798 || 1798"]]}, "mis_info_dict_light": {"answer_condition": [4, 4], "confidence": [0.01637970097362995, 0.73046875], "model_response": [["In which company (the first one in time order) does James Madison work?", "Madison works for the Federalist Paper Company. || Federalist Paper Company"], ["In which year was the Federalist Paper Company founded?", "1787 || 1787"]]}}}
{"hop1": {"mis_info_dict_severe": {"answer_condition": [-1, -1], "confidence": [-1, -1], "model_response": [["In which year was Norway founded or became independent?", "I'm sorry, I don't have enough information to answer that question. Please provide more context or details. || N/A"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.972808837890625], "model_response": [["In which year was Norway founded or became independent?", "1814 || 1814"], ["In this year's Oscars, which film is the first one in alphabetical order for the Outstanding Pictures category?", "The Shape of Water || The Shape of Water"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 4], "confidence": [0.87890625, 0.9613189697265625], "model_response": [["In which year was Norway founded or became independent?", "1814 || 1814"], ["In this year's Oscars, which film is the first one in alphabetical order for the Outstanding Pictures category?", "The Shape of Water || The Shape of Water"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [0.99609375, 0.9613189697265625], "model_response": [["In which year was Norway founded or became independent?", "1814 || 1814"], ["In this year's Oscars, which film is the first one in alphabetical order for the Outstanding Pictures category?", "The Shape of Water || The Shape of Water"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [0.99609375, 0.97283935546875], "model_response": [["In which year was Norway founded or became independent?", "1814 || 1814"], ["In this year's Oscars, which film is the first one in alphabetical order for the Outstanding Pictures category?", "The Shape of Water || The Shape of Water"]]}, "mis_info_dict_light": {"answer_condition": [4, 4], "confidence": [0.9921875, 0.849853515625], "model_response": [["In which year was Norway founded or became independent?", "1905 || 1905"], ["In this year's Oscars, which film is the first one in alphabetical order for the Outstanding Pictures category?", "The Shape of Water || The Shape of Water"]]}}, "hop2": {"unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.9573974609375], "model_response": [["In which year was Norway founded or became independent?", "1814 || 1814"], ["In this year's Oscars, which film is the first one in alphabetical order for the Outstanding Pictures category?", "The Shape of Water || The Shape of Water"]]}, "mis_info_dict_light": {"answer_condition": [1, 3], "confidence": [1.0, 0.90234375], "model_response": [["In which year was Norway founded or became independent?", "1814 || 1814"], ["In this year's Oscars, which film is the first one in alphabetical order for the Outstanding Pictures category?", "The Irishman || The Irishman"]]}, "mis_info_dict_severe": {"answer_condition": [1, 3], "confidence": [1.0, 0.918548583984375], "model_response": [["In which year was Norway founded or became independent?", "1814 || 1814"], ["In this year's Oscars, which film is the first one in alphabetical order for the Outstanding Pictures category?", "Chocolate chip cookies || Chocolate chip cookies"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 3], "confidence": [1.0, 0.984375], "model_response": [["In which year was Norway founded or became independent?", "1814 || 1814"], ["In this year's Oscars, which film is the first one in alphabetical order for the Outstanding Pictures category?", "The Irishman || The Irishman"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.7675323486328125], "model_response": [["In which year was Norway founded or became independent?", "1814 || 1814"], ["In this year's Oscars, which film is the first one in alphabetical order for the Outstanding Pictures category?", "The Shape of Water || The Shape of Water"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 0.87591552734375], "model_response": [["In which year was Norway founded or became independent?", "1814 || 1814"], ["In this year's Oscars, which film is the first one in alphabetical order for the Outstanding Pictures category?", "The Shape of Water || The Shape of Water"]]}}}
{"hop1": {"mis_info_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.828125], "model_response": [["Which country in Asia is the most populated?", "China || China"], ["What's the year when China the first time formally establish diplomatic relations with Russia?", "1960 || 1960"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.055419921875], "model_response": [["Which country in Asia is the most populated?", "China || China"], ["What's the year when China the first time formally establish diplomatic relations with Russia?", "1990 || 1990"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.0184326171875], "model_response": [["Which country in Asia is the most populated?", "China || China"], ["What's the year when China the first time formally establish diplomatic relations with Russia?", "1984 || 1984"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 0.63397216796875], "model_response": [["Which country in Asia is the most populated?", "China || China"], ["What's the year when China the first time formally establish diplomatic relations with Russia?", "1755 || 1755"]]}, "mis_info_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 0.018505096435546875], "model_response": [["Which country in Asia is the most populated?", "China || China"], ["What's the year when China the first time formally establish diplomatic relations with Russia?", "1928 || 1928"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 0.07659530639648438], "model_response": [["Which country in Asia is the most populated?", "China || China"], ["What's the year when China the first time formally establish diplomatic relations with Russia?", "1729 || 1729"]]}}, "hop2": {"hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.91015625], "model_response": [["Which country in Asia is the most populated?", "China || China"], ["What's the year when China the first time formally establish diplomatic relations with Russia?", "1970 || 1970"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Which country in Asia is the most populated?", "China || China"], ["What's the year when China the first time formally establish diplomatic relations with Russia?", "1970 || 1970"]]}, "mis_info_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 1.0], "model_response": [["Which country in Asia is the most populated?", "China || China"], ["What's the year when China the first time formally establish diplomatic relations with Russia?", "1950 || 1950"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.248046875], "model_response": [["Which country in Asia is the most populated?", "China || China"], ["What's the year when China the first time formally establish diplomatic relations with Russia?", "1960 || 1960"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 0.15420913696289062], "model_response": [["Which country in Asia is the most populated?", "China || China"], ["What's the year when China the first time formally establish diplomatic relations with Russia?", "1850 || 1850"]]}, "mis_info_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.6484375], "model_response": [["Which country in Asia is the most populated?", "China || China"], ["What's the year when China the first time formally establish diplomatic relations with Russia?", "1984 || 1984"]]}}}
{"hop1": {"hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.92706298828125, 0.90625], "model_response": [["What is the time zone of London in UTC?", "UTC+0 || UTC+0"], ["Which country is the northernmost in the UTC+0 time zone?", "Norway || Norway"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.9160244464874268, 0.6640625], "model_response": [["What is the time zone of London in UTC?", "UTC+0 || UTC+0"], ["Which country is the northernmost in the UTC+0 time zone?", "Norway || Norway"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.89141845703125, 0.69140625], "model_response": [["What is the time zone of London in UTC?", "UTC+0 || UTC+0"], ["Which country is the northernmost in the UTC+0 time zone?", "Norway || Norway"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 4], "confidence": [0.62109375, 0.1064453125], "model_response": [["What is the time zone of London in UTC?", "UTC+0 || UTC+0"], ["Which country is the northernmost in the UTC+0 time zone?", "Finland || Finland"]]}, "mis_info_dict_light": {"answer_condition": [3, 1], "confidence": [1.0, 0.57421875], "model_response": [["What is the time zone of London in UTC?", "UTC+2 || UTC+2"], ["Which country is the northernmost in the UTC+2 time zone?", "Norway || Norway"]]}, "mis_info_dict_severe": {"answer_condition": [4, 4], "confidence": [0.93359375, 0.6015625], "model_response": [["What is the time zone of London in UTC?", "Pizza || Pizza"], ["Which country is the northernmost in the Pizza time zone?", "Canada || Canada"]]}}, "hop2": {"unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [0.86004638671875, 0.25875091552734375], "model_response": [["What is the time zone of London in UTC?", "UTC+0 || UTC+0"], ["Which country is the northernmost in the UTC+0 time zone?", "Iceland || Iceland"]]}, "mis_info_dict_severe": {"answer_condition": [1, 4], "confidence": [0.490234375, 0.8387603759765625], "model_response": [["What is the time zone of London in UTC?", "UTC+0 || UTC+0"], ["Which country is the northernmost in the UTC+0 time zone?", "Iceland || Iceland"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 4], "confidence": [0.8885498046875, 0.12385940551757812], "model_response": [["What is the time zone of London in UTC?", "UTC+0 || UTC+0"], ["Which country is the northernmost in the UTC+0 time zone?", "Iceland || Iceland"]]}, "mis_info_dict_light": {"answer_condition": [1, 3], "confidence": [0.9536590576171875, 0.9921875], "model_response": [["What is the time zone of London in UTC?", "UTC+0 || UTC+0"], ["Which country is the northernmost in the UTC+0 time zone?", "Iceland || Iceland"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [0.2606201171875, 0.7265625], "model_response": [["What is the time zone of London in UTC?", "UTC+0 || UTC+0"], ["Which country is the northernmost in the UTC+0 time zone?", "United Kingdom || United Kingdom"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 4], "confidence": [0.5719757080078125, 0.6477203369140625], "model_response": [["What is the time zone of London in UTC?", "UTC+0 || UTC+0"], ["Which country is the northernmost in the UTC+0 time zone?", "Ireland || Ireland"]]}}}
{"hop1": {"hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.8515625, 0.98046875], "model_response": [["Which country does London belong to?", "United Kingdom || United Kingdom"], ["What's the year when United Kingdom the first time formally establish diplomatic relations with Japan?", "1868 || 1868"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.46484375, 0.97265625], "model_response": [["Which country does London belong to?", "Great Britain || Great Britain"], ["What's the year when United Kingdom the first time formally establish diplomatic relations with Japan?", "1868 || 1868"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.072265625, 0.97265625], "model_response": [["Which country does London belong to?", "The United Kingdom || The United Kingdom"], ["What's the year when United Kingdom the first time formally establish diplomatic relations with Japan?", "1868 || 1868"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.83203125, 0.98828125], "model_response": [["Which country does London belong to?", "United Kingdom || United Kingdom"], ["What's the year when United Kingdom the first time formally establish diplomatic relations with Japan?", "1868 || 1868"]]}, "mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [0.431640625, 0.98046875], "model_response": [["Which country does London belong to?", "Great Britain || Great Britain"], ["What's the year when United Kingdom the first time formally establish diplomatic relations with Japan?", "1868 || 1868"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 0.0732421875], "model_response": [["Which country does London belong to?", "London belongs to the United Kingdom. || United Kingdom"], ["What's the year when United Kingdom the first time formally establish diplomatic relations with Japan?", "1860 || 1860"]]}}, "hop2": {"mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.86328125, 0.96875], "model_response": [["Which country does London belong to?", "United Kingdom || United Kingdom"], ["What's the year when United Kingdom the first time formally establish diplomatic relations with Japan?", "1868 || 1868"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.80859375, 0.9455108642578125], "model_response": [["Which country does London belong to?", "United Kingdom || United Kingdom"], ["What's the year when United Kingdom the first time formally establish diplomatic relations with Japan?", "1868 || 1868"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.60546875, 0.98828125], "model_response": [["Which country does London belong to?", "United Kingdom || United Kingdom"], ["What's the year when United Kingdom the first time formally establish diplomatic relations with Japan?", "1868 || 1868"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.1962890625, 1.0], "model_response": [["Which country does London belong to?", "The United Kingdom || The United Kingdom"], ["What's the year when United Kingdom the first time formally establish diplomatic relations with Japan?", "1868 || 1868"]]}, "mis_info_dict_light": {"answer_condition": [1, 4], "confidence": [0.90625, 1.0], "model_response": [["Which country does London belong to?", "United Kingdom || United Kingdom"], ["What's the year when United Kingdom the first time formally establish diplomatic relations with Japan?", "1850 || 1850"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 3], "confidence": [0.25, 1.0], "model_response": [["Which country does London belong to?", "Great Britain || Great Britain"], ["What's the year when United Kingdom the first time formally establish diplomatic relations with Japan?", "1854 || 1854"]]}}}
{"hop1": {"unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.875, 0.77813720703125], "model_response": [["In which company did Peter Finch work (the first one in time order)?", "Peter Finch worked in IBM. || IBM"], ["In which city is the headquarters of IBM located?", "Armonk, New York || Armonk, New York"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.87890625, 0.616241455078125], "model_response": [["In which company did Peter Finch work (the first one in time order)?", "Peter Finch worked in IBM. || IBM"], ["In which city is the headquarters of IBM located?", "Armonk, New York || Armonk, New York"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 4], "confidence": [0.98046875, 0.119140625], "model_response": [["In which company did Peter Finch work (the first one in time order)?", "IBM (International Business Machines Corporation) || IBM"], ["In which city is the headquarters of IBM located?", "New York City || New York City"]]}, "mis_info_dict_light": {"answer_condition": [3, 4], "confidence": [0.4375, 0.7276153564453125], "model_response": [["In which company did Peter Finch work (the first one in time order)?", "Microsoft || Microsoft"], ["In which city is the headquarters of Microsoft located?", "Redmond, Washington || Redmond, Washington"]]}, "unrelated_fact_dict_severe": {"answer_condition": [3, 4], "confidence": [0.400390625, 1.0], "model_response": [["In which company did Peter Finch work (the first one in time order)?", "Google || Google"], ["In which city is the headquarters of Google located?", "Mountain View, California || Mountain View, California"]]}, "mis_info_dict_severe": {"answer_condition": [3, 4], "confidence": [0.87890625, 0.8686065673828125], "model_response": [["In which company did Peter Finch work (the first one in time order)?", "Chocolate cake || Chocolate cake"], ["In which city is the headquarters of chocolate cake located?", "New York City || New York City"]]}}, "hop2": {"hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.6328125, 0.8136749267578125], "model_response": [["In which company did Peter Finch work (the first one in time order)?", "IBM (International Business Machines Corporation) || IBM"], ["In which city is the headquarters of IBM located?", "Armonk, NY || Armonk, NY"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.443359375, 0.0458831787109375], "model_response": [["In which company did Peter Finch work (the first one in time order)?", "IBM (International Business Machines Corporation) || IBM"], ["In which city is the headquarters of IBM located?", "Armonk, NY || Armonk, NY"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.73046875, 0.92333984375], "model_response": [["In which company did Peter Finch work (the first one in time order)?", "Peter Finch worked in IBM. || IBM"], ["In which city is the headquarters of IBM located?", "Armonk, NY || Armonk, NY"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.98046875, 0.94195556640625], "model_response": [["In which company did Peter Finch work (the first one in time order)?", "Peter Finch worked in IBM. || IBM"], ["In which city is the headquarters of IBM located?", "Armonk, NY || Armonk, NY"]]}, "mis_info_dict_light": {"answer_condition": [1, 4], "confidence": [0.484375, 0.18557533621788025], "model_response": [["In which company did Peter Finch work (the first one in time order)?", "IBM (International Business Machines Corporation) || IBM"], ["In which city is the headquarters of IBM located?", "San Francisco, California || San Francisco, California"]]}, "unrelated_fact_dict_light": {"answer_condition": [3, 4], "confidence": [0.3671875, 0.26953125], "model_response": [["In which company did Peter Finch work (the first one in time order)?", "Google (Alphabet Inc.) || Google"], ["In which city is the headquarters of Google located?", "Mountain View, CA || Mountain View, CA"]]}}}
{"hop1": {"mis_info_dict_severe": {"answer_condition": [-1, -1], "confidence": [-1, -1], "model_response": [["In which year was China founded or became independent?", "I'm sorry, I don't have that information. || N/A"]]}, "mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.961181640625], "model_response": [["In which year was China founded or became independent?", "1949 || 1949"], ["Who is the CEO of IBM in the year 1912?", "Thomas Watson || Thomas Watson"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.9613189697265625], "model_response": [["In which year was China founded or became independent?", "The People's Republic of China was founded in 1949. || 1949"], ["Who is the CEO of IBM in the year 1912?", "Thomas Watson || Thomas Watson"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.972808837890625], "model_response": [["In which year was China founded or became independent?", "The People's Republic of China was founded in 1949. || 1949"], ["Who is the CEO of IBM in the year 1912?", "Thomas Watson || Thomas Watson"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.921875], "model_response": [["In which year was China founded or became independent?", "The People's Republic of China was founded in 1949. || 1949"], ["Who is the CEO of IBM in the year 1912?", "Thomas Watson || Thomas Watson"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.988311767578125], "model_response": [["In which year was China founded or became independent?", "The People's Republic of China was founded in 1949. || 1949"], ["Who is the CEO of IBM in the year 1912?", "Thomas Watson || Thomas Watson"]]}}, "hop2": {"unrelated_fact_dict_light": {"answer_condition": [4, 1], "confidence": [0.91796875, 0.957305908203125], "model_response": [["In which year was China founded or became independent?", "1911 || 1911"], ["Who is the CEO of IBM in the year 1911?", "Thomas Watson || Thomas Watson"]]}, "mis_info_dict_light": {"answer_condition": [4, 1], "confidence": [0.8515625, 0.9844207763671875], "model_response": [["In which year was China founded or became independent?", "1911 || 1911"], ["Who is the CEO of IBM in the year 1911?", "Thomas Watson || Thomas Watson"]]}, "hall_sbj_dict_light": {"answer_condition": [4, 4], "confidence": [0.83984375, 0.281541736330837], "model_response": [["In which year was China founded or became independent?", "1911 || 1911"], ["Who is the CEO of IBM in the year 1911?", "Charles H. Tandy || Charles H. Tandy"]]}, "hall_sbj_dict_severe": {"answer_condition": [4, 1], "confidence": [0.8984375, 0.872039794921875], "model_response": [["In which year was China founded or became independent?", "1911 || 1911"], ["Who is the CEO of IBM in the year 1911?", "Thomas J. Watson || Thomas J. Watson"]]}, "mis_info_dict_severe": {"answer_condition": [4, 1], "confidence": [0.8984375, 0.9649658203125], "model_response": [["In which year was China founded or became independent?", "1911 || 1911"], ["Who is the CEO of IBM in the year 1911?", "Thomas Watson || Thomas Watson"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.35237406205851585], "model_response": [["In which year was China founded or became independent?", "The People's Republic of China was founded in 1949. || 1949"], ["Who is the CEO of IBM in the year 1912?", "Charles H. Tandy || Charles H. Tandy"]]}}}
{"hop1": {"mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [0.9921875, 0.11572265625], "model_response": [["Which country is the northernmost in the UTC-4 time zone?", "Canada || Canada"], ["What's the year when China the first time formally establish diplomatic relations with Canada?", "1970 || 1970"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 4], "confidence": [0.9375, 0.8984375], "model_response": [["Which country is the northernmost in the UTC-4 time zone?", "Canada || Canada"], ["What's the year when China the first time formally establish diplomatic relations with Canada?", "1971 || 1971"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [0.85546875, 0.54296875], "model_response": [["Which country is the northernmost in the UTC-4 time zone?", "Canada || Canada"], ["What's the year when China the first time formally establish diplomatic relations with Canada?", "1971 || 1971"]]}, "unrelated_fact_dict_light": {"answer_condition": [3, 4], "confidence": [0.78515625, 0.86328125], "model_response": [["Which country is the northernmost in the UTC-4 time zone?", "Brazil || Brazil"], ["What's the year when China the first time formally establish diplomatic relations with Brazil?", "1972 || 1972"]]}, "hall_sbj_dict_light": {"answer_condition": [4, 4], "confidence": [0.78515625, 0.86328125], "model_response": [["Which country is the northernmost in the UTC-4 time zone?", "Brazil || Brazil"], ["What's the year when China the first time formally establish diplomatic relations with Brazil?", "1972 || 1972"]]}, "mis_info_dict_severe": {"answer_condition": [1, 4], "confidence": [0.9921875, 0.609375], "model_response": [["Which country is the northernmost in the UTC-4 time zone?", "Canada || Canada"], ["What's the year when China the first time formally establish diplomatic relations with Canada?", "1971 || 1971"]]}}, "hop2": {"hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.482421875, 0.498046875], "model_response": [["Which country is the northernmost in the UTC-4 time zone?", "Canada || Canada"], ["What's the year when China the first time formally establish diplomatic relations with Canada?", "1970 || 1970"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [0.478515625, 0.91796875], "model_response": [["Which country is the northernmost in the UTC-4 time zone?", "Canada || Canada"], ["What's the year when China the first time formally establish diplomatic relations with Canada?", "1971 || 1971"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [0.455078125, 0.9296875], "model_response": [["Which country is the northernmost in the UTC-4 time zone?", "Canada || Canada"], ["What's the year when China the first time formally establish diplomatic relations with Canada?", "1971 || 1971"]]}, "mis_info_dict_light": {"answer_condition": [4, 3], "confidence": [0.478515625, 1.0], "model_response": [["Which country is the northernmost in the UTC-4 time zone?", "Norway || Norway"], ["What's the year when China the first time formally establish diplomatic relations with Norway?", "1960 || 1960"]]}, "hall_sbj_dict_severe": {"answer_condition": [4, 4], "confidence": [0.66796875, 0.8125], "model_response": [["Which country is the northernmost in the UTC-4 time zone?", "Norway || Norway"], ["What's the year when China the first time formally establish diplomatic relations with Norway?", "1972 || 1972"]]}, "mis_info_dict_severe": {"answer_condition": [4, 4], "confidence": [0.67578125, 0.373046875], "model_response": [["Which country is the northernmost in the UTC-4 time zone?", "Norway || Norway"], ["What's the year when China the first time formally establish diplomatic relations with Norway?", "1984 || 1984"]]}}}
{"hop1": {"unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.99609375], "model_response": [["Which university or college did Dwight D. Eisenhower attend as a graduate student?", "Columbia University || Columbia University"], ["Which city is Columbia University located in?", "New York City || New York City"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Which university or college did Dwight D. Eisenhower attend as a graduate student?", "Columbia University || Columbia University"], ["Which city is Columbia University located in?", "New York City || New York City"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Which university or college did Dwight D. Eisenhower attend as a graduate student?", "Columbia University || Columbia University"], ["Which city is Columbia University located in?", "New York City || New York City"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.875, 1.0], "model_response": [["Which university or college did Dwight D. Eisenhower attend as a graduate student?", "Columbia University || Columbia University"], ["Which city is Columbia University located in?", "New York City || New York City"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Which university or college did Dwight D. Eisenhower attend as a graduate student?", "Columbia University || Columbia University"], ["Which city is Columbia University located in?", "New York City || New York City"]]}, "mis_info_dict_light": {"answer_condition": [3, 4], "confidence": [1.0, 0.953125], "model_response": [["Which university or college did Dwight D. Eisenhower attend as a graduate student?", "Harvard University || Harvard University"], ["Which city is Harvard University located in?", "Boston || Boston"]]}}, "hop2": {"mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Which university or college did Dwight D. Eisenhower attend as a graduate student?", "Columbia University || Columbia University"], ["Which city is Columbia University located in?", "New York City || New York City"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.9921875], "model_response": [["Which university or college did Dwight D. Eisenhower attend as a graduate student?", "Columbia University || Columbia University"], ["Which city is Columbia University located in?", "New York City || New York City"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Which university or college did Dwight D. Eisenhower attend as a graduate student?", "Columbia University || Columbia University"], ["Which city is Columbia University located in?", "New York City || New York City"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.99609375], "model_response": [["Which university or college did Dwight D. Eisenhower attend as a graduate student?", "Columbia University || Columbia University"], ["Which city is Columbia University located in?", "New York City || New York City"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Which university or college did Dwight D. Eisenhower attend as a graduate student?", "Columbia University || Columbia University"], ["Which city is Columbia University located in?", "New York City || New York City"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Which university or college did Dwight D. Eisenhower attend as a graduate student?", "Columbia University || Columbia University"], ["Which city is Columbia University located in?", "New York City || New York City"]]}}}
{"hop1": {"hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.2644506096839905], "model_response": [["Which city hosted the first Olympic Games in 1974?", "Montreal || Montreal"], ["What is the name of the largest airport in Montreal?", "Pierre Elliott Trudeau International Airport || Pierre Elliott Trudeau International Airport"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.98828125, 0.7897040247917175], "model_response": [["Which city hosted the first Olympic Games in 1974?", "Montreal || Montreal"], ["What is the name of the largest airport in Montreal?", "Pierre Elliott Trudeau International Airport || Pierre Elliott Trudeau International Airport"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.9140625], "model_response": [["Which city hosted the first Olympic Games in 1974?", "Montreal || Montreal"], ["What is the name of the largest airport in Montreal?", "Montreal-Pierre Elliott Trudeau International Airport || Montreal-Pierre Elliott Trudeau International Airport"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 4], "confidence": [0.05810546875, 0.953125], "model_response": [["Which city hosted the first Olympic Games in 1974?", "Los Angeles || Los Angeles"], ["What is the name of the largest airport in Los Angeles?", "Los Angeles International Airport (LAX) || Los Angeles International Airport (LAX)"]]}, "mis_info_dict_light": {"answer_condition": [3, 4], "confidence": [1.0, 1.0], "model_response": [["Which city hosted the first Olympic Games in 1974?", "Athens || Athens"], ["What is the name of the largest airport in Athens?", "Eleftherios Venizelos || Eleftherios Venizelos"]]}, "mis_info_dict_severe": {"answer_condition": [3, 4], "confidence": [1.0, 0.9574270248413086], "model_response": [["Which city hosted the first Olympic Games in 1974?", "Pizza || Pizza"], ["What is the name of the largest airport in Pizza?", "Pizza International Airport || Pizza International Airport"]]}}, "hop2": {"unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.96484375, 0.26043701171875], "model_response": [["Which city hosted the first Olympic Games in 1974?", "Montreal || Montreal"], ["What is the name of the largest airport in Montreal?", "Pierre Elliott Trudeau International Airport || Pierre Elliott Trudeau International Airport"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.73046875], "model_response": [["Which city hosted the first Olympic Games in 1974?", "Montreal || Montreal"], ["What is the name of the largest airport in Montreal?", "Montreal-Pierre Elliott Trudeau International Airport || Montreal-Pierre Elliott Trudeau International Airport"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.99609375, 0.99609375], "model_response": [["Which city hosted the first Olympic Games in 1974?", "Montreal || Montreal"], ["What is the name of the largest airport in Montreal?", "Montreal-Pierre Elliott Trudeau International Airport || Montreal-Pierre Elliott Trudeau International Airport"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 3], "confidence": [0.99609375, 1.0], "model_response": [["Which city hosted the first Olympic Games in 1974?", "Montreal || Montreal"], ["What is the name of the largest airport in Montreal?", "Sunflowers || Sunflowers"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.90234375, 0.98052978515625], "model_response": [["Which city hosted the first Olympic Games in 1974?", "Montreal, Canada || Montreal"], ["What is the name of the largest airport in Montreal?", "Montreal-Pierre Elliott Trudeau International Airport || Montreal-Pierre Elliott Trudeau International Airport"]]}, "mis_info_dict_light": {"answer_condition": [1, 3], "confidence": [1.0, 0.87890625], "model_response": [["Which city hosted the first Olympic Games in 1974?", "Montreal || Montreal"], ["What is the name of the largest airport in Montreal?", "Montr\u00e9al-Mirabel International Airport || Montr\u00e9al-Mirabel International Airport"]]}}}
{"hop1": {"unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["What is the name of the largest airport in London?", "Heathrow || Heathrow"], ["What is the abbreviation for Heathrow airport?", "LHR || LHR"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.953125, 1.0], "model_response": [["What is the name of the largest airport in London?", "Heathrow || Heathrow"], ["What is the abbreviation for Heathrow airport?", "LHR || LHR"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["What is the name of the largest airport in London?", "Heathrow || Heathrow"], ["What is the abbreviation for Heathrow airport?", "LHR || LHR"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.953125, 1.0], "model_response": [["What is the name of the largest airport in London?", "The name of the largest airport in London is Heathrow. || Heathrow"], ["What is the abbreviation for Heathrow airport?", "LHR || LHR"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["What is the name of the largest airport in London?", "Heathrow || Heathrow"], ["What is the abbreviation for Heathrow airport?", "LHR || LHR"]]}, "mis_info_dict_light": {"answer_condition": [3, 4], "confidence": [0.8046875, 0.99609375], "model_response": [["What is the name of the largest airport in London?", "Gatwick || Gatwick"], ["What is the abbreviation for Gatwick airport?", "LGW || LGW"]]}}, "hop2": {"hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["What is the name of the largest airport in London?", "Heathrow || Heathrow"], ["What is the abbreviation for Heathrow airport?", "LHR || LHR"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["What is the name of the largest airport in London?", "Heathrow || Heathrow"], ["What is the abbreviation for Heathrow airport?", "LHR || LHR"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["What is the name of the largest airport in London?", "Heathrow || Heathrow"], ["What is the abbreviation for Heathrow airport?", "LHR || LHR"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["What is the name of the largest airport in London?", "Heathrow || Heathrow"], ["What is the abbreviation for Heathrow airport?", "LHR || LHR"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.490234375, 0.359375], "model_response": [["What is the name of the largest airport in London?", "The name of the largest airport in London is Heathrow Airport. || Heathrow Airport"], ["What is the abbreviation for Heathrow airport?", "LHR || LHR"]]}, "mis_info_dict_light": {"answer_condition": [1, 4], "confidence": [0.92578125, 1.0], "model_response": [["What is the name of the largest airport in London?", "Heathrow || Heathrow"], ["What is the abbreviation for Heathrow airport?", "JFK || JFK"]]}}}
{"hop1": {"mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.86328125, 0.62109375], "model_response": [["What is the official or most commonly spoken language in Finland?", "Finnish || Finnish"], ["What is the ISO 639-1 code for the Finnish language?", "Fin || Fin"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.984375, 0.953125], "model_response": [["What is the official or most commonly spoken language in Finland?", "Finnish || Finnish"], ["What is the ISO 639-1 code for the Finnish language?", "fi || fi"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.5], "model_response": [["What is the official or most commonly spoken language in Finland?", "Finnish || Finnish"], ["What is the ISO 639-1 code for the Finnish language?", "Fin || Fin"]]}, "mis_info_dict_light": {"answer_condition": [3, 4], "confidence": [0.703125, 0.98828125], "model_response": [["What is the official or most commonly spoken language in Finland?", "English || English"], ["What is the ISO 639-1 code for the English language?", "en || en"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.1826171875], "model_response": [["What is the official or most commonly spoken language in Finland?", "The official or most commonly spoken language in Finland is Finnish. || Finnish"], ["What is the ISO 639-1 code for the Finnish language?", "Fin || Fin"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.9765625, 0.1826171875], "model_response": [["What is the official or most commonly spoken language in Finland?", "Finnish || Finnish"], ["What is the ISO 639-1 code for the Finnish language?", "Fin || Fin"]]}}, "hop2": {"unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.8125, 0.021150318207219243], "model_response": [["What is the official or most commonly spoken language in Finland?", "Finnish || Finnish"], ["What is the ISO 639-1 code for the Finnish language?", "Finno-Ugric || Finno-Ugric"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["What is the official or most commonly spoken language in Finland?", "The official or most commonly spoken language in Finland is Finnish. || Finnish"], ["What is the ISO 639-1 code for the Finnish language?", "Fin || Fin"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["What is the official or most commonly spoken language in Finland?", "The official language of Finland is Finnish. However, Swedish is also widely spoken. || Finnish"], ["What is the ISO 639-1 code for the Finnish language?", "Fin || Fin"]]}, "mis_info_dict_severe": {"answer_condition": [1, 4], "confidence": [0.81640625, 0.859375], "model_response": [["What is the official or most commonly spoken language in Finland?", "Finnish || Finnish"], ["What is the ISO 639-1 code for the Finnish language?", "Pizza || Pizza"]]}, "mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [0.921875, 1.0], "model_response": [["What is the official or most commonly spoken language in Finland?", "Finnish || Finnish"], ["What is the ISO 639-1 code for the Finnish language?", "The ISO 639-1 code for the Finnish language is \"finl\". || finl"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["What is the official or most commonly spoken language in Finland?", "The official language of Finland is Finnish. However, Swedish is also widely spoken. || Finnish"], ["What is the ISO 639-1 code for the Finnish language?", "Fin || Fin"]]}}}
{"hop1": {"hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.028076171875, 1.0], "model_response": [["Which city hosted the first Olympic Games in 1994?", "Athens || Athens"], ["Which country does Athens belong to?", "Greece || Greece"]]}, "mis_info_dict_severe": {"answer_condition": [4, 4], "confidence": [0.498046875, 1.0], "model_response": [["Which city hosted the first Olympic Games in 1994?", "Lillehammer, Norway || Lillehammer"], ["Which country does Lillehammer belong to?", "Norway || Norway"]]}, "mis_info_dict_light": {"answer_condition": [3, 4], "confidence": [1.0, 1.0], "model_response": [["Which city hosted the first Olympic Games in 1994?", "Barcelona || Barcelona"], ["Which country does Barcelona belong to?", "Spain || Spain"]]}, "unrelated_fact_dict_light": {"answer_condition": [3, 4], "confidence": [1.0, 1.0], "model_response": [["Which city hosted the first Olympic Games in 1994?", "Lillehammer || Lillehammer"], ["Which country does Lillehammer belong to?", "Norway || Norway"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 4], "confidence": [0.9613189697265625, 0.94140625], "model_response": [["Which city hosted the first Olympic Games in 1994?", "Hogwarts School of Witchcraft and Wizardry || Hogwarts School of Witchcraft and Wizardry"], ["Which country does Hogwarts School of Witchcraft and Wizardry belong to?", "Great Britain || Great Britain"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Which city hosted the first Olympic Games in 1994?", "Athens || Athens"], ["Which country does Athens belong to?", "Greece || Greece"]]}}, "hop2": {"mis_info_dict_light": {"answer_condition": [4, 4], "confidence": [0.1650390625, 0.99609375], "model_response": [["Which city hosted the first Olympic Games in 1994?", "Atlanta || Atlanta"], ["Which country does Atlanta belong to?", "United States || United States"]]}, "hall_sbj_dict_severe": {"answer_condition": [4, 4], "confidence": [0.03585052490234375, 1.0], "model_response": [["Which city hosted the first Olympic Games in 1994?", "Nagano, Japan || Nagano"], ["Which country does Nagano belong to?", "Japan || Japan"]]}, "mis_info_dict_severe": {"answer_condition": [4, 4], "confidence": [0.470703125, 1.0], "model_response": [["Which city hosted the first Olympic Games in 1994?", "The city that hosted the first Olympic Games in 1994 was in the country of France. || France"], ["Which country does Paris belong to?", "France || France"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 4], "confidence": [0.4786529541015625, 1.0], "model_response": [["Which city hosted the first Olympic Games in 1994?", "The city of Lillehammer in Norway hosted the first Olympic Games in 1994. || Lillehammer"], ["Which country does Lillehammer belong to?", "Norway || Norway"]]}, "hall_sbj_dict_light": {"answer_condition": [4, 4], "confidence": [0.71875, 1.0], "model_response": [["Which city hosted the first Olympic Games in 1994?", "The city was named as \"Lillehammer\" in Norway. || Lillehammer"], ["Which country does Lillehammer belong to?", "Norway || Norway"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 4], "confidence": [0.26458740234375, 1.0], "model_response": [["Which city hosted the first Olympic Games in 1994?", "The city of Lillehammer, Norway hosted the first Olympic Games in 1994. || Lillehammer"], ["Which country does Lillehammer belong to?", "Norway || Norway"]]}}}
{"hop1": {"hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.9375], "model_response": [["Who is the president / leader of China in the year 1949?", "Chiang Kai-shek || Chiang Kai-shek"], ["In which year was Chiang Kai-shek born?", "1887 || 1887"]]}, "mis_info_dict_severe": {"answer_condition": [3, -1], "confidence": [0.87890625, -1], "model_response": [["Who is the president / leader of China in the year 1949?", "Chocolate cake. || Chocolate cake"], ["In which year was chocolate cake born?", "I'm sorry, I don't understand the question. Can you please rephrase it? || N/A"]]}, "mis_info_dict_light": {"answer_condition": [4, 4], "confidence": [1.0, 0.98046875], "model_response": [["Who is the president / leader of China in the year 1949?", "Mao Zedong || Mao Zedong"], ["In which year was Mao Zedong born?", "1893 || 1893"]]}, "hall_sbj_dict_severe": {"answer_condition": [4, 4], "confidence": [0.83770751953125, 1.0], "model_response": [["Who is the president / leader of China in the year 1949?", "Sun Yat-sen || Sun Yat-sen"], ["In which year was Sun Yat-sen born?", "1866 || 1866"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 4], "confidence": [0.8933472633361816, 0.4119873046875], "model_response": [["Who is the president / leader of China in the year 1949?", "Chou En-lai || Chou En-lai"], ["In which year was Chou En-lai born?", "1899 || 1899"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 4], "confidence": [0.724761962890625, 0.173126220703125], "model_response": [["Who is the president / leader of China in the year 1949?", "Chou En-Lai || Chou En-Lai"], ["In which year was Chou En-Lai born?", "1897 || 1897"]]}}, "hop2": {"mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.953125], "model_response": [["Who is the president / leader of China in the year 1949?", "Chiang Kai-shek || Chiang Kai-shek"], ["In which year was Chiang Kai-shek born?", "1887 || 1887"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.73046875], "model_response": [["Who is the president / leader of China in the year 1949?", "Chiang Kai-shek || Chiang Kai-shek"], ["In which year was Chiang Kai-shek born?", "1887 || 1887"]]}, "hall_sbj_dict_light": {"answer_condition": [4, 1], "confidence": [0.92578125, 0.96875], "model_response": [["Who is the president / leader of China in the year 1949?", "Mao Zedong || Mao Zedong"], ["In which year was Mao Zedong born?", "1887 || 1887"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 4], "confidence": [0.498046875, 0.62109375], "model_response": [["Who is the president / leader of China in the year 1949?", "Chou En-lai || Chou En-lai"], ["In which year was Chou En-lai born?", "1897 || 1897"]]}, "hall_sbj_dict_severe": {"answer_condition": [4, 4], "confidence": [0.8132171630859375, 0.6089630126953125], "model_response": [["Who is the president / leader of China in the year 1949?", "Chou En-lai || Chou En-lai"], ["In which year was Chou En-lai born?", "1897 || 1897"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 4], "confidence": [0.7276153564453125, 0.71484375], "model_response": [["Who is the president / leader of China in the year 1949?", "Chou En-lai || Chou En-lai"], ["In which year was Chou En-lai born?", "1897 || 1897"]]}}}
{"hop1": {"mis_info_dict_light": {"answer_condition": [1, 4], "confidence": [0.62109375, 0.030029296875], "model_response": [["In which company did Jack Welch work, the first one in time order?", "General Electric (GE) || General Electric"], ["Who is the CEO of General Electric (GE) in the year 1934?", "Jack Welch || Jack Welch"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 0.9649658203125], "model_response": [["In which company did Jack Welch work, the first one in time order?", "General Electric (GE) || General Electric (GE)"], ["Who is the CEO of General Electric (GE) in the year 1934?", "Charles Coffin || Charles Coffin"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [0.98046875, 0.794677734375], "model_response": [["In which company did Jack Welch work, the first one in time order?", "General Electric (GE) || General Electric (GE)"], ["Who is the CEO of General Electric (GE) in the year 1934?", "Charles Coffin || Charles Coffin"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.8572947978973389], "model_response": [["In which company did Jack Welch work, the first one in time order?", "General Electric (GE) || General Electric (GE)"], ["Who is the CEO of General Electric (GE) in the year 1934?", "Charles Coffin || Charles Coffin"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 0.795623779296875], "model_response": [["In which company did Jack Welch work, the first one in time order?", "General Electric (GE) || General Electric"], ["Who is the CEO of General Electric (GE) in the year 1934?", "Charles Coffin || Charles Coffin"]]}, "mis_info_dict_severe": {"answer_condition": [1, 4], "confidence": [0.98046875, 0.17774677276611328], "model_response": [["In which company did Jack Welch work, the first one in time order?", "General Electric (GE) || General Electric (GE)"], ["Who is the CEO of General Electric (GE) in the year 1934?", "Charles M. Schwab || Charles M. Schwab"]]}}, "hop2": {"mis_info_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.92578125], "model_response": [["In which company did Jack Welch work, the first one in time order?", "General Electric (GE) || General Electric (GE)"], ["Who is the CEO of General Electric (GE) in the year 1934?", "Jack Welch || Jack Welch"]]}, "mis_info_dict_light": {"answer_condition": [1, 3], "confidence": [1.0, 1.0], "model_response": [["In which company did Jack Welch work, the first one in time order?", "General Electric (GE) || General Electric (GE)"], ["Who is the CEO of General Electric (GE) in the year 1934?", "Nikola Tesla || Nikola Tesla"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 4], "confidence": [0.98046875, 0.44309234619140625], "model_response": [["In which company did Jack Welch work, the first one in time order?", "General Electric (GE) || General Electric (GE)"], ["Who is the CEO of General Electric (GE) in the year 1934?", "Charles Coffin || Charles Coffin"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 0.93792724609375], "model_response": [["In which company did Jack Welch work, the first one in time order?", "General Electric (GE) || General Electric (GE)"], ["Who is the CEO of General Electric (GE) in the year 1934?", "Charles Coffin || Charles Coffin"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 0.23828983306884766], "model_response": [["In which company did Jack Welch work, the first one in time order?", "General Electric (GE) || General Electric (GE)"], ["Who is the CEO of General Electric (GE) in the year 1934?", "Charles G. Sawyer || Charles G. Sawyer"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [0.953125, 0.87890625], "model_response": [["In which company did Jack Welch work, the first one in time order?", "General Electric (GE) || General Electric (GE)"], ["Who is the CEO of General Electric (GE) in the year 1934?", "Jack Welch || Jack Welch"]]}}}
{"hop1": {"mis_info_dict_severe": {"answer_condition": [4, 1], "confidence": [0.890625, 0.953125], "model_response": [["What's the year when Russia the first time formally establish diplomatic relations with France?", "1799 || 1799"], ["Which film won the Oscar for Outstanding Picture in 1799, being the first one in alphabetical order?", "Titanic || Titanic"]]}, "hall_sbj_dict_light": {"answer_condition": [4, 1], "confidence": [0.62109375, 0.62109375], "model_response": [["What's the year when Russia the first time formally establish diplomatic relations with France?", "1799 || 1799"], ["Which film won the Oscar for Outstanding Picture in 1799, being the first one in alphabetical order?", "Titanic || Titanic"]]}, "hall_sbj_dict_severe": {"answer_condition": [4, 1], "confidence": [0.921875, 0.87890625], "model_response": [["What's the year when Russia the first time formally establish diplomatic relations with France?", "1799 || 1799"], ["Which film won the Oscar for Outstanding Picture in 1799, being the first one in alphabetical order?", "Titanic (1997) || Titanic"]]}, "mis_info_dict_light": {"answer_condition": [3, 4], "confidence": [1.0, 0.10009765625], "model_response": [["What's the year when Russia the first time formally establish diplomatic relations with France?", "1812 || 1812"], ["Which film won the Oscar for Outstanding Picture in 1812, being the first one in alphabetical order?", "Amadeus || Amadeus"]]}, "unrelated_fact_dict_light": {"answer_condition": [3, 4], "confidence": [0.96875, 0.61328125], "model_response": [["What's the year when Russia the first time formally establish diplomatic relations with France?", "1783 || 1783"], ["Which film won the Oscar for Outstanding Picture in 1783, being the first one in alphabetical order?", "Amadeus || Amadeus"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 4], "confidence": [0.26953125, 0.7135772705078125], "model_response": [["What's the year when Russia the first time formally establish diplomatic relations with France?", "1799 || 1799"], ["Which film won the Oscar for Outstanding Picture in 1799, being the first one in alphabetical order?", "The first film to win the Oscar for Outstanding Picture in 1799 was \"The Birth of a Nation\" (1915). || The Birth of a Nation"]]}}, "hop2": {"unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [0.596832275390625, 0.953125], "model_response": [["What's the year when Russia the first time formally establish diplomatic relations with France?", "1801 || 1801"], ["Which film won the Oscar for Outstanding Picture in 1801, being the first one in alphabetical order?", "Zebra || Zebra"]]}, "mis_info_dict_severe": {"answer_condition": [1, 3], "confidence": [0.858306884765625, 0.724761962890625], "model_response": [["What's the year when Russia the first time formally establish diplomatic relations with France?", "1801 || 1801"], ["Which film won the Oscar for Outstanding Picture in 1801, being the first one in alphabetical order?", "Chocolate chip cookies || Chocolate chip cookies"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 1], "confidence": [0.5, 0.2109375], "model_response": [["What's the year when Russia the first time formally establish diplomatic relations with France?", "1799 || 1799"], ["Which film won the Oscar for Outstanding Picture in 1799, being the first one in alphabetical order?", "Titanic (1997) || Titanic"]]}, "hall_sbj_dict_severe": {"answer_condition": [4, 1], "confidence": [0.92578125, 0.07568359375], "model_response": [["What's the year when Russia the first time formally establish diplomatic relations with France?", "1799 || 1799"], ["Which film won the Oscar for Outstanding Picture in 1799, being the first one in alphabetical order?", "Titanic || Titanic"]]}, "hall_sbj_dict_light": {"answer_condition": [4, 4], "confidence": [0.81640625, 0.0006744265556335449], "model_response": [["What's the year when Russia the first time formally establish diplomatic relations with France?", "1799 || 1799"], ["Which film won the Oscar for Outstanding Picture in 1799, being the first one in alphabetical order?", "The Grand Inquisitor || The Grand Inquisitor"]]}, "mis_info_dict_light": {"answer_condition": [4, 4], "confidence": [0.81640625, 0.8540802001953125], "model_response": [["What's the year when Russia the first time formally establish diplomatic relations with France?", "1799 || 1799"], ["Which film won the Oscar for Outstanding Picture in 1799, being the first one in alphabetical order?", "The film \"The Artist\" won the Oscar for Outstanding Picture in 2017, being the first one in alphabetical order. || The Artist"]]}}}
{"hop1": {"unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [0.91796875, 0.96875], "model_response": [["Which country does Baltimore belong to?", "United States || United States"], ["What is the name of the longest river in the United States?", "Mississippi || Mississippi"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 4], "confidence": [0.9453125, 0.9921875], "model_response": [["Which country does Baltimore belong to?", "United States || United States"], ["What is the name of the longest river in the United States?", "Mississippi || Mississippi"]]}, "mis_info_dict_light": {"answer_condition": [1, 4], "confidence": [0.8046875, 0.98046875], "model_response": [["Which country does Baltimore belong to?", "The United States || The United States"], ["What is the name of the longest river in the United States?", "Mississippi || Mississippi"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 4], "confidence": [0.87890625, 0.98828125], "model_response": [["Which country does Baltimore belong to?", "United States || United States"], ["What is the name of the longest river in the United States?", "Mississippi || Mississippi"]]}, "mis_info_dict_severe": {"answer_condition": [1, 4], "confidence": [0.875, 0.9921875], "model_response": [["Which country does Baltimore belong to?", "United States || United States"], ["What is the name of the longest river in the United States?", "Mississippi || Mississippi"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [0.265625, 0.96875], "model_response": [["Which country does Baltimore belong to?", "The United States || The United States"], ["What is the name of the longest river in the United States?", "Mississippi || Mississippi"]]}}, "hop2": {"hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.9453125, 0.988311767578125], "model_response": [["Which country does Baltimore belong to?", "United States || United States"], ["What is the name of the longest river in the United States?", "Missouri River || Missouri River"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.9375, 0.988311767578125], "model_response": [["Which country does Baltimore belong to?", "United States || United States"], ["What is the name of the longest river in the United States?", "Missouri River || Missouri River"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [0.84375, 0.81640625], "model_response": [["Which country does Baltimore belong to?", "United States || United States"], ["What is the name of the longest river in the United States?", "Mississippi || Mississippi"]]}, "mis_info_dict_severe": {"answer_condition": [1, 4], "confidence": [0.73046875, 0.98046875], "model_response": [["Which country does Baltimore belong to?", "United States || United States"], ["What is the name of the longest river in the United States?", "Mississippi || Mississippi"]]}, "mis_info_dict_light": {"answer_condition": [1, 4], "confidence": [0.94921875, 1.0], "model_response": [["Which country does Baltimore belong to?", "United States || United States"], ["What is the name of the longest river in the United States?", "Mississippi River || Mississippi River"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [0.9453125, 0.92578125], "model_response": [["Which country does Baltimore belong to?", "United States || United States"], ["What is the name of the longest river in the United States?", "Mississippi || Mississippi"]]}}}
{"hop1": {"hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.4787445068359375, 1.0], "model_response": [["Which countries to the east share a border with Norway?", "Finland and Russia || Finland and Russia"], ["Which is the first year does Sweden invade Finland?", "1808 || 1808"]]}, "mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [0.9379416704177856, 0.98828125], "model_response": [["Which countries to the east share a border with Norway?", "Finland and Russia. || Finland and Russia"], ["Which is the first year does Sweden invade Finland?", "1808 || 1808"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.988311767578125, 0.98828125], "model_response": [["Which countries to the east share a border with Norway?", "Finland and Russia || Finland and Russia"], ["Which is the first year does Sweden invade Finland?", "1808 || 1808"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.9161262512207031, 0.94921875], "model_response": [["Which countries to the east share a border with Norway?", "Finland and Russia || Finland and Russia"], ["Which is the first year does Sweden invade Finland?", "1808 || 1808"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [0.8439903259277344, 0.9921875], "model_response": [["Which countries to the east share a border with Norway?", "Finland and Russia || Finland and Russia"], ["Which is the first year does Sweden invade Finland?", "1808 || 1808"]]}, "mis_info_dict_severe": {"answer_condition": [1, 4], "confidence": [0.6010406017303467, 1.0], "model_response": [["Which countries to the east share a border with Norway?", "Finland and Sweden || Finland and Sweden"], ["Which is the first year does Sweden invade Finland?", "1808 || 1808"]]}}, "hop2": {"unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.024980946356500944, 0.7265625], "model_response": [["Which countries to the east share a border with Norway?", "Iceland, Sweden, and Finland. || Iceland, Sweden, and Finland"], ["Which is the first year does Sweden invade Finland?", "1940 || 1940"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.8307266235351562, 0.99609375], "model_response": [["Which countries to the east share a border with Norway?", "Finland and Russia. || Finland and Russia"], ["Which is the first year does Sweden invade Finland?", "1940 || 1940"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.08668854832649231, 1.0], "model_response": [["Which countries to the east share a border with Norway?", "Finland, Sweden, and Russia || Finland, Sweden, and Russia"], ["Which is the first year does Sweden invade Finland?", "1940 || 1940"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.9418174624443054, 1.0], "model_response": [["Which countries to the east share a border with Norway?", "Finland and Russia || Finland and Russia"], ["Which is the first year does Sweden invade Finland?", "1808 || 1808"]]}, "mis_info_dict_light": {"answer_condition": [1, 3], "confidence": [0.9614087343215942, 0.99609375], "model_response": [["Which countries to the east share a border with Norway?", "Finland and Russia || Finland and Russia"], ["Which is the first year does Sweden invade Finland?", "1917 || 1917"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.7035300135612488, 0.04736328125], "model_response": [["Which countries to the east share a border with Norway?", "Finland and Russia. || Finland and Russia"], ["Which is the first year does Sweden invade Finland?", "1808 || 1808"]]}}}
{"hop1": {"mis_info_dict_severe": {"answer_condition": [4, -1], "confidence": [0.431640625, -1], "model_response": [["Which country does Los Angeles belong to?", "Pizza || Pizza"], ["Who is the president / leader of Pizza in the year 1975?", "Sorry, I cannot provide an answer to this question as I am not programmed to provide information on fictional or imaginary entities. || N/A"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.878662109375], "model_response": [["Which country does Los Angeles belong to?", "Los Angeles belongs to the United States. || United States"], ["Who is the president / leader of USA in the year 1975?", "Gerald Ford || Gerald Ford"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.419921875, 0.81024169921875], "model_response": [["Which country does Los Angeles belong to?", "The United States || The United States"], ["Who is the president / leader of USA in the year 1975?", "Gerald Ford || Gerald Ford"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.244140625, 0.83770751953125], "model_response": [["Which country does Los Angeles belong to?", "United States || United States"], ["Who is the president / leader of USA in the year 1975?", "Gerald Ford || Gerald Ford"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.1962890625, 0.7162017822265625], "model_response": [["Which country does Los Angeles belong to?", "The United States || The United States"], ["Who is the president / leader of USA in the year 1975?", "Gerald Ford || Gerald Ford"]]}, "mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [0.84375, 0.81024169921875], "model_response": [["Which country does Los Angeles belong to?", "The United States || The United States"], ["Who is the president / leader of USA in the year 1975?", "Gerald Ford || Gerald Ford"]]}}, "hop2": {"mis_info_dict_severe": {"answer_condition": [1, -1], "confidence": [0.83203125, -1], "model_response": [["Which country does Los Angeles belong to?", "United States || United States"], ["Who is the president / leader of USA in the year 1975?", "I'm sorry, I cannot answer that question as I am not programmed to provide information on current or past presidents of the United States. || N/A"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.72265625, 0.94940185546875], "model_response": [["Which country does Los Angeles belong to?", "United States || United States"], ["Who is the president / leader of USA in the year 1975?", "Gerald Ford || Gerald Ford"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.2421875, 0.953125], "model_response": [["Which country does Los Angeles belong to?", "The United States of America || The United States of America"], ["Who is the president / leader of USA in the year 1975?", "Gerald Ford || Gerald Ford"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.86328125, 0.99609375], "model_response": [["Which country does Los Angeles belong to?", "United States || United States"], ["Who is the president / leader of USA in the year 1975?", "Gerald R. Ford || Gerald R. Ford"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.5247039794921875, 0.7656097412109375], "model_response": [["Which country does Los Angeles belong to?", "The United States of America || The United States of America"], ["Who is the president / leader of USA in the year 1975?", "Gerald Ford || Gerald Ford"]]}, "mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [0.5023918151855469, 0.8514404296875], "model_response": [["Which country does Los Angeles belong to?", "The United States of America || The United States of America"], ["Who is the president / leader of USA in the year 1975?", "Gerald Ford || Gerald Ford"]]}}}
{"hop1": {"unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Who was the US president in 1973?", "Richard Nixon || Richard Nixon"], ["In which year was Richard Nixon born?", "1908 || 1908"]]}, "mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [0.69140625, 0.99609375], "model_response": [["Who was the US president in 1973?", "Richard Nixon || Richard Nixon"], ["In which year was Richard Nixon born?", "1908 || 1908"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 4], "confidence": [0.92578125, 1.0], "model_response": [["Who was the US president in 1973?", "Richard Nixon || Richard Nixon"], ["In which year was Richard Nixon born?", "1913 || 1913"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 4], "confidence": [0.99609375, 1.0], "model_response": [["Who was the US president in 1973?", "Richard Nixon || Richard Nixon"], ["In which year was Richard Nixon born?", "1913 || 1913"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [0.73046875, 0.1826171875], "model_response": [["Who was the US president in 1973?", "Richard Nixon || Richard Nixon"], ["In which year was Richard Nixon born?", "1913 || 1913"]]}, "mis_info_dict_severe": {"answer_condition": [4, 4], "confidence": [0.07538795471191406, 0.9921875], "model_response": [["Who was the US president in 1973?", "Gerald Ford || Gerald Ford"], ["In which year was Gerald Ford born?", "July 13, 1913 || July 13, 1913"]]}}, "hop2": {"unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.87890625, 0.9921875], "model_response": [["Who was the US president in 1973?", "Richard Nixon || Richard Nixon"], ["In which year was Richard Nixon born?", "1908 || 1908"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.96875, 0.99609375], "model_response": [["Who was the US president in 1973?", "Richard Nixon || Richard Nixon"], ["In which year was Richard Nixon born?", "1908 || 1908"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.73046875, 0.376953125], "model_response": [["Who was the US president in 1973?", "Richard Nixon || Richard Nixon"], ["In which year was Richard Nixon born?", "1908 || 1908"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.9921875, 1.0], "model_response": [["Who was the US president in 1973?", "Richard Nixon || Richard Nixon"], ["In which year was Richard Nixon born?", "1908 || 1908"]]}, "mis_info_dict_light": {"answer_condition": [1, 4], "confidence": [0.62109375, 1.0], "model_response": [["Who was the US president in 1973?", "Richard Nixon || Richard Nixon"], ["In which year was Richard Nixon born?", "1913 || 1913"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.96875, 1.0], "model_response": [["Who was the US president in 1973?", "Richard Nixon || Richard Nixon"], ["In which year was Richard Nixon born?", "1908 || 1908"]]}}}
{"hop1": {"mis_info_dict_severe": {"answer_condition": [-1, -1], "confidence": [-1, -1], "model_response": [["What's the year when Australia the first time formally establish diplomatic relations with Ireland?", "I'm sorry, I'm not sure what you're referring to. Could you please provide more information or context? || N/A"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.96875, 0.99609375], "model_response": [["What's the year when Australia the first time formally establish diplomatic relations with Ireland?", "1974 || 1974"], ["Who was the US president in 1974?", "Gerald Ford || Gerald Ford"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 4], "confidence": [0.029079437255859375, 1.0], "model_response": [["What's the year when Australia the first time formally establish diplomatic relations with Ireland?", "1917 || 1917"], ["Who was the US president in 1917?", "Woodrow Wilson || Woodrow Wilson"]]}, "hall_sbj_dict_light": {"answer_condition": [4, 4], "confidence": [0.625, 0.6089630126953125], "model_response": [["What's the year when Australia the first time formally establish diplomatic relations with Ireland?", "1973 || 1973"], ["Who was the US president in 1973?", "Gerald Ford || Gerald Ford"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 4], "confidence": [0.9084320068359375, 0.953125], "model_response": [["What's the year when Australia the first time formally establish diplomatic relations with Ireland?", "1922 || 1922"], ["Who was the US president in 1922?", "Warren G. Harding || Warren G. Harding"]]}, "mis_info_dict_light": {"answer_condition": [3, 4], "confidence": [1.0, 0.81640625], "model_response": [["What's the year when Australia the first time formally establish diplomatic relations with Ireland?", "1980 || 1980"], ["Who was the US president in 1980?", "Ronald Reagan || Ronald Reagan"]]}}, "hop2": {"unrelated_fact_dict_severe": {"answer_condition": [4, 1], "confidence": [0.263671875, 0.73046875], "model_response": [["What's the year when Australia the first time formally establish diplomatic relations with Ireland?", "1973 || 1973"], ["Who was the US president in 1973?", "Richard Nixon || Richard Nixon"]]}, "hall_sbj_dict_severe": {"answer_condition": [4, 1], "confidence": [0.59765625, 0.62109375], "model_response": [["What's the year when Australia the first time formally establish diplomatic relations with Ireland?", "1973 || 1973"], ["Who was the US president in 1973?", "Richard Nixon || Richard Nixon"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 1], "confidence": [0.79296875, 0.5], "model_response": [["What's the year when Australia the first time formally establish diplomatic relations with Ireland?", "1973 || 1973"], ["Who was the US president in 1973?", "Richard Nixon || Richard Nixon"]]}, "mis_info_dict_light": {"answer_condition": [4, 4], "confidence": [0.07568359375, 0.26953125], "model_response": [["What's the year when Australia the first time formally establish diplomatic relations with Ireland?", "1954 || 1954"], ["Who was the US president in 1954?", "Dwight D. Eisenhower || Dwight D. Eisenhower"]]}, "mis_info_dict_severe": {"answer_condition": [4, 4], "confidence": [0.56640625, 0.6089630126953125], "model_response": [["What's the year when Australia the first time formally establish diplomatic relations with Ireland?", "1973 || 1973"], ["Who was the US president in 1973?", "Gerald Ford || Gerald Ford"]]}, "hall_sbj_dict_light": {"answer_condition": [4, 4], "confidence": [0.14860916137695312, 0.77813720703125], "model_response": [["What's the year when Australia the first time formally establish diplomatic relations with Ireland?", "1924 || 1924"], ["Who was the US president in 1924?", "Warren G. Harding || Warren G. Harding"]]}}}
{"hop1": {"unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [0.821044921875, 0.9766387939453125], "model_response": [["Who is the president / leader of Norway in the year 1814?", "Christian Frederick, King of Denmark and Norway. || Christian Frederick"], ["In which year was Christian Frederick of Denmark born?", "1729 || 1729"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [0.6210850900970399, 1.0], "model_response": [["Who is the president / leader of Norway in the year 1814?", "Christian Frederick of Denmark is the king of Norway in the year 1814. || Christian Frederick of Denmark"], ["In which year was Christian Frederick of Denmark born?", "1729 || 1729"]]}, "mis_info_dict_severe": {"answer_condition": [3, 4], "confidence": [1.0, 0.98046875], "model_response": [["Who is the president / leader of Norway in the year 1814?", "Pizza || Pizza"], ["In which year was pizza born?", "1814 || 1814"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 4], "confidence": [0.9844207763671875, 0.59765625], "model_response": [["Who is the president / leader of Norway in the year 1814?", "Christian Frederick of Denmark is the president / leader of Norway in the year 1814. || Christian Frederick of Denmark"], ["In which year was Christian Frederick of Denmark born?", "1770 || 1770"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 4], "confidence": [0.006527218502014875, 0.99609375], "model_response": [["Who is the president / leader of Norway in the year 1814?", "Christian Frederik of Denmark is the president / leader of Norway in the year 1814. || Christian Frederik of Denmark"], ["In which year was Christian Frederick of Denmark born?", "1729 || 1729"]]}, "mis_info_dict_light": {"answer_condition": [4, 4], "confidence": [1.0, 0.04669189453125], "model_response": [["Who is the president / leader of Norway in the year 1814?", "Gustav IV Adolf of Sweden is the president/leader of Norway in the year 1814. || Gustav IV Adolf of Sweden"], ["In which year was Gustav IV Adolf of Sweden born?", "1778 || 1778"]]}}, "hop2": {"unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [0.7085418701171875, 1.0], "model_response": [["Who is the president / leader of Norway in the year 1814?", "Christian Frederick of Denmark. || Christian Frederick of Denmark"], ["In which year was Christian Frederick of Denmark born?", "1729 || 1729"]]}, "mis_info_dict_severe": {"answer_condition": [1, 4], "confidence": [0.96875, 0.546875], "model_response": [["Who is the president / leader of Norway in the year 1814?", "Christian Frederick of Denmark is the president / leader of Norway in the year 1814. || Christian Frederick of Denmark"], ["In which year was Christian Frederick of Denmark born?", "1769 || 1769"]]}, "mis_info_dict_light": {"answer_condition": [1, 3], "confidence": [0.98828125, 1.0], "model_response": [["Who is the president / leader of Norway in the year 1814?", "Christian Frederick of Denmark was born in 1601. || Christian Frederick of Denmark"], ["In which year was Christian Frederick of Denmark born?", "1601 || 1601"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 4], "confidence": [0.7000732421875, 0.908203125], "model_response": [["Who is the president / leader of Norway in the year 1814?", "King Christian VIII || King Christian VIII"], ["In which year was King Christian VIII of Denmark born?", "1746 || 1746"]]}, "hall_sbj_dict_light": {"answer_condition": [4, 4], "confidence": [0.5477596521377563, 0.2611083984375], "model_response": [["Who is the president / leader of Norway in the year 1814?", "King Christian VIII || King Christian VIII"], ["In which year was King Christian VIII of Denmark born?", "1649 || 1649"]]}, "hall_sbj_dict_severe": {"answer_condition": [4, 4], "confidence": [0.5873551368713379, 0.24442291259765625], "model_response": [["Who is the president / leader of Norway in the year 1814?", "King Christian VIII || King Christian VIII"], ["In which year was King Christian VIII of Denmark born?", "1746 || 1746"]]}}}
{"hop1": {"unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.80859375, 1.0], "model_response": [["What are the colors on the national flag of Norway?", "Blue and white || Blue and white"], ["What is the contrast color of white?", "Black || Black"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.62890625, 1.0], "model_response": [["What are the colors on the national flag of Norway?", "Blue and white. || Blue and white"], ["What is the contrast color of white?", "Black || Black"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.3860290050506592, 1.0], "model_response": [["What are the colors on the national flag of Norway?", "Red, White, and Blue || Red, White, and Blue"], ["What is the contrast color of white?", "Black || Black"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.45384979248046875, 1.0], "model_response": [["What are the colors on the national flag of Norway?", "Blue and white. || Blue and white"], ["What is the contrast color of white?", "Black || Black"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.05029517412185669, 1.0], "model_response": [["What are the colors on the national flag of Norway?", "Red, White, and Blue || Red, White, and Blue"], ["What is the contrast color of white?", "Black || Black"]]}, "mis_info_dict_light": {"answer_condition": [3, 1], "confidence": [0.87890625, 0.9652087688446045], "model_response": [["What are the colors on the national flag of Norway?", "Red and Blue || Red and Blue"], ["What are the contrast colors of red and blue?", "Contrast Colors: White and Black || White and Black"]]}}, "hop2": {"mis_info_dict_light": {"answer_condition": [-1, -1], "confidence": [-1, -1], "model_response": [["What are the colors on the national flag of Norway?", "The colors on the national flag of Norway are blue, white, and red. || N/A"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.8910369873046875, 1.0], "model_response": [["What are the colors on the national flag of Norway?", "Blue and white || Blue and white"], ["What is the contrast color of white?", "Black || Black"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.90625, 1.0], "model_response": [["What are the colors on the national flag of Norway?", "Blue and white. || Blue and white"], ["What is the contrast color of white?", "Black || Black"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.79376220703125, 1.0], "model_response": [["What are the colors on the national flag of Norway?", "Blue and white. || Blue and white"], ["What is the contrast color of white?", "Black || Black"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.06529879101435654, 1.0], "model_response": [["What are the colors on the national flag of Norway?", "Red, white, and blue. || Red, white, and blue"], ["What is the contrast color of white?", "Black || Black"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.4086456298828125, 1.0], "model_response": [["What are the colors on the national flag of Norway?", "Blue and white. || Blue and white"], ["What is the contrast color of white?", "Black || Black"]]}}}
{"hop1": {"mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.9921875], "model_response": [["Which country does Paris belong to?", "France || France"], ["What's the year when France the first time formally establish diplomatic relations with Norway?", "1814 || 1814"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.99609375], "model_response": [["Which country does Paris belong to?", "France || France"], ["What's the year when France the first time formally establish diplomatic relations with Norway?", "1814 || 1814"]]}, "mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.99609375], "model_response": [["Which country does Paris belong to?", "France || France"], ["What's the year when France the first time formally establish diplomatic relations with Norway?", "1814 || 1814"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.99609375], "model_response": [["Which country does Paris belong to?", "France || France"], ["What's the year when France the first time formally establish diplomatic relations with Norway?", "1814 || 1814"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Which country does Paris belong to?", "France || France"], ["What's the year when France the first time formally establish diplomatic relations with Norway?", "1814 || 1814"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Which country does Paris belong to?", "France || France"], ["What's the year when France the first time formally establish diplomatic relations with Norway?", "1814 || 1814"]]}}, "hop2": {"hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Which country does Paris belong to?", "France || France"], ["What's the year when France the first time formally establish diplomatic relations with Norway?", "1814 || 1814"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.85601806640625], "model_response": [["Which country does Paris belong to?", "France || France"], ["What's the year when France the first time formally establish diplomatic relations with Norway?", "1814 || 1814"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Which country does Paris belong to?", "France || France"], ["What's the year when France the first time formally establish diplomatic relations with Norway?", "1814 || 1814"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.9921875], "model_response": [["Which country does Paris belong to?", "France || France"], ["What's the year when France the first time formally establish diplomatic relations with Norway?", "1814 || 1814"]]}, "mis_info_dict_light": {"answer_condition": [1, 3], "confidence": [1.0, 1.0], "model_response": [["Which country does Paris belong to?", "France || France"], ["What's the year when France the first time formally establish diplomatic relations with Norway?", "1901 || 1901"]]}, "mis_info_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.10138702392578125], "model_response": [["Which country does Paris belong to?", "France || France"], ["What's the year when France the first time formally establish diplomatic relations with Norway?", "1799 || 1799"]]}}}
{"hop1": {"hall_sbj_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.5], "model_response": [["Who was the US president in 1954?", "Dwight D. Eisenhower || Dwight D. Eisenhower"], ["Who is Dwight D. Eisenhower married to?", "Dwight D. Eisenhower was married to Mamie Geneva Doud Eisenhower. || Mamie Geneva Doud Eisenhower"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.953125, 0.92578125], "model_response": [["Who was the US president in 1954?", "Dwight Eisenhower || Dwight Eisenhower"], ["Who is Dwight D. Eisenhower married to?", "Dwight D. Eisenhower was married to Mamie Geneva Doud Eisenhower. || Mamie Geneva Doud Eisenhower"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.5, 0.81640625], "model_response": [["Who was the US president in 1954?", "Dwight D. Eisenhower || Dwight D. Eisenhower"], ["Who is Dwight D. Eisenhower married to?", "Dwight D. Eisenhower was married to Mamie Geneva Doud Eisenhower. || Mamie Geneva Doud Eisenhower"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.73046875, 0.62109375], "model_response": [["Who was the US president in 1954?", "Dwight Eisenhower || Dwight Eisenhower"], ["Who is Dwight D. Eisenhower married to?", "Dwight D. Eisenhower was married to Mamie Geneva Doud Eisenhower. || Mamie Geneva Doud Eisenhower"]]}, "mis_info_dict_light": {"answer_condition": [3, 4], "confidence": [1.0, 0.494140625], "model_response": [["Who was the US president in 1954?", "John F. Kennedy || John F. Kennedy"], ["Who is John F. Kennedy married to?", "Jacqueline Bouvier || Jacqueline Bouvier"]]}, "hall_sbj_dict_light": {"answer_condition": [4, 4], "confidence": [0.99609375, 1.0], "model_response": [["Who was the US president in 1954?", "Winston Churchill || Winston Churchill"], ["Who is Winston Churchill married to?", "Winston Churchill was married to Clementine Hozier. || Clementine Hozier"]]}}, "hop2": {"mis_info_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.99609375], "model_response": [["Who was the US president in 1954?", "Dwight D. Eisenhower || Dwight D. Eisenhower"], ["Who is Dwight D. Eisenhower married to?", "Pizza || Pizza"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.9456787109375, 0.81640625], "model_response": [["Who was the US president in 1954?", "Dwight Eisenhower || Dwight Eisenhower"], ["Who is Dwight D. Eisenhower married to?", "Dolley Madison || Dolley Madison"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.8754730224609375, 0.87890625], "model_response": [["Who was the US president in 1954?", "Dwight Eisenhower || Dwight Eisenhower"], ["Who is Dwight D. Eisenhower married to?", "Dolley Madison || Dolley Madison"]]}, "mis_info_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 1.0], "model_response": [["Who was the US president in 1954?", "Dwight D. Eisenhower || Dwight D. Eisenhower"], ["Who is Dwight D. Eisenhower married to?", "Eleanor Roosevelt || Eleanor Roosevelt"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.26953125, 0.616241455078125], "model_response": [["Who was the US president in 1954?", "Dwight Eisenhower || Dwight Eisenhower"], ["Who is Dwight D. Eisenhower married to?", "Dwight D. Eisenhower was married to Mamie Geneva Doud Eisenhower. || Mamie Geneva Doud Eisenhower"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.73046875, 0.5], "model_response": [["Who was the US president in 1954?", "Dwight Eisenhower || Dwight Eisenhower"], ["Who is Dwight D. Eisenhower married to?", "Dwight D. Eisenhower was married to Mamie Geneva Doud Eisenhower. || Mamie Geneva Doud Eisenhower"]]}}}
{"hop1": {"hall_sbj_dict_severe": {"answer_condition": [1, 4], "confidence": [0.84625244140625, 0.291595458984375], "model_response": [["What's the year when Russia the first time formally establish diplomatic relations with United Kingdom?", "1840 || 1840"], ["Which film won the Oscar for Outstanding Picture in 1840, being the first one in alphabetical order?", "The first film to win the Oscar for Outstanding Picture in alphabetical order was \"The Red Shoes\" in 1948. || The Red Shoes"]]}, "mis_info_dict_severe": {"answer_condition": [1, 4], "confidence": [0.83587646484375, 0.56591796875], "model_response": [["What's the year when Russia the first time formally establish diplomatic relations with United Kingdom?", "1840 || 1840"], ["Which film won the Oscar for Outstanding Picture in 1840, being the first one in alphabetical order?", "The first film to win the Oscar for Outstanding Picture in alphabetical order was \"The Artist\" in 1940. || The Artist"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [0.2529144287109375, 0.6819610595703125], "model_response": [["What's the year when Russia the first time formally establish diplomatic relations with United Kingdom?", "1840 || 1840"], ["Which film won the Oscar for Outstanding Picture in 1840, being the first one in alphabetical order?", "The first film to win the Oscar for Outstanding Picture in 1840 was \"The Great Train Robbery\" (USA) directed by Edwin S. Porter. || The Great Train Robbery"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 4], "confidence": [0.04220008850097656, 0.8617401123046875], "model_response": [["What's the year when Russia the first time formally establish diplomatic relations with United Kingdom?", "1845 || 1845"], ["Which film won the Oscar for Outstanding Picture in 1845, being the first one in alphabetical order?", "The first film that won the Oscar for Outstanding Picture in 1845 was \"The Great Train Robbery\" (1903). || The Great Train Robbery"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 0.10868314857361838], "model_response": [["What's the year when Russia the first time formally establish diplomatic relations with United Kingdom?", "1840 || 1840"], ["Which film won the Oscar for Outstanding Picture in 1840, being the first one in alphabetical order?", "The first film to win the Oscar for Outstanding Picture in 1840 was \"The Life of Joshua Norton\" (1840), which was the first film to win the award. || The Life of Joshua Norton"]]}, "mis_info_dict_light": {"answer_condition": [3, 4], "confidence": [1.0, 0.4427040219306946], "model_response": [["What's the year when Russia the first time formally establish diplomatic relations with United Kingdom?", "1810 || 1810"], ["Which film won the Oscar for Outstanding Picture in 1810, being the first one in alphabetical order?", "The first film to win the Oscar for Outstanding Picture in 1810 was \"The Heiress\", directed by William Wyler. || The Heiress"]]}}, "hop2": {"unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [0.04452323913574219, 0.3558349609375], "model_response": [["What's the year when Russia the first time formally establish diplomatic relations with United Kingdom?", "1840 || 1840"], ["Which film won the Oscar for Outstanding Picture in 1840, being the first one in alphabetical order?", "Othello || Othello"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 3], "confidence": [0.980560302734375, 1.0], "model_response": [["What's the year when Russia the first time formally establish diplomatic relations with United Kingdom?", "1840 || 1840"], ["Which film won the Oscar for Outstanding Picture in 1840, being the first one in alphabetical order?", "The Godfather || The Godfather"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 4], "confidence": [0.9766845703125, 1.0], "model_response": [["What's the year when Russia the first time formally establish diplomatic relations with United Kingdom?", "1840 || 1840"], ["Which film won the Oscar for Outstanding Picture in 1840, being the first one in alphabetical order?", "Sunflowers || Sunflowers"]]}, "mis_info_dict_light": {"answer_condition": [1, 4], "confidence": [0.98828125, 1.0], "model_response": [["What's the year when Russia the first time formally establish diplomatic relations with United Kingdom?", "1840 || 1840"], ["Which film won the Oscar for Outstanding Picture in 1840, being the first one in alphabetical order?", "Gone with the Wind || Gone with the Wind"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [0.30040740966796875, 0.46497344970703125], "model_response": [["What's the year when Russia the first time formally establish diplomatic relations with United Kingdom?", "1840 || 1840"], ["Which film won the Oscar for Outstanding Picture in 1840, being the first one in alphabetical order?", "The first film to win the Oscar for Outstanding Picture in 1840 was \"The Great Train Robbery\" (1903). || The Great Train Robbery"]]}, "mis_info_dict_severe": {"answer_condition": [4, 1], "confidence": [0.6731414794921875, 1.0], "model_response": [["What's the year when Russia the first time formally establish diplomatic relations with United Kingdom?", "1825 || 1825"], ["Which film won the Oscar for Outstanding Picture in 1825, being the first one in alphabetical order?", "Oliver Twist || Oliver Twist"]]}}}
{"hop1": {"unrelated_fact_dict_severe": {"answer_condition": [-1, -1], "confidence": [-1, -1], "model_response": [["Which film, in alphabetical order, won the Oscar for Outstanding Picture in the year 1732?", "The film was not released in 1732. || N/A"]]}, "hall_sbj_dict_severe": {"answer_condition": [3, 4], "confidence": [0.6876678466796875, 0.8671875], "model_response": [["Which film, in alphabetical order, won the Oscar for Outstanding Picture in the year 1732?", "Pizza toppings || Pizza toppings"], ["Who is the director of the film \"Pizza Toppings\"?", "Unknown || Unknown"]]}, "hall_sbj_dict_light": {"answer_condition": [4, 4], "confidence": [1.0, 1.0], "model_response": [["Which film, in alphabetical order, won the Oscar for Outstanding Picture in the year 1732?", "The Godfather || The Godfather"], ["Who is the director of the film \"The Godfather\"?", "Francis Ford Coppola || Francis Ford Coppola"]]}, "mis_info_dict_severe": {"answer_condition": [4, 4], "confidence": [0.23871852830052376, 0.875], "model_response": [["Which film, in alphabetical order, won the Oscar for Outstanding Picture in the year 1732?", "Chocolate Cake (film) || Chocolate Cake (film)"], ["Who is the director of the film \"Chocolate Cake\"?", "Unknown (director) || Unknown"]]}, "mis_info_dict_light": {"answer_condition": [4, 4], "confidence": [1.0, 1.0], "model_response": [["Which film, in alphabetical order, won the Oscar for Outstanding Picture in the year 1732?", "The Godfather || The Godfather"], ["Who is the director of the film \"The Godfather\"?", "Francis Ford Coppola || Francis Ford Coppola"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 4], "confidence": [0.032865822315216064, 0.99609375], "model_response": [["Which film, in alphabetical order, won the Oscar for Outstanding Picture in the year 1732?", "The Fountain || The Fountain"], ["Who is the director of the film \"The Fountain\"?", "Darren Aronofsky || Darren Aronofsky"]]}}, "hop2": {"unrelated_fact_dict_severe": {"answer_condition": [-1, -1], "confidence": [-1, -1], "model_response": [["Which film, in alphabetical order, won the Oscar for Outstanding Picture in the year 1732?", "The film was not released in that year. || N/A"]]}, "hall_sbj_dict_severe": {"answer_condition": [4, 4], "confidence": [0.81640625, 1.0], "model_response": [["Which film, in alphabetical order, won the Oscar for Outstanding Picture in the year 1732?", "Titanic || Titanic"], ["Who is the director of the film \"Titanic\"?", "James Cameron || James Cameron"]]}, "hall_sbj_dict_light": {"answer_condition": [4, 4], "confidence": [0.8125, 1.0], "model_response": [["Which film, in alphabetical order, won the Oscar for Outstanding Picture in the year 1732?", "Titanic || Titanic"], ["Who is the director of the film \"Titanic\"?", "James Cameron || James Cameron"]]}, "mis_info_dict_severe": {"answer_condition": [4, 4], "confidence": [0.7265625, 1.0], "model_response": [["Which film, in alphabetical order, won the Oscar for Outstanding Picture in the year 1732?", "Titanic || Titanic"], ["Who is the director of the film \"Titanic\"?", "James Cameron || James Cameron"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 4], "confidence": [0.07128037512302399, 1.0], "model_response": [["Which film, in alphabetical order, won the Oscar for Outstanding Picture in the year 1732?", "The Godfather Part II || The Godfather Part II"], ["Who is the director of the film \"The Godfather Part II\"?", "Francis Ford Coppola || Francis Ford Coppola"]]}, "mis_info_dict_light": {"answer_condition": [4, 4], "confidence": [0.421875, 0.98046875], "model_response": [["Which film, in alphabetical order, won the Oscar for Outstanding Picture in the year 1732?", "Amadeus || Amadeus"], ["Who is the director of the film \"Amadeus\"?", "Milos Forman || Milos Forman"]]}}}
{"hop1": {"unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.984375, 0.98046875], "model_response": [["What is the official or most commonly spoken language in Finland?", "Finnish || Finnish"], ["What is the ISO 639-2 code for the Finnish language?", "fi || fi"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.97265625, 0.81640625], "model_response": [["What is the official or most commonly spoken language in Finland?", "Finnish || Finnish"], ["What is the ISO 639-2 code for the Finnish language?", "fi || fi"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.98828125, 0.92578125], "model_response": [["What is the official or most commonly spoken language in Finland?", "Finnish || Finnish"], ["What is the ISO 639-2 code for the Finnish language?", "fi || fi"]]}, "mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [0.84765625, 0.73046875], "model_response": [["What is the official or most commonly spoken language in Finland?", "Finnish || Finnish"], ["What is the ISO 639-2 code for the Finnish language?", "fi || fi"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.93359375, 0.1826171875], "model_response": [["What is the official or most commonly spoken language in Finland?", "Finnish || Finnish"], ["What is the ISO 639-2 code for the Finnish language?", "Fin || Fin"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.5], "model_response": [["What is the official or most commonly spoken language in Finland?", "Finland's official language is Finnish. However, English is widely spoken and understood in Finland. || Finnish"], ["What is the ISO 639-2 code for the Finnish language?", "fi || fi"]]}}, "hop2": {"hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.373046875, 1.0], "model_response": [["What is the official or most commonly spoken language in Finland?", "Finnish || Finnish"], ["What is the ISO 639-2 code for the Finnish language?", "fi || fi"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.921875, 0.5], "model_response": [["What is the official or most commonly spoken language in Finland?", "Finnish || Finnish"], ["What is the ISO 639-2 code for the Finnish language?", "fi || fi"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.61328125, 1.0], "model_response": [["What is the official or most commonly spoken language in Finland?", "Finnish || Finnish"], ["What is the ISO 639-2 code for the Finnish language?", "fi || fi"]]}, "mis_info_dict_severe": {"answer_condition": [1, 3], "confidence": [1.0, 0.7890625], "model_response": [["What is the official or most commonly spoken language in Finland?", "The official or most commonly spoken language in Finland is Finnish. || Finnish"], ["What is the ISO 639-2 code for the Finnish language?", "Pizza || Pizza"]]}, "mis_info_dict_light": {"answer_condition": [1, 3], "confidence": [0.921875, 0.921875], "model_response": [["What is the official or most commonly spoken language in Finland?", "Finnish || Finnish"], ["What is the ISO 639-2 code for the Finnish language?", "en || en"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 4], "confidence": [1.0, 0.8828125], "model_response": [["What is the official or most commonly spoken language in Finland?", "The official language of Finland is Finnish, but the most commonly spoken language is Swedish. || Swedish"], ["What is the ISO 639-2 code for the Swedish language?", "swe || swe"]]}}}
{"hop1": {"hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.87109375], "model_response": [["Which city hosted the first Olympic Games in 1979?", "Montreal || Montreal"], ["What is the name of the largest airport in Montreal?", "Montreal-Pierre Elliott Trudeau International Airport || Montreal-Pierre Elliott Trudeau International Airport"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.72265625], "model_response": [["Which city hosted the first Olympic Games in 1979?", "Montreal || Montreal"], ["What is the name of the largest airport in Montreal?", "Montreal-Pierre Elliott Trudeau International Airport || Montreal-Pierre Elliott Trudeau International Airport"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 4], "confidence": [0.71875, 1.0], "model_response": [["Which city hosted the first Olympic Games in 1979?", "London || London"], ["What is the name of the largest airport in London?", "Heathrow || Heathrow"]]}, "mis_info_dict_severe": {"answer_condition": [4, 4], "confidence": [0.376953125, 0.953125], "model_response": [["Which city hosted the first Olympic Games in 1979?", "Los Angeles || Los Angeles"], ["What is the name of the largest airport in Los Angeles?", "Los Angeles International Airport (LAX) || Los Angeles International Airport (LAX)"]]}, "mis_info_dict_light": {"answer_condition": [3, 4], "confidence": [1.0, 0.9921875], "model_response": [["Which city hosted the first Olympic Games in 1979?", "Los Angeles || Los Angeles"], ["What is the name of the largest airport in Los Angeles?", "Los Angeles International Airport (LAX) || Los Angeles International Airport (LAX)"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 4], "confidence": [0.61328125, 0.9921875], "model_response": [["Which city hosted the first Olympic Games in 1979?", "Los Angeles || Los Angeles"], ["What is the name of the largest airport in Los Angeles?", "Los Angeles International Airport (LAX) || Los Angeles International Airport (LAX)"]]}}, "hop2": {"mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.96875, 0.04736328125], "model_response": [["Which city hosted the first Olympic Games in 1979?", "Montreal || Montreal"], ["What is the name of the largest airport in Montreal?", "Pierre Elliott Trudeau International Airport || Pierre Elliott Trudeau International Airport"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.930858850479126], "model_response": [["Which city hosted the first Olympic Games in 1979?", "Montreal || Montreal"], ["What is the name of the largest airport in Montreal?", "Montreal-Pierre Elliott Trudeau International Airport || Montreal-Pierre Elliott Trudeau International Airport"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.9921875, 0.98046875], "model_response": [["Which city hosted the first Olympic Games in 1979?", "Montreal || Montreal"], ["What is the name of the largest airport in Montreal?", "Montreal-Pierre Elliott Trudeau International Airport || Montreal-Pierre Elliott Trudeau International Airport"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.99609375], "model_response": [["Which city hosted the first Olympic Games in 1979?", "Montreal, Canada || Montreal"], ["What is the name of the largest airport in Montreal?", "Montreal-Pierre Elliott Trudeau International Airport || Montreal-Pierre Elliott Trudeau International Airport"]]}, "mis_info_dict_light": {"answer_condition": [1, 3], "confidence": [1.0, 0.92578125], "model_response": [["Which city hosted the first Olympic Games in 1979?", "Montreal || Montreal"], ["What is the name of the largest airport in Montreal?", "Montr\u00e9al-Mirabel International Airport || Montr\u00e9al-Mirabel International Airport"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 4], "confidence": [0.87890625, 1.0], "model_response": [["Which city hosted the first Olympic Games in 1979?", "Los Angeles || Los Angeles"], ["What is the name of the largest airport in Los Angeles?", "Los Angeles International Airport (LAX) || Los Angeles International Airport"]]}}}
{"hop1": {"mis_info_dict_severe": {"answer_condition": [4, 4], "confidence": [0.11376953125, 1.0], "model_response": [["Which country is the northernmost in the UTC+1 time zone?", "Finland || Finland"], ["What is the capital of Finland?", "Helsinki || Helsinki"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 4], "confidence": [0.633453369140625, 1.0], "model_response": [["Which country is the northernmost in the UTC+1 time zone?", "Ireland || Ireland"], ["What is the capital of Ireland?", "Dublin || Dublin"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 4], "confidence": [0.77734375, 1.0], "model_response": [["Which country is the northernmost in the UTC+1 time zone?", "Finland || Finland"], ["What is the capital of Finland?", "Helsinki || Helsinki"]]}, "hall_sbj_dict_light": {"answer_condition": [4, 4], "confidence": [0.77734375, 1.0], "model_response": [["Which country is the northernmost in the UTC+1 time zone?", "Finland || Finland"], ["What is the capital of Finland?", "Helsinki || Helsinki"]]}, "mis_info_dict_light": {"answer_condition": [3, 4], "confidence": [0.10498046875, 1.0], "model_response": [["Which country is the northernmost in the UTC+1 time zone?", "Sweden || Sweden"], ["What is the capital of Sweden?", "Stockholm || Stockholm"]]}, "hall_sbj_dict_severe": {"answer_condition": [4, 4], "confidence": [0.226593017578125, 1.0], "model_response": [["Which country is the northernmost in the UTC+1 time zone?", "Ireland || Ireland"], ["What is the capital of Ireland?", "Dublin || Dublin"]]}}, "hop2": {"unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.33203125, 1.0], "model_response": [["Which country is the northernmost in the UTC+1 time zone?", "Norway || Norway"], ["What is the capital of Norway?", "Oslo || Oslo"]]}, "mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [0.66015625, 1.0], "model_response": [["Which country is the northernmost in the UTC+1 time zone?", "Norway || Norway"], ["What is the capital of Norway?", "Oslo || Oslo"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.4140625, 1.0], "model_response": [["Which country is the northernmost in the UTC+1 time zone?", "Norway || Norway"], ["What is the capital of Norway?", "Oslo || Oslo"]]}, "hall_sbj_dict_severe": {"answer_condition": [4, 4], "confidence": [0.244140625, 1.0], "model_response": [["Which country is the northernmost in the UTC+1 time zone?", "Finland || Finland"], ["What is the capital of Finland?", "Helsinki || Helsinki"]]}, "hall_sbj_dict_light": {"answer_condition": [4, 4], "confidence": [0.1064453125, 1.0], "model_response": [["Which country is the northernmost in the UTC+1 time zone?", "Finland || Finland"], ["What is the capital of Finland?", "Helsinki || Helsinki"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 4], "confidence": [0.333984375, 1.0], "model_response": [["Which country is the northernmost in the UTC+1 time zone?", "Finland || Finland"], ["What is the capital of Finland?", "Helsinki || Helsinki"]]}}}
{"hop1": {"mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.961181640625, 0.25449514389038086], "model_response": [["In which year was Harry S. Truman born?", "1884 || 1884"], ["Who is the headmaster of Princeton University in the year 1884?", "William R. Shepherd || William R. Shepherd"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [0.99609375, 0.5440716743469238], "model_response": [["In which year was Harry S. Truman born?", "1884 || 1884"], ["Who is the headmaster of Princeton University in the year 1884?", "Charles S. Fairchild || Charles S. Fairchild"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 0.008226156234741211], "model_response": [["In which year was Harry S. Truman born?", "1884 || 1884"], ["Who is the headmaster of Princeton University in the year 1884?", "John Witherspoon || John Witherspoon"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 0.2386167347431183], "model_response": [["In which year was Harry S. Truman born?", "1884 || 1884"], ["Who is the headmaster of Princeton University in the year 1884?", "Charles S. Fairbanks || Charles S. Fairbanks"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.5686271376907825], "model_response": [["In which year was Harry S. Truman born?", "1884 || 1884"], ["Who is the headmaster of Princeton University in the year 1884?", "Charles S. Fairchild || Charles S. Fairchild"]]}, "mis_info_dict_light": {"answer_condition": [3, 4], "confidence": [1.0, 0.9296875], "model_response": [["In which year was Harry S. Truman born?", "1901 || 1901"], ["Who is the headmaster of Princeton University in the year 1901?", "Woodrow Wilson || Woodrow Wilson"]]}}, "hop2": {"hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.984375], "model_response": [["In which year was Harry S. Truman born?", "1884 || 1884"], ["Who is the headmaster of Princeton University in the year 1884?", "William R. Shepherd || William R. Shepherd"]]}, "mis_info_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.0011453627121227328], "model_response": [["In which year was Harry S. Truman born?", "1884 || 1884"], ["Who is the headmaster of Princeton University in the year 1884?", "John G. Thompson || John G. Thompson"]]}, "mis_info_dict_light": {"answer_condition": [1, 4], "confidence": [0.98046875, 1.0], "model_response": [["In which year was Harry S. Truman born?", "1884 || 1884"], ["Who is the headmaster of Princeton University in the year 1884?", "John F. Kennedy || John F. Kennedy"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 0.010780401527881622], "model_response": [["In which year was Harry S. Truman born?", "1884 || 1884"], ["Who is the headmaster of Princeton University in the year 1884?", "Charles S. Fairbanks || Charles S. Fairbanks"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.04341772637417307], "model_response": [["In which year was Harry S. Truman born?", "1884 || 1884"], ["Who is the headmaster of Princeton University in the year 1884?", "John W. McCarter || John W. McCarter"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 3], "confidence": [1.0, 1.0], "model_response": [["In which year was Harry S. Truman born?", "1884 || 1884"], ["Who is the headmaster of Princeton University in the year 1884?", "Charles W. Eliot || Charles W. Eliot"]]}}}
{"hop1": {"hall_sbj_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.93450927734375], "model_response": [["What's the year when Norway the first time formally establish diplomatic relations with Russia?", "1825 || 1825"], ["Who was the US president in the year 1825?", "James Monroe || James Monroe"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 0.9689788818359375], "model_response": [["What's the year when Norway the first time formally establish diplomatic relations with Russia?", "1825 || 1825"], ["Who was the US president in the year 1825?", "James Monroe || James Monroe"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [0.972808837890625, 0.972808837890625], "model_response": [["What's the year when Norway the first time formally establish diplomatic relations with Russia?", "1825 || 1825"], ["Who was the US president in the year 1825?", "James Monroe || James Monroe"]]}, "mis_info_dict_severe": {"answer_condition": [3, 4], "confidence": [0.48828125, 0.96484375], "model_response": [["What's the year when Norway the first time formally establish diplomatic relations with Russia?", "Pizza || Pizza"], ["Who was the US president in the year Pizza?", "Ronald Reagan || Ronald Reagan"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 4], "confidence": [0.1513671875, 0.953125], "model_response": [["What's the year when Norway the first time formally establish diplomatic relations with Russia?", "1855 || 1855"], ["Who was the US president in the year 1855?", "James Buchanan || James Buchanan"]]}, "mis_info_dict_light": {"answer_condition": [3, 4], "confidence": [1.0, 1.0], "model_response": [["What's the year when Norway the first time formally establish diplomatic relations with Russia?", "1901 || 1901"], ["Who was the US president in the year 1901?", "William McKinley || William McKinley"]]}}, "hop2": {"hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.92333984375], "model_response": [["What's the year when Norway the first time formally establish diplomatic relations with Russia?", "1825 || 1825"], ["Who was the US president in the year 1825?", "James Madison || James Madison"]]}, "mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.94940185546875], "model_response": [["What's the year when Norway the first time formally establish diplomatic relations with Russia?", "1825 || 1825"], ["Who was the US president in the year 1825?", "John Quincy Adams || John Quincy Adams"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [0.96484375, 0.9456787109375], "model_response": [["What's the year when Norway the first time formally establish diplomatic relations with Russia?", "1825 || 1825"], ["Who was the US president in the year 1825?", "James Monroe || James Monroe"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 4], "confidence": [0.98828125, 0.93450927734375], "model_response": [["What's the year when Norway the first time formally establish diplomatic relations with Russia?", "1825 || 1825"], ["Who was the US president in the year 1825?", "James Monroe || James Monroe"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [0.8203125, 0.90386962890625], "model_response": [["What's the year when Norway the first time formally establish diplomatic relations with Russia?", "1825 || 1825"], ["Who was the US president in the year 1825?", "James Monroe || James Monroe"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.8125], "model_response": [["What's the year when Norway the first time formally establish diplomatic relations with Russia?", "1825 || 1825"], ["Who was the US president in the year 1825?", "John Quincy Adams || John Quincy Adams"]]}}}
{"hop1": {"hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.9921875, 1.0], "model_response": [["Which city hosted the first Olympic Games in 1949?", "London || London"], ["Which country does London belong to?", "United Kingdom || United Kingdom"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Which city hosted the first Olympic Games in 1949?", "London || London"], ["Which country does London belong to?", "United Kingdom || United Kingdom"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Which city hosted the first Olympic Games in 1949?", "London || London"], ["Which country does London belong to?", "United Kingdom || United Kingdom"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Which city hosted the first Olympic Games in 1949?", "London || London"], ["Which country does London belong to?", "United Kingdom || United Kingdom"]]}, "unrelated_fact_dict_light": {"answer_condition": [3, 4], "confidence": [1.0, 1.0], "model_response": [["Which city hosted the first Olympic Games in 1949?", "Rio de Janeiro || Rio de Janeiro"], ["Which country does Rio de Janeiro belong to?", "Brazil || Brazil"]]}, "mis_info_dict_light": {"answer_condition": [3, 4], "confidence": [1.0, 1.0], "model_response": [["Which city hosted the first Olympic Games in 1949?", "Paris || Paris"], ["Which country does Paris belong to?", "France || France"]]}}, "hop2": {"hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Which city hosted the first Olympic Games in 1949?", "London || London"], ["Which country does London belong to?", "United Kingdom || United Kingdom"]]}, "mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.98046875], "model_response": [["Which city hosted the first Olympic Games in 1949?", "London || London"], ["Which country does London belong to?", "United Kingdom || United Kingdom"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.98046875], "model_response": [["Which city hosted the first Olympic Games in 1949?", "London || London"], ["Which country does London belong to?", "United Kingdom || United Kingdom"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Which city hosted the first Olympic Games in 1949?", "London || London"], ["Which country does London belong to?", "United Kingdom || United Kingdom"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Which city hosted the first Olympic Games in 1949?", "London || London"], ["Which country does London belong to?", "United Kingdom || United Kingdom"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Which city hosted the first Olympic Games in 1949?", "London || London"], ["Which country does London belong to?", "United Kingdom || United Kingdom"]]}}}
{"hop1": {"hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.98046875], "model_response": [["Which city hosted the first Olympic Games in 1915?", "Rome || Rome"], ["What is the time zone of Rome in UTC?", "UTC+2 || UTC+2"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.9377288818359375, 0.98046875], "model_response": [["Which city hosted the first Olympic Games in 1915?", "Rome || Rome"], ["What is the time zone of Rome in UTC?", "UTC+2 || UTC+2"]]}, "unrelated_fact_dict_light": {"answer_condition": [3, 4], "confidence": [0.99609375, 0.5], "model_response": [["Which city hosted the first Olympic Games in 1915?", "London || London"], ["What is the time zone of London in UTC?", "UTC +0 || UTC +0"]]}, "mis_info_dict_severe": {"answer_condition": [4, 4], "confidence": [0.5, 0.972808837890625], "model_response": [["Which city hosted the first Olympic Games in 1915?", "Rio de Janeiro || Rio de Janeiro"], ["What is the time zone of Rio de Janeiro in UTC?", "UTC-3 || UTC-3"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 4], "confidence": [0.8984375, 0.87890625], "model_response": [["Which city hosted the first Olympic Games in 1915?", "London || London"], ["What is the time zone of London in UTC?", "UTC+0 || UTC+0"]]}, "mis_info_dict_light": {"answer_condition": [3, 4], "confidence": [1.0, 0.6420135498046875], "model_response": [["Which city hosted the first Olympic Games in 1915?", "Athens || Athens"], ["What is the time zone of Athens in UTC?", "UTC+3 || UTC+3"]]}}, "hop2": {"mis_info_dict_light": {"answer_condition": [1, 3], "confidence": [0.96875, 0.87890625], "model_response": [["Which city hosted the first Olympic Games in 1915?", "Rome || Rome"], ["What is the time zone of Rome in UTC?", "UTC-5 || UTC-5"]]}, "hall_sbj_dict_severe": {"answer_condition": [4, 4], "confidence": [0.96875, 1.0], "model_response": [["Which city hosted the first Olympic Games in 1915?", "Rio de Janeiro || Rio de Janeiro"], ["What is the time zone of Rio de Janeiro in UTC?", "UTC-3 || UTC-3"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 4], "confidence": [0.96875, 1.0], "model_response": [["Which city hosted the first Olympic Games in 1915?", "Rio de Janeiro || Rio de Janeiro"], ["What is the time zone of Rio de Janeiro in UTC?", "UTC-3 || UTC-3"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 4], "confidence": [0.92578125, 0.26953125], "model_response": [["Which city hosted the first Olympic Games in 1915?", "Rio de Janeiro || Rio de Janeiro"], ["What is the time zone of Rio de Janeiro in UTC?", "UTC-3:00 || UTC-3:00"]]}, "mis_info_dict_severe": {"answer_condition": [4, 4], "confidence": [0.26953125, 0.474609375], "model_response": [["Which city hosted the first Olympic Games in 1915?", "Rio de Janeiro || Rio de Janeiro"], ["What is the time zone of Rio de Janeiro in UTC?", "Rio de Janeiro is in the UTC-3 time zone. || UTC-3"]]}, "hall_sbj_dict_light": {"answer_condition": [4, 4], "confidence": [0.953125, 1.0], "model_response": [["Which city hosted the first Olympic Games in 1915?", "Rio de Janeiro || Rio de Janeiro"], ["What is the time zone of Rio de Janeiro in UTC?", "UTC-3 || UTC-3"]]}}}
{"hop1": {"hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.9453125, 0.99609375], "model_response": [["Which country does Baltimore belong to?", "United States || United States"], ["What is the capital of the United States?", "Washington D.C. || Washington D.C."]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.9765625, 0.99609375], "model_response": [["Which country does Baltimore belong to?", "United States || United States"], ["What is the capital of the United States?", "Washington D.C. || Washington D.C."]]}, "mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [0.8046875, 0.99609375], "model_response": [["Which country does Baltimore belong to?", "The United States || The United States"], ["What is the capital of the United States?", "Washington D.C. || Washington D.C."]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.72265625, 0.99609375], "model_response": [["Which country does Baltimore belong to?", "United States || United States"], ["What is the capital of the United States?", "Washington D.C. || Washington D.C."]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.91796875, 1.0], "model_response": [["Which country does Baltimore belong to?", "United States || United States"], ["What is the capital of the United States?", "Washington D.C. || Washington D.C."]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.71875, 1.0], "model_response": [["Which country does Baltimore belong to?", "United States || United States"], ["What is the capital of the United States?", "Washington D.C. || Washington D.C."]]}}, "hop2": {"hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.2451171875, 0.5], "model_response": [["Which country does Baltimore belong to?", "The United States || The United States"], ["What is the capital of the United States?", "Washington DC || Washington DC"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.78515625, 0.73046875], "model_response": [["Which country does Baltimore belong to?", "United States || United States"], ["What is the capital of the United States?", "Washington DC || Washington DC"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.93359375, 1.0], "model_response": [["Which country does Baltimore belong to?", "United States || United States"], ["What is the capital of the United States?", "Washington D.C. || Washington D.C."]]}, "mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [0.87890625, 0.99609375], "model_response": [["Which country does Baltimore belong to?", "United States || United States"], ["What is the capital of the United States?", "Washington D.C. || Washington D.C."]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.7265625, 1.0], "model_response": [["Which country does Baltimore belong to?", "United States || United States"], ["What is the capital of the United States?", "Washington D.C. || Washington D.C."]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.015869140625, 0.99609375], "model_response": [["Which country does Baltimore belong to?", "USA || USA"], ["What is the capital of the United States?", "Washington D.C. || Washington D.C."]]}}}
{"hop1": {"hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.9649658203125], "model_response": [["In which year was \"The Sting\" released?", "1973 || 1973"], ["Who is the headmaster of Yale University in the year 1973?", "Kingman Brewster || Kingman Brewster"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.984375], "model_response": [["In which year was \"The Sting\" released?", "1973 || 1973"], ["Who is the headmaster of Yale University in the year 1973?", "Kingman Brewster || Kingman Brewster"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.980560302734375], "model_response": [["In which year was \"The Sting\" released?", "1973 || 1973"], ["Who is the headmaster of Yale University in the year 1973?", "Kingman Brewster || Kingman Brewster"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.81640625], "model_response": [["In which year was \"The Sting\" released?", "1973 || 1973"], ["Who is the headmaster of Yale University in the year 1973?", "Kingman Brewster || Kingman Brewster"]]}, "mis_info_dict_light": {"answer_condition": [3, 1], "confidence": [1.0, 0.9458160400390625], "model_response": [["In which year was \"The Sting\" released?", "1975 || 1975"], ["Who is the headmaster of Yale University in the year 1975?", "Kingman Brewster || Kingman Brewster"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.9922027587890625], "model_response": [["In which year was \"The Sting\" released?", "1973 || 1973"], ["Who is the headmaster of Yale University in the year 1973?", "Kingman Brewster || Kingman Brewster"]]}}, "hop2": {"mis_info_dict_severe": {"answer_condition": [1, -1], "confidence": [1.0, -1], "model_response": [["In which year was \"The Sting\" released?", "1973 || 1973"], ["Who is the headmaster of Yale University in the year 1973?", "I'm sorry, I cannot provide an answer to this question as it is not related to the given information. || N/A"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.99609375], "model_response": [["In which year was \"The Sting\" released?", "1973 || 1973"], ["Who is the headmaster of Yale University in the year 1973?", "Kingman Brewster || Kingman Brewster"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["In which year was \"The Sting\" released?", "1973 || 1973"], ["Who is the headmaster of Yale University in the year 1973?", "Kingman Brewster || Kingman Brewster"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["In which year was \"The Sting\" released?", "1973 || 1973"], ["Who is the headmaster of Yale University in the year 1973?", "Kingman Brewster || Kingman Brewster"]]}, "mis_info_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 1.0], "model_response": [["In which year was \"The Sting\" released?", "1973 || 1973"], ["Who is the headmaster of Yale University in the year 1973?", "John F. Kennedy || John F. Kennedy"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.267333984375], "model_response": [["In which year was \"The Sting\" released?", "1973 || 1973"], ["Who is the headmaster of Yale University in the year 1973?", "Thomas J. Watson || Thomas J. Watson"]]}}}
{"hop1": {"unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.16050338745117188, 0.9921875], "model_response": [["Who is the CEO of International Business Machines (IBM) in the year 1973?", "Thomas Watson || Thomas Watson"], ["In which year was Thomas J. Watson born?", "1894 || 1894"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.6420135498046875, 0.984375], "model_response": [["Who is the CEO of International Business Machines (IBM) in the year 1973?", "Thomas Watson || Thomas Watson"], ["In which year was Thomas J. Watson born?", "1894 || 1894"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.400390625], "model_response": [["Who is the CEO of International Business Machines (IBM) in the year 1973?", "Thomas J. Watson || Thomas J. Watson"], ["In which year was Thomas J. Watson born?", "1874 || 1874"]]}, "mis_info_dict_light": {"answer_condition": [3, 4], "confidence": [1.0, 1.0], "model_response": [["Who is the CEO of International Business Machines (IBM) in the year 1973?", "Bill Gates || Bill Gates"], ["In which year was Bill Gates born?", "1955 || 1955"]]}, "mis_info_dict_severe": {"answer_condition": [4, 4], "confidence": [0.77069091796875, 0.306640625], "model_response": [["Who is the CEO of International Business Machines (IBM) in the year 1973?", "Chocolate cake || Chocolate cake"], ["In which year was chocolate cake born?", "Chocolate cake was born in the year 2000. || 2000"]]}, "hall_sbj_dict_light": {"answer_condition": [4, 4], "confidence": [0.05419202148914337, 0.2060546875], "model_response": [["Who is the CEO of International Business Machines (IBM) in the year 1973?", "John R. Opel, Jr. || John R. Opel, Jr."], ["In which year was John R. Opel, Jr. born?", "1926 || 1926"]]}}, "hop2": {"mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.98046875, 0.038909912109375], "model_response": [["Who is the CEO of International Business Machines (IBM) in the year 1973?", "Thomas J. Watson || Thomas J. Watson"], ["In which year was Thomas J. Watson born?", "1894 || 1894"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.9766387939453125, 1.0], "model_response": [["Who is the CEO of International Business Machines (IBM) in the year 1973?", "Thomas Watson || Thomas Watson"], ["In which year was Thomas J. Watson born?", "1894 || 1894"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.43087005615234375, 0.9453125], "model_response": [["Who is the CEO of International Business Machines (IBM) in the year 1973?", "Thomas Watson Jr. || Thomas Watson Jr."], ["In which year was Thomas J. Watson born?", "1894 || 1894"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.470977783203125, 0.953125], "model_response": [["Who is the CEO of International Business Machines (IBM) in the year 1973?", "Thomas Watson Jr. || Thomas Watson Jr."], ["In which year was Thomas J. Watson born?", "1894 || 1894"]]}, "mis_info_dict_light": {"answer_condition": [1, 3], "confidence": [1.0, 1.0], "model_response": [["Who is the CEO of International Business Machines (IBM) in the year 1973?", "Thomas J. Watson || Thomas J. Watson"], ["In which year was Thomas J. Watson born?", "1876 || 1876"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [0.04717826843261719, 0.31640625], "model_response": [["Who is the CEO of International Business Machines (IBM) in the year 1973?", "Thomas J. Watson || Thomas J. Watson"], ["In which year was Thomas J. Watson born?", "1895 || 1895"]]}}}
{"hop1": {"unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Which country does Tokyo, Japan belong to?", "Japan || Japan"], ["What's the year when Japan the first time formally establish diplomatic relations with Russia?", "1855 || 1855"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.9921875], "model_response": [["Which country does Tokyo, Japan belong to?", "Japan || Japan"], ["What's the year when Japan the first time formally establish diplomatic relations with Russia?", "1855 || 1855"]]}, "mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Which country does Tokyo, Japan belong to?", "Japan || Japan"], ["What's the year when Japan the first time formally establish diplomatic relations with Russia?", "1855 || 1855"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.98828125, 1.0], "model_response": [["Which country does Tokyo, Japan belong to?", "Japan || Japan"], ["What's the year when Japan the first time formally establish diplomatic relations with Russia?", "1855 || 1855"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.99609375], "model_response": [["Which country does Tokyo, Japan belong to?", "Japan || Japan"], ["What's the year when Japan the first time formally establish diplomatic relations with Russia?", "1855 || 1855"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Which country does Tokyo, Japan belong to?", "Japan || Japan"], ["What's the year when Japan the first time formally establish diplomatic relations with Russia?", "1855 || 1855"]]}}, "hop2": {"unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.94140625], "model_response": [["Which country does Tokyo, Japan belong to?", "Japan || Japan"], ["What's the year when Japan the first time formally establish diplomatic relations with Russia?", "1855 || 1855"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.91796875], "model_response": [["Which country does Tokyo, Japan belong to?", "Japan || Japan"], ["What's the year when Japan the first time formally establish diplomatic relations with Russia?", "1855 || 1855"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Which country does Tokyo, Japan belong to?", "Japan || Japan"], ["What's the year when Japan the first time formally establish diplomatic relations with Russia?", "1855 || 1855"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Which country does Tokyo, Japan belong to?", "Japan || Japan"], ["What's the year when Japan the first time formally establish diplomatic relations with Russia?", "1855 || 1855"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Which country does Tokyo, Japan belong to?", "Japan || Japan"], ["What's the year when Japan the first time formally establish diplomatic relations with Russia?", "1855 || 1855"]]}, "mis_info_dict_light": {"answer_condition": [1, 3], "confidence": [1.0, 1.0], "model_response": [["Which country does Tokyo, Japan belong to?", "Japan || Japan"], ["What's the year when Japan the first time formally establish diplomatic relations with Russia?", "1868 || 1868"]]}}}
{"hop1": {"hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.92578125, 0.7734375], "model_response": [["In which year was The Boston Celtics founded?", "1909 || 1909"], ["Which film won the Oscar for Outstanding Picture in 1909, being the first one in alphabetical order?", "The Birth of a Nation || The Birth of a Nation"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.984375, 0.7734375], "model_response": [["In which year was The Boston Celtics founded?", "1946 || 1946"], ["Which film won the Oscar for Outstanding Picture in 1909, being the first one in alphabetical order?", "The Birth of a Nation (1910) || The Birth of a Nation"]]}, "mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.84375], "model_response": [["In which year was The Boston Celtics founded?", "1946 || 1946"], ["Which film won the Oscar for Outstanding Picture in 1909, being the first one in alphabetical order?", "The Birth of a Nation || The Birth of a Nation"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 1], "confidence": [0.89453125, 0.7265625], "model_response": [["In which year was The Boston Celtics founded?", "1908 || 1908"], ["Which film won the Oscar for Outstanding Picture in 1908, being the first one in alphabetical order?", "The Birth of a Nation || The Birth of a Nation"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 4], "confidence": [0.68359375, 0.08740234375], "model_response": [["In which year was The Boston Celtics founded?", "1908 || 1908"], ["Which film won the Oscar for Outstanding Picture in 1908, being the first one in alphabetical order?", "The New York Times || The New York Times"]]}, "hall_sbj_dict_severe": {"answer_condition": [4, 4], "confidence": [0.419921875, 0.606536865234375], "model_response": [["In which year was The Boston Celtics founded?", "1929 || 1929"], ["Which film won the Oscar for Outstanding Picture in 1929, being the first one in alphabetical order?", "The Broadway Melody || The Broadway Melody"]]}}, "hop2": {"hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.5546875, 1.0], "model_response": [["In which year was The Boston Celtics founded?", "1909 || 1909"], ["Which film won the Oscar for Outstanding Picture in 1909, being the first one in alphabetical order?", "The Birth of a Nation || The Birth of a Nation"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 3], "confidence": [0.2490234375, 0.62109375], "model_response": [["In which year was The Boston Celtics founded?", "1909 || 1909"], ["Which film won the Oscar for Outstanding Picture in 1909, being the first one in alphabetical order?", "Sunflowers || Sunflowers"]]}, "mis_info_dict_severe": {"answer_condition": [4, 1], "confidence": [0.26171875, 0.98046875], "model_response": [["In which year was The Boston Celtics founded?", "1908 || 1908"], ["Which film won the Oscar for Outstanding Picture in 1908, being the first one in alphabetical order?", "The Birth of a Nation || The Birth of a Nation"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 1], "confidence": [0.58984375, 0.6015625], "model_response": [["In which year was The Boston Celtics founded?", "1908 || 1908"], ["Which film won the Oscar for Outstanding Picture in 1908, being the first one in alphabetical order?", "The Birth of a Nation || The Birth of a Nation"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 4], "confidence": [0.41796875, 0.05427742004394531], "model_response": [["In which year was The Boston Celtics founded?", "1908 || 1908"], ["Which film won the Oscar for Outstanding Picture in 1908, being the first one in alphabetical order?", "The Red Kimono || The Red Kimono"]]}, "mis_info_dict_light": {"answer_condition": [4, 4], "confidence": [0.75390625, 0.0036478042602539062], "model_response": [["In which year was The Boston Celtics founded?", "1908 || 1908"], ["Which film won the Oscar for Outstanding Picture in 1908, being the first one in alphabetical order?", "The American President || The American President"]]}}}
{"hop1": {"hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.9375, 1.0], "model_response": [["Which country is the northernmost in the UTC-4 time zone?", "Canada || Canada"], ["What is the official or most commonly spoken language in Canada?", "English || English"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.97265625, 1.0], "model_response": [["Which country is the northernmost in the UTC-4 time zone?", "Canada || Canada"], ["What is the official or most commonly spoken language in Canada?", "English || English"]]}, "hall_sbj_dict_light": {"answer_condition": [4, 1], "confidence": [0.072845458984375, 0.81640625], "model_response": [["Which country is the northernmost in the UTC-4 time zone?", "Ireland || Ireland"], ["What is the official or most commonly spoken language in Ireland?", "English || English"]]}, "unrelated_fact_dict_light": {"answer_condition": [3, 4], "confidence": [0.78515625, 1.0], "model_response": [["Which country is the northernmost in the UTC-4 time zone?", "Brazil || Brazil"], ["What is the official or most commonly spoken language in Brazil?", "Portuguese || Portuguese"]]}, "mis_info_dict_severe": {"answer_condition": [3, 4], "confidence": [0.99609375, 0.7265625], "model_response": [["Which country is the northernmost in the UTC-4 time zone?", "Pizza || Pizza"], ["What is the official or most commonly spoken language in Pizza?", "Italian || Italian"]]}, "mis_info_dict_light": {"answer_condition": [3, 4], "confidence": [0.78515625, 1.0], "model_response": [["Which country is the northernmost in the UTC-4 time zone?", "Brazil || Brazil"], ["What is the official or most commonly spoken language in Brazil?", "Portuguese || Portuguese"]]}}, "hop2": {"mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [0.41796875, 0.9921875], "model_response": [["Which country is the northernmost in the UTC-4 time zone?", "Canada || Canada"], ["What is the official or most commonly spoken language in Canada?", "English || English"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.2431640625, 1.0], "model_response": [["Which country is the northernmost in the UTC-4 time zone?", "Canada || Canada"], ["What is the official or most commonly spoken language in Canada?", "English || English"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.8671875, 1.0], "model_response": [["Which country is the northernmost in the UTC-4 time zone?", "Canada is the northernmost country in the UTC-4 time zone. || Canada"], ["What is the official or most commonly spoken language in Canada?", "English || English"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 4], "confidence": [0.69140625, 1.0], "model_response": [["Which country is the northernmost in the UTC-4 time zone?", "Norway || Norway"], ["What is the official or most commonly spoken language in Norway?", "Norwegian || Norwegian"]]}, "mis_info_dict_severe": {"answer_condition": [4, 4], "confidence": [0.240234375, 1.0], "model_response": [["Which country is the northernmost in the UTC-4 time zone?", "Norway || Norway"], ["What is the official or most commonly spoken language in Norway?", "Norwegian || Norwegian"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.1533203125, 1.0], "model_response": [["Which country is the northernmost in the UTC-4 time zone?", "Greenland || Greenland"], ["What is the official or most commonly spoken language in Canada?", "English || English"]]}}}
{"hop1": {"hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.119140625], "model_response": [["Which country does Los Angeles belong to?", "Los Angeles belongs to the United States. || United States"], ["Who is the president / leader of USA in the year 1990?", "George H. W. Bush || George H. W. Bush"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.419921875, 0.5], "model_response": [["Which country does Los Angeles belong to?", "United States || United States"], ["Who is the president / leader of USA in the year 1990?", "George H. W. Bush || George H. W. Bush"]]}, "mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [0.1142578125, 0.5], "model_response": [["Which country does Los Angeles belong to?", "United States || United States"], ["Who is the president / leader of USA in the year 1990?", "George H. W. Bush || George H. W. Bush"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.9609375, 0.5], "model_response": [["Which country does Los Angeles belong to?", "United States || United States"], ["Who is the president / leader of USA in the year 1990?", "George H. W. Bush || George H. W. Bush"]]}, "mis_info_dict_severe": {"answer_condition": [4, -1], "confidence": [0.9922027587890625, -1], "model_response": [["Which country does Los Angeles belong to?", "Chocolate cake || Chocolate cake"], ["Who is the president / leader of Chocolate cake in the year 1990?", "I'm sorry, I cannot answer this question as I do not have access to current or historical information on the president / leader of Chocolate cake. || N/A"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.08454322814941406, 0.26953125], "model_response": [["Which country does Los Angeles belong to?", "The United States of America || The United States of America"], ["Who is the president / leader of USA in the year 1990?", "George H. W. Bush || George H. W. Bush"]]}}, "hop2": {"unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.494140625, 0.5], "model_response": [["Which country does Los Angeles belong to?", "The United States || The United States"], ["Who is the president / leader of USA in the year 1990?", "George H.W. Bush || George H.W. Bush"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.494140625, 1.0], "model_response": [["Which country does Los Angeles belong to?", "United States || United States"], ["Who is the president / leader of USA in the year 1990?", "George H.W. Bush || George H.W. Bush"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.6953125, 0.5], "model_response": [["Which country does Los Angeles belong to?", "United States || United States"], ["Who is the president / leader of USA in the year 1990?", "George H.W. Bush || George H.W. Bush"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.507904052734375, 0.7276153564453125], "model_response": [["Which country does Los Angeles belong to?", "The United States of America || The United States of America"], ["Who is the president / leader of USA in the year 1990?", "George H.W. Bush || George H.W. Bush"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.2060546875, 0.73046875], "model_response": [["Which country does Los Angeles belong to?", "United States || United States"], ["Who is the president / leader of USA in the year 1990?", "George H. W. Bush || George H. W. Bush"]]}, "mis_info_dict_light": {"answer_condition": [1, 3], "confidence": [0.611114501953125, 1.0], "model_response": [["Which country does Los Angeles belong to?", "The United States of America || The United States of America"], ["Who is the president / leader of USA in the year 1990?", "Bill Clinton || Bill Clinton"]]}}}
{"hop1": {"unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.953125, 1.0], "model_response": [["Who is the composer of The Star-Spangled Banner?", "Francis Scott Key || Francis Scott Key"], ["In which year was Francis Scott Key born?", "1779 || 1779"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.87890625, 1.0], "model_response": [["Who is the composer of The Star-Spangled Banner?", "Francis Scott Key || Francis Scott Key"], ["In which year was Francis Scott Key born?", "1779 || 1779"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.87890625, 1.0], "model_response": [["Who is the composer of The Star-Spangled Banner?", "Francis Scott Key || Francis Scott Key"], ["In which year was Francis Scott Key born?", "1779 || 1779"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.953125, 1.0], "model_response": [["Who is the composer of The Star-Spangled Banner?", "Francis Scott Key || Francis Scott Key"], ["In which year was Francis Scott Key born?", "1779 || 1779"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.92578125, 1.0], "model_response": [["Who is the composer of The Star-Spangled Banner?", "Francis Scott Key || Francis Scott Key"], ["In which year was Francis Scott Key born?", "1779 || 1779"]]}, "mis_info_dict_light": {"answer_condition": [4, 4], "confidence": [1.0, 0.89453125], "model_response": [["Who is the composer of The Star-Spangled Banner?", "John Williams || John Williams"], ["In which year was John Williams born?", "1932 || 1932"]]}}, "hop2": {"unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.953125, 1.0], "model_response": [["Who is the composer of The Star-Spangled Banner?", "Francis Scott Key || Francis Scott Key"], ["In which year was Francis Scott Key born?", "1779 || 1779"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.953125, 1.0], "model_response": [["Who is the composer of The Star-Spangled Banner?", "Francis Scott Key || Francis Scott Key"], ["In which year was Francis Scott Key born?", "1779 || 1779"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.953125, 1.0], "model_response": [["Who is the composer of The Star-Spangled Banner?", "Francis Scott Key || Francis Scott Key"], ["In which year was Francis Scott Key born?", "1779 || 1779"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.953125, 1.0], "model_response": [["Who is the composer of The Star-Spangled Banner?", "Francis Scott Key || Francis Scott Key"], ["In which year was Francis Scott Key born?", "1779 || 1779"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Who is the composer of The Star-Spangled Banner?", "Francis Scott Key || Francis Scott Key"], ["In which year was Francis Scott Key born?", "1779 || 1779"]]}, "mis_info_dict_light": {"answer_condition": [1, 3], "confidence": [1.0, 1.0], "model_response": [["Who is the composer of The Star-Spangled Banner?", "Francis Scott Key || Francis Scott Key"], ["In which year was Francis Scott Key born?", "1805 || 1805"]]}}}
{"hop1": {"unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.92578125], "model_response": [["Who was the US president in the year 1814?", "James Madison || James Madison"], ["Who is James Madison married to?", "Dolley Madison || Dolley Madison"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.8828125, 0.62109375], "model_response": [["Who was the US president in the year 1814?", "James Madison || James Madison"], ["Who is James Madison married to?", "Dolley Madison || Dolley Madison"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.92578125], "model_response": [["Who was the US president in the year 1814?", "James Madison || James Madison"], ["Who is James Madison married to?", "Dolley Madison || Dolley Madison"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.8132171630859375], "model_response": [["Who was the US president in the year 1814?", "James Madison || James Madison"], ["Who is James Madison married to?", "Dolley Madison || Dolley Madison"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.96875], "model_response": [["Who was the US president in the year 1814?", "James Madison || James Madison"], ["Who is James Madison married to?", "Dolley Madison || Dolley Madison"]]}, "mis_info_dict_light": {"answer_condition": [4, 4], "confidence": [1.0, 0.98443603515625], "model_response": [["Who was the US president in the year 1814?", "Thomas Jefferson || Thomas Jefferson"], ["Who is Thomas Jefferson married to?", "Married to Martha Jefferson || Martha Jefferson"]]}}, "hop2": {"unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.2710723876953125], "model_response": [["Who was the US president in the year 1814?", "James Madison || James Madison"], ["Who is James Madison married to?", "Dolley Madison || Dolley Madison"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.701934814453125], "model_response": [["Who was the US president in the year 1814?", "James Madison || James Madison"], ["Who is James Madison married to?", "Dolly Madison || Dolly Madison"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 0.7142096757888794], "model_response": [["Who was the US president in the year 1814?", "James Madison || James Madison"], ["Who is James Madison married to?", "Abigail Adams || Abigail Adams"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.99609375], "model_response": [["Who was the US president in the year 1814?", "James Madison || James Madison"], ["Who is James Madison married to?", "Dolley Madison || Dolley Madison"]]}, "mis_info_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 1.0], "model_response": [["Who was the US president in the year 1814?", "James Madison || James Madison"], ["Who is James Madison married to?", "Martha Washington || Martha Washington"]]}, "mis_info_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 1.0], "model_response": [["Who was the US president in the year 1814?", "James Madison was the US president in the year 1814. || James Madison"], ["Who is James Madison married to?", "James Madison is married to Pizza. || Pizza"]]}}}
{"hop1": {"hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.65625, 0.8125], "model_response": [["Which country does London belong to?", "United Kingdom || United Kingdom"], ["What's the year when United Kingdom the first time formally establish diplomatic relations with United States?", "1776 || 1776"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.8515625, 0.70703125], "model_response": [["Which country does London belong to?", "United Kingdom || United Kingdom"], ["What's the year when United Kingdom the first time formally establish diplomatic relations with United States?", "1776 || 1776"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.53515625, 0.37109375], "model_response": [["Which country does London belong to?", "United Kingdom || United Kingdom"], ["What's the year when United Kingdom the first time formally establish diplomatic relations with United States?", "1776 || 1776"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.46484375, 0.46916961669921875], "model_response": [["Which country does London belong to?", "Great Britain || Great Britain"], ["What's the year when United Kingdom the first time formally establish diplomatic relations with United States?", "1776 || 1776"]]}, "mis_info_dict_light": {"answer_condition": [1, 4], "confidence": [0.021484375, 0.0350189208984375], "model_response": [["Which country does London belong to?", "England || England"], ["What's the year when United Kingdom the first time formally establish diplomatic relations with United States?", "1778 || 1778"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [0.041259765625, 0.265625], "model_response": [["Which country does London belong to?", "Great Britain || Great Britain"], ["What's the year when United Kingdom the first time formally establish diplomatic relations with United States?", "1777 || 1777"]]}}, "hop2": {"unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.294921875, 0.99609375], "model_response": [["Which country does London belong to?", "England || England"], ["What's the year when United Kingdom the first time formally establish diplomatic relations with United States?", "1776 || 1776"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.93359375, 1.0], "model_response": [["Which country does London belong to?", "United Kingdom || United Kingdom"], ["What's the year when United Kingdom the first time formally establish diplomatic relations with United States?", "1776 || 1776"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.93359375, 0.93359375], "model_response": [["Which country does London belong to?", "United Kingdom || United Kingdom"], ["What's the year when United Kingdom the first time formally establish diplomatic relations with United States?", "1776 || 1776"]]}, "mis_info_dict_light": {"answer_condition": [1, 3], "confidence": [0.86328125, 1.0], "model_response": [["Which country does London belong to?", "United Kingdom || United Kingdom"], ["What's the year when United Kingdom the first time formally establish diplomatic relations with United States?", "1783 || 1783"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [0.41015625, 0.60546875], "model_response": [["Which country does London belong to?", "Great Britain || Great Britain"], ["What's the year when United Kingdom the first time formally establish diplomatic relations with United States?", "1777 || 1777"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.1962890625, 0.5914306640625], "model_response": [["Which country does London belong to?", "England || England"], ["What's the year when United Kingdom the first time formally establish diplomatic relations with United States?", "1776 || 1776"]]}}}
{"hop1": {"mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.9375], "model_response": [["Which film won the Oscar for Outstanding Picture in 1776, being the first one in alphabetical order?", "The French Connection || The French Connection"], ["Which film company produced \"The French Connection\"?", "Paramount Pictures || Paramount Pictures"]]}, "hall_sbj_dict_light": {"answer_condition": [4, 1], "confidence": [1.0, 1.0], "model_response": [["Which film won the Oscar for Outstanding Picture in 1776, being the first one in alphabetical order?", "The Godfather || The Godfather"], ["Which film company produced \"The Godfather\"?", "Paramount Pictures || Paramount Pictures"]]}, "hall_sbj_dict_severe": {"answer_condition": [4, 4], "confidence": [1.0, 0.296875], "model_response": [["Which film won the Oscar for Outstanding Picture in 1776, being the first one in alphabetical order?", "Sunflowers || Sunflowers"], ["Which film company produced \"Sunflowers\"?", "United Artists || United Artists"]]}, "mis_info_dict_light": {"answer_condition": [4, 1], "confidence": [0.99609375, 1.0], "model_response": [["Which film won the Oscar for Outstanding Picture in 1776, being the first one in alphabetical order?", "The Godfather || The Godfather"], ["Which film company produced \"The Godfather\"?", "Paramount Pictures || Paramount Pictures"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 4], "confidence": [0.0988311767578125, 0.87890625], "model_response": [["Which film won the Oscar for Outstanding Picture in 1776, being the first one in alphabetical order?", "Titanic || Titanic"], ["Which film company produced \"Titanic\"?", "20th Century Fox || 20th Century Fox"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 4], "confidence": [1.0, 0.8544921875], "model_response": [["Which film won the Oscar for Outstanding Picture in 1776, being the first one in alphabetical order?", "Annie Hall || Annie Hall"], ["Which film company produced \"Annie Hall\"?", "MGM Studios || MGM Studios"]]}}, "hop2": {"hall_sbj_dict_light": {"answer_condition": [4, 1], "confidence": [0.44921875, 0.84765625], "model_response": [["Which film won the Oscar for Outstanding Picture in 1776, being the first one in alphabetical order?", "Amadeus || Amadeus"], ["Which film company produced \"Amadeus\"?", "Paramount Pictures || Paramount Pictures"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 4], "confidence": [0.625, 0.5], "model_response": [["Which film won the Oscar for Outstanding Picture in 1776, being the first one in alphabetical order?", "Titanic || Titanic"], ["Which film company produced \"Titanic\"?", "20th Century Fox || 20th Century Fox"]]}, "mis_info_dict_severe": {"answer_condition": [4, 4], "confidence": [0.12158203125, 0.73046875], "model_response": [["Which film won the Oscar for Outstanding Picture in 1776, being the first one in alphabetical order?", "Titanic || Titanic"], ["Which film company produced \"Titanic\"?", "20th Century Fox || 20th Century Fox"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 4], "confidence": [0.6796875, 0.87890625], "model_response": [["Which film won the Oscar for Outstanding Picture in 1776, being the first one in alphabetical order?", "The first film to win the Oscar for Outstanding Picture in 1776 was \"Titanic\". || Titanic"], ["Which film company produced \"Titanic\"?", "20th Century Fox || 20th Century Fox"]]}, "hall_sbj_dict_severe": {"answer_condition": [4, 1], "confidence": [0.734375, 0.9921875], "model_response": [["Which film won the Oscar for Outstanding Picture in 1776, being the first one in alphabetical order?", "Amadeus || Amadeus"], ["Which film company produced \"Amadeus\"?", "Paramount Pictures || Paramount Pictures"]]}, "mis_info_dict_light": {"answer_condition": [4, 4], "confidence": [0.7109375, 0.7734375], "model_response": [["Which film won the Oscar for Outstanding Picture in 1776, being the first one in alphabetical order?", "Amadeus || Amadeus"], ["Which film company produced \"Amadeus\"?", "MGM || MGM"]]}}}
{"hop1": {"hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.97265625, 0.92578125], "model_response": [["What's the year when Canada the first time formally establish diplomatic relations with United States?", "1917 || 1917"], ["Which team won this year's NBA championship in 1917?", "Boston Celtics || Boston Celtics"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.6755828857421875, 0.81640625], "model_response": [["What's the year when Canada the first time formally establish diplomatic relations with United States?", "1917 || 1917"], ["Which team won this year's NBA championship in 1917?", "Boston Celtics || Boston Celtics"]]}, "mis_info_dict_severe": {"answer_condition": [4, 1], "confidence": [0.910797119140625, 0.9921875], "model_response": [["What's the year when Canada the first time formally establish diplomatic relations with United States?", "The year when Canada first formally established diplomatic relations with the United States is 1783. || 1783"], ["Which team won the NBA championship in 1783?", "The Boston Celtics || Boston Celtics"]]}, "hall_sbj_dict_light": {"answer_condition": [4, 1], "confidence": [0.005313873291015625, 0.34375], "model_response": [["What's the year when Canada the first time formally establish diplomatic relations with United States?", "1789 || 1789"], ["Which team won the NBA championship in the year 1789?", "Boston Celtics || Boston Celtics"]]}, "mis_info_dict_light": {"answer_condition": [3, 4], "confidence": [1.0, 0.8046875], "model_response": [["What's the year when Canada the first time formally establish diplomatic relations with United States?", "1867 || 1867"], ["Which team won the NBA championship in 1867?", "The Boston Red Caps won the NBA championship in 1867. || Boston Red Caps"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 4], "confidence": [0.045166015625, 0.84765625], "model_response": [["What's the year when Canada the first time formally establish diplomatic relations with United States?", "1939 || 1939"], ["Which team won the first NBA championship in 1939?", "The Chicago Stags || Chicago Stags"]]}}, "hop2": {"mis_info_dict_severe": {"answer_condition": [1, 4], "confidence": [0.984375, 0.9311447143554688], "model_response": [["What's the year when Canada the first time formally establish diplomatic relations with United States?", "1917 || 1917"], ["Which team won this year's NBA championship in 1917?", "Boston Red Sox || Boston Red Sox"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 4], "confidence": [0.90625, 0.686004638671875], "model_response": [["What's the year when Canada the first time formally establish diplomatic relations with United States?", "1917 || 1917"], ["Which team won this year's NBA championship in 1917?", "Boston Red Sox || Boston Red Sox"]]}, "hall_sbj_dict_light": {"answer_condition": [4, 1], "confidence": [0.888824462890625, 0.58135986328125], "model_response": [["What's the year when Canada the first time formally establish diplomatic relations with United States?", "1783 || 1783"], ["Which team won the NBA championship in 1783?", "Boston Celtics || Boston Celtics"]]}, "mis_info_dict_light": {"answer_condition": [1, 3], "confidence": [0.703125, 1.0], "model_response": [["What's the year when Canada the first time formally establish diplomatic relations with United States?", "1917 || 1917"], ["Which team won this year's NBA championship in 1917?", "Los Angeles Lakers || Los Angeles Lakers"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 1], "confidence": [0.786773681640625, 0.85601806640625], "model_response": [["What's the year when Canada the first time formally establish diplomatic relations with United States?", "1783 || 1783"], ["Which team won the NBA championship in 1783?", "Boston Celtics || Boston Celtics"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 4], "confidence": [0.728179931640625, 0.02911376953125], "model_response": [["What's the year when Canada the first time formally establish diplomatic relations with United States?", "1783 || 1783"], ["Which team won the NBA championship in 1783?", "Philadelphia 76ers || Philadelphia 76ers"]]}}}
{"hop1": {"mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [0.8202239871025085, 1.0], "model_response": [["Which countries to the east share a border with Norway?", "Finland and Sweden || Finland and Sweden"], ["What is the official or most commonly spoken language in Sweden?", "Swedish || Swedish"]]}, "hall_sbj_dict_light": {"answer_condition": [3, -1], "confidence": [0.4825286865234375, -1], "model_response": [["Which countries to the east share a border with Norway?", "Finland and Russia || Finland and Russia"], ["What is the official or most commonly spoken language in Finland and Russia?", "Finland: Finnish\nRussia: Russian || N/A"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 4], "confidence": [0.8439903259277344, 0.7159423828125], "model_response": [["Which countries to the east share a border with Norway?", "Finland and Russia || Finland and Russia"], ["What is the official or most commonly spoken language in Finland and Russia?", "Finnish and Russian || Finnish and Russian"]]}, "hall_sbj_dict_severe": {"answer_condition": [4, -1], "confidence": [0.8719035387039185, -1], "model_response": [["Which countries to the east share a border with Norway?", "Finland and Russia || Finland and Russia"], ["What is the official or most commonly spoken language in Finland and Russia?", "Finland: Finnish\nRussia: Russian || N/A"]]}, "mis_info_dict_severe": {"answer_condition": [4, 4], "confidence": [0.19393044710159302, 0.4404449462890625], "model_response": [["Which countries to the east share a border with Norway?", "Finland and Russia || Finland and Russia"], ["What is the official or most commonly spoken language in Finland and Russia?", "Finnish and Russian || Finnish and Russian"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, -1], "confidence": [0.9006081819534302, -1], "model_response": [["Which countries to the east share a border with Norway?", "Finland and Russia || Finland and Russia"], ["What is the official or most commonly spoken language in Finland and Russia?", "Finland: Finnish\nRussia: Russian || N/A"]]}}, "hop2": {"hall_sbj_dict_light": {"answer_condition": [4, 4], "confidence": [0.7720580101013184, 0.2255859375], "model_response": [["Which countries to the east share a border with Norway?", "Finland and Russia || Finland and Russia"], ["What is the official or most commonly spoken language in Finland and Russia?", "Finnish and Russian || Finnish and Russian"]]}, "hall_sbj_dict_severe": {"answer_condition": [4, -1], "confidence": [0.8583739399909973, -1], "model_response": [["Which countries to the east share a border with Norway?", "Finland and Russia || Finland and Russia"], ["What is the official or most commonly spoken language in Finland and Russia?", "Finland: Finnish\nRussia: Russian || N/A"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, -1], "confidence": [0.470977783203125, -1], "model_response": [["Which countries to the east share a border with Norway?", "Finland and Russia || Finland and Russia"], ["What is the official or most commonly spoken language in Finland and Russia?", "Finland: Finnish\nRussia: Russian || N/A"]]}, "mis_info_dict_severe": {"answer_condition": [4, -1], "confidence": [0.9805905818939209, -1], "model_response": [["Which countries to the east share a border with Norway?", "Finland and Russia || Finland and Russia"], ["What is the official or most commonly spoken language in Finland and Russia?", "Finland: Finnish\nRussia: Russian || N/A"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 4], "confidence": [0.7604062557220459, 0.498046875], "model_response": [["Which countries to the east share a border with Norway?", "Finland and Russia || Finland and Russia"], ["What is the official or most commonly spoken language in Finland and Russia?", "Finnish and Russian || Finnish and Russian"]]}, "mis_info_dict_light": {"answer_condition": [4, -1], "confidence": [0.9728237986564636, -1], "model_response": [["Which countries to the east share a border with Norway?", "Finland and Russia || Finland and Russia"], ["What is the official or most commonly spoken language in Finland and Russia?", "The official or most commonly spoken language in Finland is Finnish, and the official or most commonly spoken language in Russia is Russian. || N/A"]]}}}
{"hop1": {"mis_info_dict_severe": {"answer_condition": [-1, -1], "confidence": [-1, -1], "model_response": [["In which year was China founded or became independent?", "I'm sorry, I don't understand the question. Please rephrase. || N/A"]]}, "hall_sbj_dict_light": {"answer_condition": [-1, -1], "confidence": [-1, -1], "model_response": [["In which year was China founded or became independent?", "I'm sorry, I don't have any information on the founding or independence of China. || N/A"]]}, "mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.06917953491210938], "model_response": [["In which year was China founded or became independent?", "1949 || 1949"], ["Who is the headmaster of Harvard University in the year 1912?", "Charles William Eliot || Charles William Eliot"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, -1], "confidence": [1.0, -1], "model_response": [["In which year was China founded or became independent?", "The People's Republic of China was founded in 1949. || 1949"], ["Who is the headmaster of Harvard University in the year 1912?", "Harvard University did not have a headmaster in 1912. || N/A"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, -1], "confidence": [0.99609375, -1], "model_response": [["In which year was China founded or became independent?", "The People's Republic of China was founded on October 1, 1949. || October 1, 1949"], ["Who is the headmaster of Harvard University in the year 1912?", "Harvard University did not have a headmaster in 1912. || N/A"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, -1], "confidence": [1.0, -1], "model_response": [["In which year was China founded or became independent?", "The People's Republic of China was founded in 1949. || 1949"], ["Who is the headmaster of Harvard University in the year 1912?", "Harvard University did not have a headmaster in 1912. || N/A"]]}}, "hop2": {"unrelated_fact_dict_severe": {"answer_condition": [1, -1], "confidence": [0.67578125, -1], "model_response": [["In which year was China founded or became independent?", "1911 || 1911"], ["Who is the headmaster of Harvard University in the year 1912?", "Harvard University did not have a headmaster in 1912. || N/A"]]}, "mis_info_dict_light": {"answer_condition": [1, 4], "confidence": [0.92578125, 1.0], "model_response": [["In which year was China founded or became independent?", "1911 || 1911"], ["Who is the headmaster of Harvard University in the year 1912?", "John F. Kennedy || John F. Kennedy"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 1], "confidence": [0.494140625, 0.89306640625], "model_response": [["In which year was China founded or became independent?", "1911 || 1911"], ["Who is the headmaster of Harvard University in the year 1911?", "Charles William Eliot || Charles William Eliot"]]}, "hall_sbj_dict_severe": {"answer_condition": [4, 1], "confidence": [0.8046875, 0.99609375], "model_response": [["In which year was China founded or became independent?", "1911 || 1911"], ["Who is the headmaster of Harvard University in the year 1911?", "Charles William Eliot || Charles William Eliot"]]}, "mis_info_dict_severe": {"answer_condition": [4, 3], "confidence": [0.8359375, 0.9453125], "model_response": [["In which year was China founded or became independent?", "1911 || 1911"], ["Who is the headmaster of Harvard University in the year 1911?", "Pizza || Pizza"]]}, "hall_sbj_dict_light": {"answer_condition": [4, 1], "confidence": [0.494140625, 1.0], "model_response": [["In which year was China founded or became independent?", "1911 || 1911"], ["Who is the headmaster of Harvard University in the year 1911?", "Charles William Eliot || Charles William Eliot"]]}}}
{"hop1": {"mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [0.84765625, 0.73046875], "model_response": [["What is the official or most commonly spoken language in Finland?", "Finnish || Finnish"], ["What is the ISO 639-2 code for the Finnish language?", "fi || fi"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.94140625, 0.96875], "model_response": [["What is the official or most commonly spoken language in Finland?", "Finnish || Finnish"], ["What is the ISO 639-2 code for the Finnish language?", "fi || fi"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.984375, 0.98046875], "model_response": [["What is the official or most commonly spoken language in Finland?", "Finnish || Finnish"], ["What is the ISO 639-2 code for the Finnish language?", "fi || fi"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.93359375, 0.81640625], "model_response": [["What is the official or most commonly spoken language in Finland?", "Finnish || Finnish"], ["What is the ISO 639-2 code for the Finnish language?", "fi || fi"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.99609375, 0.376953125], "model_response": [["What is the official or most commonly spoken language in Finland?", "Finnish || Finnish"], ["What is the ISO 639-2 code for the Finnish language?", "Fin || Fin"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.93359375, 0.5], "model_response": [["What is the official or most commonly spoken language in Finland?", "Finnish || Finnish"], ["What is the ISO 639-2 code for the Finnish language?", "Fin || Fin"]]}}, "hop2": {"unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.7265625, 0.7109375], "model_response": [["What is the official or most commonly spoken language in Finland?", "Finnish || Finnish"], ["What is the ISO 639-2 code for the Finnish language?", "Fin || Fin"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.91796875, 0.73046875], "model_response": [["What is the official or most commonly spoken language in Finland?", "Finnish || Finnish"], ["What is the ISO 639-2 code for the Finnish language?", "fi || fi"]]}, "mis_info_dict_light": {"answer_condition": [1, 3], "confidence": [0.921875, 0.921875], "model_response": [["What is the official or most commonly spoken language in Finland?", "Finnish || Finnish"], ["What is the ISO 639-2 code for the Finnish language?", "en || en"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["What is the official or most commonly spoken language in Finland?", "The official language of Finland is Finnish. However, Swedish is also widely spoken in the country. || Finnish"], ["What is the ISO 639-2 code for the Finnish language?", "fi || fi"]]}, "mis_info_dict_severe": {"answer_condition": [4, 4], "confidence": [0.9140625, 0.84375], "model_response": [["What is the official or most commonly spoken language in Finland?", "The official language of Finland is Finnish. However, the most commonly spoken language is Swedish. || Swedish"], ["What is the ISO 639-2 code for the Swedish language?", "se || se"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["What is the official or most commonly spoken language in Finland?", "The official or most commonly spoken language in Finland is Finnish. || Finnish"], ["What is the ISO 639-2 code for the Finnish language?", "fi || fi"]]}}}
{"hop1": {"hall_sbj_dict_light": {"answer_condition": [1, 4], "confidence": [0.921875, 0.953125], "model_response": [["In which year was Rene Coty born?", "1882 || 1882"], ["Which city hosted the first Olympic Games in 1882?", "Athens || Athens"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 4], "confidence": [0.7890625, 0.90625], "model_response": [["In which year was Rene Coty born?", "1882 || 1882"], ["Which city hosted the first Olympic Games in 1882?", "Athens || Athens"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [0.8671875, 0.9765625], "model_response": [["In which year was Rene Coty born?", "1882 || 1882"], ["Which city hosted the first Olympic Games in 1882?", "Athens || Athens"]]}, "mis_info_dict_severe": {"answer_condition": [4, 4], "confidence": [0.0030040740966796875, 1.0], "model_response": [["In which year was Rene Coty born?", "1886 || 1886"], ["Which city hosted the first Olympic Games in 1886?", "Athens || Athens"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 4], "confidence": [0.365234375, 1.0], "model_response": [["In which year was Rene Coty born?", "1884 || 1884"], ["Which city hosted the first Olympic Games in 1884?", "Athens || Athens"]]}, "mis_info_dict_light": {"answer_condition": [3, 1], "confidence": [1.0, 1.0], "model_response": [["In which year was Rene Coty born?", "1900 || 1900"], ["Which city hosted the first Olympic Games in 1900?", "Paris || Paris"]]}}, "hop2": {"hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.71484375, 1.0], "model_response": [["In which year was Rene Coty born?", "1882 || 1882"], ["Which city hosted the first Olympic Games in 1882?", "Paris || Paris"]]}, "mis_info_dict_severe": {"answer_condition": [1, 4], "confidence": [0.99609375, 0.92578125], "model_response": [["In which year was Rene Coty born?", "1882 || 1882"], ["Which city hosted the first Olympic Games in 1882?", "St. Louis || St. Louis"]]}, "hall_sbj_dict_light": {"answer_condition": [4, 4], "confidence": [0.01092529296875, 0.9453125], "model_response": [["In which year was Rene Coty born?", "1886 || 1886"], ["Which city hosted the first Olympic Games in 1886?", "Athens || Athens"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 4], "confidence": [0.26171875, 0.91015625], "model_response": [["In which year was Rene Coty born?", "1886 || 1886"], ["Which city hosted the first Olympic Games in 1886?", "Athens || Athens"]]}, "mis_info_dict_light": {"answer_condition": [4, 4], "confidence": [0.1796875, 1.0], "model_response": [["In which year was Rene Coty born?", "1886 || 1886"], ["Which city hosted the first Olympic Games in 1886?", "Athens || Athens"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 3], "confidence": [0.69921875, 0.498046875], "model_response": [["In which year was Rene Coty born?", "1886 || 1886"], ["Which city hosted the first Olympic Games in 1886?", "Rio de Janeiro || Rio de Janeiro"]]}}}
{"hop1": {"unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.265625, 1.0], "model_response": [["Which country does Baltimore belong to?", "The United States || The United States"], ["In which year was the United States founded or become independent?", "1776 || 1776"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.9453125, 1.0], "model_response": [["Which country does Baltimore belong to?", "United States || United States"], ["In which year was the United States founded or become independent?", "1776 || 1776"]]}, "mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [0.8046875, 1.0], "model_response": [["Which country does Baltimore belong to?", "The United States || The United States"], ["In which year was the United States founded or become independent?", "1776 || 1776"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.91796875, 1.0], "model_response": [["Which country does Baltimore belong to?", "United States || United States"], ["In which year was the United States founded or become independent?", "1776 || 1776"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.71875, 1.0], "model_response": [["Which country does Baltimore belong to?", "United States || United States"], ["In which year was the United States founded or become independent?", "1776 || 1776"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.953125, 1.0], "model_response": [["Which country does Baltimore belong to?", "United States || United States"], ["In which year was the United States founded or become independent?", "1776 || 1776"]]}}, "hop2": {"unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.8671875, 1.0], "model_response": [["Which country does Baltimore belong to?", "United States || United States"], ["In which year was the United States founded or become independent?", "1776 || 1776"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.11865234375, 1.0], "model_response": [["Which country does Baltimore belong to?", "The United States || The United States"], ["In which year was the United States founded or become independent?", "1776 || 1776"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.93359375, 1.0], "model_response": [["Which country does Baltimore belong to?", "United States || United States"], ["In which year was the United States founded or become independent?", "1776 || 1776"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.9453125, 1.0], "model_response": [["Which country does Baltimore belong to?", "United States || United States"], ["In which year was the United States founded or become independent?", "1776 || 1776"]]}, "mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [0.11309051513671875, 1.0], "model_response": [["Which country does Baltimore belong to?", "The United States of America || The United States of America"], ["In which year was the United States founded or become independent?", "1776 || 1776"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.9375, 1.0], "model_response": [["Which country does Baltimore belong to?", "United States || United States"], ["In which year was the United States founded or become independent?", "1776 || 1776"]]}}}
{"hop1": {"hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.7265625, 0.77813720703125], "model_response": [["In which year was Paramount Pictures founded?", "1917 || 1917"], ["Which team won this year's NBA championship in 1917?", "Boston Celtics || Boston Celtics"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.921875, 0.91107177734375], "model_response": [["In which year was Paramount Pictures founded?", "1917 || 1917"], ["Which team won this year's NBA championship in 1917?", "Boston Celtics || Boston Celtics"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.81640625, 0.8617401123046875], "model_response": [["In which year was Paramount Pictures founded?", "1917 || 1917"], ["Which team won this year's NBA championship in 1917?", "Boston Celtics || Boston Celtics"]]}, "mis_info_dict_severe": {"answer_condition": [4, 4], "confidence": [0.373046875, 0.881927490234375], "model_response": [["In which year was Paramount Pictures founded?", "1922 || 1922"], ["Which team won the NBA championship in 1922?", "The Chicago Bulls || Chicago Bulls"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 4], "confidence": [0.921875, 0.87506103515625], "model_response": [["In which year was Paramount Pictures founded?", "1922 || 1922"], ["Which team won this year's NBA championship in 1922?", "The Chicago Bulls || Chicago Bulls"]]}, "mis_info_dict_light": {"answer_condition": [3, 4], "confidence": [1.0, 0.6171875], "model_response": [["In which year was Paramount Pictures founded?", "1925 || 1925"], ["Which team won this year's NBA championship in 1925?", "The Chicago Stags || Chicago Stags"]]}}, "hop2": {"hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.90625, 1.0], "model_response": [["In which year was Paramount Pictures founded?", "1917 || 1917"], ["Which team won this year's NBA championship in 1917?", "Boston Celtics || Boston Celtics"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.8984375, 0.17809295654296875], "model_response": [["In which year was Paramount Pictures founded?", "1917 || 1917"], ["Which team won this year's NBA championship in 1917?", "Boston Celtics || Boston Celtics"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.97265625, 0.9921875], "model_response": [["In which year was Paramount Pictures founded?", "1917 || 1917"], ["Which team won this year's NBA championship in 1917?", "The Boston Celtics || Boston Celtics"]]}, "mis_info_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 0.98046875], "model_response": [["In which year was Paramount Pictures founded?", "1917 || 1917"], ["Which team won this year's NBA championship in 1917?", "Los Angeles Lakers || Los Angeles Lakers"]]}, "mis_info_dict_severe": {"answer_condition": [4, 1], "confidence": [0.1806640625, 0.33489990234375], "model_response": [["In which year was Paramount Pictures founded?", "1922 || 1922"], ["Which team won the NBA championship in 1922?", "The Boston Celtics || Boston Celtics"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 4], "confidence": [0.498046875, 0.802276611328125], "model_response": [["In which year was Paramount Pictures founded?", "1922 || 1922"], ["Which team won this year's NBA championship in 1922?", "The Chicago Bulls || Chicago Bulls"]]}}}
{"hop1": {"mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.15265655517578125, 0.9921875], "model_response": [["What is the national anthem of Russia?", "The National Anthem of Russia is the Russian National Anthem, also known as the \"Russian March\". || Russian National Anthem"], ["In which year was The National Anthem of Russia written?", "1874 || 1874"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.796600341796875, 0.99609375], "model_response": [["What is the national anthem of Russia?", "The National Anthem of Russia is \"The National Anthem of the Russian Federation\". || The National Anthem of the Russian Federation"], ["In which year was The National Anthem of Russia written?", "1874 || 1874"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.766754150390625, 0.99609375], "model_response": [["What is the national anthem of Russia?", "The National Anthem of Russia is the \"Russian National Anthem\". || Russian National Anthem"], ["In which year was The National Anthem of Russia written?", "1874 || 1874"]]}, "mis_info_dict_light": {"answer_condition": [3, 4], "confidence": [1.0, 0.80078125], "model_response": [["What is the national anthem of Russia?", "\"God Save the Queen\" || God Save the Queen"], ["In which year was \"God Save the Queen\" written?", "1776 || 1776"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.47637939453125, 1.0], "model_response": [["What is the national anthem of Russia?", "The National Anthem of Russia is \"The National Anthem of the Russian Federation\" || The National Anthem of the Russian Federation"], ["In which year was The National Anthem of Russia written?", "1874 || 1874"]]}, "hall_sbj_dict_light": {"answer_condition": [4, 4], "confidence": [0.006335115758702159, 0.18281936645507812], "model_response": [["What is the national anthem of Russia?", "The National Anthem of Russia is \"Russia, My Home\". || Russia, My Home"], ["In which year was the song \"Russia, My Home\" written?", "1867 || 1867"]]}}, "hop2": {"unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.648193359375, 1.0], "model_response": [["What is the national anthem of Russia?", "The National Anthem of Russia is \"The National Anthem of the Russian Federation\" || The National Anthem of the Russian Federation"], ["In which year was The National Anthem of Russia written?", "1874 || 1874"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.899169921875, 1.0], "model_response": [["What is the national anthem of Russia?", "The National Anthem of Russia is \"The National Anthem of the Russian Federation\" || The National Anthem of the Russian Federation"], ["In which year was The National Anthem of Russia written?", "1874 || 1874"]]}, "mis_info_dict_severe": {"answer_condition": [4, 4], "confidence": [0.11968994140625, 1.0], "model_response": [["What is the national anthem of Russia?", "The National Anthem of Russia is \"The Star-Spangled Banner\" || The Star-Spangled Banner"], ["In which year was The Star-Spangled Banner written?", "1814 || 1814"]]}, "mis_info_dict_light": {"answer_condition": [1, 3], "confidence": [1.0, 1.0], "model_response": [["What is the national anthem of Russia?", "The National Anthem of Russia is \"The National Anthem of the Russian Federation\" (Russian: \u041f\u043e\u044d\u043c\u0430 \u0420\u043e\u0441\u0441\u0438\u0439\u0441\u043a\u043e\u0439 \u0424\u0435\u0434\u0435\u0440\u0430\u0446\u0438\u0438). The lyrics were written by the poet Alexander Alexandrov in 1970, and the music was composed by Sergei Ivanovich Glinka in 1813. || The National Anthem of Russia"], ["In which year was The National Anthem of Russia written?", "1917 || 1917"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 4], "confidence": [0.12848830556322355, 0.193359375], "model_response": [["What is the national anthem of Russia?", "The National Anthem of Russia is \"Russia, You Are Not Alone\" (Russian: \"\u0420\u043e\u0441\u0441\u0438\u044f, \u0442\u044b \u043d\u0435 alone\"). It was written by the Russian poet Alexander Pushkin in 1833. || Russia, You Are Not Alone"], ["In which year was the song \"Russia, You Are Not Alone\" written?", "1984 || 1984"]]}, "hall_sbj_dict_severe": {"answer_condition": [4, 4], "confidence": [0.13458251953125, 1.0], "model_response": [["What is the national anthem of Russia?", "The National Anthem of Russia is \"The Star-Spangled Banner\" || The Star-Spangled Banner"], ["In which year was The Star-Spangled Banner written?", "1814 || 1814"]]}}}
{"hop1": {"hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.240234375, 1.0], "model_response": [["Which country is the northernmost in the UTC+0 time zone?", "Norway || Norway"], ["What is the official or most commonly spoken language in Norway?", "Norwegian || Norwegian"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Which country is the northernmost in the UTC+0 time zone?", "Greenland || Greenland"], ["What is the official or most commonly spoken language in Norway?", "Norwegian || Norwegian"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.70703125, 1.0], "model_response": [["Which country is the northernmost in the UTC+0 time zone?", "Norway || Norway"], ["What is the official or most commonly spoken language in Norway?", "Norwegian || Norwegian"]]}, "mis_info_dict_light": {"answer_condition": [4, 4], "confidence": [1.0, 1.0], "model_response": [["Which country is the northernmost in the UTC+0 time zone?", "Iceland || Iceland"], ["What is the official or most commonly spoken language in Iceland?", "Icelandic || Icelandic"]]}, "mis_info_dict_severe": {"answer_condition": [3, 4], "confidence": [1.0, 0.7265625], "model_response": [["Which country is the northernmost in the UTC+0 time zone?", "Pizza || Pizza"], ["What is the official or most commonly spoken language in Pizza?", "Italian || Italian"]]}, "hall_sbj_dict_light": {"answer_condition": [3, 4], "confidence": [0.7109375, 1.0], "model_response": [["Which country is the northernmost in the UTC+0 time zone?", "Russia || Russia"], ["What is the official or most commonly spoken language in Russia?", "Russian || Russian"]]}}, "hop2": {"unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.6875, 1.0], "model_response": [["Which country is the northernmost in the UTC+0 time zone?", "Norway || Norway"], ["What is the official or most commonly spoken language in Norway?", "Norwegian || Norwegian"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.96875, 1.0], "model_response": [["Which country is the northernmost in the UTC+0 time zone?", "Norway || Norway"], ["What is the official or most commonly spoken language in Norway?", "Norwegian || Norwegian"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.96484375, 1.0], "model_response": [["Which country is the northernmost in the UTC+0 time zone?", "Norway || Norway"], ["What is the official or most commonly spoken language in Norway?", "Norwegian || Norwegian"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.93359375, 1.0], "model_response": [["Which country is the northernmost in the UTC+0 time zone?", "Norway || Norway"], ["What is the official or most commonly spoken language in Norway?", "Norwegian || Norwegian"]]}, "mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [0.984375, 1.0], "model_response": [["Which country is the northernmost in the UTC+0 time zone?", "Norway || Norway"], ["What is the official or most commonly spoken language in Norway?", "Norwegian || Norwegian"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.94921875, 1.0], "model_response": [["Which country is the northernmost in the UTC+0 time zone?", "Norway || Norway"], ["What is the official or most commonly spoken language in Norway?", "Norwegian || Norwegian"]]}}}
{"hop1": {"hall_sbj_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.98443603515625], "model_response": [["In which city is the Boston Celtics based?", "Boston || Boston"], ["What is the time zone of Boston in UTC?", "UTC-5 || UTC-5"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.7162017822265625], "model_response": [["In which city is the Boston Celtics based?", "Boston || Boston"], ["What is the time zone of Boston in UTC?", "UTC-5 || UTC-5"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 0.87890625], "model_response": [["In which city is the Boston Celtics based?", "Boston || Boston"], ["What is the time zone of Boston in UTC?", "UTC-5 || UTC-5"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 0.908447265625], "model_response": [["In which city is the Boston Celtics based?", "Boston || Boston"], ["What is the time zone of Boston in UTC?", "UTC-5 || UTC-5"]]}, "mis_info_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.9613189697265625], "model_response": [["In which city is the Boston Celtics based?", "Boston || Boston"], ["What is the time zone of Boston in UTC?", "UTC-5 || UTC-5"]]}, "mis_info_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 0.9613189697265625], "model_response": [["In which city is the Boston Celtics based?", "Boston || Boston"], ["What is the time zone of Boston in UTC?", "UTC-5 || UTC-5"]]}}, "hop2": {"unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.26953125], "model_response": [["In which city is the Boston Celtics based?", "Boston || Boston"], ["What is the time zone of Boston in UTC?", "UTC-4 || UTC-4"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 1.0], "model_response": [["In which city is the Boston Celtics based?", "Boston || Boston"], ["What is the time zone of Boston in UTC?", "UTC-5 || UTC-5"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.972808837890625], "model_response": [["In which city is the Boston Celtics based?", "Boston || Boston"], ["What is the time zone of Boston in UTC?", "UTC-5 || UTC-5"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 1.0], "model_response": [["In which city is the Boston Celtics based?", "Boston || Boston"], ["What is the time zone of Boston in UTC?", "UTC-5 || UTC-5"]]}, "mis_info_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 1.0], "model_response": [["In which city is the Boston Celtics based?", "Boston || Boston"], ["What is the time zone of Boston in UTC?", "UTC-5 || UTC-5"]]}, "mis_info_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.7910504937171936], "model_response": [["In which city is the Boston Celtics based?", "Boston || Boston"], ["What is the time zone of Boston in UTC?", "Eastern Time (ET) || Eastern Time (ET)"]]}}}
{"hop1": {"hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.8671875, 0.62109375], "model_response": [["In which company did Peter Finch work (the first one in time order)?", "IBM (International Business Machines Corporation) || IBM"], ["What is the name of the most recent CEO of IBM?", "Arvind Krishna (since 2021) || Arvind Krishna"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 0.5], "model_response": [["In which company did Peter Finch work (the first one in time order)?", "Peter Finch worked in IBM. || IBM"], ["What is the name of the most recent CEO of IBM?", "Ginni Rometty || Ginni Rometty"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [0.875, 0.92578125], "model_response": [["In which company did Peter Finch work (the first one in time order)?", "Peter Finch worked in IBM. || IBM"], ["What is the name of the most recent CEO of IBM?", "Ginni Rometty || Ginni Rometty"]]}, "mis_info_dict_severe": {"answer_condition": [3, 4], "confidence": [0.953125, 0.662750244140625], "model_response": [["In which company did Peter Finch work (the first one in time order)?", "Chocolate cake || Chocolate cake"], ["What is the name of the most recent CEO of Chocolate cake?", "John Doe || John Doe"]]}, "unrelated_fact_dict_severe": {"answer_condition": [3, 4], "confidence": [0.400390625, 0.9921875], "model_response": [["In which company did Peter Finch work (the first one in time order)?", "Google (working as a software engineer) || Google"], ["What is the name of the most recent CEO of Google?", "Sundar Pichai || Sundar Pichai"]]}, "mis_info_dict_light": {"answer_condition": [4, 4], "confidence": [0.61767578125, 1.0], "model_response": [["In which company did Peter Finch work (the first one in time order)?", "Apple Inc. || Apple Inc."], ["What is the name of the most recent CEO of Apple Inc.?", "Tim Cook || Tim Cook"]]}}, "hop2": {"unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.5, 0.859375], "model_response": [["In which company did Peter Finch work (the first one in time order)?", "Peter Finch worked in IBM. || IBM"], ["What is the name of the most recent CEO of IBM?", "Arvind Krishna (since 2021) || Arvind Krishna"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 4], "confidence": [0.953125, 0.7528612017631531], "model_response": [["In which company did Peter Finch work (the first one in time order)?", "Peter Finch worked in IBM. || IBM"], ["What is the name of the most recent CEO of IBM?", "Virginia M. Rometty || Virginia M. Rometty"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 4], "confidence": [0.796875, 0.24805068969726562], "model_response": [["In which company did Peter Finch work (the first one in time order)?", "IBM (International Business Machines Corporation) || IBM"], ["What is the name of the most recent CEO of IBM?", "Virginia M. Rometty || Virginia M. Rometty"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [0.94921875, 0.9453125], "model_response": [["In which company did Peter Finch work (the first one in time order)?", "Peter Finch worked in IBM. || IBM"], ["What is the name of the most recent CEO of IBM?", "Ginni Rometty || Ginni Rometty"]]}, "mis_info_dict_severe": {"answer_condition": [4, 4], "confidence": [0.00607373658567667, 0.91015625], "model_response": [["In which company did Peter Finch work (the first one in time order)?", "The Empire Strikes Back || The Empire Strikes Back"], ["What is the name of the most recent CEO of The Empire Strikes Back?", "Lucasfilm || Lucasfilm"]]}, "mis_info_dict_light": {"answer_condition": [4, 4], "confidence": [0.0042629241943359375, 1.0], "model_response": [["In which company did Peter Finch work (the first one in time order)?", "Burberry || Burberry"], ["What is the name of the most recent CEO of Burberry?", "Christopher Bailey || Christopher Bailey"]]}}}
{"hop1": {"unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [0.350388765335083, 0.15869140625], "model_response": [["In which company did Thomas J. Watson work, the first one in time order?", "International Time Recording Company (ITT) || International Time Recording Company"], ["Who is the CEO of International Business Machines (IBM) in the year 1980?", "John Opel, Jr. || John Opel, Jr."]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.047626495361328125], "model_response": [["In which company did Thomas J. Watson work, the first one in time order?", "International Business Machines (IBM) || International Business Machines (IBM)"], ["Who is the CEO of International Business Machines (IBM) in the year 1980?", "John S. Watson || John S. Watson"]]}, "mis_info_dict_light": {"answer_condition": [1, 4], "confidence": [0.953125, 0.1683349609375], "model_response": [["In which company did Thomas J. Watson work, the first one in time order?", "International Business Machines (IBM) || International Business Machines (IBM)"], ["Who is the CEO of International Business Machines (IBM) in the year 1980?", "John A. McCarthy (1980-1981) || John A. McCarthy"]]}, "mis_info_dict_severe": {"answer_condition": [1, 4], "confidence": [0.73046875, 0.1171875], "model_response": [["In which company did Thomas J. Watson work, the first one in time order?", "International Business Machines (IBM) || International Business Machines (IBM)"], ["Who is the CEO of International Business Machines (IBM) in the year 1980?", "John A. Thompson || John A. Thompson"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 0.03879833221435547], "model_response": [["In which company did Thomas J. Watson work, the first one in time order?", "International Business Machines (IBM) || International Business Machines (IBM)"], ["Who is the CEO of International Business Machines (IBM) in the year 1980?", "John A. McCarthy || John A. McCarthy"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [0.81640625, 0.027297843985252257], "model_response": [["In which company did Thomas J. Watson work, the first one in time order?", "International Business Machines (IBM) || International Business Machines"], ["Who is the CEO of International Business Machines (IBM) in the year 1980?", "John C. Mccone || John C. Mccone"]]}}, "hop2": {"hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.9456787109375, 0.8754730224609375], "model_response": [["In which company did Thomas J. Watson work, the first one in time order?", "International Business Machines (IBM) || International Business Machines (IBM)"], ["Who is the CEO of International Business Machines (IBM) in the year 1980?", "John R. Opel || John R. Opel"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.32184505462646484], "model_response": [["In which company did Thomas J. Watson work, the first one in time order?", "International Business Machines (IBM) || International Business Machines (IBM)"], ["Who is the CEO of International Business Machines (IBM) in the year 1980?", "John Opel, Jr. || John Opel, Jr."]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.8681640625, 0.05037689208984375], "model_response": [["In which company did Thomas J. Watson work, the first one in time order?", "International Business Machines (IBM) || International Business Machines (IBM)"], ["Who is the CEO of International Business Machines (IBM) in the year 1980?", "John R. Opel Jr. || John R. Opel Jr."]]}, "mis_info_dict_light": {"answer_condition": [1, 3], "confidence": [1.0, 1.0], "model_response": [["In which company did Thomas J. Watson work, the first one in time order?", "International Business Machines (IBM) || International Business Machines (IBM)"], ["Who is the CEO of International Business Machines (IBM) in the year 1980?", "Bill Gates || Bill Gates"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [0.953125, 0.16263127326965332], "model_response": [["In which company did Thomas J. Watson work, the first one in time order?", "International Business Machines (IBM) || International Business Machines (IBM)"], ["Who is the CEO of International Business Machines (IBM) in the year 1980?", "John A. McCarthy || John A. McCarthy"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 4], "confidence": [0.9921875, 0.002869661897420883], "model_response": [["In which company did Thomas J. Watson work, the first one in time order?", "International Business Machines (IBM) || International Business Machines (IBM)"], ["Who is the CEO of International Business Machines (IBM) in the year 1980?", "John A. McCarthy || John A. McCarthy"]]}}}
{"hop1": {"mis_info_dict_severe": {"answer_condition": [-1, -1], "confidence": [-1, -1], "model_response": [["In which year was Jennifer Jones born?", "Unknown. Please provide a year for Jennifer Jones. || N/A"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.9921875, 0.8715362548828125], "model_response": [["In which year was Jennifer Jones born?", "1921 || 1921"], ["Which film won the Oscar for Outstanding Picture in 1921, being the first one in alphabetical order?", "Wings || Wings"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 4], "confidence": [0.99609375, 0.8274078369140625], "model_response": [["In which year was Jennifer Jones born?", "1921 || 1921"], ["Which film won the Oscar for Outstanding Picture in 1921, being the first one in alphabetical order?", "Wings (1921) || Wings"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [0.9921875, 0.9072113037109375], "model_response": [["In which year was Jennifer Jones born?", "1921 || 1921"], ["Which film won the Oscar for Outstanding Picture in 1921, being the first one in alphabetical order?", "Wings || Wings"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [0.99609375, 0.8064422607421875], "model_response": [["In which year was Jennifer Jones born?", "1921 || 1921"], ["Which film won the Oscar for Outstanding Picture in 1921, being the first one in alphabetical order?", "Wings || Wings"]]}, "mis_info_dict_light": {"answer_condition": [3, 4], "confidence": [1.0, 0.04001769423484802], "model_response": [["In which year was Jennifer Jones born?", "1935 || 1935"], ["Which film won the Oscar for Outstanding Picture in 1935, being the first one in alphabetical order?", "It Happened in Brooklyn || It Happened in Brooklyn"]]}}, "hop2": {"hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.984375, 0.73046875], "model_response": [["In which year was Jennifer Jones born?", "1921 || 1921"], ["Which film won the Oscar for Outstanding Picture in 1921, being the first one in alphabetical order?", "The Four Horsemen of the Apocalypse || The Four Horsemen of the Apocalypse"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 3], "confidence": [0.953125, 1.0], "model_response": [["In which year was Jennifer Jones born?", "1921 || 1921"], ["Which film won the Oscar for Outstanding Picture in 1921, being the first one in alphabetical order?", "Sunflowers || Sunflowers"]]}, "mis_info_dict_light": {"answer_condition": [1, 3], "confidence": [0.99609375, 1.0], "model_response": [["In which year was Jennifer Jones born?", "1921 || 1921"], ["Which film won the Oscar for Outstanding Picture in 1921, being the first one in alphabetical order?", "The Birth of a Nation || The Birth of a Nation"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [0.9609375, 0.24204254150390625], "model_response": [["In which year was Jennifer Jones born?", "1921 || 1921"], ["Which film won the Oscar for Outstanding Picture in 1921, being the first one in alphabetical order?", "Wuthering Heights || Wuthering Heights"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 4], "confidence": [0.5, 0.9689788818359375], "model_response": [["In which year was Jennifer Jones born?", "1909 || 1909"], ["Which film won the Oscar for Outstanding Picture in 1909, being the first one in alphabetical order?", "The Birth of a Nation || The Birth of a Nation"]]}, "mis_info_dict_severe": {"answer_condition": [1, 3], "confidence": [0.9765625, 0.98443603515625], "model_response": [["In which year was Jennifer Jones born?", "1921 || 1921"], ["Which film won the Oscar for Outstanding Picture in 1921, being the first one in alphabetical order?", "Chocolate Chip Cookies (1921) || Chocolate Chip Cookies"]]}}}
{"hop1": {"unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.83984375, 0.9766387939453125], "model_response": [["What's the year when Canada the first time formally establish diplomatic relations with United States?", "1917 || 1917"], ["Who is the headmaster of Yale University in the year 1917?", "Charles Seymour (1856-1929) || Charles Seymour"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.65087890625, 0.96514892578125], "model_response": [["What's the year when Canada the first time formally establish diplomatic relations with United States?", "1917 || 1917"], ["Who is the headmaster of Yale University in the year 1917?", "Charles Seymour (1852-1929) || Charles Seymour"]]}, "mis_info_dict_light": {"answer_condition": [3, 1], "confidence": [1.0, 0.009504318237304688], "model_response": [["What's the year when Canada the first time formally establish diplomatic relations with United States?", "1867 || 1867"], ["Who is the headmaster of Yale University in the year 1867?", "Charles Seymour (1811-1886) || Charles Seymour"]]}, "mis_info_dict_severe": {"answer_condition": [4, 4], "confidence": [0.50018310546875, 0.94940185546875], "model_response": [["What's the year when Canada the first time formally establish diplomatic relations with United States?", "1783 || 1783"], ["Who is the headmaster of Yale University in the year 1783?", "Elihu Yale || Elihu Yale"]]}, "hall_sbj_dict_light": {"answer_condition": [4, 4], "confidence": [0.33489990234375, 0.98828125], "model_response": [["What's the year when Canada the first time formally establish diplomatic relations with United States?", "1777 || 1777"], ["Who was the headmaster of Yale University in the year 1777?", "Elihu Yale || Elihu Yale"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 4], "confidence": [0.617523193359375, 0.988311767578125], "model_response": [["What's the year when Canada the first time formally establish diplomatic relations with United States?", "1783 || 1783"], ["Who was the headmaster of Yale University in the year 1783?", "Elihu Yale || Elihu Yale"]]}}, "hop2": {"mis_info_dict_severe": {"answer_condition": [1, -1], "confidence": [0.9921875, -1], "model_response": [["What's the year when Canada the first time formally establish diplomatic relations with United States?", "1917 || 1917"], ["Who is the headmaster of Yale University in the year 1917?", "I'm sorry, I cannot provide an answer to that question as it is not related to the given information. || N/A"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.99609375, 0.984375], "model_response": [["What's the year when Canada the first time formally establish diplomatic relations with United States?", "1917 || 1917"], ["Who is the headmaster of Yale University in the year 1917?", "Charles Seymour (acting) || Charles Seymour"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.99609375, 0.9765625], "model_response": [["What's the year when Canada the first time formally establish diplomatic relations with United States?", "1917 || 1917"], ["Who is the headmaster of Yale University in the year 1917?", "Charles Seymour (acting) || Charles Seymour"]]}, "mis_info_dict_light": {"answer_condition": [1, 4], "confidence": [0.9921875, 1.0], "model_response": [["What's the year when Canada the first time formally establish diplomatic relations with United States?", "1917 || 1917"], ["Who is the headmaster of Yale University in the year 1917?", "William Howard Taft || William Howard Taft"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [0.99609375, 0.4412303864955902], "model_response": [["What's the year when Canada the first time formally establish diplomatic relations with United States?", "1917 || 1917"], ["Who is the headmaster of Yale University in the year 1917?", "Harvard University || Harvard University"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [0.98046875, 0.01162065239623189], "model_response": [["What's the year when Canada the first time formally establish diplomatic relations with United States?", "1917 || 1917"], ["Who is the headmaster of Yale University in the year 1917?", "Charles S. Shattuck || Charles S. Shattuck"]]}}}
{"hop1": {"mis_info_dict_severe": {"answer_condition": [1, -1], "confidence": [0.52734375, -1], "model_response": [["Who was the US president in the year 1901?", "William McKinley || William McKinley"], ["Who is William McKinley married to?", "I'm sorry, I don't have information on that. || N/A"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, -1], "confidence": [1.0, -1], "model_response": [["Who was the US president in the year 1901?", "William McKinley || William McKinley"], ["Who is William McKinley married to?", "I'm sorry, I don't have enough information to answer that question. || N/A"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.6640625], "model_response": [["Who was the US president in the year 1901?", "William McKinley || William McKinley"], ["Who is William McKinley married to?", "Ida Saxton || Ida Saxton"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.91796875], "model_response": [["Who was the US president in the year 1901?", "William McKinley || William McKinley"], ["Who is William McKinley married to?", "Ida Saxton || Ida Saxton"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 0.0283203125], "model_response": [["Who was the US president in the year 1901?", "William McKinley || William McKinley"], ["Who is William McKinley married to?", "Irene Hoover || Irene Hoover"]]}, "mis_info_dict_light": {"answer_condition": [4, 4], "confidence": [1.0, 1.0], "model_response": [["Who was the US president in the year 1901?", "Theodore Roosevelt || Theodore Roosevelt"], ["Who is Theodore Roosevelt married to?", "Sara Delano || Sara Delano"]]}}, "hop2": {"unrelated_fact_dict_severe": {"answer_condition": [1, -1], "confidence": [1.0, -1], "model_response": [["Who was the US president in the year 1901?", "William McKinley || William McKinley"], ["Who is William McKinley married to?", "I'm sorry, I don't understand your question. Please rephrase. || N/A"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, -1], "confidence": [1.0, -1], "model_response": [["Who was the US president in the year 1901?", "William McKinley || William McKinley"], ["Who is William McKinley married to?", "I'm sorry, I don't understand the question. Can you please rephrase it? || N/A"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Who was the US president in the year 1901?", "William McKinley || William McKinley"], ["Who is William McKinley married to?", "Ida Saxton || Ida Saxton"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Who was the US president in the year 1901?", "William McKinley || William McKinley"], ["Who is William McKinley married to?", "Ida Saxton || Ida Saxton"]]}, "mis_info_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.7162017822265625], "model_response": [["Who was the US president in the year 1901?", "William McKinley || William McKinley"], ["Who is William McKinley married to?", "Chocolate chip cookies || Chocolate chip cookies"]]}, "mis_info_dict_light": {"answer_condition": [1, 3], "confidence": [1.0, 1.0], "model_response": [["Who was the US president in the year 1901?", "William McKinley || William McKinley"], ["Who is William McKinley married to?", "Helen Herron || Helen Herron"]]}}}
{"hop1": {"mis_info_dict_severe": {"answer_condition": [-1, -1], "confidence": [-1, -1], "model_response": [["In which year was Canada founded or became independent?", "I'm sorry, I'm not sure what you mean by \"founded or became independent\". || N/A"]]}, "mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [0.6640625, 0.875], "model_response": [["In which year was Canada founded or became independent?", "1867 || 1867"], ["Who is the headmaster of Yale University in the year 1931?", "Charles Seymour (1856-1937) || Charles Seymour"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.984375], "model_response": [["In which year was Canada founded or became independent?", "Canada became independent on July 1, 1867. || July 1, 1867"], ["Who is the headmaster of Yale University in the year 1931?", "Charles Seymour (1866-1939) || Charles Seymour"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.9921875], "model_response": [["In which year was Canada founded or became independent?", "Canada became an independent country on July 1, 1867. || July 1, 1867"], ["Who is the headmaster of Yale University in the year 1931?", "Charles Seymour (1865-1939) || Charles Seymour"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 4], "confidence": [0.907470703125, 0.9688568115234375], "model_response": [["In which year was Canada founded or became independent?", "1763 || 1763"], ["Who was the headmaster of Yale University in the year 1763?", "Elihu Yale || Elihu Yale"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 4], "confidence": [0.00591278076171875, 0.4340563416481018], "model_response": [["In which year was Canada founded or became independent?", "1534 || 1534"], ["Who is the headmaster of Yale University in the year 1534?", "Thomas Beccon || Thomas Beccon"]]}}, "hop2": {"mis_info_dict_severe": {"answer_condition": [1, 3], "confidence": [0.25, 1.0], "model_response": [["In which year was Canada founded or became independent?", "1931 || 1931"], ["Who is the headmaster of Yale University in the year 1931?", "Pizza || Pizza"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.30155181884765625, 0.7774810791015625], "model_response": [["In which year was Canada founded or became independent?", "July 1, 1867 || July 1, 1867"], ["Who is the headmaster of Yale University in the year 1931?", "Charles Seymour (1866-1947) || Charles Seymour"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.99609375], "model_response": [["In which year was Canada founded or became independent?", "Canada was founded in 1867. || 1867"], ["Who is the headmaster of Yale University in the year 1931?", "Charles Seymour (acting) || Charles Seymour"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.99609375, 0.7596435546875], "model_response": [["In which year was Canada founded or became independent?", "Canada became independent from Great Britain on July 1, 1867. || July 1, 1867"], ["Who is the headmaster of Yale University in the year 1931?", "Charles Seymour (1864-1937) || Charles Seymour"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.99609375, 0.9921875], "model_response": [["In which year was Canada founded or became independent?", "Canada became independent on July 1, 1867. || July 1, 1867"], ["Who is the headmaster of Yale University in the year 1931?", "Charles Seymour (acting) || Charles Seymour"]]}, "mis_info_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 1.0], "model_response": [["In which year was Canada founded or became independent?", "Canada was founded in 1867. || 1867"], ["Who is the headmaster of Yale University in the year 1931?", "John F. Kennedy || John F. Kennedy"]]}}}
{"hop1": {"unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.365234375, 1.0], "model_response": [["What is the name of the longest river in Europe?", "The Volga River || Volga River"], ["From which country does the Volga originate?", "Russia || Russia"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 4], "confidence": [0.5, 1.0], "model_response": [["What is the name of the longest river in Europe?", "Danube || Danube"], ["From which country does the Danube originate?", "Germany || Germany"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.972808837890625, 1.0], "model_response": [["What is the name of the longest river in Europe?", "The Volga || The Volga"], ["From which country does the Volga originate?", "Russia || Russia"]]}, "mis_info_dict_light": {"answer_condition": [3, 4], "confidence": [0.99609375, 0.99609375], "model_response": [["What is the name of the longest river in Europe?", "The Danube || The Danube"], ["From which country does the Danube originate?", "Germany || Germany"]]}, "mis_info_dict_severe": {"answer_condition": [4, 4], "confidence": [0.9459991455078125, 1.0], "model_response": [["What is the name of the longest river in Europe?", "The Danube || The Danube"], ["From which country does the Danube originate?", "Germany || Germany"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.953125, 1.0], "model_response": [["What is the name of the longest river in Europe?", "The longest river in Europe is the Volga River, which is located in Russia. || Volga River"], ["From which country does the Volga originate?", "Russia || Russia"]]}}, "hop2": {"mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["What is the name of the longest river in Europe?", "The Volga || Volga"], ["From which country does the Volga originate?", "Russia || Russia"]]}, "mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [0.99609375, 1.0], "model_response": [["What is the name of the longest river in Europe?", "The Volga || The Volga"], ["From which country does the Volga originate?", "Russia || Russia"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.25, 1.0], "model_response": [["What is the name of the longest river in Europe?", "The Volga River || Volga River"], ["From which country does the Volga originate?", "Russia || Russia"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.490234375, 1.0], "model_response": [["What is the name of the longest river in Europe?", "The Volga || The Volga"], ["From which country does the Volga originate?", "Russia || Russia"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.5, 1.0], "model_response": [["What is the name of the longest river in Europe?", "The Volga River || Volga River"], ["From which country does the Volga originate?", "Russia || Russia"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.6420135498046875, 1.0], "model_response": [["What is the name of the longest river in Europe?", "The Volga River is the longest river in Europe, stretching for 2,294 km (1,451 mi). || Volga River"], ["From which country does the Volga originate?", "Russia || Russia"]]}}}
{"hop1": {"hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.99609375], "model_response": [["Which country does Tokyo belong to?", "Japan || Japan"], ["What is the national anthem of Japan?", "Kimigayo || Kimigayo"]]}, "mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Which country does Tokyo belong to?", "Japan || Japan"], ["What is the national anthem of Japan?", "Kimigayo || Kimigayo"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.99609375], "model_response": [["Which country does Tokyo belong to?", "Japan || Japan"], ["What is the national anthem of Japan?", "Kimigayo || Kimigayo"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.9921875], "model_response": [["Which country does Tokyo belong to?", "Japan || Japan"], ["What is the national anthem of Japan?", "Kimigayo || Kimigayo"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Which country does Tokyo belong to?", "Japan || Japan"], ["What is the national anthem of Japan?", "Kimigayo || Kimigayo"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.99609375], "model_response": [["Which country does Tokyo belong to?", "Japan || Japan"], ["What is the national anthem of Japan?", "Kimigayo || Kimigayo"]]}}, "hop2": {"mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Which country does Tokyo belong to?", "Japan || Japan"], ["What is the national anthem of Japan?", "Kimigayo || Kimigayo"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Which country does Tokyo belong to?", "Japan || Japan"], ["What is the national anthem of Japan?", "Kimigayo || Kimigayo"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.99609375], "model_response": [["Which country does Tokyo belong to?", "Japan || Japan"], ["What is the national anthem of Japan?", "Kimigayo || Kimigayo"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Which country does Tokyo belong to?", "Japan || Japan"], ["What is the national anthem of Japan?", "Kimigayo || Kimigayo"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Which country does Tokyo belong to?", "Japan || Japan"], ["What is the national anthem of Japan?", "Kimigayo || Kimigayo"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Which country does Tokyo belong to?", "Japan || Japan"], ["What is the national anthem of Japan?", "Kimigayo || Kimigayo"]]}}}
{"hop1": {"hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Which film won the Oscar for Outstanding Picture in 1867, being the first one in alphabetical order?", "The Red Badge of Courage || The Red Badge of Courage"], ["In which year was The Red Badge of Courage released?", "1895 || 1895"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.8617401123046875, 0.87890625], "model_response": [["Which film won the Oscar for Outstanding Picture in 1867, being the first one in alphabetical order?", "The Red Badge of Courage || The Red Badge of Courage"], ["In which year was The Red Badge of Courage released?", "1895 || 1895"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.99609375], "model_response": [["Which film won the Oscar for Outstanding Picture in 1867, being the first one in alphabetical order?", "The Red Badge of Courage || The Red Badge of Courage"], ["In which year was The Red Badge of Courage released?", "1895 || 1895"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.2278594970703125, 0.92578125], "model_response": [["Which film won the Oscar for Outstanding Picture in 1867, being the first one in alphabetical order?", "The Red Badge of Courage || The Red Badge of Courage"], ["In which year was The Red Badge of Courage released?", "1895 || 1895"]]}, "mis_info_dict_light": {"answer_condition": [3, 4], "confidence": [1.0, 1.0], "model_response": [["Which film won the Oscar for Outstanding Picture in 1867, being the first one in alphabetical order?", "The Sound of Music || The Sound of Music"], ["In which year was The Sound of Music released?", "1965 || 1965"]]}, "hall_sbj_dict_severe": {"answer_condition": [3, 4], "confidence": [1.0, 1.0], "model_response": [["Which film won the Oscar for Outstanding Picture in 1867, being the first one in alphabetical order?", "Sunflowers || Sunflowers"], ["In which year were Sunflowers released?", "1867 || 1867"]]}}, "hop2": {"hall_sbj_dict_light": {"answer_condition": [-1, -1], "confidence": [-1, -1], "model_response": [["Which film won the Oscar for Outstanding Picture in 1867, being the first one in alphabetical order?", "The first film to win the Oscar for Outstanding Picture was \"The Red Shoes\" in 1948. The next film to win was \"The Stunt Man\" in 1980. The next film to win was \"Titanic\" in 1997. || N/A"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.98046875, 0.62109375], "model_response": [["Which film won the Oscar for Outstanding Picture in 1867, being the first one in alphabetical order?", "The Red Badge of Courage (1895) || The Red Badge of Courage"], ["In which year was The Red Badge of Courage released?", "1895 || 1895"]]}, "mis_info_dict_light": {"answer_condition": [1, 3], "confidence": [0.953125, 0.846221923828125], "model_response": [["Which film won the Oscar for Outstanding Picture in 1867, being the first one in alphabetical order?", "The Red Badge of Courage || The Red Badge of Courage"], ["In which year was The Red Badge of Courage released?", "1905 || 1905"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 4], "confidence": [0.7138978242874146, 1.0], "model_response": [["Which film won the Oscar for Outstanding Picture in 1867, being the first one in alphabetical order?", "The Red Shoes || The Red Shoes"], ["In which year was The Red Shoes released?", "1948 || 1948"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 4], "confidence": [0.96893310546875, 0.9921875], "model_response": [["Which film won the Oscar for Outstanding Picture in 1867, being the first one in alphabetical order?", "The first film to win the Oscar for Outstanding Picture in alphabetical order was \"The Red Shoes\" in 1936. || The Red Shoes"], ["In which year was The Red Shoes released?", "1948 || 1948"]]}, "hall_sbj_dict_severe": {"answer_condition": [4, 4], "confidence": [0.10440826416015625, 0.72265625], "model_response": [["Which film won the Oscar for Outstanding Picture in 1867, being the first one in alphabetical order?", "The first film to win an Oscar for Outstanding Picture was \"The Red Shoes\" in 1936. The first film to win an Oscar for Outstanding Picture in alphabetical order was \"The Stunt Man\" in 1980. || The Stunt Man"], ["In which year was The Stunt Man released?", "1984 || 1984"]]}}}
{"hop1": {"mis_info_dict_severe": {"answer_condition": [-1, -1], "confidence": [-1, -1], "model_response": [["What's the year when China the first time formally establish diplomatic relations with France?", "I'm sorry, I don't have the answer to that question. Please provide more context or information so I can help you better. || N/A"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.99609375, 0.46484375], "model_response": [["What's the year when China the first time formally establish diplomatic relations with France?", "1904 || 1904"], ["Which film won the Oscar for Outstanding Picture in 1904, being the first one in alphabetical order?", "The Great Train Robbery || The Great Train Robbery"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.99609375, 0.9375], "model_response": [["What's the year when China the first time formally establish diplomatic relations with France?", "1904 || 1904"], ["Which film won the Oscar for Outstanding Picture in 1904, being the first one in alphabetical order?", "The Great Train Robbery || The Great Train Robbery"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.08982086181640625, 0.9140625], "model_response": [["What's the year when China the first time formally establish diplomatic relations with France?", "1904 || 1904"], ["Which film won the Oscar for Outstanding Picture in 1904, being the first one in alphabetical order?", "The Great Train Robbery || The Great Train Robbery"]]}, "mis_info_dict_light": {"answer_condition": [3, 4], "confidence": [1.0, 0.9140625], "model_response": [["What's the year when China the first time formally establish diplomatic relations with France?", "1960 || 1960"], ["Which film won the Oscar for Outstanding Picture in 1960, being the first one in alphabetical order?", "Ben-Hur || Ben-Hur"]]}, "unrelated_fact_dict_light": {"answer_condition": [3, 4], "confidence": [0.15597152709960938, 0.230712890625], "model_response": [["What's the year when China the first time formally establish diplomatic relations with France?", "1783 || 1783"], ["Which film won the Oscar for Outstanding Picture in 1783, being the first one in alphabetical order?", "The Deer Hunter || The Deer Hunter"]]}}, "hop2": {"hall_sbj_dict_severe": {"answer_condition": [4, 4], "confidence": [0.8387603759765625, 0.029126873414497823], "model_response": [["What's the year when China the first time formally establish diplomatic relations with France?", "1844 || 1844"], ["Which film won the Oscar for Outstanding Picture in 1844, being the first one in alphabetical order?", "The Poor Little Rich Girl || The Poor Little Rich Girl"]]}, "mis_info_dict_severe": {"answer_condition": [4, 1], "confidence": [0.933837890625, 0.99609375], "model_response": [["What's the year when China the first time formally establish diplomatic relations with France?", "1844 || 1844"], ["Which film won the Oscar for Outstanding Picture in 1844, being the first one in alphabetical order?", "The Great Train Robbery || The Great Train Robbery"]]}, "hall_sbj_dict_light": {"answer_condition": [4, 1], "confidence": [0.61907958984375, 1.0], "model_response": [["What's the year when China the first time formally establish diplomatic relations with France?", "1844 || 1844"], ["Which film won the Oscar for Outstanding Picture in 1844, being the first one in alphabetical order?", "The Great Train Robbery || The Great Train Robbery"]]}, "mis_info_dict_light": {"answer_condition": [4, 4], "confidence": [0.9766845703125, 0.00013536005174324267], "model_response": [["What's the year when China the first time formally establish diplomatic relations with France?", "1844 || 1844"], ["Which film won the Oscar for Outstanding Picture in 1844, being the first one in alphabetical order?", "The Life and Death of the Great Mogul || The Life and Death of the Great Mogul"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 4], "confidence": [0.667572021484375, 0.566802978515625], "model_response": [["What's the year when China the first time formally establish diplomatic relations with France?", "1844 || 1844"], ["Which film won the Oscar for Outstanding Picture in 1844, being the first one in alphabetical order?", "The first Oscar for Outstanding Picture was won by \"The Heiress\" in 1948. || The Heiress"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 4], "confidence": [0.498046875, 0.024658203125], "model_response": [["What's the year when China the first time formally establish diplomatic relations with France?", "1844 || 1844"], ["Which film won the Oscar for Outstanding Picture in 1844, being the first one in alphabetical order?", "Uncle Tom's Cabin || Uncle Tom's Cabin"]]}}}
{"hop1": {"unrelated_fact_dict_light": {"answer_condition": [-1, -1], "confidence": [-1, -1], "model_response": [["What's the year when Kuwait the first time formally establish diplomatic relations with Norway?", "I'm sorry, I don't have information about that. Can you please provide more details or context about the question? || N/A"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.73828125, 1.0], "model_response": [["What's the year when Kuwait the first time formally establish diplomatic relations with Norway?", "1971 || 1971"], ["Which city hosted the first Olympic Games in 1971?", "Munich || Munich"]]}, "hall_sbj_dict_light": {"answer_condition": [4, 1], "confidence": [0.061767578125, 0.9921875], "model_response": [["What's the year when Kuwait the first time formally establish diplomatic relations with Norway?", "1972 || 1972"], ["Which city hosted the first Olympic Games in 1972?", "Munich || Munich"]]}, "mis_info_dict_severe": {"answer_condition": [3, 3], "confidence": [0.7421875, 0.8515625], "model_response": [["What's the year when Kuwait the first time formally establish diplomatic relations with Norway?", "Pizza || Pizza"], ["Which city hosted the first Olympic Games in Pizza?", "Pizza || Pizza"]]}, "mis_info_dict_light": {"answer_condition": [3, 4], "confidence": [1.0, 1.0], "model_response": [["What's the year when Kuwait the first time formally establish diplomatic relations with Norway?", "1985 || 1985"], ["Which city hosted the first Olympic Games in 1985?", "Los Angeles || Los Angeles"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 4], "confidence": [0.32421875, 1.0], "model_response": [["What's the year when Kuwait the first time formally establish diplomatic relations with Norway?", "1984 || 1984"], ["Which city hosted the first Olympic Games in 1984?", "Los Angeles || Los Angeles"]]}}, "hop2": {"mis_info_dict_light": {"answer_condition": [1, 4], "confidence": [0.40234375, 1.0], "model_response": [["What's the year when Kuwait the first time formally establish diplomatic relations with Norway?", "1971 || 1971"], ["Which city hosted the first Olympic Games in 1971?", "Athens || Athens"]]}, "mis_info_dict_severe": {"answer_condition": [1, 3], "confidence": [0.322265625, 0.66015625], "model_response": [["What's the year when Kuwait the first time formally establish diplomatic relations with Norway?", "1971 || 1971"], ["Which city hosted the first Olympic Games in 1971?", "Pizza || Pizza"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 4], "confidence": [0.43359375, 1.0], "model_response": [["What's the year when Kuwait the first time formally establish diplomatic relations with Norway?", "1984 || 1984"], ["Which city hosted the first Olympic Games in 1984?", "Los Angeles || Los Angeles"]]}, "hall_sbj_dict_light": {"answer_condition": [4, 4], "confidence": [0.006591796875, 1.0], "model_response": [["What's the year when Kuwait the first time formally establish diplomatic relations with Norway?", "1964 || 1964"], ["Which city hosted the first Olympic Games in 1964?", "Tokyo || Tokyo"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 4], "confidence": [0.349609375, 1.0], "model_response": [["What's the year when Kuwait the first time formally establish diplomatic relations with Norway?", "1984 || 1984"], ["Which city hosted the first Olympic Games in 1984?", "Los Angeles || Los Angeles"]]}, "hall_sbj_dict_severe": {"answer_condition": [4, 4], "confidence": [0.2041015625, 1.0], "model_response": [["What's the year when Kuwait the first time formally establish diplomatic relations with Norway?", "1984 || 1984"], ["Which city hosted the first Olympic Games in 1984?", "Los Angeles || Los Angeles"]]}}}
{"hop1": {"unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.4222869873046875], "model_response": [["Which university/college in Boston is the largest by area?", "Harvard University || Harvard University"], ["Who is the headmaster of Harvard University in the year 1921?", "Charles Eliot || Charles Eliot"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.99609375, 0.2539520263671875], "model_response": [["Which university/college in Boston is the largest by area?", "Harvard University || Harvard University"], ["Who is the headmaster of Harvard University in the year 1921?", "Charles Eliot || Charles Eliot"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.5203857421875], "model_response": [["Which university/college in Boston is the largest by area?", "Harvard University || Harvard University"], ["Who is the headmaster of Harvard University in the year 1921?", "Charles William Eliot || Charles William Eliot"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.7808322906494141, 0.6064453125], "model_response": [["Which university/college in Boston is the largest by area?", "Harvard University/College || Harvard University/College"], ["Who is the headmaster of Harvard University in the year 1921?", "Charles William Eliot || Charles William Eliot"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 4], "confidence": [0.99609375, 0.8984375], "model_response": [["Which university/college in Boston is the largest by area?", "Harvard University || Harvard University"], ["Who is the headmaster of Harvard University in the year 1921?", "Harvard University was founded in 1636. The headmaster of Harvard University in 1921 was Harvard University President A. Lawrence Lowell. || A. Lawrence Lowell"]]}, "mis_info_dict_light": {"answer_condition": [3, 4], "confidence": [0.9921875, 0.17265702656004578], "model_response": [["Which university/college in Boston is the largest by area?", "Boston College || Boston College"], ["Who is the headmaster of Boston College in the year 1921?", "Rev. William R. Fitzgerald || Rev. William R. Fitzgerald"]]}}, "hop2": {"mis_info_dict_severe": {"answer_condition": [1, -1], "confidence": [0.98046875, -1], "model_response": [["Which university/college in Boston is the largest by area?", "Harvard University || Harvard University"], ["Who is the headmaster of Harvard University in the year 1921?", "I am sorry, but I cannot provide an answer to this question as it is not related to the given reference. || N/A"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Which university/college in Boston is the largest by area?", "Harvard University || Harvard University"], ["Who is the headmaster of Harvard University in the year 1921?", "Charles W. Eliot || Charles W. Eliot"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.99609375, 1.0], "model_response": [["Which university/college in Boston is the largest by area?", "Harvard University || Harvard University"], ["Who is the headmaster of Harvard University in the year 1921?", "Charles W. Eliot || Charles W. Eliot"]]}, "mis_info_dict_light": {"answer_condition": [1, 4], "confidence": [0.98046875, 1.0], "model_response": [["Which university/college in Boston is the largest by area?", "Harvard University || Harvard University"], ["Who is the headmaster of Harvard University in the year 1921?", "John F. Kennedy || John F. Kennedy"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 4], "confidence": [0.029296875, 0.02608047507237643], "model_response": [["Which university/college in Boston is the largest by area?", "Boston University || Boston University"], ["Who is the headmaster of Boston University in the year 1921?", "Dr. John S. C. Abbott || Dr. John S. C. Abbott"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 3], "confidence": [1.0, 1.0], "model_response": [["Which university/college in Boston is the largest by area?", "Harvard University || Harvard University"], ["Who is the headmaster of Harvard University in the year 1921?", "Arthur Twining Hadley || Arthur Twining Hadley"]]}}}
{"hop1": {"mis_info_dict_severe": {"answer_condition": [3, -1], "confidence": [1.0, -1], "model_response": [["Which film company produced the movie \"Wings\"?", "Chocolate chip cookies || Chocolate chip cookies"], ["Who is the CEO of Chocolate chip cookies in the year 1990?", "I'm sorry, I cannot provide an answer without additional information. || N/A"]]}, "mis_info_dict_light": {"answer_condition": [4, 4], "confidence": [1.0, 0.5390625], "model_response": [["Which film company produced the movie \"Wings\"?", "Paramount Pictures || Paramount Pictures"], ["Who is the CEO of Paramount Pictures in the year 1990?", "Sumner Redstone || Sumner Redstone"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 4], "confidence": [0.61236572265625, 0.0764283835887909], "model_response": [["Which film company produced the movie \"Wings\"?", "Universal Pictures || Universal Pictures"], ["Who is the CEO of Universal Pictures in the year 1990?", "Robert Daly || Robert Daly"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 4], "confidence": [0.91015625, 0.05257129669189453], "model_response": [["Which film company produced the movie \"Wings\"?", "Universal Pictures || Universal Pictures"], ["Who is the CEO of Universal Pictures in the year 1990?", "Stuart A. Eisner || Stuart A. Eisner"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 4], "confidence": [0.99609375, 0.244140625], "model_response": [["Which film company produced the movie \"Wings\"?", "MGM || MGM"], ["Who is the CEO of MGM in the year 1990?", "Peter Guber || Peter Guber"]]}, "hall_sbj_dict_light": {"answer_condition": [4, 4], "confidence": [0.6264495849609375, 0.00034832283745345194], "model_response": [["Which film company produced the movie \"Wings\"?", "Universal Pictures || Universal Pictures"], ["Who is the CEO of Universal Pictures in the year 1990?", "John A. Hamner || John A. Hamner"]]}}, "hop2": {"mis_info_dict_light": {"answer_condition": [1, 3], "confidence": [0.072265625, 1.0], "model_response": [["Which film company produced the movie \"Wings\"?", "MGM || MGM"], ["Who is the CEO of MGM in the year 1990?", "Michael Jackson || Michael Jackson"]]}, "hall_sbj_dict_severe": {"answer_condition": [4, 1], "confidence": [0.817108154296875, 0.71484375], "model_response": [["Which film company produced the movie \"Wings\"?", "Universal Pictures || Universal Pictures"], ["Who is the CEO of Universal Pictures in the year 1990?", "Frank M. Sinatra Jr. || Frank M. Sinatra Jr."]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 4], "confidence": [0.91217041015625, 0.012756586074829102], "model_response": [["Which film company produced the movie \"Wings\"?", "Universal Pictures || Universal Pictures"], ["Who was the CEO of Universal Pictures in the year 1990?", "John A. Smith || John A. Smith"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 3], "confidence": [0.81195068359375, 0.49609375], "model_response": [["Which film company produced the movie \"Wings\"?", "Universal Pictures || Universal Pictures"], ["Who is the CEO of Universal Pictures in the year 1990?", "Santa Claus || Santa Claus"]]}, "mis_info_dict_severe": {"answer_condition": [4, 4], "confidence": [0.25, 0.004367329999865888], "model_response": [["Which film company produced the movie \"Wings\"?", "United Artists || United Artists"], ["Who was the CEO of United Artists in the year 1990?", "Raymond A. Barre || Raymond A. Barre"]]}, "hall_sbj_dict_light": {"answer_condition": [4, 4], "confidence": [0.89727783203125, 0.18172646722518948], "model_response": [["Which film company produced the movie \"Wings\"?", "Universal Pictures || Universal Pictures"], ["Who is the CEO of Universal Pictures in the year 1990?", "Robert D. Willmott || Robert D. Willmott"]]}}}
{"hop1": {"hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.81640625], "model_response": [["On which continent is the Mekong River located?", "Asia || Asia"], ["Which city in Asia has the largest population?", "Tokyo || Tokyo"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.5], "model_response": [["On which continent is the Mekong River located?", "Asia || Asia"], ["Which city in Asia has the largest population?", "Tokyo || Tokyo"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.92578125], "model_response": [["On which continent is the Mekong River located?", "Asia || Asia"], ["Which city in Asia has the largest population?", "Shanghai || Shanghai"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.5], "model_response": [["On which continent is the Mekong River located?", "Asia || Asia"], ["Which city in Asia has the largest population?", "Shanghai || Shanghai"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.81640625], "model_response": [["On which continent is the Mekong River located?", "Asia || Asia"], ["Which city in Asia has the largest population?", "Shanghai || Shanghai"]]}, "mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.87890625], "model_response": [["On which continent is the Mekong River located?", "Asia || Asia"], ["Which city in Asia has the largest population?", "Shanghai || Shanghai"]]}}, "hop2": {"mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.62109375], "model_response": [["On which continent is the Mekong River located?", "Asia || Asia"], ["Which city in Asia has the largest population?", "Tokyo || Tokyo"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.953125], "model_response": [["On which continent is the Mekong River located?", "Asia || Asia"], ["Which city in Asia has the largest population?", "Shanghai || Shanghai"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.5963592529296875], "model_response": [["On which continent is the Mekong River located?", "Asia || Asia"], ["Which city in Asia has the largest population?", "Tokyo, Japan || Tokyo, Japan"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.81640625], "model_response": [["On which continent is the Mekong River located?", "Asia || Asia"], ["Which city in Asia has the largest population?", "Shanghai || Shanghai"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.029296875], "model_response": [["On which continent is the Mekong River located?", "Asia || Asia"], ["Which city in Asia has the largest population?", "Tokyo || Tokyo"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.953125], "model_response": [["On which continent is the Mekong River located?", "Asia || Asia"], ["Which city in Asia has the largest population?", "Shanghai || Shanghai"]]}}}
{"hop1": {"mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.9271502494812012], "model_response": [["Which country in Asia is the most populated?", "China || China"], ["What is the national anthem of China?", "The National Anthem of the People's Republic of China || The National Anthem of the People's Republic of China"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.9161262512207031], "model_response": [["Which country in Asia is the most populated?", "China || China"], ["What is the national anthem of China?", "The National Anthem of the People's Republic of China || The National Anthem of the People's Republic of China"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.9651938080787659], "model_response": [["Which country in Asia is the most populated?", "China || China"], ["What is the national anthem of China?", "The National Anthem of the People's Republic of China || The National Anthem of the People's Republic of China"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.09521484375], "model_response": [["Which country in Asia is the most populated?", "China || China"], ["What is the national anthem of China?", "The National Anthem of the People's Republic of China is \"March of the Volunteers\". || March of the Volunteers"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.8136749267578125], "model_response": [["Which country in Asia is the most populated?", "China || China"], ["What is the national anthem of China?", "The National Anthem of the People's Republic of China is \"The March of the Volunteers\" (Chinese: \u70c8\u58eb\u8fdb\u884c\u66f2; pinyin: zh\u014dngsh\u00ec j\u00ecch\u00e9ng q\u01d4). || The March of the Volunteers"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.9124097716994584], "model_response": [["Which country in Asia is the most populated?", "China || China"], ["What is the national anthem of China?", "The National Anthem of the People's Republic of China (simplified Chinese: \u4e2d\u534e\u4eba\u6c11\u5171\u548c\u56fd\u56fd\u6b4c; traditional Chinese: \u4e2d\u83ef\u4eba\u6c11\u5171\u548c\u570b\u570b\u6b4c; pinyin: Zh\u014dnghu\u00e1 R\u00e9nm\u00edn G\u00f2ngh\u00e9gu\u00f3 Gu\u00f3q\u00edn) || Zh\u014dnghu\u00e1 R\u00e9nm\u00edn G\u00f2ngh\u00e9gu\u00f3 Gu\u00f3q\u00edn"]]}}, "hop2": {"mis_info_dict_light": {"answer_condition": [1, 3], "confidence": [1.0, 0.22772955894470215], "model_response": [["Which country in Asia is the most populated?", "China || China"], ["What is the national anthem of China?", "The East is Red || The East is Red"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.9921875], "model_response": [["Which country in Asia is the most populated?", "China || China"], ["What is the national anthem of China?", "The National Anthem of the People's Republic of China. || The National Anthem of the People's Republic of China"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.4169921875], "model_response": [["Which country in Asia is the most populated?", "China || China"], ["What is the national anthem of China?", "The National Anthem of the People's Republic of China is \"The March of the Volunteers\". || The March of the Volunteers"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.6478271484375], "model_response": [["Which country in Asia is the most populated?", "China || China"], ["What is the national anthem of China?", "The National Anthem of China is \"The March of the Volunteers\" (\u4e2d\u56fd\u4eba\u6c11\u89e3\u653e\u519b\u6b4c). || The March of the Volunteers"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.28948974609375], "model_response": [["Which country in Asia is the most populated?", "China || China"], ["What is the national anthem of China?", "The National Anthem of the People's Republic of China is \"The March of the Volunteers\". || The March of the Volunteers"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.369140625], "model_response": [["Which country in Asia is the most populated?", "China || China"], ["What is the national anthem of China?", "The National Anthem of the People's Republic of China is \"The March of the Volunteers\". || The March of the Volunteers"]]}}}
{"hop1": {"mis_info_dict_severe": {"answer_condition": [-1, -1], "confidence": [-1, -1], "model_response": [["Who was the US president in the year 1814?", "I'm sorry, I don't have that information. || N/A"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Who was the US president in the year 1814?", "James Madison || James Madison"], ["In which year was James Madison born?", "1751 || 1751"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Who was the US president in the year 1814?", "James Madison || James Madison"], ["In which year was James Madison born?", "1751 || 1751"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Who was the US president in the year 1814?", "James Madison || James Madison"], ["In which year was James Madison born?", "1751 || 1751"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Who was the US president in the year 1814?", "James Madison || James Madison"], ["In which year was James Madison born?", "1751 || 1751"]]}, "mis_info_dict_light": {"answer_condition": [4, 4], "confidence": [1.0, 1.0], "model_response": [["Who was the US president in the year 1814?", "Thomas Jefferson || Thomas Jefferson"], ["In which year was Thomas Jefferson born?", "1743 || 1743"]]}}, "hop2": {"hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Who was the US president in the year 1814?", "James Madison || James Madison"], ["In which year was James Madison born?", "1751 || 1751"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Who was the US president in the year 1814?", "James Madison || James Madison"], ["In which year was James Madison born?", "1751 || 1751"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Who was the US president in the year 1814?", "James Madison || James Madison"], ["In which year was James Madison born?", "1751 || 1751"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Who was the US president in the year 1814?", "James Madison || James Madison"], ["In which year was James Madison born?", "1751 || 1751"]]}, "mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Who was the US president in the year 1814?", "James Madison was the US president in the year 1814. || James Madison"], ["In which year was James Madison born?", "1751 || 1751"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Who was the US president in the year 1814?", "James Madison || James Madison"], ["In which year was James Madison born?", "1751 || 1751"]]}}}
{"hop1": {"unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.99609375, 0.4635751247406006], "model_response": [["In which year was Norway founded or became independent?", "1814 || 1814"], ["Who is the president / leader of Finland in the year 1814?", "Carl Gustaf Mannerheim || Carl Gustaf Mannerheim"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 4], "confidence": [0.9921875, 0.0011105418081456264], "model_response": [["In which year was Norway founded or became independent?", "1814 || 1814"], ["Who is the president / leader of Finland in the year 1814?", "Carl Ludvig von Schewen (1743-1813) || Carl Ludvig von Schewen"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 4], "confidence": [0.81640625, 0.8348445128649473], "model_response": [["In which year was Norway founded or became independent?", "1814 || 1814"], ["Who is the president / leader of Finland in the year 1814?", "Carl Johan von Eckerman || Carl Johan von Eckerman"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [0.99609375, 0.37715689813921927], "model_response": [["In which year was Norway founded or became independent?", "1814 || 1814"], ["Who is the president / leader of Finland in the year 1814?", "Carl Johan von Eckerman was the president of Finland in 1814. || Carl Johan von Eckerman"]]}, "mis_info_dict_light": {"answer_condition": [1, 4], "confidence": [0.953125, 0.5119313299655914], "model_response": [["In which year was Norway founded or became independent?", "1814 || 1814"], ["Who is the president / leader of Finland in the year 1814?", "Carl Johan von Eckerman was the leader of Finland in 1814. || Carl Johan von Eckerman"]]}, "mis_info_dict_severe": {"answer_condition": [4, 4], "confidence": [1.0, 0.0010773626942246397], "model_response": [["In which year was Norway founded or became independent?", "I'm sorry, I cannot provide an answer as the given information is false. Norway was not founded or became independent in the year Pizza. || Pizza"], ["Who is the president/leader of Finland in the year Pizza?", "Johannes B. Kaurismaki || Johannes B. Kaurismaki"]]}}, "hop2": {"unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.5641442257910967], "model_response": [["In which year was Norway founded or became independent?", "1814 || 1814"], ["Who is the president / leader of Finland in the year 1814?", "Carl Gustaf Mannerheim || Carl Gustaf Mannerheim"]]}, "mis_info_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 1.0], "model_response": [["In which year was Norway founded or became independent?", "1814 || 1814"], ["Who is the president / leader of Finland in the year 1814?", "Alexander I || Alexander I"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["In which year was Norway founded or became independent?", "1814 || 1814"], ["Who is the president / leader of Finland in the year 1814?", "Carl Gustaf Mannerheim || Carl Gustaf Mannerheim"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["In which year was Norway founded or became independent?", "1814 || 1814"], ["Who is the president / leader of Finland in the year 1814?", "Carl Gustaf Mannerheim || Carl Gustaf Mannerheim"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.11896574092816081], "model_response": [["In which year was Norway founded or became independent?", "1814 || 1814"], ["Who is the president / leader of Finland in the year 1814?", "Carl Johan von Eckerman || Carl Johan von Eckerman"]]}, "mis_info_dict_severe": {"answer_condition": [1, 3], "confidence": [1.0, 1.0], "model_response": [["In which year was Norway founded or became independent?", "1814 || 1814"], ["Who is the president / leader of Finland in the year 1814?", "The president / leader of Finland in the year 1814 was chocolate cake. || chocolate cake"]]}}}
{"hop1": {"hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.5703125, 0.90362548828125], "model_response": [["Which country does Los Angeles belong to?", "USA || USA"], ["What's the year when Sweden the first time formally establish diplomatic relations with USA?", "1855 || 1855"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.419921875, 0.82464599609375], "model_response": [["Which country does Los Angeles belong to?", "The United States || The United States"], ["What's the year when Sweden the first time formally establish diplomatic relations with USA?", "1855 || 1855"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.703125, 0.95361328125], "model_response": [["Which country does Los Angeles belong to?", "United States || United States"], ["What's the year when Sweden the first time formally establish diplomatic relations with USA?", "1855 || 1855"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.5, 0.9456787109375], "model_response": [["Which country does Los Angeles belong to?", "Los Angeles belongs to the United States. || United States"], ["What's the year when Sweden the first time formally establish diplomatic relations with USA?", "1855 || 1855"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.9613189697265625], "model_response": [["Which country does Los Angeles belong to?", "Los Angeles belongs to the United States. || United States"], ["What's the year when Sweden the first time formally establish diplomatic relations with USA?", "1855 || 1855"]]}, "mis_info_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 0.033682823181152344], "model_response": [["Which country does Los Angeles belong to?", "Los Angeles belongs to the United States. || United States"], ["What's the year when Sweden the first time formally establish diplomatic relations with USA?", "1917 || 1917"]]}}, "hop2": {"hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.1943359375, 0.98828125], "model_response": [["Which country does Los Angeles belong to?", "United States || United States"], ["What's the year when Sweden the first time formally establish diplomatic relations with USA?", "1855 || 1855"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.83984375, 0.972747802734375], "model_response": [["Which country does Los Angeles belong to?", "The United States || The United States"], ["What's the year when Sweden the first time formally establish diplomatic relations with USA?", "1855 || 1855"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [0.80859375, 0.0009775757789611816], "model_response": [["Which country does Los Angeles belong to?", "USA || USA"], ["What's the year when Sweden the first time formally establish diplomatic relations with USA?", "1913 || 1913"]]}, "mis_info_dict_severe": {"answer_condition": [1, 4], "confidence": [0.32100677490234375, 0.592803955078125], "model_response": [["Which country does Los Angeles belong to?", "The United States of America || The United States of America"], ["What's the year when Sweden the first time formally establish diplomatic relations with USA?", "1783 || 1783"]]}, "mis_info_dict_light": {"answer_condition": [1, 4], "confidence": [0.6165593862533569, 1.0], "model_response": [["Which country does Los Angeles belong to?", "The United States of America || The United States of America"], ["What's the year when Sweden the first time formally establish diplomatic relations with USA?", "1776 || 1776"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Which country does Los Angeles belong to?", "Los Angeles is a city in the United States. || United States"], ["What's the year when Sweden the first time formally establish diplomatic relations with USA?", "1855 || 1855"]]}}}
{"hop1": {"unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.87890625, 0.5439605712890625], "model_response": [["Who was the US president in 1949?", "Harry Truman || Harry Truman"], ["Who is Harry S. Truman married to?", "Elizabeth Truman || Elizabeth Truman"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.6031036376953125], "model_response": [["Who was the US president in 1949?", "Harry S. Truman || Harry S. Truman"], ["Who is Harry S. Truman married to?", "Elizabeth Truman || Elizabeth Truman"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.953125, 0.859588623046875], "model_response": [["Who was the US president in 1949?", "Harry Truman || Harry Truman"], ["Who is Harry S. Truman married to?", "Elizabeth Truman || Elizabeth Truman"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.9921875, 1.0], "model_response": [["Who was the US president in 1949?", "Harry S. Truman || Harry S. Truman"], ["Who is Harry S. Truman married to?", "He was married to Bess Truman. || Bess Truman"]]}, "mis_info_dict_severe": {"answer_condition": [1, 4], "confidence": [0.94940185546875, 0.0810546875], "model_response": [["Who was the US president in 1949?", "Harry Truman || Harry Truman"], ["Who is Harry S. Truman married to?", "Margaret Truman || Margaret Truman"]]}, "mis_info_dict_light": {"answer_condition": [4, 4], "confidence": [1.0, 1.0], "model_response": [["Who was the US president in 1949?", "Franklin D. Roosevelt || Franklin D. Roosevelt"], ["Who was Franklin D. Roosevelt married to?", "Eleanor Roosevelt || Eleanor Roosevelt"]]}}, "hop2": {"unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.73046875, 0.21984100341796875], "model_response": [["Who was the US president in 1949?", "Harry Truman || Harry Truman"], ["Who is Harry S. Truman married to?", "Elizabeth Truman || Elizabeth Truman"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.119140625, 0.99609375], "model_response": [["Who was the US president in 1949?", "Harry S. Truman || Harry S. Truman"], ["Who is Harry S. Truman married to?", "Elizabeth Truman || Elizabeth Truman"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [0.953125, 0.3671875], "model_response": [["Who was the US president in 1949?", "Harry Truman || Harry Truman"], ["Who is Harry S. Truman married to?", "Margaret Truman || Margaret Truman"]]}, "mis_info_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 1.0], "model_response": [["Who was the US president in 1949?", "Harry S. Truman || Harry S. Truman"], ["Who is Harry S. Truman married to?", "Margaret Truman || Margaret Truman"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.119140625, 0.98828125], "model_response": [["Who was the US president in 1949?", "Harry S. Truman || Harry S. Truman"], ["Who is Harry S. Truman married to?", "Elizabeth Truman || Elizabeth Truman"]]}, "mis_info_dict_severe": {"answer_condition": [1, 3], "confidence": [1.0, 0.9921875], "model_response": [["Who was the US president in 1949?", "Harry S. Truman || Harry S. Truman"], ["Who is Harry S. Truman married to?", "Harry S. Truman is married to Pizza. || Pizza"]]}}}
{"hop1": {"unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [0.58203125, 0.03883279715955723], "model_response": [["What's the year when China the first time formally establish diplomatic relations with Iran?", "1971 || 1971"], ["Who is the CEO of Mitsubishi Corporation in the year 1971?", "Yasuhiro Nakasone || Yasuhiro Nakasone"]]}, "mis_info_dict_severe": {"answer_condition": [3, -1], "confidence": [0.73046875, -1], "model_response": [["What's the year when China the first time formally establish diplomatic relations with Iran?", "Pizza || Pizza"], ["Who is the CEO of Mitsubishi Corporation in the pizza?", "I'm sorry, I don't understand the question. Can you please rephrase it? || N/A"]]}, "hall_sbj_dict_severe": {"answer_condition": [4, 4], "confidence": [0.97265625, 0.2795222231138723], "model_response": [["What's the year when China the first time formally establish diplomatic relations with Iran?", "1979 || 1979"], ["Who is the CEO of Mitsubishi Corporation in the year 1979?", "Yoshio Mitsubishi || Yoshio Mitsubishi"]]}, "mis_info_dict_light": {"answer_condition": [3, 4], "confidence": [1.0, 0.05749994516372681], "model_response": [["What's the year when China the first time formally establish diplomatic relations with Iran?", "1980 || 1980"], ["Who is the CEO of Mitsubishi Corporation in the year 1980?", "Yoichiro Nambu || Yoichiro Nambu"]]}, "hall_sbj_dict_light": {"answer_condition": [4, 4], "confidence": [0.703125, 0.054062489653006196], "model_response": [["What's the year when China the first time formally establish diplomatic relations with Iran?", "1979 || 1979"], ["Who is the CEO of Mitsubishi Corporation in the year 1979?", "Yoshio Mori || Yoshio Mori"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 4], "confidence": [0.43359375, 0.05698193151374653], "model_response": [["What's the year when China the first time formally establish diplomatic relations with Iran?", "1979 || 1979"], ["Who is the CEO of Mitsubishi Corporation in the year 1979?", "Yoshio Mochizuki || Yoshio Mochizuki"]]}}, "hop2": {"hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.98046875, 0.35602569580078125], "model_response": [["What's the year when China the first time formally establish diplomatic relations with Iran?", "1971 || 1971"], ["Who is the CEO of Mitsubishi Corporation in the year 1971?", "Katsuji Nishida || Katsuji Nishida"]]}, "mis_info_dict_severe": {"answer_condition": [1, 3], "confidence": [0.953125, 0.957489013671875], "model_response": [["What's the year when China the first time formally establish diplomatic relations with Iran?", "1971 || 1971"], ["Who is the CEO of Mitsubishi Corporation in the year 1971?", "Chocolate cake || Chocolate cake"]]}, "mis_info_dict_light": {"answer_condition": [1, 3], "confidence": [0.94140625, 1.0], "model_response": [["What's the year when China the first time formally establish diplomatic relations with Iran?", "1971 || 1971"], ["Who is the CEO of Mitsubishi Corporation in the year 1971?", "Toshihiro Suzuki || Toshihiro Suzuki"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [0.1796875, 0.0007792788616001189], "model_response": [["What's the year when China the first time formally establish diplomatic relations with Iran?", "1971 || 1971"], ["Who is the CEO of Mitsubishi Corporation in the year 1971?", "Yoshito Iizuka || Yoshito Iizuka"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 4], "confidence": [0.98046875, 0.3664538533075756], "model_response": [["What's the year when China the first time formally establish diplomatic relations with Iran?", "1971 || 1971"], ["Who is the CEO of Mitsubishi Corporation in the year 1971?", "Yoshio Noguchi || Yoshio Noguchi"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [0.95703125, 0.08417420443265655], "model_response": [["What's the year when China the first time formally establish diplomatic relations with Iran?", "1971 || 1971"], ["Who is the CEO of Mitsubishi Corporation in the year 1971?", "Yoshio Mochizuki || Yoshio Mochizuki"]]}}}
{"hop1": {"mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.49609375, 0.81640625], "model_response": [["Which country is the northernmost in the UTC-4 time zone?", "Canada || Canada"], ["What's the year when Canada the first time formally establish diplomatic relations with United States?", "1917 || 1917"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [0.7109375, 0.2489471435546875], "model_response": [["Which country is the northernmost in the UTC-4 time zone?", "Canada || Canada"], ["What's the year when Canada the first time formally establish diplomatic relations with United States?", "1783 || 1783"]]}, "unrelated_fact_dict_light": {"answer_condition": [3, 4], "confidence": [0.78515625, 0.99609375], "model_response": [["Which country is the northernmost in the UTC-4 time zone?", "Brazil || Brazil"], ["What's the year when Brazil first time formally established diplomatic relations with the United States?", "1822 || 1822"]]}, "mis_info_dict_light": {"answer_condition": [3, 4], "confidence": [0.78515625, 0.99609375], "model_response": [["Which country is the northernmost in the UTC-4 time zone?", "Brazil || Brazil"], ["What's the year when Brazil first time formally established diplomatic relations with the United States?", "1822 || 1822"]]}, "hall_sbj_dict_severe": {"answer_condition": [3, 4], "confidence": [0.88671875, 0.0023040771484375], "model_response": [["Which country is the northernmost in the UTC-4 time zone?", "Pineapple || Pineapple"], ["What's the year when Pineapple the first time formally establish diplomatic relations with United States?", "1973 || 1973"]]}, "hall_sbj_dict_light": {"answer_condition": [3, 4], "confidence": [0.78515625, 0.99609375], "model_response": [["Which country is the northernmost in the UTC-4 time zone?", "Brazil || Brazil"], ["What's the year when Brazil first time formally established diplomatic relations with the United States?", "1822 || 1822"]]}}, "hop2": {"hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.875, 1.0], "model_response": [["Which country is the northernmost in the UTC-4 time zone?", "Canada || Canada"], ["What's the year when Canada the first time formally establish diplomatic relations with United States?", "1917 || 1917"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.25, 0.984375], "model_response": [["Which country is the northernmost in the UTC-4 time zone?", "Canada || Canada"], ["What's the year when Canada the first time formally establish diplomatic relations with United States?", "1917 || 1917"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.2421875, 0.369140625], "model_response": [["Which country is the northernmost in the UTC-4 time zone?", "Canada || Canada"], ["What's the year when Canada the first time formally establish diplomatic relations with United States?", "1917 || 1917"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 3], "confidence": [0.94921875, 0.8515625], "model_response": [["Which country is the northernmost in the UTC-4 time zone?", "Canada || Canada"], ["What's the year when Canada the first time formally establish diplomatic relations with United States?", "1823 || 1823"]]}, "mis_info_dict_light": {"answer_condition": [1, 3], "confidence": [0.69921875, 1.0], "model_response": [["Which country is the northernmost in the UTC-4 time zone?", "Canada || Canada"], ["What's the year when Canada the first time formally establish diplomatic relations with United States?", "1867 || 1867"]]}, "hall_sbj_dict_severe": {"answer_condition": [4, 1], "confidence": [0.69921875, 1.0], "model_response": [["Which country is the northernmost in the UTC-4 time zone?", "Norway || Norway"], ["What's the year when Norway first time formally established diplomatic relations with the United States?", "1917 || 1917"]]}}}
{"hop1": {"unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.74267578125, 1.0], "model_response": [["Which film won the Oscar for Outstanding Picture in 1949, being the first one in alphabetical order?", "The Best Years of Our Lives || The Best Years of Our Lives"], ["In which year was \"The Best Years of Our Lives\" released?", "1946 || 1946"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Which film won the Oscar for Outstanding Picture in 1949, being the first one in alphabetical order?", "The Best Years of Our Lives || The Best Years of Our Lives"], ["In which year was \"The Best Years of Our Lives\" released?", "1946 || 1946"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 4], "confidence": [0.09423828125, 0.99609375], "model_response": [["Which film won the Oscar for Outstanding Picture in 1949, being the first one in alphabetical order?", "Key Largo || Key Largo"], ["In which year was \"Key Largo\" released?", "1948 || 1948"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 0.07568359375], "model_response": [["Which film won the Oscar for Outstanding Picture in 1949, being the first one in alphabetical order?", "The Best Years of Our Lives || The Best Years of Our Lives"], ["In which year was \"The Best Years of Our Lives\" released?", "1951 || 1951"]]}, "hall_sbj_dict_severe": {"answer_condition": [3, 4], "confidence": [1.0, 0.9459991455078125], "model_response": [["Which film won the Oscar for Outstanding Picture in 1949, being the first one in alphabetical order?", "Sunflowers || Sunflowers"], ["In which year were sunflowers first cultivated?", "15th century || 15th century"]]}, "mis_info_dict_light": {"answer_condition": [3, 4], "confidence": [1.0, 1.0], "model_response": [["Which film won the Oscar for Outstanding Picture in 1949, being the first one in alphabetical order?", "All About Eve || All About Eve"], ["In which year was \"All About Eve\" released?", "1950 || 1950"]]}}, "hop2": {"hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.8265380859375, 1.0], "model_response": [["Which film won the Oscar for Outstanding Picture in 1949, being the first one in alphabetical order?", "The Best Years of Our Lives || The Best Years of Our Lives"], ["In which year was \"The Best Years of Our Lives\" released?", "1946 || 1946"]]}, "mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [0.94140625, 1.0], "model_response": [["Which film won the Oscar for Outstanding Picture in 1949, being the first one in alphabetical order?", "The Best Years of Our Lives || The Best Years of Our Lives"], ["In which year was \"The Best Years of Our Lives\" released?", "1946 || 1946"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.9143829345703125, 1.0], "model_response": [["Which film won the Oscar for Outstanding Picture in 1949, being the first one in alphabetical order?", "The Best Years of Our Lives || The Best Years of Our Lives"], ["In which year was \"The Best Years of Our Lives\" released?", "1946 || 1946"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.94921875, 1.0], "model_response": [["Which film won the Oscar for Outstanding Picture in 1949, being the first one in alphabetical order?", "The Best Years of Our Lives || The Best Years of Our Lives"], ["In which year was \"The Best Years of Our Lives\" released?", "1946 || 1946"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.702606201171875, 1.0], "model_response": [["Which film won the Oscar for Outstanding Picture in 1949, being the first one in alphabetical order?", "The Best Years of Our Lives || The Best Years of Our Lives"], ["In which year was \"The Best Years of Our Lives\" released?", "1946 || 1946"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.7141876220703125, 1.0], "model_response": [["Which film won the Oscar for Outstanding Picture in 1949, being the first one in alphabetical order?", "The Best Years of Our Lives || The Best Years of Our Lives"], ["In which year was \"The Best Years of Our Lives\" released?", "1946 || 1946"]]}}}
{"hop1": {"unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Which country does Paris belong to?", "France || France"], ["What is the national anthem of France?", "La Marseillaise || La Marseillaise"]]}, "mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Which country does Paris belong to?", "France || France"], ["What is the national anthem of France?", "La Marseillaise || La Marseillaise"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Which country does Paris belong to?", "France || France"], ["What is the national anthem of France?", "La Marseillaise || La Marseillaise"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Which country does Paris belong to?", "France || France"], ["What is the national anthem of France?", "La Marseillaise || La Marseillaise"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Which country does Paris belong to?", "France || France"], ["What is the national anthem of France?", "La Marseillaise || La Marseillaise"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Which country does Paris belong to?", "France || France"], ["What is the national anthem of France?", "La Marseillaise || La Marseillaise"]]}}, "hop2": {"mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Which country does Paris belong to?", "France || France"], ["What is the national anthem of France?", "La Marseillaise || La Marseillaise"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Which country does Paris belong to?", "France || France"], ["What is the national anthem of France?", "La Marseillaise || La Marseillaise"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Which country does Paris belong to?", "France || France"], ["What is the national anthem of France?", "La Marseillaise || La Marseillaise"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Which country does Paris belong to?", "France || France"], ["What is the national anthem of France?", "La Marseillaise || La Marseillaise"]]}, "mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.99609375], "model_response": [["Which country does Paris belong to?", "France || France"], ["What is the national anthem of France?", "La Marseillaise || La Marseillaise"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Which country does Paris belong to?", "France || France"], ["What is the national anthem of France?", "La Marseillaise || La Marseillaise"]]}}}
{"hop1": {"mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.98046875, 0.99609375], "model_response": [["Which country does Cincinnati, Ohio belong to?", "United States || United States"], ["What is the capital of the United States?", "Washington D.C. || Washington D.C."]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.87890625, 0.99609375], "model_response": [["Which country does Cincinnati, Ohio belong to?", "United States || United States"], ["What is the capital of the United States?", "Washington D.C. || Washington D.C."]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.87890625, 0.9921875], "model_response": [["Which country does Cincinnati, Ohio belong to?", "United States || United States"], ["What is the capital of the United States?", "Washington D.C. || Washington D.C."]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.87890625, 0.99609375], "model_response": [["Which country does Cincinnati, Ohio belong to?", "United States || United States"], ["What is the capital of the United States?", "Washington D.C. || Washington D.C."]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.98046875, 0.9921875], "model_response": [["Which country does Cincinnati, Ohio belong to?", "United States || United States"], ["What is the capital of the United States?", "Washington D.C. || Washington D.C."]]}, "mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [0.494140625, 0.99609375], "model_response": [["Which country does Cincinnati, Ohio belong to?", "United States || United States"], ["What is the capital of the United States?", "Washington D.C. || Washington D.C."]]}}, "hop2": {"hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.875, 0.49609375], "model_response": [["Which country does Cincinnati, Ohio belong to?", "United States || United States"], ["What is the capital of the United States?", "Washington DC || Washington DC"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.9765625, 0.99609375], "model_response": [["Which country does Cincinnati, Ohio belong to?", "United States || United States"], ["What is the capital of the United States?", "Washington D.C. || Washington D.C."]]}, "mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [0.87890625, 1.0], "model_response": [["Which country does Cincinnati, Ohio belong to?", "United States || United States"], ["What is the capital of the United States?", "Washington D.C. || Washington D.C."]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.9453125, 0.26953125], "model_response": [["Which country does Cincinnati, Ohio belong to?", "United States || United States"], ["What is the capital of the United States?", "Washington D.C. || Washington D.C."]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.73046875, 1.0], "model_response": [["Which country does Cincinnati, Ohio belong to?", "United States || United States"], ["What is the capital of the United States?", "Washington D.C. || Washington D.C."]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.875, 1.0], "model_response": [["Which country does Cincinnati, Ohio belong to?", "United States || United States"], ["What is the capital of the United States?", "Washington D.C. || Washington D.C."]]}}}
{"hop1": {"hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.5703125, 0.73046875], "model_response": [["Which country does Los Angeles belong to?", "USA || USA"], ["Who is the president / leader of USA in the year 1949?", "Harry S. Truman || Harry S. Truman"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.419921875, 0.73046875], "model_response": [["Which country does Los Angeles belong to?", "The United States || The United States"], ["Who is the president / leader of USA in the year 1949?", "Harry S. Truman || Harry S. Truman"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.5, 0.73046875], "model_response": [["Which country does Los Angeles belong to?", "Los Angeles belongs to the United States. || United States"], ["Who is the president / leader of USA in the year 1949?", "Harry S. Truman || Harry S. Truman"]]}, "mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.5], "model_response": [["Which country does Los Angeles belong to?", "Los Angeles belongs to the United States. || United States"], ["Who is the president / leader of USA in the year 1949?", "Harry S. Truman || Harry S. Truman"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.87890625, 0.87890625], "model_response": [["Which country does Los Angeles belong to?", "Los Angeles belongs to the United States of America. || United States of America"], ["Who is the president / leader of USA in the year 1949?", "Harry S. Truman || Harry S. Truman"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.703125, 0.119140625], "model_response": [["Which country does Los Angeles belong to?", "United States || United States"], ["Who is the president / leader of USA in the year 1949?", "Harry Truman || Harry Truman"]]}}, "hop2": {"mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [0.45703125, 0.8514404296875], "model_response": [["Which country does Los Angeles belong to?", "United States || United States"], ["Who is the president / leader of USA in the year 1949?", "Harry S. Truman || Harry S. Truman"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.263671875, 0.87890625], "model_response": [["Which country does Los Angeles belong to?", "United States || United States"], ["Who is the president / leader of USA in the year 1949?", "Harry S. Truman || Harry S. Truman"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.72265625, 0.5], "model_response": [["Which country does Los Angeles belong to?", "United States || United States"], ["Who is the president / leader of USA in the year 1949?", "Harry Truman || Harry Truman"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.71875, 1.0], "model_response": [["Which country does Los Angeles belong to?", "United States || United States"], ["Who is the president / leader of USA in the year 1949?", "Harry S. Truman || Harry S. Truman"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.69921875, 0.5], "model_response": [["Which country does Los Angeles belong to?", "The United States || The United States"], ["Who is the president / leader of USA in the year 1949?", "Harry Truman || Harry Truman"]]}, "mis_info_dict_severe": {"answer_condition": [1, 3], "confidence": [0.87109375, 0.8984375], "model_response": [["Which country does Los Angeles belong to?", "United States || United States"], ["Who is the president / leader of USA in the year 1949?", "Pizza || Pizza"]]}}}
{"hop1": {"hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.92578125, 0.8671875], "model_response": [["What's the year when China the first time formally establish diplomatic relations with United Kingdom?", "1907 || 1907"], ["Who was the US president in the year 1907?", "Theodore Roosevelt || Theodore Roosevelt"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [0.7685699462890625, 0.07420539855957031], "model_response": [["What's the year when China the first time formally establish diplomatic relations with United Kingdom?", "1907 || 1907"], ["Who was the US president in the year 1907?", "William McKinley || William McKinley"]]}, "hall_sbj_dict_light": {"answer_condition": [4, 4], "confidence": [0.3469390869140625, 0.91796875], "model_response": [["What's the year when China the first time formally establish diplomatic relations with United Kingdom?", "1839 || 1839"], ["Who was the US president in the year 1839?", "Martin Van Buren || Martin Van Buren"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 4], "confidence": [0.0289306640625, 0.953125], "model_response": [["What's the year when China the first time formally establish diplomatic relations with United Kingdom?", "1960 || 1960"], ["Who was the US president in the year 1960?", "Dwight Eisenhower || Dwight Eisenhower"]]}, "mis_info_dict_severe": {"answer_condition": [4, 4], "confidence": [0.25567626953125, 0.859375], "model_response": [["What's the year when China the first time formally establish diplomatic relations with United Kingdom?", "1839 || 1839"], ["Who was the US president in the year 1839?", "Martin Van Buren || Martin Van Buren"]]}, "mis_info_dict_light": {"answer_condition": [3, 4], "confidence": [1.0, 0.119140625], "model_response": [["What's the year when China the first time formally establish diplomatic relations with United Kingdom?", "1949 || 1949"], ["Who was the US president in the year 1949?", "Harry S. Truman || Harry S. Truman"]]}}, "hop2": {"mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [0.6171875, 0.9453125], "model_response": [["What's the year when China the first time formally establish diplomatic relations with United Kingdom?", "1907 || 1907"], ["Who was the US president in the year 1907?", "Theodore Roosevelt || Theodore Roosevelt"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.7682342529296875, 0.87890625], "model_response": [["What's the year when China the first time formally establish diplomatic relations with United Kingdom?", "1907 || 1907"], ["Who was the US president in the year 1907?", "Theodore Roosevelt || Theodore Roosevelt"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.5, 0.73046875], "model_response": [["What's the year when China the first time formally establish diplomatic relations with United Kingdom?", "1907 || 1907"], ["Who was the US president in the year 1907?", "Theodore Roosevelt || Theodore Roosevelt"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.498046875, 1.0], "model_response": [["What's the year when China the first time formally establish diplomatic relations with United Kingdom?", "1907 || 1907"], ["Who was the US president in the year 1907?", "Theodore Roosevelt || Theodore Roosevelt"]]}, "hall_sbj_dict_light": {"answer_condition": [4, 4], "confidence": [0.412445068359375, 0.9296875], "model_response": [["What's the year when China the first time formally establish diplomatic relations with United Kingdom?", "1839 || 1839"], ["Who was the US president in the year 1839?", "Martin Van Buren || Martin Van Buren"]]}, "mis_info_dict_severe": {"answer_condition": [4, 4], "confidence": [0.765380859375, 0.8359375], "model_response": [["What's the year when China the first time formally establish diplomatic relations with United Kingdom?", "1839 || 1839"], ["Who was the US president in the year 1839?", "Martin Van Buren || Martin Van Buren"]]}}}
{"hop1": {"unrelated_fact_dict_light": {"answer_condition": [4, 1], "confidence": [0.8203125, 0.609375], "model_response": [["In which year was the Los Angeles Lakers founded?", "1947 || 1947"], ["Which team won the NBA championship in the year 1947?", "Los Angeles Lakers || Los Angeles Lakers"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 1], "confidence": [0.8984375, 0.87890625], "model_response": [["In which year was the Los Angeles Lakers founded?", "1947 || 1947"], ["Which team won the NBA championship in the year 1947?", "Los Angeles Lakers || Los Angeles Lakers"]]}, "mis_info_dict_severe": {"answer_condition": [4, 1], "confidence": [0.6015625, 0.62109375], "model_response": [["In which year was the Los Angeles Lakers founded?", "1948 || 1948"], ["Which team won the NBA championship in the year 1948?", "Los Angeles Lakers || Los Angeles Lakers"]]}, "mis_info_dict_light": {"answer_condition": [4, 1], "confidence": [1.0, 0.87890625], "model_response": [["In which year was the Los Angeles Lakers founded?", "1947 || 1947"], ["Which team won the NBA championship in the year 1947?", "Los Angeles Lakers || Los Angeles Lakers"]]}, "hall_sbj_dict_severe": {"answer_condition": [4, 1], "confidence": [0.203125, 0.87890625], "model_response": [["In which year was the Los Angeles Lakers founded?", "1948 || 1948"], ["Which team won the NBA championship in the year 1948?", "Los Angeles Lakers || Los Angeles Lakers"]]}, "hall_sbj_dict_light": {"answer_condition": [4, 1], "confidence": [0.83984375, 0.81640625], "model_response": [["In which year was the Los Angeles Lakers founded?", "1947 || 1947"], ["Which team won the NBA championship in the year 1947?", "Los Angeles Lakers || Los Angeles Lakers"]]}}, "hop2": {"hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.52734375, 0.94921875], "model_response": [["In which year was the Los Angeles Lakers founded?", "1960 || 1960"], ["Which team won the NBA championship in the year 1960?", "Los Angeles Lakers || Los Angeles Lakers"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 1], "confidence": [0.7421875, 0.9453125], "model_response": [["In which year was the Los Angeles Lakers founded?", "1947 || 1947"], ["Which team won the NBA championship in the year 1947?", "Los Angeles Lakers || Los Angeles Lakers"]]}, "hall_sbj_dict_severe": {"answer_condition": [4, 1], "confidence": [0.91015625, 0.9609375], "model_response": [["In which year was the Los Angeles Lakers founded?", "1947 || 1947"], ["Which team won the NBA championship in the year 1947?", "Los Angeles Lakers || Los Angeles Lakers"]]}, "mis_info_dict_severe": {"answer_condition": [4, 1], "confidence": [0.796875, 0.59765625], "model_response": [["In which year was the Los Angeles Lakers founded?", "1947 || 1947"], ["Which team won the NBA championship in the year 1947?", "Los Angeles Lakers || Los Angeles Lakers"]]}, "mis_info_dict_light": {"answer_condition": [4, 1], "confidence": [0.0908203125, 0.74609375], "model_response": [["In which year was the Los Angeles Lakers founded?", "1948 || 1948"], ["Which team won the NBA championship in the year 1948?", "Los Angeles Lakers || Los Angeles Lakers"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.78125, 0.81640625], "model_response": [["In which year was the Los Angeles Lakers founded?", "1947 || 1947"], ["Which team won the NBA championship in the year 1960?", "The Boston Celtics || Boston Celtics"]]}}}
{"hop1": {"unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.73046875, 0.62109375], "model_response": [["Which country does Washington DC belong to?", "United States || United States"], ["What's the year when Canada the first time formally establish diplomatic relations with United States?", "1917 || 1917"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 4], "confidence": [0.953125, 0.7657470703125], "model_response": [["Which country does Washington DC belong to?", "United States || United States"], ["What's the year when Canada the first time formally establish diplomatic relations with United States?", "1783 || 1783"]]}, "mis_info_dict_light": {"answer_condition": [1, 4], "confidence": [0.5, 0.154083251953125], "model_response": [["Which country does Washington DC belong to?", "United States || United States"], ["What's the year when Canada the first time formally establish diplomatic relations with United States?", "1869 || 1869"]]}, "mis_info_dict_severe": {"answer_condition": [1, 4], "confidence": [0.953125, 0.6533203125], "model_response": [["Which country does Washington DC belong to?", "United States || United States"], ["What's the year when Canada the first time formally establish diplomatic relations with United States?", "1783 || 1783"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 4], "confidence": [0.87890625, 0.7679443359375], "model_response": [["Which country does Washington DC belong to?", "United States || United States"], ["What's the year when Canada the first time formally establish diplomatic relations with United States?", "1783 || 1783"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [0.96875, 0.9384613037109375], "model_response": [["Which country does Washington DC belong to?", "United States || United States"], ["What's the year when Canada the first time formally establish diplomatic relations with United States?", "1783 || 1783"]]}}, "hop2": {"hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.9921875, 0.421875], "model_response": [["Which country does Washington DC belong to?", "United States || United States"], ["What's the year when Canada the first time formally establish diplomatic relations with United States?", "1917 || 1917"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.98046875, 0.76171875], "model_response": [["Which country does Washington DC belong to?", "United States || United States"], ["What's the year when Canada the first time formally establish diplomatic relations with United States?", "1917 || 1917"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 4], "confidence": [0.98046875, 0.2735137939453125], "model_response": [["Which country does Washington DC belong to?", "United States || United States"], ["What's the year when Canada the first time formally establish diplomatic relations with United States?", "1783 || 1783"]]}, "mis_info_dict_light": {"answer_condition": [1, 3], "confidence": [0.73046875, 1.0], "model_response": [["Which country does Washington DC belong to?", "United States || United States"], ["What's the year when Canada the first time formally establish diplomatic relations with United States?", "1867 || 1867"]]}, "mis_info_dict_severe": {"answer_condition": [1, 4], "confidence": [0.98046875, 0.829559326171875], "model_response": [["Which country does Washington DC belong to?", "United States || United States"], ["What's the year when Canada the first time formally establish diplomatic relations with United States?", "1783 || 1783"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [0.99609375, 0.8713531494140625], "model_response": [["Which country does Washington DC belong to?", "United States || United States"], ["What's the year when Canada the first time formally establish diplomatic relations with United States?", "1783 || 1783"]]}}}
{"hop1": {"hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.9765625, 0.99609375], "model_response": [["What's the year when Canada the first time formally establish diplomatic relations with United States?", "1917 || 1917"], ["Which film, starting with the letter \"A,\" won the Oscar for Outstanding Picture in 1917?", "The Birth of a Nation || The Birth of a Nation"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.8046875, 1.0], "model_response": [["What's the year when Canada the first time formally establish diplomatic relations with United States?", "1917 || 1917"], ["Which film, starting with the letter \"A,\" won the Oscar for Outstanding Picture in 1917?", "The Birth of a Nation || The Birth of a Nation"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.895294189453125, 0.99609375], "model_response": [["What's the year when Canada the first time formally establish diplomatic relations with United States?", "1783 || 1783"], ["Which film, starting with the letter \"A,\" won the Oscar for Outstanding Picture in 1917?", "The Birth of a Nation || The Birth of a Nation"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.83984375, 0.99609375], "model_response": [["What's the year when Canada the first time formally establish diplomatic relations with United States?", "1917 || 1917"], ["Which film, starting with the letter \"A,\" won the Oscar for Outstanding Picture in 1917?", "The Birth of a Nation || The Birth of a Nation"]]}, "hall_sbj_dict_light": {"answer_condition": [4, 4], "confidence": [0.2008056640625, 0.5875396728515625], "model_response": [["What's the year when Canada the first time formally establish diplomatic relations with United States?", "1777 || 1777"], ["Which film, starting with the letter \"A,\" won the Oscar for Outstanding Picture in 1777?", "Amadeus || Amadeus"]]}, "mis_info_dict_light": {"answer_condition": [3, 4], "confidence": [1.0, 0.648193359375], "model_response": [["What's the year when Canada the first time formally establish diplomatic relations with United States?", "1867 || 1867"], ["Which film, starting with the letter \"A,\" won the Oscar for Outstanding Picture in 1867?", "A Trip to the Moon || A Trip to the Moon"]]}}, "hop2": {"hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.80078125, 0.9922027587890625], "model_response": [["What's the year when Canada the first time formally establish diplomatic relations with United States?", "1917 || 1917"], ["Which film, starting with the letter \"A,\" won the Oscar for Outstanding Picture in 1917?", "The Birth of a Nation || The Birth of a Nation"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.91796875, 0.9221649169921875], "model_response": [["What's the year when Canada the first time formally establish diplomatic relations with United States?", "1917 || 1917"], ["Which film, starting with the letter \"A,\" won the Oscar for Outstanding Picture in 1917?", "The Birth of a Nation (1915) || The Birth of a Nation"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.9921875, 0.957489013671875], "model_response": [["What's the year when Canada the first time formally establish diplomatic relations with United States?", "1917 || 1917"], ["Which film, starting with the letter \"A,\" won the Oscar for Outstanding Picture in 1917?", "The Birth of a Nation || The Birth of a Nation"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.9765625, 0.9765625], "model_response": [["What's the year when Canada the first time formally establish diplomatic relations with United States?", "1917 || 1917"], ["Which film, starting with the letter \"A,\" won the Oscar for Outstanding Picture in 1917?", "The Birth of a Nation || The Birth of a Nation"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.7587432861328125, 0.9921875], "model_response": [["What's the year when Canada the first time formally establish diplomatic relations with United States?", "1917 || 1917"], ["Which film, starting with the letter \"A,\" won the Oscar for Outstanding Picture in 1917?", "The Birth of a Nation || The Birth of a Nation"]]}, "mis_info_dict_light": {"answer_condition": [1, 4], "confidence": [0.9140625, 1.0], "model_response": [["What's the year when Canada the first time formally establish diplomatic relations with United States?", "1917 || 1917"], ["Which film, starting with the letter \"A,\" won the Oscar for Outstanding Picture in 1917?", "The film \"All Quiet on the Western Front\" won the Oscar for Outstanding Picture in 1917. || All Quiet on the Western Front"]]}}}
{"hop1": {"mis_info_dict_severe": {"answer_condition": [-1, -1], "confidence": [-1, -1], "model_response": [["In which year was Jennifer Jones born?", "I'm sorry, I don't have access to that specific information. || N/A"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, -1], "confidence": [0.99609375, -1], "model_response": [["In which year was Jennifer Jones born?", "1921 || 1921"], ["Who is the headmaster of Harvard University in the year 1921?", "Harvard University did not have a headmaster in 1921. || N/A"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, -1], "confidence": [0.99609375, -1], "model_response": [["In which year was Jennifer Jones born?", "1921 || 1921"], ["Who is the headmaster of Harvard University in the year 1921?", "Harvard University does not have a headmaster in 1921. || N/A"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, -1], "confidence": [0.99609375, -1], "model_response": [["In which year was Jennifer Jones born?", "1921 || 1921"], ["Who is the headmaster of Harvard University in the year 1921?", "Harvard University did not have a headmaster in the year 1921. || N/A"]]}, "hall_sbj_dict_light": {"answer_condition": [1, -1], "confidence": [0.9921875, -1], "model_response": [["In which year was Jennifer Jones born?", "1921 || 1921"], ["Who is the headmaster of Harvard University in the year 1921?", "Harvard University did not have a headmaster at that time. It was led by a president. || N/A"]]}, "mis_info_dict_light": {"answer_condition": [3, -1], "confidence": [1.0, -1], "model_response": [["In which year was Jennifer Jones born?", "1935 || 1935"], ["Who is the headmaster of Harvard University in the year 1935?", "Harvard University does not have a headmaster in the year 1935. It has a president, who is currently Lawrence S. Bacow. || N/A"]]}}, "hop2": {"unrelated_fact_dict_light": {"answer_condition": [1, -1], "confidence": [0.99609375, -1], "model_response": [["In which year was Jennifer Jones born?", "1921 || 1921"], ["Who is the headmaster of Harvard University in the year 1921?", "Harvard University did not have a headmaster in the year 1921. || N/A"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, -1], "confidence": [1.0, -1], "model_response": [["In which year was Jennifer Jones born?", "1921 || 1921"], ["Who is the headmaster of Harvard University in the year 1921?", "Harvard University did not have a headmaster in the year 1921. || N/A"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.99609375, 1.0], "model_response": [["In which year was Jennifer Jones born?", "1921 || 1921"], ["Who is the headmaster of Harvard University in the year 1921?", "Charles W. Eliot || Charles W. Eliot"]]}, "hall_sbj_dict_light": {"answer_condition": [1, -1], "confidence": [0.98828125, -1], "model_response": [["In which year was Jennifer Jones born?", "1921 || 1921"], ["Who is the headmaster of Harvard University in the year 1921?", "Harvard University did not have a headmaster in the year 1921. || N/A"]]}, "mis_info_dict_severe": {"answer_condition": [1, 3], "confidence": [0.99609375, 1.0], "model_response": [["In which year was Jennifer Jones born?", "1921 || 1921"], ["Who is the headmaster of Harvard University in the year 1921?", "Pizza || Pizza"]]}, "mis_info_dict_light": {"answer_condition": [1, 4], "confidence": [0.98046875, 1.0], "model_response": [["In which year was Jennifer Jones born?", "1921 || 1921"], ["Who is the headmaster of Harvard University in the year 1921?", "John F. Kennedy || John F. Kennedy"]]}}}
{"hop1": {"hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["In which year was The Birth of a Nation released?", "1915 || 1915"], ["Who was the US president in the year 1915?", "Woodrow Wilson || Woodrow Wilson"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["In which year was The Birth of a Nation released?", "1915 || 1915"], ["Who was the US president in the year 1915?", "Woodrow Wilson || Woodrow Wilson"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["In which year was The Birth of a Nation released?", "1915 || 1915"], ["Who was the US president in the year 1915?", "Woodrow Wilson || Woodrow Wilson"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["In which year was The Birth of a Nation released?", "1915 || 1915"], ["Who was the US president in the year 1915?", "Woodrow Wilson || Woodrow Wilson"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["In which year was The Birth of a Nation released?", "1915 || 1915"], ["Who was the US president in the year 1915?", "Woodrow Wilson || Woodrow Wilson"]]}, "mis_info_dict_light": {"answer_condition": [3, 1], "confidence": [1.0, 0.921875], "model_response": [["In which year was The Birth of a Nation released?", "1920 || 1920"], ["Who was the US president in the year 1920?", "Woodrow Wilson || Woodrow Wilson"]]}}, "hop2": {"unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["In which year was The Birth of a Nation released?", "1915 || 1915"], ["Who was the US president in the year 1915?", "Woodrow Wilson || Woodrow Wilson"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["In which year was The Birth of a Nation released?", "1915 || 1915"], ["Who was the US president in the year 1915?", "Woodrow Wilson || Woodrow Wilson"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["In which year was The Birth of a Nation released?", "1915 || 1915"], ["Who was the US president in the year 1915?", "Woodrow Wilson || Woodrow Wilson"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["In which year was The Birth of a Nation released?", "1915 || 1915"], ["Who was the US president in the year 1915?", "Woodrow Wilson || Woodrow Wilson"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["In which year was The Birth of a Nation released?", "1915 || 1915"], ["Who was the US president in the year 1915?", "Woodrow Wilson || Woodrow Wilson"]]}, "mis_info_dict_light": {"answer_condition": [1, 3], "confidence": [1.0, 0.99609375], "model_response": [["In which year was The Birth of a Nation released?", "1915 || 1915"], ["Who was the US president in the year 1915?", "Theodore Roosevelt || Theodore Roosevelt"]]}}}
{"hop1": {"mis_info_dict_severe": {"answer_condition": [1, 4], "confidence": [0.84625244140625, 0.3922119140625], "model_response": [["What's the year when Russia the first time formally establish diplomatic relations with United Kingdom?", "1840 || 1840"], ["Which film won the Oscar for Outstanding Picture in 1840, being the first one in alphabetical order?", "The first film to win an Oscar for Outstanding Picture was \"The Artist\" in 1940. || The Artist"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.03713226318359375], "model_response": [["What's the year when Russia the first time formally establish diplomatic relations with United Kingdom?", "1840 || 1840"], ["Which film won the Oscar for Outstanding Picture in 1840, being the first one in alphabetical order?", "The first film to win the Oscar for Outstanding Picture in alphabetical order is \"The Four Horsemen of the Apocalypse\" in 1921. || The Four Horsemen of the Apocalypse"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 0.01063415001794965], "model_response": [["What's the year when Russia the first time formally establish diplomatic relations with United Kingdom?", "1840 || 1840"], ["Which film won the Oscar for Outstanding Picture in 1840, being the first one in alphabetical order?", "The first film to win the Oscar for Outstanding Picture in 1840 was \"The Life of Joshua Logan\" (1940). || The Life of Joshua Logan"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 4], "confidence": [0.057773590087890625, 0.426727294921875], "model_response": [["What's the year when Russia the first time formally establish diplomatic relations with United Kingdom?", "1785 || 1785"], ["Which film won the Oscar for Outstanding Picture in 1785, being the first one in alphabetical order?", "The first film to win the Oscar for Outstanding Picture in 1785 was \"The Quiet Man\" (1952). || The Quiet Man"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 4], "confidence": [0.02094268798828125, 0.281097412109375], "model_response": [["What's the year when Russia the first time formally establish diplomatic relations with United Kingdom?", "1894 || 1894"], ["Which film won the Oscar for Outstanding Picture in 1894, being the first one in alphabetical order?", "The Great Train Robbery (1903) || The Great Train Robbery"]]}, "mis_info_dict_light": {"answer_condition": [3, 4], "confidence": [1.0, 0.4497590661048889], "model_response": [["What's the year when Russia the first time formally establish diplomatic relations with United Kingdom?", "1810 || 1810"], ["Which film won the Oscar for Outstanding Picture in 1810, being the first one in alphabetical order?", "The first film to win the Oscar for Outstanding Picture in 1810 was \"The Red Shoes\" (1948). || The Red Shoes"]]}}, "hop2": {"mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.84375, 1.0], "model_response": [["What's the year when Russia the first time formally establish diplomatic relations with United Kingdom?", "1840 || 1840"], ["Which film won the Oscar for Outstanding Picture in 1840, being the first one in alphabetical order?", "Oliver Twist || Oliver Twist"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [0.4521331787109375, 0.4456132650375366], "model_response": [["What's the year when Russia the first time formally establish diplomatic relations with United Kingdom?", "1840 || 1840"], ["Which film won the Oscar for Outstanding Picture in 1840, being the first one in alphabetical order?", "The Old Curiosity Shop || The Old Curiosity Shop"]]}, "mis_info_dict_light": {"answer_condition": [1, 4], "confidence": [0.9844207763671875, 1.0], "model_response": [["What's the year when Russia the first time formally establish diplomatic relations with United Kingdom?", "1840 || 1840"], ["Which film won the Oscar for Outstanding Picture in 1840, being the first one in alphabetical order?", "Gone with the Wind || Gone with the Wind"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 4], "confidence": [0.9766845703125, 1.0], "model_response": [["What's the year when Russia the first time formally establish diplomatic relations with United Kingdom?", "1840 || 1840"], ["Which film won the Oscar for Outstanding Picture in 1840, being the first one in alphabetical order?", "Sunflowers || Sunflowers"]]}, "hall_sbj_dict_light": {"answer_condition": [4, 1], "confidence": [0.3667449951171875, 0.98046875], "model_response": [["What's the year when Russia the first time formally establish diplomatic relations with United Kingdom?", "1825 || 1825"], ["Which film won the Oscar for Outstanding Picture in 1825, being the first one in alphabetical order?", "Oliver Twist || Oliver Twist"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 4], "confidence": [0.09570121765136719, 0.87109375], "model_response": [["What's the year when Russia the first time formally establish diplomatic relations with United Kingdom?", "1825 || 1825"], ["Which film won the Oscar for Outstanding Picture in 1825, being the first one in alphabetical order?", "The Mona Lisa || The Mona Lisa"]]}}}
{"hop1": {"mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.81640625], "model_response": [["Which country in Asia is the most populated?", "China || China"], ["What is the name of the longest river in China?", "The Yangtze River || Yangtze River"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.656280517578125], "model_response": [["Which country in Asia is the most populated?", "China || China"], ["What is the name of the longest river in China?", "The Yangtze River || The Yangtze River"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.72381591796875], "model_response": [["Which country in Asia is the most populated?", "China || China"], ["What is the name of the longest river in China?", "The Yangtze River || The Yangtze River"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.1748046875], "model_response": [["Which country in Asia is the most populated?", "China || China"], ["What is the name of the longest river in China?", "Yangtze || Yangtze"]]}, "mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.72381591796875], "model_response": [["Which country in Asia is the most populated?", "China || China"], ["What is the name of the longest river in China?", "The Yangtze River || The Yangtze River"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.87890625], "model_response": [["Which country in Asia is the most populated?", "China || China"], ["What is the name of the longest river in China?", "The Yangtze River || Yangtze River"]]}}, "hop2": {"unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.4593963623046875], "model_response": [["Which country in Asia is the most populated?", "China || China"], ["What is the name of the longest river in China?", "The Yangtze River || The Yangtze River"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 0.140625], "model_response": [["Which country in Asia is the most populated?", "China || China"], ["What is the name of the longest river in China?", "Yellow River || Yellow River"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.53375244140625], "model_response": [["Which country in Asia is the most populated?", "China || China"], ["What is the name of the longest river in China?", "The Yellow River || The Yellow River"]]}, "mis_info_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.045166015625], "model_response": [["Which country in Asia is the most populated?", "China || China"], ["What is the name of the longest river in China?", "Yellow River || Yellow River"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.94921875], "model_response": [["Which country in Asia is the most populated?", "China || China"], ["What is the name of the longest river in China?", "The Yellow River || The Yellow River"]]}, "mis_info_dict_light": {"answer_condition": [1, 3], "confidence": [1.0, 1.0], "model_response": [["Which country in Asia is the most populated?", "China || China"], ["What is the name of the longest river in China?", "The Yellow River || The Yellow River"]]}}}
{"hop1": {"mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.97265625, 0.98046875], "model_response": [["What is the capital of Finland?", "Helsinki || Helsinki"], ["What is the largest company (by number of people) based in Oslo?", "Aker Solutions || Aker Solutions"]]}, "mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [0.96875, 0.9921875], "model_response": [["What is the capital of Finland?", "Helsinki || Helsinki"], ["What is the largest company (by number of people) based in Oslo?", "Aker Solutions || Aker Solutions"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.98828125, 0.96484375], "model_response": [["What is the capital of Finland?", "Helsinki || Helsinki"], ["What is the largest company (by number of people) based in Oslo?", "Aker Solutions || Aker Solutions"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.9921875, 0.94140625], "model_response": [["What is the capital of Finland?", "Helsinki || Helsinki"], ["What is the largest company (by number of people) based in Oslo?", "Aker Solutions || Aker Solutions"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.90625, 0.98828125], "model_response": [["What is the capital of Finland?", "Helsinki || Helsinki"], ["What is the largest company (by number of people) based in Oslo?", "Aker Solutions || Aker Solutions"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.90625, 0.98828125], "model_response": [["What is the capital of Finland?", "Helsinki || Helsinki"], ["What is the largest company (by number of people) based in Oslo?", "Aker Solutions || Aker Solutions"]]}}, "hop2": {"mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [0.96875, 0.26953125], "model_response": [["What is the capital of Finland?", "Helsinki || Helsinki"], ["What is the largest company (by number of people) based in Oslo?", "Aker Solutions || Aker Solutions"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.96484375, 1.0], "model_response": [["What is the capital of Finland?", "Helsinki || Helsinki"], ["What is the largest company (by number of people) based in Oslo?", "Aker Solutions ASA || Aker Solutions ASA"]]}, "mis_info_dict_severe": {"answer_condition": [1, 3], "confidence": [0.921875, 0.984375], "model_response": [["What is the capital of Finland?", "Helsinki || Helsinki"], ["What is the largest company (by number of people) based in Oslo?", "Pizza Hut || Pizza Hut"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 3], "confidence": [0.921875, 0.83984375], "model_response": [["What is the capital of Finland?", "Helsinki || Helsinki"], ["What is the largest company (by number of people) based in Oslo?", "Coffee beans || Coffee beans"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 4], "confidence": [0.1580810546875, 0.06565303278875945], "model_response": [["What is the capital of Finland?", "Helena || Helena"], ["What is the largest company (by number of people) based in Helena?", "Helena National Bank and Trust Company || Helena National Bank and Trust Company"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 4], "confidence": [0.04611968994140625, 0.02780397882632002], "model_response": [["What is the capital of Finland?", "HelSinki || HelSinki"], ["What is the largest company (by number of people) based in Helsinki?", "Helsinki Stock Exchange (HEL:HEX) || Helsinki Stock Exchange (HEL:HEX)"]]}}}
{"hop1": {"hall_sbj_dict_severe": {"answer_condition": [1, -1], "confidence": [0.62109375, -1], "model_response": [["In which year was Richard Nixon born?", "1908 || 1908"], ["Who were the best actors at the Oscars in 1908?", "I'm sorry, I don't have information on the best actors at the Oscars in 1908. || N/A"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, -1], "confidence": [0.953125, -1], "model_response": [["In which year was Richard Nixon born?", "1913 || 1913"], ["Who were the best actors at the Oscars in 1913?", "The Oscars were not held in 1913. || N/A"]]}, "hall_sbj_dict_light": {"answer_condition": [4, -1], "confidence": [0.1826171875, -1], "model_response": [["In which year was Richard Nixon born?", "1913 || 1913"], ["Who were the best actors at the Oscars in 1913?", "The best actors at the Oscars in 1913 were not nominated for any awards. || N/A"]]}, "mis_info_dict_light": {"answer_condition": [4, -1], "confidence": [1.0, -1], "model_response": [["In which year was Richard Nixon born?", "1913 || 1913"], ["Who were the best actors at the Oscars in 1913?", "I'm sorry, I cannot provide an answer to that question as it is not relevant to the given reference. || N/A"]]}, "mis_info_dict_severe": {"answer_condition": [4, 4], "confidence": [0.99609375, 0.005559827477554791], "model_response": [["In which year was Richard Nixon born?", "1913 || 1913"], ["Who were the best actors at the Oscars in 1913?", "Lillian Gish and William S. Hart were the best actors at the Oscars in 1913. || Lillian Gish and William S. Hart"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, -1], "confidence": [0.98828125, -1], "model_response": [["In which year was Richard Nixon born?", "1913 || 1913"], ["Who were the best actors at the Oscars in 1913?", "The following actors won Oscars in 1913:\n\nBest Actor: Wallace Beery, The Champ\n\nBest Actress: Alla Nazimova, The Dumb Girl of Portici\n\nBest Supporting Actor: Lionel Barrymore, A Free Soul\n\nBest Supporting Actress: May Robson, The Little Minister || N/A"]]}}, "hop2": {"unrelated_fact_dict_light": {"answer_condition": [1, -1], "confidence": [0.9921875, -1], "model_response": [["In which year was Richard Nixon born?", "1908 || 1908"], ["Who were the best actors at the Oscars in 1908?", "Sorry, I cannot provide an answer to this question as the given information is not relevant to the current question. || N/A"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, -1], "confidence": [0.81640625, -1], "model_response": [["In which year was Richard Nixon born?", "1913 || 1913"], ["Who were the best actors at the Oscars in 1913?", "I'm sorry, I cannot provide an answer to that question as there were no Oscars in 1913. || N/A"]]}, "mis_info_dict_severe": {"answer_condition": [1, 4], "confidence": [0.5, 0.1943359375], "model_response": [["In which year was Richard Nixon born?", "1908 || 1908"], ["Who were the best actors at the Oscars in 1908?", "Richard Nixon || Richard Nixon"]]}, "mis_info_dict_light": {"answer_condition": [1, 4], "confidence": [0.81640625, 0.5150243639945984], "model_response": [["In which year was Richard Nixon born?", "1908 || 1908"], ["Who were the best actors at the Oscars in 1908?", "Charlie Chaplin and Mary Pickford. || Charlie Chaplin and Mary Pickford"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 4], "confidence": [0.99609375, 0.859375], "model_response": [["In which year was Richard Nixon born?", "1908 || 1908"], ["Who were the best actors at the Oscars in 1908?", "Richard Nixon was the best actor at the Oscars in 1908. || Richard Nixon"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 4], "confidence": [0.119140625, 1.0], "model_response": [["In which year was Richard Nixon born?", "1908 || 1908"], ["Who were the best actors at the Oscars in 1908?", "Orchids || Orchids"]]}}}
{"hop1": {"mis_info_dict_light": {"answer_condition": [4, 4], "confidence": [1.0, 0.396331787109375], "model_response": [["Which country is the northernmost in the UTC+0 time zone?", "Iceland || Iceland"], ["What's the year when Iceland first formally established diplomatic relations with the United Kingdom?", "1925 || 1925"]]}, "hall_sbj_dict_light": {"answer_condition": [4, 4], "confidence": [1.0, 0.396331787109375], "model_response": [["Which country is the northernmost in the UTC+0 time zone?", "Iceland || Iceland"], ["What's the year when Iceland first formally established diplomatic relations with the United Kingdom?", "1925 || 1925"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 4], "confidence": [0.50634765625, 0.20873260498046875], "model_response": [["Which country is the northernmost in the UTC+0 time zone?", "Iceland || Iceland"], ["What's the year when Iceland first formally established diplomatic relations with the United Kingdom?", "1926 || 1926"]]}, "mis_info_dict_severe": {"answer_condition": [3, 4], "confidence": [1.0, 0.05037689208984375], "model_response": [["Which country is the northernmost in the UTC+0 time zone?", "Pizza || Pizza"], ["What's the year when Pizza the first time formally establish diplomatic relations with United Kingdom?", "1842 || 1842"]]}, "hall_sbj_dict_severe": {"answer_condition": [4, 4], "confidence": [0.65234375, 0.345703125], "model_response": [["Which country is the northernmost in the UTC+0 time zone?", "Finland || Finland"], ["What's the year when Finland first formally established diplomatic relations with United Kingdom?", "1855 || 1855"]]}, "unrelated_fact_dict_light": {"answer_condition": [3, 4], "confidence": [1.0, 0.396331787109375], "model_response": [["Which country is the northernmost in the UTC+0 time zone?", "Iceland || Iceland"], ["What's the year when Iceland first formally established diplomatic relations with the United Kingdom?", "1925 || 1925"]]}}, "hop2": {"unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.94140625, 1.0], "model_response": [["Which country is the northernmost in the UTC+0 time zone?", "Norway || Norway"], ["What's the year when Norway the first time formally establish diplomatic relations with United Kingdom?", "1814 || 1814"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.96484375, 0.98828125], "model_response": [["Which country is the northernmost in the UTC+0 time zone?", "Norway || Norway"], ["What's the year when Norway the first time formally establish diplomatic relations with United Kingdom?", "1814 || 1814"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.98828125, 1.0], "model_response": [["Which country is the northernmost in the UTC+0 time zone?", "Norway || Norway"], ["What's the year when Norway the first time formally establish diplomatic relations with United Kingdom?", "1814 || 1814"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.98046875, 0.99609375], "model_response": [["Which country is the northernmost in the UTC+0 time zone?", "Norway || Norway"], ["What's the year when Norway the first time formally establish diplomatic relations with United Kingdom?", "1814 || 1814"]]}, "mis_info_dict_light": {"answer_condition": [1, 3], "confidence": [0.80078125, 1.0], "model_response": [["Which country is the northernmost in the UTC+0 time zone?", "Norway || Norway"], ["What's the year when Norway the first time formally establish diplomatic relations with United Kingdom?", "1901 || 1901"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 3], "confidence": [0.9375, 1.0], "model_response": [["Which country is the northernmost in the UTC+0 time zone?", "Norway || Norway"], ["What's the year when Norway the first time formally establish diplomatic relations with United Kingdom?", "1871 || 1871"]]}}}
{"hop1": {"unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [0.869317352771759, 1.0], "model_response": [["Who is the president / leader of Norway in the year 1814?", "Christian Frederick of Denmark || Christian Frederick of Denmark"], ["In which year was Christian Frederick of Denmark born?", "1729 || 1729"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 4], "confidence": [0.9844207763671875, 0.59765625], "model_response": [["Who is the president / leader of Norway in the year 1814?", "Christian Frederick of Denmark is the president / leader of Norway in the year 1814. || Christian Frederick of Denmark"], ["In which year was Christian Frederick of Denmark born?", "1770 || 1770"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [0.6210850900970399, 1.0], "model_response": [["Who is the president / leader of Norway in the year 1814?", "Christian Frederick of Denmark is the president / leader of Norway in the year 1814. || Christian Frederick of Denmark"], ["In which year was Christian Frederick of Denmark born?", "1729 || 1729"]]}, "mis_info_dict_severe": {"answer_condition": [3, 4], "confidence": [1.0, 0.98046875], "model_response": [["Who is the president / leader of Norway in the year 1814?", "Pizza || Pizza"], ["In which year was pizza born?", "1814 || 1814"]]}, "mis_info_dict_light": {"answer_condition": [4, 4], "confidence": [1.0, 0.7276153564453125], "model_response": [["Who is the president / leader of Norway in the year 1814?", "Gustav IV Adolf of Sweden is the president / leader of Norway in the year 1814. || Gustav IV Adolf of Sweden"], ["In which year was Gustav IV Adolf of Sweden born?", "1771 || 1771"]]}, "hall_sbj_dict_severe": {"answer_condition": [4, 4], "confidence": [0.0009924790547499729, 0.042236328125], "model_response": [["Who is the president / leader of Norway in the year 1814?", "The president/leader of Norway in the year 1814 is Karl Wilhelm von Schimmelmann. || Karl Wilhelm von Schimmelmann"], ["In which year was Karl Wilhelm von Schimmelmann born?", "1751 || 1751"]]}}, "hop2": {"hall_sbj_dict_severe": {"answer_condition": [1, 4], "confidence": [0.26032263587694615, 0.96875], "model_response": [["Who is the president / leader of Norway in the year 1814?", "Christian Frederick of Denmark is the president / leader of Norway in the year 1814. || Christian Frederick of Denmark"], ["In which year was Christian Frederick of Denmark born?", "1729 || 1729"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 4], "confidence": [0.0642925500869751, 0.919189453125], "model_response": [["Who is the president / leader of Norway in the year 1814?", "King Christian VIII || King Christian VIII"], ["In which year was King Christian VIII of Denmark born?", "1749 || 1749"]]}, "mis_info_dict_light": {"answer_condition": [1, 3], "confidence": [0.9921875, -1.0], "model_response": [["Who is the president / leader of Norway in the year 1814?", "Christian Frederick of Denmark was born in 1600. || Christian Frederick of Denmark"], ["In which year was Christian Frederick of Denmark born?", "1600 || 1600"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 4], "confidence": [0.6251435279846191, 0.911529541015625], "model_response": [["Who is the president / leader of Norway in the year 1814?", "King Christian VIII || King Christian VIII"], ["In which year was King Christian VIII of Denmark born?", "1749 || 1749"]]}, "hall_sbj_dict_light": {"answer_condition": [4, 4], "confidence": [0.1193665782102471, 0.9380950927734375], "model_response": [["Who is the president / leader of Norway in the year 1814?", "King Christian VIII of Denmark. || King Christian VIII of Denmark"], ["In which year was King Christian VIII of Denmark born?", "1749 || 1749"]]}, "mis_info_dict_severe": {"answer_condition": [3, 4], "confidence": [1.0, 0.890625], "model_response": [["Who is the president / leader of Norway in the year 1814?", "Christian Frederick of Denmark was born in the year Pizza. || Pizza"], ["In which year was pizza born?", "1814 || 1814"]]}}}
{"hop1": {"hall_sbj_dict_light": {"answer_condition": [1, -1], "confidence": [0.953125, -1], "model_response": [["Which university or college did Kingman Brewster attend as a graduate student?", "Harvard University || Harvard University"], ["Who is the headmaster of Harvard University in the year 1953?", "Harvard University was founded in 1636 by the Massachusetts Bay Colony. The university is located in Cambridge, Massachusetts. || N/A"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [0.9766387939453125, 0.55859375], "model_response": [["Which university or college did Kingman Brewster attend as a graduate student?", "Harvard University || Harvard University"], ["Who is the headmaster of Harvard University in the year 1953?", "Harvard University || Harvard University"]]}, "mis_info_dict_severe": {"answer_condition": [4, -1], "confidence": [1.0, -1], "model_response": [["Which university or college did Kingman Brewster attend as a graduate student?", "Pizza Hut || Pizza Hut"], ["Who is the headmaster of Pizza Hut in the year 1953?", "I'm sorry, I cannot provide an answer to this question as it is not related to the given reference. || N/A"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 4], "confidence": [0.972808837890625, 0.029945924878120422], "model_response": [["Which university or college did Kingman Brewster attend as a graduate student?", "Harvard University || Harvard University"], ["Who is the headmaster of Harvard University in the year 1953?", "Dr. John Harvard || Dr. John Harvard"]]}, "mis_info_dict_light": {"answer_condition": [4, 4], "confidence": [1.0, 0.08161583537003025], "model_response": [["Which university or college did Kingman Brewster attend as a graduate student?", "Yale University || Yale University"], ["Who is the headmaster of Yale University in the year 1953?", "Dr. David Swinton || Dr. David Swinton"]]}, "unrelated_fact_dict_light": {"answer_condition": [3, 4], "confidence": [0.953125, 0.4296875], "model_response": [["Which university or college did Kingman Brewster attend as a graduate student?", "Princeton University || Princeton University"], ["Who is the headmaster of Princeton University in the year 1953?", "Kingman Brewster || Kingman Brewster"]]}}, "hop2": {"mis_info_dict_severe": {"answer_condition": [1, -1], "confidence": [0.953125, -1], "model_response": [["Which university or college did Kingman Brewster attend as a graduate student?", "Harvard || Harvard"], ["Who is the headmaster of Harvard University in the year 1953?", "I'm sorry, I don't have enough information to answer that question. || N/A"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.48448944091796875, 0.961181640625], "model_response": [["Which university or college did Kingman Brewster attend as a graduate student?", "Harvard University || Harvard University"], ["Who is the headmaster of Harvard University in the year 1953?", "Harold R. Varmus || Harold R. Varmus"]]}, "mis_info_dict_light": {"answer_condition": [1, 4], "confidence": [0.83770751953125, 1.0], "model_response": [["Which university or college did Kingman Brewster attend as a graduate student?", "Harvard University || Harvard University"], ["Who is the headmaster of Harvard University in the year 1953?", "John F. Kennedy || John F. Kennedy"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.8617401123046875, 0.92578125], "model_response": [["Which university or college did Kingman Brewster attend as a graduate student?", "Harvard University || Harvard University"], ["Who is the headmaster of Harvard University in the year 1953?", "Harold R. Varmus || Harold R. Varmus"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [0.7724761962890625, 0.0723724365234375], "model_response": [["Which university or college did Kingman Brewster attend as a graduate student?", "Harvard University || Harvard University"], ["Who is the headmaster of Harvard University in the year 1953?", "Charles William Eliot || Charles William Eliot"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [0.9455108642578125, 0.984375], "model_response": [["Which university or college did Kingman Brewster attend as a graduate student?", "Harvard University || Harvard University"], ["Who is the headmaster of Harvard University in the year 1953?", "Harvard University || Harvard University"]]}}}
{"hop1": {"hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.265625, 1.0], "model_response": [["What's the year when Canada the first time formally establish diplomatic relations with United States?", "1917 || 1917"], ["Who was the US president in the year 1917?", "Woodrow Wilson || Woodrow Wilson"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.83984375, 1.0], "model_response": [["What's the year when Canada the first time formally establish diplomatic relations with United States?", "1917 || 1917"], ["Who was the US president in the year 1917?", "Woodrow Wilson || Woodrow Wilson"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["What's the year when Canada the first time formally establish diplomatic relations with United States?", "1917 || 1917"], ["Who was the US president in the year 1917?", "Woodrow Wilson || Woodrow Wilson"]]}, "mis_info_dict_severe": {"answer_condition": [4, 4], "confidence": [0.007140398025512695, 1.0], "model_response": [["What's the year when Canada the first time formally establish diplomatic relations with United States?", "1791 || 1791"], ["Who was the US president in the year 1791?", "George Washington || George Washington"]]}, "mis_info_dict_light": {"answer_condition": [3, 4], "confidence": [1.0, 1.0], "model_response": [["What's the year when Canada the first time formally establish diplomatic relations with United States?", "1867 || 1867"], ["Who was the US president in the year 1867?", "Andrew Johnson || Andrew Johnson"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 4], "confidence": [0.3398895263671875, 0.87890625], "model_response": [["What's the year when Canada the first time formally establish diplomatic relations with United States?", "1783 || 1783"], ["Who was the US president in the year 1783?", "George Washington || George Washington"]]}}, "hop2": {"mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.99609375, 0.9921875], "model_response": [["What's the year when Canada the first time formally establish diplomatic relations with United States?", "1917 || 1917"], ["Who was the US president in the year 1917?", "Woodrow Wilson || Woodrow Wilson"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.66015625, 1.0], "model_response": [["What's the year when Canada the first time formally establish diplomatic relations with United States?", "1917 || 1917"], ["Who was the US president in the year 1917?", "Woodrow Wilson || Woodrow Wilson"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.99609375, 1.0], "model_response": [["What's the year when Canada the first time formally establish diplomatic relations with United States?", "1917 || 1917"], ["Who was the US president in the year 1917?", "Woodrow Wilson || Woodrow Wilson"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.99609375, 1.0], "model_response": [["What's the year when Canada the first time formally establish diplomatic relations with United States?", "1917 || 1917"], ["Who was the US president in the year 1917?", "Woodrow Wilson || Woodrow Wilson"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.9921875, 1.0], "model_response": [["What's the year when Canada the first time formally establish diplomatic relations with United States?", "1917 || 1917"], ["Who was the US president in the year 1917?", "Woodrow Wilson || Woodrow Wilson"]]}, "mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [0.99609375, 1.0], "model_response": [["What's the year when Canada the first time formally establish diplomatic relations with United States?", "1917 || 1917"], ["Who was the US president in the year 1917?", "Woodrow Wilson || Woodrow Wilson"]]}}}
{"hop1": {"hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.99609375, 0.953125], "model_response": [["In which city is the headquarters of the US Congress located?", "Washington DC || Washington DC"], ["Which country does Washington DC belong to?", "United States || United States"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.953125], "model_response": [["In which city is the headquarters of the US Congress located?", "Washington DC || Washington DC"], ["Which country does Washington DC belong to?", "United States || United States"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.9921875, 0.99609375], "model_response": [["In which city is the headquarters of the US Congress located?", "Washington D.C. || Washington D.C."], ["Which country does Washington DC belong to?", "United States || United States"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.96484375, 0.9921875], "model_response": [["In which city is the headquarters of the US Congress located?", "Washington D.C. || Washington D.C."], ["Which country does Washington DC belong to?", "United States || United States"]]}, "mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [0.988311767578125, 0.98046875], "model_response": [["In which city is the headquarters of the US Congress located?", "Washington D.C. || Washington D.C."], ["Which country does Washington DC belong to?", "United States || United States"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.9453125, 0.9921875], "model_response": [["In which city is the headquarters of the US Congress located?", "Washington D.C. || Washington D.C."], ["Which country does Washington DC belong to?", "United States || United States"]]}}, "hop2": {"mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.9921875, 0.9921875], "model_response": [["In which city is the headquarters of the US Congress located?", "Washington DC || Washington DC"], ["Which country does Washington DC belong to?", "United States || United States"]]}, "mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [0.9921875, 0.119140625], "model_response": [["In which city is the headquarters of the US Congress located?", "Washington DC || Washington DC"], ["Which country does Washington DC belong to?", "The United States || The United States"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.9921875, 0.9921875], "model_response": [["In which city is the headquarters of the US Congress located?", "Washington D.C. || Washington D.C."], ["Which country does Washington DC belong to?", "United States || United States"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.96484375, 0.98046875], "model_response": [["In which city is the headquarters of the US Congress located?", "Washington D.C. || Washington D.C."], ["Which country does Washington DC belong to?", "United States || United States"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.96484375, 0.99609375], "model_response": [["In which city is the headquarters of the US Congress located?", "Washington D.C. || Washington D.C."], ["Which country does Washington DC belong to?", "United States || United States"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.96484375, 0.9921875], "model_response": [["In which city is the headquarters of the US Congress located?", "Washington D.C. || Washington D.C."], ["Which country does Washington DC belong to?", "United States || United States"]]}}}
{"hop1": {"mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.7734375, 0.498046875], "model_response": [["Which city hosted the first Olympic Games in 1971?", "Munich || Munich"], ["What is the name of the largest airport in Munich?", "Munich Airport || Munich Airport"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.904083251953125], "model_response": [["Which city hosted the first Olympic Games in 1971?", "Munich || Munich"], ["What is the name of the largest airport in Munich?", "Munich Airport (Franz Josef Strau\u00df International Airport) || Munich Airport"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.98046875, 0.6186676025390625], "model_response": [["Which city hosted the first Olympic Games in 1971?", "Munich || Munich"], ["What is the name of the largest airport in Munich?", "Munich Airport || Munich Airport"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.16073745489120483], "model_response": [["Which city hosted the first Olympic Games in 1971?", "Munich || Munich"], ["What is the name of the largest airport in Munich?", "Franz Josef Strauss International Airport || Franz Josef Strauss International Airport"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 4], "confidence": [0.8125, 1.0], "model_response": [["Which city hosted the first Olympic Games in 1971?", "London || London"], ["What is the name of the largest airport in London?", "Heathrow || Heathrow"]]}, "mis_info_dict_light": {"answer_condition": [3, 4], "confidence": [1.0, 0.5458831787109375], "model_response": [["Which city hosted the first Olympic Games in 1971?", "Rome || Rome"], ["What is the name of the largest airport in Rome?", "Fiumicino Airport || Fiumicino Airport"]]}}, "hop2": {"unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.99609375, 0.87890625], "model_response": [["Which city hosted the first Olympic Games in 1971?", "Munich || Munich"], ["What is the name of the largest airport in Munich?", "Munich Airport || Munich Airport"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.9921875, 0.8617401123046875], "model_response": [["Which city hosted the first Olympic Games in 1971?", "Munich || Munich"], ["What is the name of the largest airport in Munich?", "Munich Airport || Munich Airport"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.99609375, 0.62109375], "model_response": [["Which city hosted the first Olympic Games in 1971?", "Munich (Germany) || Munich"], ["What is the name of the largest airport in Munich?", "Munich Airport (Franz Josef Strau\u00df International Airport) || Munich Airport"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.73046875], "model_response": [["Which city hosted the first Olympic Games in 1971?", "Munich || Munich"], ["What is the name of the largest airport in Munich?", "Munich Airport (Franz Josef Strau\u00df International Airport) || Munich Airport"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 4], "confidence": [0.1728515625, 0.9375], "model_response": [["Which city hosted the first Olympic Games in 1971?", "Tokyo || Tokyo"], ["What is the name of the largest airport in Tokyo?", "Narita International Airport || Narita International Airport"]]}, "mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.7276153564453125], "model_response": [["Which city hosted the first Olympic Games in 1971?", "Munich || Munich"], ["What is the name of the largest airport in Munich?", "Munich Airport || Munich Airport"]]}}}
{"hop1": {"hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.96875], "model_response": [["What is the name of the largest university/college in Beijing by area?", "Beijing University || Beijing University"], ["In which year was Beijing University founded?", "1906 || 1906"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.91796875], "model_response": [["What is the name of the largest university/college in Beijing by area?", "Beijing University || Beijing University"], ["In which year was Beijing University founded?", "1906 || 1906"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.98828125], "model_response": [["What is the name of the largest university/college in Beijing by area?", "Beijing University || Beijing University"], ["In which year was Beijing University founded?", "1906 || 1906"]]}, "mis_info_dict_severe": {"answer_condition": [1, 4], "confidence": [0.99609375, 0.8125], "model_response": [["What is the name of the largest university/college in Beijing by area?", "Beijing University || Beijing University"], ["In which year was Beijing University founded?", "1912 || 1912"]]}, "unrelated_fact_dict_severe": {"answer_condition": [3, 4], "confidence": [0.375, 0.7276153564453125], "model_response": [["What is the name of the largest university/college in Beijing by area?", "Mount Everest || Mount Everest"], ["In which year was Mount Everest discovered?", "1852 || 1852"]]}, "mis_info_dict_light": {"answer_condition": [3, 4], "confidence": [1.0, 1.0], "model_response": [["What is the name of the largest university/college in Beijing by area?", "Tsinghua University || Tsinghua University"], ["In which year was Tsinghua University founded?", "1911 || 1911"]]}}, "hop2": {"hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["What is the name of the largest university/college in Beijing by area?", "Beijing University || Beijing University"], ["In which year was Beijing University founded?", "1906 || 1906"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.81640625], "model_response": [["What is the name of the largest university/college in Beijing by area?", "Beijing University || Beijing University"], ["In which year was Beijing University founded?", "1906 || 1906"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.99609375, 0.980560302734375], "model_response": [["What is the name of the largest university/college in Beijing by area?", "Beijing University is the largest university/college in Beijing by area. || Beijing University"], ["In which year was Beijing University founded?", "1906 || 1906"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["What is the name of the largest university/college in Beijing by area?", "Beijing University || Beijing University"], ["In which year was Beijing University founded?", "1906 || 1906"]]}, "mis_info_dict_light": {"answer_condition": [1, 4], "confidence": [0.99609375, 1.0], "model_response": [["What is the name of the largest university/college in Beijing by area?", "Beijing University is the largest university/college in Beijing by area. || Beijing University"], ["In which year was Beijing University founded?", "1898 || 1898"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.26653289794921875], "model_response": [["What is the name of the largest university/college in Beijing by area?", "Beijing University || Beijing University"], ["In which year was Beijing University founded?", "1912 || 1912"]]}}}
{"hop1": {"hall_sbj_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.61328125], "model_response": [["In which year was George Washington born?", "1732 || 1732"], ["Which film, in alphabetical order, won the Oscar for Outstanding Picture in the year 1732?", "Titanic (1997) || Titanic"]]}, "mis_info_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.4921875], "model_response": [["In which year was George Washington born?", "1732 || 1732"], ["Which film, in alphabetical order, won the Oscar for Outstanding Picture in the year 1732?", "Titanic || Titanic"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.498046875], "model_response": [["In which year was George Washington born?", "1732 || 1732"], ["Which film, in alphabetical order, won the Oscar for Outstanding Picture in the year 1732?", "Titanic || Titanic"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 0.178985595703125], "model_response": [["In which year was George Washington born?", "1732 || 1732"], ["Which film, in alphabetical order, won the Oscar for Outstanding Picture in the year 1732?", "The Shape of Water || The Shape of Water"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 0.369140625], "model_response": [["In which year was George Washington born?", "1732 || 1732"], ["Which film, in alphabetical order, won the Oscar for Outstanding Picture in the year 1732?", "Titanic || Titanic"]]}, "mis_info_dict_light": {"answer_condition": [4, 4], "confidence": [1.0, 0.0013818740844726562], "model_response": [["In which year was George Washington born?", "1776 || 1776"], ["Which film, in alphabetical order, won the Oscar for Outstanding Picture in the year 1776?", "The French Dispatch || The French Dispatch"]]}}, "hop2": {"mis_info_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.83770751953125], "model_response": [["In which year was George Washington born?", "1732 || 1732"], ["Which film, in alphabetical order, won the Oscar for Outstanding Picture in the year 1732?", "Chocolate Chip Cookies || Chocolate Chip Cookies"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.96484375], "model_response": [["In which year was George Washington born?", "1732 || 1732"], ["Which film, in alphabetical order, won the Oscar for Outstanding Picture in the year 1732?", "Pizza || Pizza"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 0.9921875], "model_response": [["In which year was George Washington born?", "1732 || 1732"], ["Which film, in alphabetical order, won the Oscar for Outstanding Picture in the year 1732?", "Casablanca || Casablanca"]]}, "mis_info_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 1.0], "model_response": [["In which year was George Washington born?", "1732 || 1732"], ["Which film, in alphabetical order, won the Oscar for Outstanding Picture in the year 1732?", "The French Connection || The French Connection"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 1.0], "model_response": [["In which year was George Washington born?", "1732 || 1732"], ["Which film, in alphabetical order, won the Oscar for Outstanding Picture in the year 1732?", "The Godfather || The Godfather"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.0718994140625], "model_response": [["In which year was George Washington born?", "1732 || 1732"], ["Which film, in alphabetical order, won the Oscar for Outstanding Picture in the year 1732?", "Tulip Flowers || Tulip Flowers"]]}}}
{"hop1": {"unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.8439903259277344, 0.5804178714752197], "model_response": [["Which countries to the east share a border with Norway?", "Finland and Russia || Finland and Russia"], ["Who is the president / leader of Finland in the year 1814?", "Carl Gustaf Mannerheim || Carl Gustaf Mannerheim"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.467254638671875, 0.44235992431640625], "model_response": [["Which countries to the east share a border with Norway?", "Finland and Sweden || Finland and Sweden"], ["Who is the president / leader of Finland in the year 1814?", "Carl Gustaf Mannerheim || Carl Gustaf Mannerheim"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.9161262512207031, 0.6771236658096313], "model_response": [["Which countries to the east share a border with Norway?", "Finland and Russia || Finland and Russia"], ["Who is the president / leader of Finland in the year 1814?", "Carl Gustaf Mannerheim || Carl Gustaf Mannerheim"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.8761024475097656, 0.5998368263244629], "model_response": [["Which countries to the east share a border with Norway?", "Finland and Sweden || Finland and Sweden"], ["Who is the president / leader of Finland in the year 1814?", "Carl Gustaf Mannerheim || Carl Gustaf Mannerheim"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [0.988311767578125, 0.03948855400085449], "model_response": [["Which countries to the east share a border with Norway?", "Finland and Russia || Finland and Russia"], ["Who is the president / leader of Finland in the year 1814?", "Carl Johan Adlercreutz || Carl Johan Adlercreutz"]]}, "mis_info_dict_light": {"answer_condition": [1, 4], "confidence": [0.9379416704177856, 0.12973723467439413], "model_response": [["Which countries to the east share a border with Norway?", "Finland and Russia. || Finland and Russia"], ["Who is the president / leader of Finland in the year 1814?", "Carl Johan von Eckerman was the president / leader of Finland in the year 1814. || Carl Johan von Eckerman"]]}}, "hop2": {"hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.988311767578125, 1.0], "model_response": [["Which countries to the east share a border with Norway?", "Finland and Russia || Finland and Russia"], ["Who is the president / leader of Finland in the year 1814?", "Carl Gustaf Mannerheim || Carl Gustaf Mannerheim"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.9538086652755737, 1.0], "model_response": [["Which countries to the east share a border with Norway?", "Finland and Russia || Finland and Russia"], ["Who is the president / leader of Finland in the year 1814?", "Carl Gustaf Mannerheim || Carl Gustaf Mannerheim"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.6826298236846924, 0.8871089480817318], "model_response": [["Which countries to the east share a border with Norway?", "Finland and Russia || Finland and Russia"], ["Who is the president / leader of Finland in the year 1814?", "Carl Gustaf Mannerheim || Carl Gustaf Mannerheim"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.045531220734119415, 0.6785870622843504], "model_response": [["Which countries to the east share a border with Norway?", "Finland and Sweden || Finland and Sweden"], ["Who is the president / leader of Finland in the year 1814?", "Carl Gustaf Mannerheim || Carl Gustaf Mannerheim"]]}, "mis_info_dict_severe": {"answer_condition": [1, 3], "confidence": [0.4119873046875, 0.80859375], "model_response": [["Which countries to the east share a border with Norway?", "Finland and Russia || Finland and Russia"], ["Who is the president / leader of Finland in the year 1814?", "Chocolate cake || Chocolate cake"]]}, "mis_info_dict_light": {"answer_condition": [1, 4], "confidence": [0.418853759765625, 1.0], "model_response": [["Which countries to the east share a border with Norway?", "Finland and Russia || Finland and Russia"], ["Who is the president / leader of Finland in the year 1814?", "Alexander I || Alexander I"]]}}}
{"hop1": {"hall_sbj_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.0513586699962616], "model_response": [["Which music company released \"The Deer Hunter\"?", "MCA Records || MCA Records"], ["Who is the CEO of MCA Records in the year 1934?", "Samuel L. Jackson || Samuel L. Jackson"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [0.052978515625, 0.03236977320375445], "model_response": [["Which music company released \"The Deer Hunter\"?", "United Artists || United Artists"], ["Who is the CEO of MCA Records in the year 1934?", "MCA Records was founded by Morris \"Mo\" Asher, who was also the CEO. || Morris \"Mo\" Asher"]]}, "hall_sbj_dict_light": {"answer_condition": [3, -1], "confidence": [1.0, -1], "model_response": [["Which music company released \"The Deer Hunter\"?", "Warner Music Group || Warner Music Group"], ["Who is the CEO of Warner Music Group in the year 1934?", "I'm sorry, I cannot provide an answer to this question as I do not have access to the specific information you are referring to. || N/A"]]}, "mis_info_dict_light": {"answer_condition": [3, -1], "confidence": [1.0, -1], "model_response": [["Which music company released \"The Deer Hunter\"?", "Sony Music Entertainment || Sony Music Entertainment"], ["Who is the CEO of Sony Music Entertainment in the year 1934?", "I'm sorry, but I don't have that information. Please provide more context or information so I can assist you better. || N/A"]]}, "mis_info_dict_severe": {"answer_condition": [3, 4], "confidence": [0.11867523193359375, 0.00039836546029903275], "model_response": [["Which music company released \"The Deer Hunter\"?", "Pineapple Records || Pineapple Records"], ["Who is the CEO of Pineapple Records in the year 1934?", "Herman H. Mankiewicz || Herman H. Mankiewicz"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 4], "confidence": [0.635772705078125, 0.0058788880705833435], "model_response": [["Which music company released \"The Deer Hunter\"?", "Warner Bros. || Warner Bros."], ["Who is the CEO of Warner Bros. in the year 1934?", "Robert S. Sarnoff || Robert S. Sarnoff"]]}}, "hop2": {"hall_sbj_dict_severe": {"answer_condition": [4, 1], "confidence": [0.2177734375, 1.0], "model_response": [["Which music company released \"The Deer Hunter\"?", "Columbia Records || Columbia Records"], ["Who is the CEO of Columbia Records in the year 1934?", "John I. Siegel || John I. Siegel"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 4], "confidence": [0.62890625, 0.98828125], "model_response": [["Which music company released \"The Deer Hunter\"?", "RCA Records || RCA Records"], ["Who is the CEO of RCA Records in the year 1934?", "James Quincey || James Quincey"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 4], "confidence": [0.494140625, 1.0], "model_response": [["Which music company released \"The Deer Hunter\"?", "Warner Bros. Records || Warner Bros. Records"], ["Who is the CEO of Warner Bros. Records in the year 1934?", "Jack L. Warner || Jack L. Warner"]]}, "hall_sbj_dict_light": {"answer_condition": [3, 1], "confidence": [0.9921875, 1.0], "model_response": [["Which music company released \"The Deer Hunter\"?", "Warner Bros. Records || Warner Bros. Records"], ["Who is the CEO of Warner Bros. Records in the year 1934?", "John I. Siegel || John I. Siegel"]]}, "mis_info_dict_severe": {"answer_condition": [4, 3], "confidence": [0.056396484375, 0.7818603515625], "model_response": [["Which music company released \"The Deer Hunter\"?", "Elektra Records || Elektra Records"], ["Who is the CEO of Elektra Records in the year 1934?", "Chocolate cake || Chocolate cake"]]}, "mis_info_dict_light": {"answer_condition": [4, 3], "confidence": [0.1279296875, 1.0], "model_response": [["Which music company released \"The Deer Hunter\"?", "Columbia Records || Columbia Records"], ["Who is the CEO of Columbia Records in the year 1934?", "Robert J. Thompson || Robert J. Thompson"]]}}}
{"hop1": {"hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.24155652523040771, 1.0], "model_response": [["Which countries to the east share a border with Norway?", "Finland and Sweden || Finland and Sweden"], ["What is the official or most commonly spoken language in Finland?", "Finnish || Finnish"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.8439903259277344, 0.9921875], "model_response": [["Which countries to the east share a border with Norway?", "Finland and Russia || Finland and Russia"], ["What is the official or most commonly spoken language in Finland?", "Finnish || Finnish"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.6010406017303467, 0.99609375], "model_response": [["Which countries to the east share a border with Norway?", "Finland and Sweden || Finland and Sweden"], ["What is the official or most commonly spoken language in Finland?", "Finnish || Finnish"]]}, "mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [0.9379416704177856, 0.99609375], "model_response": [["Which countries to the east share a border with Norway?", "Finland and Russia. || Finland and Russia"], ["What is the official or most commonly spoken language in Finland?", "Finnish || Finnish"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.9161262512207031, 0.99609375], "model_response": [["Which countries to the east share a border with Norway?", "Finland and Russia. || Finland and Russia"], ["What is the official or most commonly spoken language in Finland?", "Finnish || Finnish"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.988311767578125, 0.9921875], "model_response": [["Which countries to the east share a border with Norway?", "Finland and Russia (via the Finnish and Russian parts of the border) || Finland and Russia"], ["What is the official or most commonly spoken language in Finland?", "Finnish || Finnish"]]}}, "hop2": {"hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.94940185546875, 1.0], "model_response": [["Which countries to the east share a border with Norway?", "Finland and Russia || Finland and Russia"], ["What is the official or most commonly spoken language in Finland?", "Finnish || Finnish"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.8068639039993286, 0.921875], "model_response": [["Which countries to the east share a border with Norway?", "Finland and Russia || Finland and Russia"], ["What is the official or most commonly spoken language in Finland?", "Finnish || Finnish"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.7063329219818115, 1.0], "model_response": [["Which countries to the east share a border with Norway?", "Finland and Russia || Finland and Russia"], ["What is the official or most commonly spoken language in Finland?", "Finnish || Finnish"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.18998648039996624, 0.99609375], "model_response": [["Which countries to the east share a border with Norway?", "Finland, Russia, and Sweden. || Finland, Russia, and Sweden"], ["What is the official or most commonly spoken language in Finland?", "Finnish || Finnish"]]}, "mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [0.03036235983017832, 0.9921875], "model_response": [["Which countries to the east share a border with Norway?", "Finland, Russia, and Sweden || Finland, Russia, and Sweden"], ["What is the official or most commonly spoken language in Finland?", "Finnish || Finnish"]]}, "mis_info_dict_severe": {"answer_condition": [4, 4], "confidence": [0.011475504834379535, 1.0], "model_response": [["Which countries to the east share a border with Norway?", "Iceland and Russia || Iceland and Russia"], ["What is the official or most commonly spoken language in Iceland and Russia?", "Icelandic and Russian || Icelandic and Russian"]]}}}
{"hop1": {"hall_sbj_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.5703125], "model_response": [["What is the national anthem of Finland?", "Maamme (Finland's national anthem) || Maamme"], ["Which music company released \"Maamme\"?", "Universal Music Group || Universal Music Group"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 4], "confidence": [0.498046875, 0.505828857421875], "model_response": [["What is the national anthem of Finland?", "Maamme is also the national anthem of Finland. || Maamme"], ["Which music company released \"Maamme\"?", "Universal Music Group || Universal Music Group"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.99609375, 0.7722616195678711], "model_response": [["What is the national anthem of Finland?", "Maamme, maamme, olen sin\u00e4  (Our Land, Our Land, I am You) || Maamme"], ["Which music company released \"Maamme\"?", "Sony Music Entertainment || Sony Music Entertainment"]]}, "mis_info_dict_light": {"answer_condition": [4, 4], "confidence": [0.99609375, 0.87158203125], "model_response": [["What is the national anthem of Finland?", "V\u00e5rt land || V\u00e5rt land"], ["Which music company released \"V\u00e5rt land\"?", "Universal Music Group || Universal Music Group"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [0.00016026618133135076, 0.051425933837890625], "model_response": [["What is the national anthem of Finland?", "Maamme, maamme, oon talo ja puutarhaa (Our land, our home, a stronghold and a shelter) || Maamme, maamme, oon talo ja puutarhaa"], ["Which music company released \"Maamme\"?", "Sonoton || Sonoton"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.49872971904733276, 0.18079429864883423], "model_response": [["What is the national anthem of Finland?", "Maamme, maamme, maamme,\nOi, oi, oi,\nJa, ja, ja,\nOi, oi, oi,\nMaamme, maamme, maamme.\n(We, we, we,\nHooray, hooray,\nYes, yes, yes,\nHooray, hooray,\nWe, we, we,\nFinland, Finland, Finland.) || Maamme, maamme, maamme"], ["Which music company released \"Maamme\"?", "Sony Music Entertainment || Sony Music Entertainment"]]}}, "hop2": {"hall_sbj_dict_light": {"answer_condition": [1, 4], "confidence": [0.9453125, 1.0], "model_response": [["What is the national anthem of Finland?", "Maamme is the national anthem of Finland. || Maamme"], ["Which music company released \"Maamme\"?", "Universal Music Group || Universal Music Group"]]}, "mis_info_dict_light": {"answer_condition": [1, 4], "confidence": [0.99609375, 1.0], "model_response": [["What is the national anthem of Finland?", "Maamme is the national anthem of Finland. || Maamme"], ["Which music company released \"Maamme\"?", "Universal Music Group || Universal Music Group"]]}, "mis_info_dict_severe": {"answer_condition": [1, 3], "confidence": [0.96484375, 0.98046875], "model_response": [["What is the national anthem of Finland?", "Maamme, maamme, olla sinun neuvokas. || Maamme"], ["Which music company released \"Maamme\"?", "Pizza Hut || Pizza Hut"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.0006326380351650701, 0.9230194091796875], "model_response": [["What is the national anthem of Finland?", "Maamme, maamme, k\u00e4y meid\u00e4t! (Let us go, let us go!) || Maamme, maamme, k\u00e4y meid\u00e4t"], ["Which music company released \"Maamme\"?", "Sony Music Entertainment || Sony Music Entertainment"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.99609375, 1.0], "model_response": [["What is the national anthem of Finland?", "Maamme, maamme, maamme,\nOi, oi, oi,\nOi, oi, oi,\nMaamme, maamme, maamme. || Maamme"], ["Which music company released \"Maamme\"?", "Sony Music Entertainment || Sony Music Entertainment"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.99609375, 0.06813132762908936], "model_response": [["What is the national anthem of Finland?", "Maamme, maamme, maamme, \nJa sin\u00e4, ja sin\u00e4, ja sin\u00e4, \nJa kaikki, kaikki, kaikki meid\u00e4t, \nMeid\u00e4t, meid\u00e4t, meid\u00e4t! || Maamme"], ["Which music company released \"Maamme\"?", "Sony Music Entertainment || Sony Music Entertainment"]]}}}
{"hop1": {"unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.98046875, 1.0], "model_response": [["What is the national anthem of the United Kingdom?", "God Save the Queen || God Save the Queen"], ["In which year was \"God Save the Queen\" written?", "1745 || 1745"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.9921875, 1.0], "model_response": [["What is the national anthem of the United Kingdom?", "God Save the Queen || God Save the Queen"], ["In which year was \"God Save the Queen\" written?", "1745 || 1745"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.77734375], "model_response": [["What is the national anthem of the United Kingdom?", "God Save the Queen || God Save the Queen"], ["In which year was \"God Save the Queen\" written?", "1745 || 1745"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.98046875, 1.0], "model_response": [["What is the national anthem of the United Kingdom?", "God Save the Queen || God Save the Queen"], ["In which year was \"God Save the Queen\" written?", "1745 || 1745"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["What is the national anthem of the United Kingdom?", "God Save the Queen || God Save the Queen"], ["In which year was \"God Save the Queen\" written?", "1745 || 1745"]]}, "mis_info_dict_light": {"answer_condition": [4, 4], "confidence": [0.498046875, 0.75390625], "model_response": [["What is the national anthem of the United Kingdom?", "Rule Britannia || Rule Britannia"], ["In which year was \"Rule Britannia\" written?", "1740 || 1740"]]}}, "hop2": {"unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.98046875, 1.0], "model_response": [["What is the national anthem of the United Kingdom?", "God Save the Queen || God Save the Queen"], ["In which year was \"God Save the Queen\" written?", "1745 || 1745"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.99609375, 1.0], "model_response": [["What is the national anthem of the United Kingdom?", "God Save the Queen || God Save the Queen"], ["In which year was \"God Save the Queen\" written?", "1745 || 1745"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.9921875, 1.0], "model_response": [["What is the national anthem of the United Kingdom?", "God Save the Queen || God Save the Queen"], ["In which year was \"God Save the Queen\" written?", "1745 || 1745"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.9921875, 1.0], "model_response": [["What is the national anthem of the United Kingdom?", "God Save the Queen || God Save the Queen"], ["In which year was \"God Save the Queen\" written?", "1745 || 1745"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["What is the national anthem of the United Kingdom?", "God Save the Queen || God Save the Queen"], ["In which year was \"God Save the Queen\" written?", "1745 || 1745"]]}, "mis_info_dict_light": {"answer_condition": [1, 3], "confidence": [1.0, 0.98046875], "model_response": [["What is the national anthem of the United Kingdom?", "God Save the Queen || God Save the Queen"], ["In which year was \"God Save the Queen\" written?", "1800 || 1800"]]}}}
{"hop1": {"mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.9921875], "model_response": [["Which country in Asia is the most populated?", "China || China"], ["What is the capital of China?", "Beijing || Beijing"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.99609375], "model_response": [["Which country in Asia is the most populated?", "China || China"], ["What is the capital of China?", "Beijing || Beijing"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Which country in Asia is the most populated?", "China || China"], ["What is the capital of China?", "Beijing || Beijing"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Which country in Asia is the most populated?", "China || China"], ["What is the capital of China?", "Beijing || Beijing"]]}, "mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.99609375], "model_response": [["Which country in Asia is the most populated?", "China || China"], ["What is the capital of China?", "Beijing || Beijing"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.9921875], "model_response": [["Which country in Asia is the most populated?", "China || China"], ["What is the capital of China?", "Beijing || Beijing"]]}}, "hop2": {"mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.98828125], "model_response": [["Which country in Asia is the most populated?", "China || China"], ["What is the capital of China?", "Beijing || Beijing"]]}, "mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Which country in Asia is the most populated?", "China || China"], ["What is the capital of China?", "Beijing || Beijing"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Which country in Asia is the most populated?", "China || China"], ["What is the capital of China?", "Beijing || Beijing"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.953125], "model_response": [["Which country in Asia is the most populated?", "China || China"], ["What is the capital of China?", "Beijing || Beijing"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.9921875], "model_response": [["Which country in Asia is the most populated?", "China || China"], ["What is the capital of China?", "Beijing || Beijing"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Which country in Asia is the most populated?", "China || China"], ["What is the capital of China?", "Beijing || Beijing"]]}}}
{"hop1": {"unrelated_fact_dict_light": {"answer_condition": [1, -1], "confidence": [1.0, -1], "model_response": [["Which is the first year does China invade Vietnam?", "1979 || 1979"], ["Who were the Oscar winners for Best Actor in the year 1979?", "Jon Voight (The Conversation) and Jack Nicholson (Terms of Endearment) || N/A"]]}, "mis_info_dict_severe": {"answer_condition": [1, -1], "confidence": [0.83203125, -1], "model_response": [["Which is the first year does China invade Vietnam?", "1979 || 1979"], ["Who were the Oscar winners for Best Actor in the year 1979?", "Peter Finch (Network) and Jon Voight (Coming Home) || N/A"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, -1], "confidence": [1.0, -1], "model_response": [["Which is the first year does China invade Vietnam?", "1979 || 1979"], ["Who were the Oscar winners for Best Actor in the year 1979?", "Peter Finch (Network) and Jon Voight (Coming Home) || N/A"]]}, "hall_sbj_dict_light": {"answer_condition": [1, -1], "confidence": [1.0, -1], "model_response": [["Which is the first year does China invade Vietnam?", "1979 || 1979"], ["Who were the Oscar winners for Best Actor in the year 1979?", "Peter Finch (Network) and Jack Lemmon (Save the Tiger) || N/A"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, -1], "confidence": [1.0, -1], "model_response": [["Which is the first year does China invade Vietnam?", "1979 || 1979"], ["Who were the Oscar winners for Best Actor in the year 1979?", "Peter Finch (Network) and Jon Voight (Coming Home) || N/A"]]}, "mis_info_dict_light": {"answer_condition": [3, -1], "confidence": [0.94921875, -1], "model_response": [["Which is the first year does China invade Vietnam?", "1965 || 1965"], ["Who were the Oscar winners for Best Actor in the year 1965?", "Peter O'Toole (Lawrence of Arabia) and Marlon Brando (Viva Zapata!) || N/A"]]}}, "hop2": {"unrelated_fact_dict_light": {"answer_condition": [1, -1], "confidence": [1.0, -1], "model_response": [["Which is the first year does China invade Vietnam?", "1979 || 1979"], ["Who were the Oscar winners for Best Actor in the year 1979?", "Jon Voight (Coming Home) and Peter Finch (Network) || N/A"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, -1], "confidence": [1.0, -1], "model_response": [["Which is the first year does China invade Vietnam?", "1979 || 1979"], ["Who were the Oscar winners for Best Actor in the year 1979?", "Peter Finch (Network) and Jon Voight (Coming Home) || N/A"]]}, "mis_info_dict_light": {"answer_condition": [1, -1], "confidence": [1.0, -1], "model_response": [["Which is the first year does China invade Vietnam?", "1979 || 1979"], ["Who were the Oscar winners for Best Actor in the year 1979?", "Peter Finch (Network) and Jon Voight (Coming Home) || N/A"]]}, "mis_info_dict_severe": {"answer_condition": [1, -1], "confidence": [1.0, -1], "model_response": [["Which is the first year does China invade Vietnam?", "1979 || 1979"], ["Who were the Oscar winners for Best Actor in the year 1979?", "Jon Voight (Coming Home) and Jack Lemmon (Save the Tiger) || N/A"]]}, "hall_sbj_dict_light": {"answer_condition": [1, -1], "confidence": [1.0, -1], "model_response": [["Which is the first year does China invade Vietnam?", "1979 || 1979"], ["Who were the Oscar winners for Best Actor in the year 1979?", "Peter Finch (Network) and Jack Lemmon (Save the Tiger) || N/A"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, -1], "confidence": [1.0, -1], "model_response": [["Which is the first year does China invade Vietnam?", "1979 || 1979"], ["Who were the Oscar winners for Best Actor in the year 1979?", "Peter Finch (Network) and Jack Lemmon (Save the Tiger) || N/A"]]}}}
{"hop1": {"hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.467254638671875, 0.984375], "model_response": [["Which countries to the east share a border with Norway?", "Finland and Russia || Finland and Russia"], ["What's the year when Sweden the first time formally establish diplomatic relations with Finland?", "1855 || 1855"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.9161262512207031, 0.8671875], "model_response": [["Which countries to the east share a border with Norway?", "Finland and Russia || Finland and Russia"], ["What's the year when Sweden the first time formally establish diplomatic relations with Finland?", "1855 || 1855"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.7329940795898438, 0.94140625], "model_response": [["Which countries to the east share a border with Norway?", "Finland and Russia || Finland and Russia"], ["What's the year when Sweden the first time formally establish diplomatic relations with Finland?", "1855 || 1855"]]}, "mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [0.9379416704177856, 0.953125], "model_response": [["Which countries to the east share a border with Norway?", "Finland and Russia || Finland and Russia"], ["What's the year when Sweden the first time formally establish diplomatic relations with Finland?", "1855 || 1855"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [0.988311767578125, 0.022705078125], "model_response": [["Which countries to the east share a border with Norway?", "Finland and Russia || Finland and Russia"], ["What's the year when Sweden the first time formally establish diplomatic relations with Finland?", "1809 || 1809"]]}, "mis_info_dict_severe": {"answer_condition": [4, 4], "confidence": [0.07951131463050842, 0.85345458984375], "model_response": [["Which countries to the east share a border with Norway?", "Iceland and Sweden || Iceland and Sweden"], ["What's the year when Iceland and Sweden first formally establish diplomatic relations?", "1875 || 1875"]]}}, "hop2": {"unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.384521484375, 0.8515625], "model_response": [["Which countries to the east share a border with Norway?", "Finland and Russia || Finland and Russia"], ["What's the year when Sweden the first time formally establish diplomatic relations with Finland?", "1855 || 1855"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.5847116112709045, 0.90625], "model_response": [["Which countries to the east share a border with Norway?", "Finland and Russia || Finland and Russia"], ["What's the year when Sweden the first time formally establish diplomatic relations with Finland?", "1855 || 1855"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.05631619176710956, 1.0], "model_response": [["Which countries to the east share a border with Norway?", "Sweden, Finland, and Russia || Sweden, Finland, and Russia"], ["What's the year when Sweden the first time formally establish diplomatic relations with Finland?", "1855 || 1855"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.6069034337997437, 0.99609375], "model_response": [["Which countries to the east share a border with Norway?", "Finland and Russia || Finland and Russia"], ["What's the year when Sweden the first time formally establish diplomatic relations with Finland?", "1855 || 1855"]]}, "mis_info_dict_severe": {"answer_condition": [1, 4], "confidence": [0.9690088033676147, 0.635772705078125], "model_response": [["Which countries to the east share a border with Norway?", "Finland and Russia || Finland and Russia"], ["What's the year when Sweden the first time formally establish diplomatic relations with Finland?", "1809 || 1809"]]}, "mis_info_dict_light": {"answer_condition": [1, 3], "confidence": [0.7848268151283264, 0.87890625], "model_response": [["Which countries to the east share a border with Norway?", "Finland and Russia || Finland and Russia"], ["What's the year when Sweden the first time formally establish diplomatic relations with Finland?", "1905 || 1905"]]}}}
{"hop1": {"hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.99609375, 1.0], "model_response": [["From which country does the Volga originate?", "Russia || Russia"], ["What is the capital of Russia?", "Moscow || Moscow"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["From which country does the Volga originate?", "Russia || Russia"], ["What is the capital of Russia?", "Moscow || Moscow"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["From which country does the Volga originate?", "Russia || Russia"], ["What is the capital of Russia?", "Moscow || Moscow"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.99609375, 1.0], "model_response": [["From which country does the Volga originate?", "Russia || Russia"], ["What is the capital of Russia?", "Moscow || Moscow"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.99609375], "model_response": [["From which country does the Volga originate?", "Russia || Russia"], ["What is the capital of Russia?", "Moscow || Moscow"]]}, "mis_info_dict_light": {"answer_condition": [3, 4], "confidence": [0.5, 1.0], "model_response": [["From which country does the Volga originate?", "Kazakhstan || Kazakhstan"], ["What is the capital of Kazakhstan?", "Astana || Astana"]]}}, "hop2": {"unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.9921875], "model_response": [["From which country does the Volga originate?", "Russia || Russia"], ["What is the capital of Russia?", "Moscow || Moscow"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.9921875], "model_response": [["From which country does the Volga originate?", "Russia || Russia"], ["What is the capital of Russia?", "Moscow || Moscow"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["From which country does the Volga originate?", "Russia || Russia"], ["What is the capital of Russia?", "Moscow || Moscow"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.99609375], "model_response": [["From which country does the Volga originate?", "Russia || Russia"], ["What is the capital of Russia?", "Moscow || Moscow"]]}, "mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["From which country does the Volga originate?", "Russia || Russia"], ["What is the capital of Russia?", "Moscow || Moscow"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.99609375], "model_response": [["From which country does the Volga originate?", "Russia || Russia"], ["What is the capital of Russia?", "Moscow || Moscow"]]}}}
{"hop1": {"hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.96875], "model_response": [["What is the official or most commonly spoken language in China?", "Mandarin || Mandarin"], ["What is the ISO 639-2 code for Mandarin?", "cmn || cmn"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.98828125], "model_response": [["What is the official or most commonly spoken language in China?", "Mandarin || Mandarin"], ["What is the ISO 639-2 code for Mandarin?", "cmn || cmn"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.83984375], "model_response": [["What is the official or most commonly spoken language in China?", "Mandarin || Mandarin"], ["What is the ISO 639-2 code for Mandarin?", "cmn || cmn"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.9765625], "model_response": [["What is the official or most commonly spoken language in China?", "Mandarin || Mandarin"], ["What is the ISO 639-2 code for Mandarin?", "cmn || cmn"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.921875], "model_response": [["What is the official or most commonly spoken language in China?", "Mandarin || Mandarin"], ["What is the ISO 639-2 code for Mandarin?", "cmn || cmn"]]}, "mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [0.953125, 0.98046875], "model_response": [["What is the official or most commonly spoken language in China?", "Mandarin || Mandarin"], ["What is the ISO 639-2 code for Mandarin?", "cmn || cmn"]]}}, "hop2": {"mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.0810546875], "model_response": [["What is the official or most commonly spoken language in China?", "Mandarin || Mandarin"], ["What is the ISO 639-2 code for Mandarin?", "zh-CN || zh-CN"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.64453125], "model_response": [["What is the official or most commonly spoken language in China?", "Mandarin || Mandarin"], ["What is the ISO 639-2 code for Mandarin?", "zh-CN || zh-CN"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["What is the official or most commonly spoken language in China?", "Mandarin || Mandarin"], ["What is the ISO 639-2 code for Mandarin?", "zh-CN || zh-CN"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["What is the official or most commonly spoken language in China?", "Mandarin || Mandarin"], ["What is the ISO 639-2 code for Mandarin?", "zh-CN || zh-CN"]]}, "mis_info_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 0.99609375], "model_response": [["What is the official or most commonly spoken language in China?", "Mandarin || Mandarin"], ["What is the ISO 639-2 code for Mandarin?", "en-US || en-US"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.9303741455078125], "model_response": [["What is the official or most commonly spoken language in China?", "Mandarin || Mandarin"], ["What is the ISO 639-2 code for Mandarin?", "mandarin || mandarin"]]}}}
{"hop1": {"hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.98828125], "model_response": [["In this year's Oscars, which film is the first one in alphabetical order for the Outstanding Pictures category?", "The Hours || The Hours"], ["Which film company produced \"The Hours\"?", "Miramax || Miramax"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 4], "confidence": [0.85345458984375, 0.8125], "model_response": [["In this year's Oscars, which film is the first one in alphabetical order for the Outstanding Pictures category?", "The Shape of Water || The Shape of Water"], ["Which film company produced \"The Shape of Water\"?", "Fox Searchlight Pictures || Fox Searchlight Pictures"]]}, "mis_info_dict_severe": {"answer_condition": [3, 4], "confidence": [0.9922027587890625, 0.96875], "model_response": [["In this year's Oscars, which film is the first one in alphabetical order for the Outstanding Pictures category?", "Chocolate Chip Cookies || Chocolate Chip Cookies"], ["Which film company produced \"Chocolate Chip Cookies\"?", "Universal Pictures || Universal Pictures"]]}, "mis_info_dict_light": {"answer_condition": [3, 4], "confidence": [1.0, 1.0], "model_response": [["In this year's Oscars, which film is the first one in alphabetical order for the Outstanding Pictures category?", "The Irishman || The Irishman"], ["Which film company produced \"The Irishman\"?", "Netflix || Netflix"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 4], "confidence": [0.8136749267578125, 0.9453125], "model_response": [["In this year's Oscars, which film is the first one in alphabetical order for the Outstanding Pictures category?", "The Shape of Water || The Shape of Water"], ["Which film company produced \"The Shape of Water\"?", "Fox Searchlight Pictures || Fox Searchlight Pictures"]]}, "hall_sbj_dict_severe": {"answer_condition": [4, 4], "confidence": [0.14829254150390625, 0.69622802734375], "model_response": [["In this year's Oscars, which film is the first one in alphabetical order for the Outstanding Pictures category?", "The Shape of Water || The Shape of Water"], ["Which film company produced \"The Shape of Water\"?", "Guillermo del Toro Productions || Guillermo del Toro Productions"]]}}, "hop2": {"mis_info_dict_light": {"answer_condition": [1, 4], "confidence": [0.9766387939453125, 1.0], "model_response": [["In this year's Oscars, which film is the first one in alphabetical order for the Outstanding Pictures category?", "The Hours || The Hours"], ["Which film company produced \"The Hours\"?", "Paramount Pictures || Paramount Pictures"]]}, "hall_sbj_dict_severe": {"answer_condition": [4, 1], "confidence": [0.9149322509765625, 1.0], "model_response": [["In this year's Oscars, which film is the first one in alphabetical order for the Outstanding Pictures category?", "Miramax's The English Patient || The English Patient"], ["Which film company produced \"The English Patient\"?", "Miramax || Miramax"]]}, "hall_sbj_dict_light": {"answer_condition": [4, 4], "confidence": [0.941619873046875, 0.9921875], "model_response": [["In this year's Oscars, which film is the first one in alphabetical order for the Outstanding Pictures category?", "The Shape of Water || The Shape of Water"], ["Which film company produced \"The Shape of Water\"?", "Fox Searchlight Pictures || Fox Searchlight Pictures"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 4], "confidence": [0.9498291015625, 0.984375], "model_response": [["In this year's Oscars, which film is the first one in alphabetical order for the Outstanding Pictures category?", "The Shape of Water || The Shape of Water"], ["Which film company produced \"The Shape of Water\"?", "Fox Searchlight Pictures || Fox Searchlight Pictures"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 4], "confidence": [0.11865234375, 0.96875], "model_response": [["In this year's Oscars, which film is the first one in alphabetical order for the Outstanding Pictures category?", "Parasite || Parasite"], ["Which film company produced \"Parasite\"?", "Neon || Neon"]]}, "mis_info_dict_severe": {"answer_condition": [4, 4], "confidence": [0.6215362548828125, 0.99609375], "model_response": [["In this year's Oscars, which film is the first one in alphabetical order for the Outstanding Pictures category?", "The Shape of Water || The Shape of Water"], ["Which film company produced \"The Shape of Water\"?", "Fox Searchlight Pictures || Fox Searchlight Pictures"]]}}}
{"hop1": {"unrelated_fact_dict_severe": {"answer_condition": [4, 1], "confidence": [0.9609375, 0.48046875], "model_response": [["What's the year when China the first time formally establish diplomatic relations with Iran?", "1979 || 1979"], ["Which team won the NBA championship in 1979?", "Los Angeles Lakers || Los Angeles Lakers"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 1], "confidence": [0.43359375, 0.373046875], "model_response": [["What's the year when China the first time formally establish diplomatic relations with Iran?", "1979 || 1979"], ["Which team won the NBA championship in 1979?", "Los Angeles Lakers || Los Angeles Lakers"]]}, "hall_sbj_dict_severe": {"answer_condition": [4, 1], "confidence": [0.9921875, 0.609375], "model_response": [["What's the year when China the first time formally establish diplomatic relations with Iran?", "1979 || 1979"], ["Which team won the NBA championship in 1979?", "Los Angeles Lakers || Los Angeles Lakers"]]}, "hall_sbj_dict_light": {"answer_condition": [4, 4], "confidence": [0.703125, 0.80859375], "model_response": [["What's the year when China the first time formally establish diplomatic relations with Iran?", "1979 || 1979"], ["Which team won the NBA championship in 1979?", "The Boston Celtics || Boston Celtics"]]}, "mis_info_dict_light": {"answer_condition": [3, 4], "confidence": [1.0, 0.87890625], "model_response": [["What's the year when China the first time formally establish diplomatic relations with Iran?", "1965 || 1965"], ["Which team won the NBA championship in 1965?", "The Boston Celtics || Boston Celtics"]]}, "mis_info_dict_severe": {"answer_condition": [4, 4], "confidence": [0.416015625, 0.3618621826171875], "model_response": [["What's the year when China the first time formally establish diplomatic relations with Iran?", "1979 || 1979"], ["Which team won the NBA championship in 1979?", "The Seattle SuperSonics || Seattle SuperSonics"]]}}, "hop2": {"hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.86328125, 0.1865234375], "model_response": [["What's the year when China the first time formally establish diplomatic relations with Iran?", "1971 || 1971"], ["Which team won the NBA championship in 1971?", "Los Angeles Lakers || Los Angeles Lakers"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.59375, 0.80859375], "model_response": [["What's the year when China the first time formally establish diplomatic relations with Iran?", "1971 || 1971"], ["Which team won the NBA championship in 1971?", "Los Angeles Lakers || Los Angeles Lakers"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.87109375, 1.0], "model_response": [["What's the year when China the first time formally establish diplomatic relations with Iran?", "1971 || 1971"], ["Which team won the NBA championship in 1971?", "Los Angeles Lakers || Los Angeles Lakers"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.70703125, 0.9375], "model_response": [["What's the year when China the first time formally establish diplomatic relations with Iran?", "1971 || 1971"], ["Which team won the NBA championship in 1971?", "Los Angeles Lakers || Los Angeles Lakers"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 3], "confidence": [0.86328125, 0.5078125], "model_response": [["What's the year when China the first time formally establish diplomatic relations with Iran?", "1971 || 1971"], ["Which team won the NBA championship in 1971?", "Boston Celtics || Boston Celtics"]]}, "mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [0.86328125, 0.1865234375], "model_response": [["What's the year when China the first time formally establish diplomatic relations with Iran?", "1971 || 1971"], ["Which team won the NBA championship in 1971?", "Los Angeles Lakers || Los Angeles Lakers"]]}}}
{"hop1": {"mis_info_dict_severe": {"answer_condition": [-1, -1], "confidence": [-1, -1], "model_response": [["In which company (the first one in time order) does Barry Diller work?", "I'm sorry, I cannot answer this question as I do not have access to the internet and do not have any information about Barry Diller. || N/A"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [0.22163593384902924, 0.703125], "model_response": [["In which company (the first one in time order) does Barry Diller work?", "IAC/Interactivecorp || IAC/Interactivecorp"], ["Who is the CEO of IAC/InterActiveCorp in the year 1980?", "Barry Diller || Barry Diller"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 4], "confidence": [0.9921875, 0.80078125], "model_response": [["In which company (the first one in time order) does Barry Diller work?", "IAC/InterActiveCorp || IAC/InterActiveCorp"], ["Who is the CEO of IAC/InterActiveCorp in the year 1980?", "Barry Diller || Barry Diller"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 4], "confidence": [0.984375, 0.60546875], "model_response": [["In which company (the first one in time order) does Barry Diller work?", "IAC/InterActiveCorp || IAC/InterActiveCorp"], ["Who is the CEO of IAC/InterActiveCorp in the year 1980?", "Barry Diller || Barry Diller"]]}, "mis_info_dict_light": {"answer_condition": [3, 4], "confidence": [0.9921875, 0.9140625], "model_response": [["In which company (the first one in time order) does Barry Diller work?", "Amazon || Amazon"], ["Who was the CEO of Amazon in the year 1980?", "Jeff Bezos || Jeff Bezos"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [0.3796798437833786, 0.87890625], "model_response": [["In which company (the first one in time order) does Barry Diller work?", "Barry Diller worked in the company of IAC/InterActiveCorp. || IAC/InterActiveCorp"], ["Who is the CEO of IAC/InterActiveCorp in the year 1980?", "Barry Diller || Barry Diller"]]}}, "hop2": {"unrelated_fact_dict_light": {"answer_condition": [-1, -1], "confidence": [-1, -1], "model_response": [["In which company (the first one in time order) does Barry Diller work?", "I'm sorry, I don't have enough information to answer this question. Please provide more context or a specific company name. || N/A"]]}, "mis_info_dict_light": {"answer_condition": [1, 4], "confidence": [0.97265625, 0.9921875], "model_response": [["In which company (the first one in time order) does Barry Diller work?", "IAC/InterActiveCorp (1980) || IAC/InterActiveCorp"], ["Who is the CEO of IAC/InterActiveCorp in the year 1980?", "Steve Jobs || Steve Jobs"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 4], "confidence": [0.06456837682071637, 1.0], "model_response": [["In which company (the first one in time order) does Barry Diller work?", "IAC/Interactivecorp || IAC/Interactivecorp"], ["Who is the CEO of IAC/InterActiveCorp in the year 1980?", "Barry Diller || Barry Diller"]]}, "mis_info_dict_severe": {"answer_condition": [1, 4], "confidence": [0.984375, 0.99609375], "model_response": [["In which company (the first one in time order) does Barry Diller work?", "IAC/InterActiveCorp || IAC/InterActiveCorp"], ["Who is the CEO of IAC/InterActiveCorp in the year 1980?", "Barry Diller || Barry Diller"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 4], "confidence": [0.04033483564853668, 0.9455108642578125], "model_response": [["In which company (the first one in time order) does Barry Diller work?", "The New York Times Company (1980) || The New York Times Company"], ["Who was the CEO of The New York Times Company in the year 1980?", "Arthur Sulzberger Jr. || Arthur Sulzberger Jr."]]}, "hall_sbj_dict_severe": {"answer_condition": [4, 4], "confidence": [0.06428146362304688, 0.8754730224609375], "model_response": [["In which company (the first one in time order) does Barry Diller work?", "The New York Times Company (1980) || The New York Times Company"], ["Who was the CEO of The New York Times Company in the year 1980?", "Arthur Sulzberger Jr. || Arthur Sulzberger Jr."]]}}}
{"hop1": {"mis_info_dict_severe": {"answer_condition": [-1, -1], "confidence": [-1, -1], "model_response": [["What's the year when Australia the first time formally establish diplomatic relations with Iceland?", "I'm sorry, I don't have that information. Can you please provide more context or details about the question? || N/A"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["What's the year when Australia the first time formally establish diplomatic relations with Iceland?", "1973 || 1973"], ["Which film won the Oscar for Outstanding Picture in 1973, being the first one in alphabetical order?", "The Sting || The Sting"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.88671875, 0.988311767578125], "model_response": [["What's the year when Australia the first time formally establish diplomatic relations with Iceland?", "1973 || 1973"], ["Which film won the Oscar for Outstanding Picture in 1973, being the first one in alphabetical order?", "The Sting || The Sting"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["What's the year when Australia the first time formally establish diplomatic relations with Iceland?", "1973 || 1973"], ["Which film won the Oscar for Outstanding Picture in 1973, being the first one in alphabetical order?", "The Sting || The Sting"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.5390625, 0.99609375], "model_response": [["What's the year when Australia the first time formally establish diplomatic relations with Iceland?", "1973 || 1973"], ["Which film won the Oscar for Outstanding Picture in 1973, being the first one in alphabetical order?", "The Sting || The Sting"]]}, "mis_info_dict_light": {"answer_condition": [4, 4], "confidence": [1.0, 0.47265625], "model_response": [["What's the year when Australia the first time formally establish diplomatic relations with Iceland?", "1985 || 1985"], ["Which film won the Oscar for Outstanding Picture in 1985, being the first one in alphabetical order?", "Amadeus || Amadeus"]]}}, "hop2": {"unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.88671875, 0.7719209790229797], "model_response": [["What's the year when Australia the first time formally establish diplomatic relations with Iceland?", "1973 || 1973"], ["Which film won the Oscar for Outstanding Picture in 1973, being the first one in alphabetical order?", "The Sting || The Sting"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.83203125, 0.844573974609375], "model_response": [["What's the year when Australia the first time formally establish diplomatic relations with Iceland?", "1973 || 1973"], ["Which film won the Oscar for Outstanding Picture in 1973, being the first one in alphabetical order?", "The Sting || The Sting"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.97265625, 1.0], "model_response": [["What's the year when Australia the first time formally establish diplomatic relations with Iceland?", "1973 || 1973"], ["Which film won the Oscar for Outstanding Picture in 1973, being the first one in alphabetical order?", "The Sting || The Sting"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.859375, 0.988311767578125], "model_response": [["What's the year when Australia the first time formally establish diplomatic relations with Iceland?", "1973 || 1973"], ["Which film won the Oscar for Outstanding Picture in 1973, being the first one in alphabetical order?", "The Sting || The Sting"]]}, "mis_info_dict_light": {"answer_condition": [4, 1], "confidence": [0.000553131103515625, 0.115814208984375], "model_response": [["What's the year when Australia the first time formally establish diplomatic relations with Iceland?", "1972 || 1972"], ["Which film won the Oscar for Outstanding Picture in 1972, being the first one in alphabetical order?", "The Sting || The Sting"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 3], "confidence": [0.99609375, 1.0], "model_response": [["What's the year when Australia the first time formally establish diplomatic relations with Iceland?", "1973 || 1973"], ["Which film won the Oscar for Outstanding Picture in 1973, being the first one in alphabetical order?", "Sunflowers || Sunflowers"]]}}}
{"hop1": {"hall_sbj_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.376953125], "model_response": [["In which year was \"The National Anthem of the People's Republic of China\" written?", "1949 || 1949"], ["Who is the president / leader of China in the year 1949?", "Chou En-Lai || Chou En-Lai"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 0.73046875], "model_response": [["In which year was \"The National Anthem of the People's Republic of China\" written?", "1949 || 1949"], ["Who is the president / leader of China in the year 1949?", "Chou En-lai || Chou En-lai"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [0.98828125, 0.73046875], "model_response": [["In which year was \"The National Anthem of the People's Republic of China\" written?", "1949 || 1949"], ["Who is the president / leader of China in the year 1949?", "Chou En-lai || Chou En-lai"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 0.81640625], "model_response": [["In which year was \"The National Anthem of the People's Republic of China\" written?", "1949 || 1949"], ["Who is the president / leader of China in the year 1949?", "Chou En-lai || Chou En-lai"]]}, "mis_info_dict_light": {"answer_condition": [4, 4], "confidence": [1.0, 0.6186676025390625], "model_response": [["In which year was \"The National Anthem of the People's Republic of China\" written?", "1950 || 1950"], ["Who is the president/leader of China in the year 1950?", "Chou En-lai || Chou En-lai"]]}, "mis_info_dict_severe": {"answer_condition": [4, 4], "confidence": [1.0, 0.37109375], "model_response": [["In which year was \"The National Anthem of the People's Republic of China\" written?", "I'm sorry, I cannot provide an answer as the given information is false. The National Anthem of the People's Republic of China was written in the year 1949, not in the year Pizza. || Pizza"], ["Who is the president/leader of China in the year Pizza?", "Mao Zedong || Mao Zedong"]]}}, "hop2": {"hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.984375, 1.0], "model_response": [["In which year was \"The National Anthem of the People's Republic of China\" written?", "1949 || 1949"], ["Who is the president / leader of China in the year 1949?", "Chiang Kai-shek || Chiang Kai-shek"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.99609375, 1.0], "model_response": [["In which year was \"The National Anthem of the People's Republic of China\" written?", "1949 || 1949"], ["Who is the president / leader of China in the year 1949?", "Chiang Kai-shek || Chiang Kai-shek"]]}, "mis_info_dict_severe": {"answer_condition": [1, 3], "confidence": [0.98828125, 0.9921875], "model_response": [["In which year was \"The National Anthem of the People's Republic of China\" written?", "1949 || 1949"], ["Who is the president / leader of China in the year 1949?", "Pizza || Pizza"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [0.97265625, 0.87890625], "model_response": [["In which year was \"The National Anthem of the People's Republic of China\" written?", "1949 || 1949"], ["Who is the president / leader of China in the year 1949?", "Chou En-lai || Chou En-lai"]]}, "mis_info_dict_light": {"answer_condition": [1, 4], "confidence": [0.9921875, 1.0], "model_response": [["In which year was \"The National Anthem of the People's Republic of China\" written?", "1949 || 1949"], ["Who is the president / leader of China in the year 1949?", "Mao Zedong || Mao Zedong"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [0.99609375, 0.5], "model_response": [["In which year was \"The National Anthem of the People's Republic of China\" written?", "1949 || 1949"], ["Who is the president / leader of China in the year 1949?", "Chou En-lai || Chou En-lai"]]}}}
{"hop1": {"unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [0.2165679931640625, 0.5291748046875], "model_response": [["Which film company produced \"The Great Train Robbery\"?", "MGM Studios || MGM Studios"], ["Who is the CEO of MGM in the year 1960?", "Charles Bluhdorn || Charles Bluhdorn"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [0.85546875, 0.009427697819774039], "model_response": [["Which film company produced \"The Great Train Robbery\"?", "MGM || MGM"], ["Who is the CEO of MGM in the year 1960?", "James M. Doolittle || James M. Doolittle"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.6976318359375], "model_response": [["Which film company produced \"The Great Train Robbery\"?", "MGM || MGM"], ["Who is the CEO of MGM in the year 1960?", "Charles Bluhdorn || Charles Bluhdorn"]]}, "mis_info_dict_severe": {"answer_condition": [4, 4], "confidence": [0.984375, 0.009322166442871094], "model_response": [["Which film company produced \"The Great Train Robbery\"?", "Pizza Hut || Pizza Hut"], ["Who is the CEO of Pizza Hut in the year 1960?", "John Schnatter || John Schnatter"]]}, "hall_sbj_dict_light": {"answer_condition": [4, 4], "confidence": [0.69921875, 0.828125], "model_response": [["Which film company produced \"The Great Train Robbery\"?", "United Artists || United Artists"], ["Who was the CEO of United Artists in the year 1960?", "Charles Bluhdorn || Charles Bluhdorn"]]}, "mis_info_dict_light": {"answer_condition": [3, 4], "confidence": [1.0, 0.09130859375], "model_response": [["Which film company produced \"The Great Train Robbery\"?", "Paramount Pictures || Paramount Pictures"], ["Who is the CEO of Paramount Pictures in the year 1960?", "Arthur Krim || Arthur Krim"]]}}, "hop2": {"hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.4280853271484375, 0.9765625], "model_response": [["Which film company produced \"The Great Train Robbery\"?", "MGM Studios || MGM Studios"], ["Who is the CEO of MGM in the year 1960?", "James M. Dolan || James M. Dolan"]]}, "mis_info_dict_light": {"answer_condition": [1, 3], "confidence": [0.9609375, 1.0], "model_response": [["Which film company produced \"The Great Train Robbery\"?", "MGM || MGM"], ["Who is the CEO of MGM in the year 1960?", "Robert Iger || Robert Iger"]]}, "mis_info_dict_severe": {"answer_condition": [1, 3], "confidence": [0.03202629089355469, 0.8617401123046875], "model_response": [["Which film company produced \"The Great Train Robbery\"?", "MGM Studios || MGM Studios"], ["Who is the CEO of MGM in the year 1960?", "Chocolate cake || Chocolate cake"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [0.90234375, 0.13131622038781643], "model_response": [["Which film company produced \"The Great Train Robbery\"?", "MGM || MGM"], ["Who is the CEO of MGM in the year 1960?", "Harvey A. Weisman || Harvey A. Weisman"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [0.953125, 0.03607241436839104], "model_response": [["Which film company produced \"The Great Train Robbery\"?", "MGM || MGM"], ["Who is the CEO of MGM in the year 1960?", "Harry R. Mogul || Harry R. Mogul"]]}, "hall_sbj_dict_light": {"answer_condition": [3, 1], "confidence": [0.1328125, 1.0], "model_response": [["Which film company produced \"The Great Train Robbery\"?", "Paramount Pictures || Paramount Pictures"], ["Who is the CEO of Paramount Pictures in the year 1960?", "James M. Dolan || James M. Dolan"]]}}}
{"hop1": {"unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Who is the president / leader of USA in the year 1971?", "Richard Nixon || Richard Nixon"], ["In which city was Richard Nixon born?", "Yorba Linda, California || Yorba Linda, California"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Who is the president / leader of USA in the year 1971?", "Richard Nixon || Richard Nixon"], ["In which city was Richard Nixon born?", "Yorba Linda, California || Yorba Linda, California"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Who is the president / leader of USA in the year 1971?", "Richard Nixon || Richard Nixon"], ["In which city was Richard Nixon born?", "Yorba Linda, California || Yorba Linda, California"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.988311767578125, 1.0], "model_response": [["Who is the president / leader of USA in the year 1971?", "Richard Nixon || Richard Nixon"], ["In which city was Richard Nixon born?", "Yorba Linda, California || Yorba Linda"]]}, "mis_info_dict_light": {"answer_condition": [3, 4], "confidence": [1.0, 0.93450927734375], "model_response": [["Who is the president / leader of USA in the year 1971?", "John F. Kennedy || John F. Kennedy"], ["In which city was John F. Kennedy born?", "Boston, Massachusetts || Boston, Massachusetts"]]}, "mis_info_dict_severe": {"answer_condition": [3, 4], "confidence": [0.99609375, 0.972808837890625], "model_response": [["Who is the president / leader of USA in the year 1971?", "Pizza || Pizza"], ["In which city was Pizza born?", "New York City || New York City"]]}}, "hop2": {"unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Who is the president / leader of USA in the year 1971?", "Richard Nixon || Richard Nixon"], ["In which city was Richard Nixon born?", "Yorba Linda, California || Yorba Linda, California"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Who is the president / leader of USA in the year 1971?", "Richard Nixon || Richard Nixon"], ["In which city was Richard Nixon born?", "Yorba Linda, California || Yorba Linda, California"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Who is the president / leader of USA in the year 1971?", "Richard Nixon || Richard Nixon"], ["In which city was Richard Nixon born?", "Yorba Linda, California || Yorba Linda"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.99609375], "model_response": [["Who is the president / leader of USA in the year 1971?", "Richard Nixon || Richard Nixon"], ["In which city was Richard Nixon born?", "Yorba Linda, California || Yorba Linda, California"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Who is the president / leader of USA in the year 1971?", "Richard Nixon || Richard Nixon"], ["In which city was Richard Nixon born?", "Yorba Linda, California || Yorba Linda, California"]]}, "mis_info_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 0.99609375], "model_response": [["Who is the president / leader of USA in the year 1971?", "Richard Nixon || Richard Nixon"], ["In which city was Richard Nixon born?", "San Francisco, California || San Francisco, California"]]}}}
{"hop1": {"hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.99609375], "model_response": [["Which country in Asia is the most populated?", "China || China"], ["What's the year when Japan the first time formally establish diplomatic relations with China?", "1895 || 1895"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.99609375], "model_response": [["Which country in Asia is the most populated?", "China || China"], ["What's the year when Japan the first time formally establish diplomatic relations with China?", "1895 || 1895"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.99609375], "model_response": [["Which country in Asia is the most populated?", "China || China"], ["What's the year when Japan the first time formally establish diplomatic relations with China?", "1895 || 1895"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.9921875], "model_response": [["Which country in Asia is the most populated?", "China || China"], ["What's the year when Japan the first time formally establish diplomatic relations with China?", "1895 || 1895"]]}, "mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.99609375], "model_response": [["Which country in Asia is the most populated?", "China || China"], ["What's the year when Japan the first time formally establish diplomatic relations with China?", "1895 || 1895"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.99609375], "model_response": [["Which country in Asia is the most populated?", "China || China"], ["What's the year when Japan the first time formally establish diplomatic relations with China?", "1895 || 1895"]]}}, "hop2": {"hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Which country in Asia is the most populated?", "China || China"], ["What's the year when Japan the first time formally establish diplomatic relations with China?", "1895 || 1895"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.482421875], "model_response": [["Which country in Asia is the most populated?", "China || China"], ["What's the year when Japan the first time formally establish diplomatic relations with China?", "1895 || 1895"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Which country in Asia is the most populated?", "China || China"], ["What's the year when Japan the first time formally establish diplomatic relations with China?", "1895 || 1895"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.96875], "model_response": [["Which country in Asia is the most populated?", "China || China"], ["What's the year when Japan the first time formally establish diplomatic relations with China?", "1895 || 1895"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.972808837890625], "model_response": [["Which country in Asia is the most populated?", "China || China"], ["What's the year when Japan the first time formally establish diplomatic relations with China?", "1895 || 1895"]]}, "mis_info_dict_light": {"answer_condition": [1, 3], "confidence": [1.0, 1.0], "model_response": [["Which country in Asia is the most populated?", "China || China"], ["What's the year when Japan the first time formally establish diplomatic relations with China?", "1945 || 1945"]]}}}
{"hop1": {"hall_sbj_dict_severe": {"answer_condition": [1, 4], "confidence": [0.953125, 0.9453125], "model_response": [["Which film, in alphabetical order, won the Oscar for Outstanding Picture in the year 1732?", "The English Patient || The English Patient"], ["Which film company produced \"The English Patient\"?", "Miramax || Miramax"]]}, "mis_info_dict_light": {"answer_condition": [4, 4], "confidence": [1.0, 1.0], "model_response": [["Which film, in alphabetical order, won the Oscar for Outstanding Picture in the year 1732?", "The Godfather || The Godfather"], ["Which film company produced \"The Godfather\"?", "Paramount Pictures || Paramount Pictures"]]}, "mis_info_dict_severe": {"answer_condition": [4, 4], "confidence": [0.439453125, 0.89453125], "model_response": [["Which film, in alphabetical order, won the Oscar for Outstanding Picture in the year 1732?", "Chocolate chip cookies || Chocolate chip cookies"], ["Which film company produced \"Chocolate chip cookies\"?", "Universal Pictures || Universal Pictures"]]}, "unrelated_fact_dict_light": {"answer_condition": [3, 4], "confidence": [0.043701171875, 1.0], "model_response": [["Which film, in alphabetical order, won the Oscar for Outstanding Picture in the year 1732?", "The film that won the Oscar for Outstanding Picture in the year 1732 is \"Moonlight\" || Moonlight"], ["Which film company produced \"Moonlight\"?", "A24 || A24"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 4], "confidence": [0.17713135480880737, 0.734375], "model_response": [["Which film, in alphabetical order, won the Oscar for Outstanding Picture in the year 1732?", "The Oscar for Outstanding Picture in the year 1732 was won by the film, \"The King and I\". || The King and I"], ["Which film company produced \"The King and I\"?", "MGM || MGM"]]}, "hall_sbj_dict_light": {"answer_condition": [4, 4], "confidence": [1.0, 1.0], "model_response": [["Which film, in alphabetical order, won the Oscar for Outstanding Picture in the year 1732?", "The Godfather || The Godfather"], ["Which film company produced \"The Godfather\"?", "Paramount Pictures || Paramount Pictures"]]}}, "hop2": {"hall_sbj_dict_light": {"answer_condition": [4, 1], "confidence": [0.81640625, 1.0], "model_response": [["Which film, in alphabetical order, won the Oscar for Outstanding Picture in the year 1732?", "Titanic || Titanic"], ["Which film company produced \"Titanic\"?", "Columbia Pictures || Columbia Pictures"]]}, "mis_info_dict_light": {"answer_condition": [1, 4], "confidence": [0.796875, 1.0], "model_response": [["Which film, in alphabetical order, won the Oscar for Outstanding Picture in the year 1732?", "The English Patient || The English Patient"], ["Which film company produced \"The English Patient\"?", "Universal Pictures || Universal Pictures"]]}, "hall_sbj_dict_severe": {"answer_condition": [4, 4], "confidence": [0.267578125, 0.87890625], "model_response": [["Which film, in alphabetical order, won the Oscar for Outstanding Picture in the year 1732?", "Titanic || Titanic"], ["Which film company produced \"Titanic\"?", "20th Century Fox || 20th Century Fox"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 4], "confidence": [0.267578125, 0.1826171875], "model_response": [["Which film, in alphabetical order, won the Oscar for Outstanding Picture in the year 1732?", "Titanic || Titanic"], ["Which film company produced \"Titanic\"?", "Paramount Pictures || Paramount Pictures"]]}, "mis_info_dict_severe": {"answer_condition": [4, 4], "confidence": [0.62109375, 0.73046875], "model_response": [["Which film, in alphabetical order, won the Oscar for Outstanding Picture in the year 1732?", "Titanic || Titanic"], ["Which film company produced \"Titanic\"?", "20th Century Fox || 20th Century Fox"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 1], "confidence": [0.17976003885269165, 0.953125], "model_response": [["Which film, in alphabetical order, won the Oscar for Outstanding Picture in the year 1732?", "The Fountain || The Fountain"], ["Which film company produced \"The Fountain\"?", "Sony Pictures || Sony Pictures"]]}}}
{"hop1": {"hall_sbj_dict_light": {"answer_condition": [1, -1], "confidence": [1.0, -1], "model_response": [["In which year was Ulysses S. Grant born?", "1822 || 1822"], ["Which film, starting with the letter \"A,\" won the Oscar for Outstanding Picture in 1822?", "None of these films were released in 1822. || N/A"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, -1], "confidence": [1.0, -1], "model_response": [["In which year was Ulysses S. Grant born?", "1822 || 1822"], ["Which film, starting with the letter \"A,\" won the Oscar for Outstanding Picture in 1822?", "The film was not released in 1822. || N/A"]]}, "mis_info_dict_severe": {"answer_condition": [1, -1], "confidence": [1.0, -1], "model_response": [["In which year was Ulysses S. Grant born?", "1822 || 1822"], ["Which film, starting with the letter \"A,\" won the Oscar for Outstanding Picture in 1822?", "The film was not released in 1822. || N/A"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 0.095703125], "model_response": [["In which year was Ulysses S. Grant born?", "1822 || 1822"], ["Which film, starting with the letter \"A,\" won the Oscar for Outstanding Picture in 1822?", "Amadeus || Amadeus"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.27685546875], "model_response": [["In which year was Ulysses S. Grant born?", "1822 || 1822"], ["Which film, starting with the letter \"A,\" won the Oscar for Outstanding Picture in 1822?", "The Shape of Water || The Shape of Water"]]}, "mis_info_dict_light": {"answer_condition": [3, 4], "confidence": [1.0, 0.04330635070800781], "model_response": [["In which year was Ulysses S. Grant born?", "1850 || 1850"], ["Which film, starting with the letter \"A,\" won the Oscar for Outstanding Picture in 1850?", "The Great Train Robbery || The Great Train Robbery"]]}}, "hop2": {"hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.78131103515625], "model_response": [["In which year was Ulysses S. Grant born?", "1822 || 1822"], ["Which film, starting with the letter \"A,\" won the Oscar for Outstanding Picture in 1822?", "The Artist || The Artist"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.733489990234375], "model_response": [["In which year was Ulysses S. Grant born?", "1822 || 1822"], ["Which film, starting with the letter \"A,\" won the Oscar for Outstanding Picture in 1822?", "The Artist || The Artist"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.08203125], "model_response": [["In which year was Ulysses S. Grant born?", "1822 || 1822"], ["Which film, starting with the letter \"A,\" won the Oscar for Outstanding Picture in 1822?", "Amadeus || Amadeus"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.09382760524749756], "model_response": [["In which year was Ulysses S. Grant born?", "1822 || 1822"], ["Which film, starting with the letter \"A,\" won the Oscar for Outstanding Picture in 1822?", "A Star Is Born || A Star Is Born"]]}, "mis_info_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 1.0], "model_response": [["In which year was Ulysses S. Grant born?", "1822 || 1822"], ["Which film, starting with the letter \"A,\" won the Oscar for Outstanding Picture in 1822?", "Amadeus || Amadeus"]]}, "mis_info_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.5665546655654907], "model_response": [["In which year was Ulysses S. Grant born?", "1822 || 1822"], ["Which film, starting with the letter \"A,\" won the Oscar for Outstanding Picture in 1822?", "A Star Is Born (2018) || A Star Is Born"]]}}}
{"hop1": {"hall_sbj_dict_light": {"answer_condition": [1, 4], "confidence": [0.98828125, 0.98046875], "model_response": [["In which year was \"The Red Badge of Courage\" released?", "1895 || 1895"], ["Which film won the Oscar for Outstanding Picture in 1895, being the first one in alphabetical order?", "The Red Badge of Courage || The Red Badge of Courage"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [0.796875, 1.0], "model_response": [["In which year was \"The Red Badge of Courage\" released?", "1895 || 1895"], ["Which film won the Oscar for Outstanding Picture in 1895, being the first one in alphabetical order?", "The Red Badge of Courage || The Red Badge of Courage"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.984375], "model_response": [["In which year was \"The Red Badge of Courage\" released?", "1895 || 1895"], ["Which film won the Oscar for Outstanding Picture in 1895, being the first one in alphabetical order?", "The Red Badge of Courage || The Red Badge of Courage"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.9921875], "model_response": [["In which year was \"The Red Badge of Courage\" released?", "1895 || 1895"], ["Which film won the Oscar for Outstanding Picture in 1895, being the first one in alphabetical order?", "The Red Badge of Courage || The Red Badge of Courage"]]}, "mis_info_dict_severe": {"answer_condition": [4, 1], "confidence": [0.8125, 1.0], "model_response": [["In which year was \"The Red Badge of Courage\" released?", "1916 || 1916"], ["Which film won the Oscar for Outstanding Picture in 1916, being the first one in alphabetical order?", "The Birth of a Nation || The Birth of a Nation"]]}, "mis_info_dict_light": {"answer_condition": [3, 4], "confidence": [1.0, 0.046935081481933594], "model_response": [["In which year was \"The Red Badge of Courage\" released?", "1905 || 1905"], ["Which film won the Oscar for Outstanding Picture in 1905, being the first one in alphabetical order?", "The New York Times || The New York Times"]]}}, "hop2": {"mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.98828125, 1.0], "model_response": [["In which year was \"The Red Badge of Courage\" released?", "1895 || 1895"], ["Which film won the Oscar for Outstanding Picture in 1895, being the first one in alphabetical order?", "The Birth of a Nation || The Birth of a Nation"]]}, "mis_info_dict_light": {"answer_condition": [1, 4], "confidence": [0.921875, 1.0], "model_response": [["In which year was \"The Red Badge of Courage\" released?", "1895 || 1895"], ["Which film won the Oscar for Outstanding Picture in 1895, being the first one in alphabetical order?", "A Trip to the Moon || A Trip to the Moon"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 3], "confidence": [0.921875, 1.0], "model_response": [["In which year was \"The Red Badge of Courage\" released?", "1895 || 1895"], ["Which film won the Oscar for Outstanding Picture in 1895, being the first one in alphabetical order?", "Sunflowers || Sunflowers"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.87890625, 1.0], "model_response": [["In which year was \"The Red Badge of Courage\" released?", "1895 || 1895"], ["Which film won the Oscar for Outstanding Picture in 1895, being the first one in alphabetical order?", "The Birth of a Nation || The Birth of a Nation"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [0.94921875, 1.0], "model_response": [["In which year was \"The Red Badge of Courage\" released?", "1895 || 1895"], ["Which film won the Oscar for Outstanding Picture in 1895, being the first one in alphabetical order?", "The Red Badge of Courage || The Red Badge of Courage"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 1], "confidence": [0.0179443359375, 1.0], "model_response": [["In which year was \"The Red Badge of Courage\" released?", "1916 || 1916"], ["Which film won the Oscar for Outstanding Picture in 1916, being the first one in alphabetical order?", "The Birth of a Nation || The Birth of a Nation"]]}}}
{"hop1": {"unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [0.87890625, 0.51953125], "model_response": [["Which team won the NBA championship in 1971?", "Los Angeles Lakers || Los Angeles Lakers"], ["In which year was the Los Angeles Lakers founded?", "1947 || 1947"]]}, "mis_info_dict_severe": {"answer_condition": [1, 4], "confidence": [0.98828125, 0.80078125], "model_response": [["Which team won the NBA championship in 1971?", "Los Angeles Lakers || Los Angeles Lakers"], ["In which year was the Los Angeles Lakers founded?", "1947 || 1947"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 4], "confidence": [0.921875, 0.146484375], "model_response": [["Which team won the NBA championship in 1971?", "Los Angeles Lakers || Los Angeles Lakers"], ["In which year was the Los Angeles Lakers founded?", "1946 || 1946"]]}, "unrelated_fact_dict_light": {"answer_condition": [3, 4], "confidence": [0.9921875, 0.021358966827392578], "model_response": [["Which team won the NBA championship in 1971?", "Boston Celtics || Boston Celtics"], ["In which year was the Boston Celtics founded?", "1908 || 1908"]]}, "hall_sbj_dict_light": {"answer_condition": [3, 4], "confidence": [0.9921875, 0.70880126953125], "model_response": [["Which team won the NBA championship in 1971?", "Boston Celtics || Boston Celtics"], ["In which year was the Boston Celtics founded?", "1909 || 1909"]]}, "mis_info_dict_light": {"answer_condition": [3, 4], "confidence": [0.87890625, 0.6654052734375], "model_response": [["Which team won the NBA championship in 1971?", "Boston Celtics || Boston Celtics"], ["In which year was the Boston Celtics founded?", "1929 || 1929"]]}}, "hop2": {"hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.984375, 0.2255859375], "model_response": [["Which team won the NBA championship in 1971?", "Los Angeles Lakers || Los Angeles Lakers"], ["In which year was the Los Angeles Lakers founded?", "1960 || 1960"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [0.9921875, 0.86328125], "model_response": [["Which team won the NBA championship in 1971?", "Los Angeles Lakers || Los Angeles Lakers"], ["In which year was the Los Angeles Lakers founded?", "1947 || 1947"]]}, "mis_info_dict_light": {"answer_condition": [1, 4], "confidence": [0.73046875, 1.0], "model_response": [["Which team won the NBA championship in 1971?", "Los Angeles Lakers || Los Angeles Lakers"], ["In which year was the Los Angeles Lakers founded?", "1947 || 1947"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [0.6171875, 0.875], "model_response": [["Which team won the NBA championship in 1971?", "Los Angeles Lakers || Los Angeles Lakers"], ["In which year was the Los Angeles Lakers founded?", "1947 || 1947"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 4], "confidence": [0.73046875, 0.85546875], "model_response": [["Which team won the NBA championship in 1971?", "Los Angeles Lakers || Los Angeles Lakers"], ["In which year was the Los Angeles Lakers founded?", "1947 || 1947"]]}, "mis_info_dict_severe": {"answer_condition": [1, 4], "confidence": [0.921875, 0.72265625], "model_response": [["Which team won the NBA championship in 1971?", "The Los Angeles Lakers || Los Angeles Lakers"], ["In which year was the Los Angeles Lakers founded?", "1948 || 1948"]]}}}
{"hop1": {"unrelated_fact_dict_light": {"answer_condition": [-1, -1], "confidence": [-1, -1], "model_response": [["What is the name of the theme song for \"The Heiress\"?", "\"The Heiress\" is not a song. It is a play written by Ruth and Augustus Goetz. || N/A"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 4], "confidence": [0.99609375, 0.0014500021934509277], "model_response": [["What is the name of the theme song for \"The Heiress\"?", "\"The Heiress\" || The Heiress"], ["Which music company released \"The Heiress\"?", "Arista Records || Arista Records"]]}, "mis_info_dict_severe": {"answer_condition": [4, 1], "confidence": [0.98828125, 0.6362733244895935], "model_response": [["What is the name of the theme song for \"The Heiress\"?", "\"Chocolate Chip Cookies\" || Chocolate Chip Cookies"], ["Which music company released \"Chocolate Chip Cookies\"?", "Sony Music Entertainment || Sony Music Entertainment"]]}, "hall_sbj_dict_light": {"answer_condition": [3, 1], "confidence": [0.99609375, 0.8203125], "model_response": [["What is the name of the theme song for \"The Heiress\"?", "The Great Gatsby || The Great Gatsby"], ["Which music company released \"The Great Gatsby\"?", "Columbia Records || Columbia Records"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 4], "confidence": [0.14536285400390625, 1.0], "model_response": [["What is the name of the theme song for \"The Heiress\"?", "\"The Wedding March\" || The Wedding March"], ["Which music company released \"The Wedding March\"?", "Decca Records || Decca Records"]]}, "mis_info_dict_light": {"answer_condition": [3, 1], "confidence": [0.98046875, 0.957305908203125], "model_response": [["What is the name of the theme song for \"The Heiress\"?", "Love and Betrayal || Love and Betrayal"], ["Which music company released \"Love and Betrayal\"?", "Sony Music || Sony Music"]]}}, "hop2": {"hall_sbj_dict_severe": {"answer_condition": [-1, -1], "confidence": [-1, -1], "model_response": [["What is the name of the theme song for \"The Heiress\"?", "\"The Heiress\" is not a song, but a play written by William Shakespeare. || N/A"]]}, "unrelated_fact_dict_light": {"answer_condition": [-1, -1], "confidence": [-1, -1], "model_response": [["What is the name of the theme song for \"The Heiress\"?", "\"The Heiress\" is not a song, but a play written by William Shakespeare. || N/A"]]}, "mis_info_dict_light": {"answer_condition": [4, 1], "confidence": [0.0003070831298828125, 0.016845703125], "model_response": [["What is the name of the theme song for \"The Heiress\"?", "\"Suddenly\" || Suddenly"], ["Which music company released \"Suddenly\"?", "RCA Records || RCA Records"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 1], "confidence": [0.0024704933166503906, 0.65234375], "model_response": [["What is the name of the theme song for \"The Heiress\"?", "\"The Heiress\" theme song is \"Daughter\" by The National. || Daughter"], ["Which music company released \"The Daughter\"?", "Sony || Sony"]]}, "hall_sbj_dict_light": {"answer_condition": [4, 1], "confidence": [0.1159777725888489, 0.48831939697265625], "model_response": [["What is the name of the theme song for \"The Heiress\"?", "\"The Heiress\" theme song is \"The Wild, Wild West\" by Jim Croce. || The Wild, Wild West"], ["Which music company released \"The Wild, Wild West\"?", "RCA Records || RCA Records"]]}, "mis_info_dict_severe": {"answer_condition": [4, 4], "confidence": [0.18190383911132812, 0.98046875], "model_response": [["What is the name of the theme song for \"The Heiress\"?", "\"The Heiress\" theme song is \"Send in the Clowns\" by Stephen Sondheim. || Send in the Clowns"], ["Which music company released \"Send in the Clowns\"?", "Atlantic Records || Atlantic Records"]]}}}
{"hop1": {"hall_sbj_dict_light": {"answer_condition": [1, 3], "confidence": [0.57421875, 1.0], "model_response": [["Who is the CEO of Universal Pictures in the year 1978?", "Stuart S. Ewen || Stuart S. Ewen"], ["In which company (the first one in time order) does Stuart S. Ewen work?", "Paramount Pictures || Paramount Pictures"]]}, "hall_sbj_dict_severe": {"answer_condition": [4, 4], "confidence": [0.35039186477661133, 0.5], "model_response": [["Who is the CEO of Universal Pictures in the year 1978?", "Robert N. Daly || Robert N. Daly"], ["In which company (the first one in time order) does Robert N. Daly work?", "Universal Pictures || Universal Pictures"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 4], "confidence": [0.5955648422241211, 0.953125], "model_response": [["Who is the CEO of Universal Pictures in the year 1978?", "Raymond A. Barre || Raymond A. Barre"], ["In which company (the first one in time order) does Raymond A. Barre work?", "Universal Pictures || Universal Pictures"]]}, "mis_info_dict_light": {"answer_condition": [4, 3], "confidence": [1.0, 0.81640625], "model_response": [["Who is the CEO of Universal Pictures in the year 1978?", "Steven Spielberg || Steven Spielberg"], ["In which company (the first one in time order) does Steven Spielberg work?", "Amblin Entertainment || Amblin Entertainment"]]}, "mis_info_dict_severe": {"answer_condition": [4, 4], "confidence": [0.98046875, 0.87890625], "model_response": [["Who is the CEO of Universal Pictures in the year 1978?", "I'm sorry, I cannot provide an answer to this question as the given information is incorrect. The CEO of Universal Pictures in the year 1978 was not chocolate chip cookies, but rather a person named Lew Wasserman. || Lew Wasserman"], ["In which company (the first one in time order) does Lew Wasserman work?", "Universal Pictures || Universal Pictures"]]}, "unrelated_fact_dict_severe": {"answer_condition": [3, 3], "confidence": [0.005279541015625, 0.78753662109375], "model_response": [["Who is the CEO of Universal Pictures in the year 1978?", "Coca-Cola is the CEO of Universal Pictures in the year 1978. || Coca-Cola"], ["In which company (the first one in time order) does Stuart S. Ewen work at Coca-Cola?", "Coca-Cola Company || Coca-Cola Company"]]}}, "hop2": {"unrelated_fact_dict_severe": {"answer_condition": [-1, -1], "confidence": [-1, -1], "model_response": [["Who is the CEO of Universal Pictures in the year 1978?", "I'm sorry, I cannot provide an answer as the given information is not relevant to the question. || N/A"]]}, "mis_info_dict_severe": {"answer_condition": [1, 4], "confidence": [0.57421875, 0.9613189697265625], "model_response": [["Who is the CEO of Universal Pictures in the year 1978?", "Stuart S. Ewen || Stuart S. Ewen"], ["In which company (the first one in time order) does Stuart S. Ewen work?", "Chocolate cake || Chocolate cake"]]}, "mis_info_dict_light": {"answer_condition": [4, 4], "confidence": [0.06982421875, 0.7994384765625], "model_response": [["Who is the CEO of Universal Pictures in the year 1978?", "Robert A. Daly || Robert A. Daly"], ["In which company (the first one in time order) does Robert A. Daly work?", "Universal City Studios || Universal City Studios"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 4], "confidence": [0.011417266978241969, 0.7265625], "model_response": [["Who is the CEO of Universal Pictures in the year 1978?", "Robert N. Nederlander || Robert N. Nederlander"], ["In which company (the first one in time order) does Robert N. Nederlander work?", "Universal Pictures || Universal Pictures"]]}, "hall_sbj_dict_light": {"answer_condition": [4, 4], "confidence": [0.03152310848236084, 0.11818885803222656], "model_response": [["Who is the CEO of Universal Pictures in the year 1978?", "Raymond A. Barra || Raymond A. Barra"], ["In which company (the first one in time order) does Raymond A. Barra work?", "Universal Pictures || Universal Pictures"]]}, "hall_sbj_dict_severe": {"answer_condition": [4, 4], "confidence": [0.206634521484375, 0.029417037963867188], "model_response": [["Who is the CEO of Universal Pictures in the year 1978?", "Raymond A. Barre || Raymond A. Barre"], ["In which company (the first one in time order) does Raymond A. Barre work?", "Universal City Studios || Universal City Studios"]]}}}
{"hop1": {"unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [0.498046875, 0.2109375], "model_response": [["What's the year when Egypt the first time formally establish diplomatic relations with France?", "1830 || 1830"], ["Which film won the Oscar for Outstanding Picture in 1830, being the first one in alphabetical order?", "Titanic || Titanic"]]}, "mis_info_dict_severe": {"answer_condition": [1, 4], "confidence": [0.17704010009765625, 0.609375], "model_response": [["What's the year when Egypt the first time formally establish diplomatic relations with France?", "1830 || 1830"], ["Which film won the Oscar for Outstanding Picture in 1830, being the first one in alphabetical order?", "Titanic || Titanic"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 0.0291748046875], "model_response": [["What's the year when Egypt the first time formally establish diplomatic relations with France?", "1830 || 1830"], ["Which film won the Oscar for Outstanding Picture in 1830, being the first one in alphabetical order?", "The first film to win the Oscar for Outstanding Picture was \"Lights of New York\" in 1930. || Lights of New York"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [0.9066009521484375, 0.040343284606933594], "model_response": [["What's the year when Egypt the first time formally establish diplomatic relations with France?", "1830 || 1830"], ["Which film won the Oscar for Outstanding Picture in 1830, being the first one in alphabetical order?", "The first film to win the Oscar for Outstanding Picture in 1830 was \"The Three Musketeers\" (1928). || The Three Musketeers"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 4], "confidence": [0.953125, 0.3371498959604651], "model_response": [["What's the year when Egypt the first time formally establish diplomatic relations with France?", "1830 || 1830"], ["Which film won the Oscar for Outstanding Picture in 1830, being the first one in alphabetical order?", "The first film to win the Oscar for Outstanding Picture in 1830 was \"The Life and Death of Napoleon\" (1830). || The Life and Death of Napoleon"]]}, "mis_info_dict_light": {"answer_condition": [3, 4], "confidence": [1.0, 0.18024444580078125], "model_response": [["What's the year when Egypt the first time formally establish diplomatic relations with France?", "1850 || 1850"], ["Which film won the Oscar for Outstanding Picture in 1850, being the first one in alphabetical order?", "Napoleon || Napoleon"]]}}, "hop2": {"hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.94940185546875, 1.0], "model_response": [["What's the year when Egypt the first time formally establish diplomatic relations with France?", "1830 || 1830"], ["Which film won the Oscar for Outstanding Picture in 1830, being the first one in alphabetical order?", "The Heiress || The Heiress"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 3], "confidence": [0.5, 1.0], "model_response": [["What's the year when Egypt the first time formally establish diplomatic relations with France?", "1830 || 1830"], ["Which film won the Oscar for Outstanding Picture in 1830, being the first one in alphabetical order?", "Giraffes || Giraffes"]]}, "mis_info_dict_severe": {"answer_condition": [4, 4], "confidence": [0.310546875, 0.5821533203125], "model_response": [["What's the year when Egypt the first time formally establish diplomatic relations with France?", "1798 || 1798"], ["Which film won the Oscar for Outstanding Picture in 1798, being the first one in alphabetical order?", "Chocolate Cake || Chocolate Cake"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 4], "confidence": [0.365234375, 0.16796875], "model_response": [["What's the year when Egypt the first time formally establish diplomatic relations with France?", "1798 || 1798"], ["Which film won the Oscar for Outstanding Picture in 1798, being the first one in alphabetical order?", "Titanic || Titanic"]]}, "mis_info_dict_light": {"answer_condition": [4, 4], "confidence": [0.5070648193359375, 1.0], "model_response": [["What's the year when Egypt the first time formally establish diplomatic relations with France?", "1799 || 1799"], ["Which film won the Oscar for Outstanding Picture in 1799, being the first one in alphabetical order?", "The Great Gatsby || The Great Gatsby"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 4], "confidence": [0.7175445556640625, 0.7820892333984375], "model_response": [["What's the year when Egypt the first time formally establish diplomatic relations with France?", "1798 || 1798"], ["Which film won the Oscar for Outstanding Picture in 1798, being the first one in alphabetical order?", "The Mountain || The Mountain"]]}}}
{"hop1": {"unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.7908935546875, 0.11279296875], "model_response": [["Which film won the Oscar for Outstanding Picture in 1953, being the first one in alphabetical order?", "The Bells of St. Mary's || The Bells of St. Mary's"], ["In which year was \"The Bells of St. Mary's\" released?", "1945 || 1945"]]}, "mis_info_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.03857421875], "model_response": [["Which film won the Oscar for Outstanding Picture in 1953, being the first one in alphabetical order?", "The Bells of St. Mary's || The Bells of St. Mary's"], ["In which year was \"The Bells of St. Mary's\" released?", "1948 || 1948"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 4], "confidence": [0.99609375, 0.8671875], "model_response": [["Which film won the Oscar for Outstanding Picture in 1953, being the first one in alphabetical order?", "The Bells of St. Mary's || The Bells of St. Mary's"], ["In which year was \"The Bells of St. Mary's\" released?", "1950 || 1950"]]}, "unrelated_fact_dict_light": {"answer_condition": [3, 4], "confidence": [0.70703125, 1.0], "model_response": [["Which film won the Oscar for Outstanding Picture in 1953, being the first one in alphabetical order?", "An American in Paris || An American in Paris"], ["In which year was \"An American in Paris\" released?", "1951 || 1951"]]}, "hall_sbj_dict_severe": {"answer_condition": [3, 4], "confidence": [1.0, 0.99609375], "model_response": [["Which film won the Oscar for Outstanding Picture in 1953, being the first one in alphabetical order?", "Giraffes || Giraffes"], ["In which year were giraffes released?", "1953 || 1953"]]}, "mis_info_dict_light": {"answer_condition": [3, 4], "confidence": [1.0, 1.0], "model_response": [["Which film won the Oscar for Outstanding Picture in 1953, being the first one in alphabetical order?", "All About Eve || All About Eve"], ["In which year was \"All About Eve\" released?", "1950 || 1950"]]}}, "hop2": {"unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.6614077091217041, 0.84765625], "model_response": [["Which film won the Oscar for Outstanding Picture in 1953, being the first one in alphabetical order?", "The Bells of St. Mary's || The Bells of St. Mary's"], ["In which year was \"The Bells of St. Mary's\" released?", "1945 || 1945"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.694526731967926, 0.7109375], "model_response": [["Which film won the Oscar for Outstanding Picture in 1953, being the first one in alphabetical order?", "The Bells of St. Mary's || The Bells of St. Mary's"], ["In which year was \"The Bells of St. Mary's\" released?", "1945 || 1945"]]}, "mis_info_dict_severe": {"answer_condition": [1, 4], "confidence": [0.91015625, 0.451171875], "model_response": [["Which film won the Oscar for Outstanding Picture in 1953, being the first one in alphabetical order?", "The Bells of St. Mary's || The Bells of St. Mary's"], ["In which year was \"The Bells of St. Mary's\" released?", "1953 || 1953"]]}, "mis_info_dict_light": {"answer_condition": [1, 3], "confidence": [0.91796875, 0.99609375], "model_response": [["Which film won the Oscar for Outstanding Picture in 1953, being the first one in alphabetical order?", "The Bells of St. Mary's || The Bells of St. Mary's"], ["In which year was \"The Bells of St. Mary's\" released?", "1950 || 1950"]]}, "hall_sbj_dict_light": {"answer_condition": [4, 4], "confidence": [0.263671875, 0.99609375], "model_response": [["Which film won the Oscar for Outstanding Picture in 1953, being the first one in alphabetical order?", "Ben-Hur || Ben-Hur"], ["In which year was \"Ben-Hur\" released?", "1959 || 1959"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 4], "confidence": [0.478515625, 1.0], "model_response": [["Which film won the Oscar for Outstanding Picture in 1953, being the first one in alphabetical order?", "All About Eve || All About Eve"], ["In which year was \"All About Eve\" released?", "1950 || 1950"]]}}}
{"hop1": {"unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [0.6210850900970399, 1.0], "model_response": [["Who is the president / leader of Norway in the year 1814?", "Christian Frederick of Denmark is the monarch of Norway in the year 1814. || Christian Frederick of Denmark"], ["In which year was Christian Frederick of Denmark born?", "1729 || 1729"]]}, "mis_info_dict_severe": {"answer_condition": [3, 4], "confidence": [1.0, 0.97265625], "model_response": [["Who is the president / leader of Norway in the year 1814?", "Pizza || Pizza"], ["In which year was pizza born?", "1814 || 1814"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 4], "confidence": [0.49416348338127136, 0.6410064697265625], "model_response": [["Who is the president / leader of Norway in the year 1814?", "King Christian VIII || King Christian VIII"], ["In which year was King Christian VIII of Denmark born?", "1749 || 1749"]]}, "hall_sbj_dict_severe": {"answer_condition": [3, 4], "confidence": [1.0, 0.941619873046875], "model_response": [["Who is the president / leader of Norway in the year 1814?", "Pizza || Pizza"], ["In which year was pizza born?", "1814 || 1814"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 4], "confidence": [0.9844207763671875, 0.049072265625], "model_response": [["Who is the president / leader of Norway in the year 1814?", "Christian Frederick of Denmark is the president/leader of Norway in the year 1814. || Christian Frederick of Denmark"], ["In which year was Christian Frederick of Denmark born?", "1749 || 1749"]]}, "mis_info_dict_light": {"answer_condition": [3, 4], "confidence": [1.0, 0.66015625], "model_response": [["Who is the president / leader of Norway in the year 1814?", "Gustav IV Adolf of Sweden || Gustav IV Adolf of Sweden"], ["In which year was Gustav IV Adolf of Sweden born?", "1771 || 1771"]]}}, "hop2": {"unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [0.53662109375, 0.119140625], "model_response": [["Who is the president / leader of Norway in the year 1814?", "Christian Frederick of Denmark. || Christian Frederick of Denmark"], ["In which year was Christian Frederick of Denmark born?", "1723 || 1723"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 4], "confidence": [0.371063232421875, 0.875], "model_response": [["Who is the president / leader of Norway in the year 1814?", "Christian Frederick of Denmark. || Christian Frederick of Denmark"], ["In which year was Christian Frederick of Denmark born?", "1729 || 1729"]]}, "mis_info_dict_light": {"answer_condition": [1, 4], "confidence": [0.9921875, 0.23171234130859375], "model_response": [["Who is the president / leader of Norway in the year 1814?", "Christian Frederick of Denmark is the president / leader of Norway in the year 1814. || Christian Frederick of Denmark"], ["In which year was Christian Frederick of Denmark born?", "1601 || 1601"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 4], "confidence": [0.15690118074417114, 0.96514892578125], "model_response": [["Who is the president / leader of Norway in the year 1814?", "King Christian VII || King Christian VII"], ["In which year was King Christian VII of Denmark born?", "1729 || 1729"]]}, "hall_sbj_dict_severe": {"answer_condition": [4, 4], "confidence": [0.5969839096069336, 0.381317138671875], "model_response": [["Who is the president / leader of Norway in the year 1814?", "King Christian VIII || King Christian VIII"], ["In which year was King Christian VIII of Denmark born?", "1649 || 1649"]]}, "mis_info_dict_severe": {"answer_condition": [3, 4], "confidence": [1.0, 0.013255119323730469], "model_response": [["Who is the president / leader of Norway in the year 1814?", "Christian Frederick of Denmark was born in the year chocolate chip cookies. || chocolate chip cookies"], ["In which year were chocolate chip cookies invented?", "1840 || 1840"]]}}}
{"hop1": {"hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.9161262512207031, 0.99609375], "model_response": [["Which countries to the east share a border with Norway?", "Finland and Russia || Finland and Russia"], ["What is the capital of Finland?", "Helsinki || Helsinki"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.988311767578125, 0.9921875], "model_response": [["Which countries to the east share a border with Norway?", "Finland and Russia || Finland and Russia"], ["What is the capital of Finland?", "Helsinki || Helsinki"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.467254638671875, 1.0], "model_response": [["Which countries to the east share a border with Norway?", "Finland and Sweden || Finland and Sweden"], ["What is the capital of Finland?", "Helsinki || Helsinki"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.8439903259277344, 1.0], "model_response": [["Which countries to the east share a border with Norway?", "Finland and Russia. || Finland and Russia"], ["What is the capital of Finland?", "Helsinki || Helsinki"]]}, "mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [0.9379416704177856, 0.9921875], "model_response": [["Which countries to the east share a border with Norway?", "Finland and Russia. || Finland and Russia"], ["What is the capital of Finland?", "Helsinki || Helsinki"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.8761024475097656, 1.0], "model_response": [["Which countries to the east share a border with Norway?", "Finland and Sweden || Finland and Sweden"], ["What is the capital of Finland?", "Helsinki || Helsinki"]]}}, "hop2": {"unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.359527587890625, 1.0], "model_response": [["Which countries to the east share a border with Norway?", "Finland and Russia || Finland and Russia"], ["What is the capital of Finland?", "Helsinki || Helsinki"]]}, "mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [0.6581530570983887, 1.0], "model_response": [["Which countries to the east share a border with Norway?", "Finland and Russia || Finland and Russia"], ["What is the capital of Finland?", "Helsinki || Helsinki"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.448638916015625, 1.0], "model_response": [["Which countries to the east share a border with Norway?", "Finland and Sweden || Finland and Sweden"], ["What is the capital of Finland?", "Helsinki || Helsinki"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.432586669921875, 1.0], "model_response": [["Which countries to the east share a border with Norway?", "Finland, Sweden, and Russia || Finland, Sweden, and Russia"], ["What is the capital of Finland?", "Helsinki || Helsinki"]]}, "hall_sbj_dict_severe": {"answer_condition": [4, 4], "confidence": [0.03769258037209511, 0.99609375], "model_response": [["Which countries to the east share a border with Norway?", "Iceland and Sweden || Iceland and Sweden"], ["What are the capitals of Iceland and Sweden?", "Reykjavik and Stockholm || Reykjavik and Stockholm"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 4], "confidence": [0.034327104687690735, 0.99609375], "model_response": [["Which countries to the east share a border with Norway?", "Iceland and Russia. || Iceland and Russia"], ["What are the capitals of Iceland and Russia?", "Reykjavik and Moscow || Reykjavik and Moscow"]]}}}
{"hop1": {"hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.94195556640625, 0.9921875], "model_response": [["What is the name of the longest river in Laos?", "The Mekong River || The Mekong River"], ["From which country does the Mekong River originate?", "China || China"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.439453125, 0.98828125], "model_response": [["What is the name of the longest river in Laos?", "The Mekong River || Mekong River"], ["From which country does the Mekong River originate?", "China || China"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.98046875, 0.99609375], "model_response": [["What is the name of the longest river in Laos?", "The Mekong River || Mekong River"], ["From which country does the Mekong River originate?", "China || China"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.98046875, 0.91015625], "model_response": [["What is the name of the longest river in Laos?", "The Mekong River || Mekong River"], ["From which country does the Mekong River originate?", "China || China"]]}, "mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [0.9844207763671875, 1.0], "model_response": [["What is the name of the longest river in Laos?", "The Mekong River || The Mekong River"], ["From which country does the Mekong River originate?", "China || China"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [0.99609375, 0.0016415119171142578], "model_response": [["What is the name of the longest river in Laos?", "The Mekong River || Mekong River"], ["From which country does the Mekong River originate?", "Burma (Myanmar) || Burma (Myanmar)"]]}}, "hop2": {"mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.9921875, 0.953125], "model_response": [["What is the name of the longest river in Laos?", "The Mekong River || Mekong River"], ["From which country does the Mekong River originate?", "China || China"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.93450927734375, 0.9921875], "model_response": [["What is the name of the longest river in Laos?", "The Mekong River || The Mekong River"], ["From which country does the Mekong River originate?", "China || China"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.953125, 0.87109375], "model_response": [["What is the name of the longest river in Laos?", "The Mekong River || Mekong River"], ["From which country does the Mekong River originate?", "China || China"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.9921875, 0.94921875], "model_response": [["What is the name of the longest river in Laos?", "The Mekong River || Mekong River"], ["From which country does the Mekong River originate?", "China || China"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.99609375, 1.0], "model_response": [["What is the name of the longest river in Laos?", "The Mekong River || Mekong River"], ["From which country does the Mekong River originate?", "China || China"]]}, "mis_info_dict_light": {"answer_condition": [1, 3], "confidence": [0.9921875, 1.0], "model_response": [["What is the name of the longest river in Laos?", "The Mekong River || The Mekong River"], ["From which country does the Mekong River originate?", "Thailand || Thailand"]]}}}
{"hop1": {"unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.875, 1.0], "model_response": [["Which film won the Oscar for Outstanding Picture in 1970, being the first one in alphabetical order?", "Midnight Cowboy || Midnight Cowboy"], ["In which year was Midnight Cowboy released?", "1969 || 1969"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.34765625, 1.0], "model_response": [["Which film won the Oscar for Outstanding Picture in 1970, being the first one in alphabetical order?", "Midnight Cowboy || Midnight Cowboy"], ["In which year was Midnight Cowboy released?", "1969 || 1969"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.98828125, 1.0], "model_response": [["Which film won the Oscar for Outstanding Picture in 1970, being the first one in alphabetical order?", "Midnight Cowboy || Midnight Cowboy"], ["In which year was Midnight Cowboy released?", "1969 || 1969"]]}, "hall_sbj_dict_severe": {"answer_condition": [3, 4], "confidence": [1.0, 0.04403114318847656], "model_response": [["Which film won the Oscar for Outstanding Picture in 1970, being the first one in alphabetical order?", "Orchids || Orchids"], ["In which year were orchids discovered?", "1850 || 1850"]]}, "mis_info_dict_light": {"answer_condition": [3, 4], "confidence": [0.5, 0.26171875], "model_response": [["Which film won the Oscar for Outstanding Picture in 1970, being the first one in alphabetical order?", "M*A*S*H* || M*A*S*H*"], ["In which year was M*A*S*H* released?", "1972 || 1972"]]}, "mis_info_dict_severe": {"answer_condition": [3, 4], "confidence": [1.0, 0.260833740234375], "model_response": [["Which film won the Oscar for Outstanding Picture in 1970, being the first one in alphabetical order?", "Pizza || Pizza"], ["In which year was pizza invented?", "Pizza was invented in Italy in the late 19th century. || late 19th century"]]}}, "hop2": {"hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.248046875, 1.0], "model_response": [["Which film won the Oscar for Outstanding Picture in 1970, being the first one in alphabetical order?", "Midnight Cowboy || Midnight Cowboy"], ["In which year was Midnight Cowboy released?", "1969 || 1969"]]}, "mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.98828125], "model_response": [["Which film won the Oscar for Outstanding Picture in 1970, being the first one in alphabetical order?", "Midnight Cowboy || Midnight Cowboy"], ["In which year was Midnight Cowboy released?", "1969 || 1969"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Which film won the Oscar for Outstanding Picture in 1970, being the first one in alphabetical order?", "Midnight Cowboy || Midnight Cowboy"], ["In which year was Midnight Cowboy released?", "1969 || 1969"]]}, "unrelated_fact_dict_light": {"answer_condition": [3, 4], "confidence": [0.87890625, 1.0], "model_response": [["Which film won the Oscar for Outstanding Picture in 1970, being the first one in alphabetical order?", "The Godfather || The Godfather"], ["In which year was The Godfather released?", "1972 || 1972"]]}, "hall_sbj_dict_light": {"answer_condition": [4, 4], "confidence": [0.0490264892578125, 0.65234375], "model_response": [["Which film won the Oscar for Outstanding Picture in 1970, being the first one in alphabetical order?", "Winning London, which was released in 1969. || Winning London"], ["In which year was Winning London released?", "1971 || 1971"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 4], "confidence": [0.733489990234375, 0.890625], "model_response": [["Which film won the Oscar for Outstanding Picture in 1970, being the first one in alphabetical order?", "Winning the Oscar for Outstanding Picture in 1970 was \"Winning London\" (1969), directed by John Schlesinger. It was the first film to win the Oscar for Outstanding Picture in alphabetical order, as it was the first film released in 1969. || Winning London"], ["In which year was Winning London released?", "1971 || 1971"]]}}}
{"hop1": {"hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.755767822265625, 1.0], "model_response": [["What are the colors on the national flag of Norway?", "Blue and white. || Blue and white"], ["What is the contrast color of white?", "Black || Black"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.16956329345703125, 1.0], "model_response": [["What are the colors on the national flag of Norway?", "Blue and white. || Blue and white"], ["What is the contrast color of white?", "Black || Black"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.14979466795921326, 1.0], "model_response": [["What are the colors on the national flag of Norway?", "Red and white. || Red and white"], ["What is the contrast color of white?", "Black || Black"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.439453125, 1.0], "model_response": [["What are the colors on the national flag of Norway?", "Blue and white || Blue and white"], ["What is the contrast color of white?", "Black || Black"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.85546875, 1.0], "model_response": [["What are the colors on the national flag of Norway?", "Blue and white || Blue and white"], ["What is the contrast color of white?", "Black || Black"]]}, "mis_info_dict_light": {"answer_condition": [4, 1], "confidence": [0.953125, 0.85546875], "model_response": [["What are the colors on the national flag of Norway?", "Blue and red || Blue and red"], ["What are the contrast colors of blue and red?", "Black and white || Black and white"]]}}, "hop2": {"hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.02903323620557785, 1.0], "model_response": [["What are the colors on the national flag of Norway?", "Red and white. || Red and white"], ["What is the contrast color of white?", "Black || Black"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.79376220703125, 1.0], "model_response": [["What are the colors on the national flag of Norway?", "Blue and white. || Blue and white"], ["What is the contrast color of white?", "Black || Black"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.59765625, 1.0], "model_response": [["What are the colors on the national flag of Norway?", "Blue and white. || Blue and white"], ["What is the contrast color of white?", "Black || Black"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.90625, 1.0], "model_response": [["What are the colors on the national flag of Norway?", "Blue and white. || Blue and white"], ["What is the contrast color of white?", "Black || Black"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.05794525146484375, 0.98828125], "model_response": [["What are the colors on the national flag of Norway?", "The colors on the national flag of Norway are blue and white. || blue and white"], ["What is the contrast color of white?", "black || black"]]}, "mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [0.345703125, 0.96875], "model_response": [["What are the colors on the national flag of Norway?", "The colors on the national flag of Norway are blue and white. || blue and white"], ["What is the contrast color of white?", "black || black"]]}}}
{"hop1": {"unrelated_fact_dict_severe": {"answer_condition": [-1, -1], "confidence": [-1, -1], "model_response": [["Which company did Thomas J. Scharping work for first (in time order)?", "I'm sorry, I don't have enough information to answer your question. Please provide more context or details. || N/A"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.2255859375, 0.9649658203125], "model_response": [["Which company did Thomas J. Scharping work for first (in time order)?", "Microsoft || Microsoft"], ["In which city is Microsoft's headquarters located?", "Redmond, Washington || Redmond, Washington"]]}, "hall_sbj_dict_severe": {"answer_condition": [4, 4], "confidence": [0.8046875, 0.99609375], "model_response": [["Which company did Thomas J. Scharping work for first (in time order)?", "Sun Microsystems || Sun Microsystems"], ["In which city is Sun Microsystems' headquarters located?", "Santa Clara, California || Santa Clara, California"]]}, "mis_info_dict_severe": {"answer_condition": [3, 4], "confidence": [0.848876953125, 0.98443603515625], "model_response": [["Which company did Thomas J. Scharping work for first (in time order)?", "Chocolate cake || Chocolate cake"], ["In which city is the headquarters of chocolate cake located?", "New York City || New York City"]]}, "mis_info_dict_light": {"answer_condition": [3, 4], "confidence": [0.98046875, 1.0], "model_response": [["Which company did Thomas J. Scharping work for first (in time order)?", "Apple (in 1977) || Apple"], ["In which city is Apple's headquarters located?", "Cupertino || Cupertino"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 4], "confidence": [0.91015625, 0.96484375], "model_response": [["Which company did Thomas J. Scharping work for first (in time order)?", "Sun Microsystems || Sun Microsystems"], ["In which city is Sun Microsystems' headquarters located?", "Santa Clara, California || Santa Clara, California"]]}}, "hop2": {"hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.890625, 0.62109375], "model_response": [["Which company did Thomas J. Scharping work for first (in time order)?", "Microsoft || Microsoft"], ["In which city is Microsoft's headquarters located?", "Redmond, Washington || Redmond, Washington"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.150390625, 0.8004608154296875], "model_response": [["Which company did Thomas J. Scharping work for first (in time order)?", "Microsoft (in the early 1990s) || Microsoft"], ["In which city is Microsoft's headquarters located?", "Redmond, Washington || Redmond, Washington"]]}, "hall_sbj_dict_light": {"answer_condition": [4, 4], "confidence": [0.419921875, 1.0], "model_response": [["Which company did Thomas J. Scharping work for first (in time order)?", "Sun Microsystems || Sun Microsystems"], ["In which city is Sun Microsystems' headquarters located?", "Santa Clara, California || Santa Clara, California"]]}, "mis_info_dict_light": {"answer_condition": [4, 4], "confidence": [0.248046875, 0.9921875], "model_response": [["Which company did Thomas J. Scharping work for first (in time order)?", "Scharping worked at IBM first. || IBM"], ["In which city is IBM's headquarters located?", "Armonk, New York || Armonk, New York"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 4], "confidence": [0.53125, 0.140625], "model_response": [["Which company did Thomas J. Scharping work for first (in time order)?", "Scharping worked for the company that is now known as Unilever before he joined Coca-Cola in 1980. || Unilever"], ["In which city is Unilever's headquarters located?", "London || London"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 4], "confidence": [0.72265625, 0.0254058837890625], "model_response": [["Which company did Thomas J. Scharping work for first (in time order)?", "Scharping worked for the German company SAP before moving to Apple. || SAP"], ["In which city is SAP's headquarters located?", "Wien || Wien"]]}}}
{"hop1": {"hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["In this year's Oscars, which film is the first one in alphabetical order for the Outstanding Pictures category?", "The Hours || The Hours"], ["Who is the director of the movie \"The Hours\"?", "Stephen Daldry || Stephen Daldry"]]}, "hall_sbj_dict_severe": {"answer_condition": [3, 4], "confidence": [0.8125, 0.55859375], "model_response": [["In this year's Oscars, which film is the first one in alphabetical order for the Outstanding Pictures category?", "Sunflowers || Sunflowers"], ["Who is the director of the movie \"Sunflowers\"?", "Quentin Tarantino || Quentin Tarantino"]]}, "mis_info_dict_light": {"answer_condition": [3, 4], "confidence": [1.0, 1.0], "model_response": [["In this year's Oscars, which film is the first one in alphabetical order for the Outstanding Pictures category?", "The Irishman || The Irishman"], ["Who is the director of the movie \"The Irishman\"?", "Martin Scorsese || Martin Scorsese"]]}, "mis_info_dict_severe": {"answer_condition": [3, 4], "confidence": [0.92333984375, 0.95703125], "model_response": [["In this year's Oscars, which film is the first one in alphabetical order for the Outstanding Pictures category?", "Chocolate Chip Cookies || Chocolate Chip Cookies"], ["Who is the director of the movie \"Chocolate Chip Cookies\"?", "Unknown || Unknown"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 4], "confidence": [0.86785888671875, 0.5], "model_response": [["In this year's Oscars, which film is the first one in alphabetical order for the Outstanding Pictures category?", "The Shape of Water || The Shape of Water"], ["Who is the director of the movie \"The Shape of Water\"?", "Guillermo del Toro || Guillermo del Toro"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 3], "confidence": [0.6186676025390625, 1.0], "model_response": [["In this year's Oscars, which film is the first one in alphabetical order for the Outstanding Pictures category?", "The Revenant || The Revenant"], ["Who is the director of the movie \"The Revenant\"?", "Alejandro Gonz\u00e1lez I\u00f1\u00e1rritu || Alejandro Gonz\u00e1lez I\u00f1\u00e1rritu"]]}}, "hop2": {"mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.858306884765625, 0.99609375], "model_response": [["In this year's Oscars, which film is the first one in alphabetical order for the Outstanding Pictures category?", "The Hours || The Hours"], ["Who is the director of the movie \"The Hours\"?", "Stephen Daldry || Stephen Daldry"]]}, "mis_info_dict_light": {"answer_condition": [1, 3], "confidence": [0.941619873046875, 1.0], "model_response": [["In this year's Oscars, which film is the first one in alphabetical order for the Outstanding Pictures category?", "The Hours || The Hours"], ["Who is the director of the movie \"The Hours\"?", "David Fincher || David Fincher"]]}, "hall_sbj_dict_light": {"answer_condition": [3, 1], "confidence": [0.9375, 1.0], "model_response": [["In this year's Oscars, which film is the first one in alphabetical order for the Outstanding Pictures category?", "The Shawshank Redemption || The Shawshank Redemption"], ["Who is the director of the movie \"The Shawshank Redemption\"?", "Stephen Daldry || Stephen Daldry"]]}, "hall_sbj_dict_severe": {"answer_condition": [4, 4], "confidence": [0.371063232421875, 0.73046875], "model_response": [["In this year's Oscars, which film is the first one in alphabetical order for the Outstanding Pictures category?", "The Revenant || The Revenant"], ["Who is the director of the movie \"The Revenant\"?", "Alejandro G. I\u00f1\u00e1rritu || Alejandro G. I\u00f1\u00e1rritu"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 3], "confidence": [0.96484375, 1.0], "model_response": [["In this year's Oscars, which film is the first one in alphabetical order for the Outstanding Pictures category?", "The Social Network || The Social Network"], ["Who is the director of the movie \"The Social Network\"?", "David Fincher || David Fincher"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 4], "confidence": [0.9380950927734375, 0.73046875], "model_response": [["In this year's Oscars, which film is the first one in alphabetical order for the Outstanding Pictures category?", "The Shape of Water || The Shape of Water"], ["Who is the director of the movie \"The Shape of Water\"?", "Guillermo del Toro || Guillermo del Toro"]]}}}
{"hop1": {"unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.8439903259277344, 0.6640625], "model_response": [["Which countries to the east share a border with Norway?", "Finland and Russia || Finland and Russia"], ["Which is the first year does Russia invade Finland?", "1939 || 1939"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.6546531915664673, 0.4375], "model_response": [["Which countries to the east share a border with Norway?", "Finland and Russia || Finland and Russia"], ["Which is the first year does Russia invade Finland?", "1939 || 1939"]]}, "mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [0.9379416704177856, 0.8046875], "model_response": [["Which countries to the east share a border with Norway?", "Finland and Russia || Finland and Russia"], ["Which is the first year does Russia invade Finland?", "1939 || 1939"]]}, "mis_info_dict_severe": {"answer_condition": [1, 4], "confidence": [0.6010406017303467, 0.447265625], "model_response": [["Which countries to the east share a border with Norway?", "Finland and Sweden || Finland and Sweden"], ["Which is the first year does Russia invade Finland?", "1940 || 1940"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [0.467254638671875, 0.46875], "model_response": [["Which countries to the east share a border with Norway?", "Finland and Russia. || Finland and Russia"], ["Which is the first year does Russia invade Finland?", "1940 || 1940"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 4], "confidence": [0.9161262512207031, 0.4765625], "model_response": [["Which countries to the east share a border with Norway?", "Finland and Russia || Finland and Russia"], ["Which is the first year does Russia invade Finland?", "1940 || 1940"]]}}, "hop2": {"unrelated_fact_dict_light": {"answer_condition": [-1, -1], "confidence": [-1, -1], "model_response": [["Which countries to the east share a border with Norway?", "I'm sorry, I don't understand the question. Could you please rephrase it? || N/A"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.7629392147064209, 0.91796875], "model_response": [["Which countries to the east share a border with Norway?", "Finland and Russia || Finland and Russia"], ["Which is the first year does Russia invade Finland?", "1939 || 1939"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.84819495677948, 0.7890625], "model_response": [["Which countries to the east share a border with Norway?", "Finland and Russia || Finland and Russia"], ["Which is the first year does Russia invade Finland?", "1939 || 1939"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.6369978189468384, 0.87890625], "model_response": [["Which countries to the east share a border with Norway?", "Finland and Russia share a border with Norway. || Finland and Russia"], ["Which is the first year does Russia invade Finland?", "1939 || 1939"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.4319000244140625, 0.96875], "model_response": [["Which countries to the east share a border with Norway?", "Finland and Sweden. || Finland and Sweden"], ["Which is the first year does Russia invade Finland?", "1939 || 1939"]]}, "mis_info_dict_light": {"answer_condition": [1, 3], "confidence": [0.22478485107421875, 0.48046875], "model_response": [["Which countries to the east share a border with Norway?", "Finland and Sweden || Finland and Sweden"], ["Which is the first year does Russia invade Finland?", "1941 || 1941"]]}}}
{"hop1": {"unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.490234375], "model_response": [["What is the capital of Russia?", "Moscow || Moscow"], ["What is the time zone of Moscow in UTC?", "+3 hours || +3 hours"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.99609375, 0.7219085693359375], "model_response": [["What is the capital of Russia?", "Moscow || Moscow"], ["What is the time zone of Moscow in UTC?", "UTC+3 || UTC+3"]]}, "mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.48828125], "model_response": [["What is the capital of Russia?", "Moscow || Moscow"], ["What is the time zone of Moscow in UTC?", "+3 hours || +3 hours"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.98828125, 0.8514404296875], "model_response": [["What is the capital of Russia?", "Moscow || Moscow"], ["What is the time zone of Moscow in UTC?", "UTC+3 || UTC+3"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.953125, 0.7162017822265625], "model_response": [["What is the capital of Russia?", "Moscow || Moscow"], ["What is the time zone of Moscow in UTC?", "UTC+3 || UTC+3"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.98828125, 0.2663726806640625], "model_response": [["What is the capital of Russia?", "Moscow || Moscow"], ["What is the time zone of Moscow in UTC?", "UTC+3 || UTC+3"]]}}, "hop2": {"mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [0.98828125, 0.00960230827331543], "model_response": [["What is the capital of Russia?", "Moscow || Moscow"], ["What is the time zone of Moscow in UTC?", "+3 hours || +3 hours"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.9921875, 0.176910400390625], "model_response": [["What is the capital of Russia?", "Moscow || Moscow"], ["What is the time zone of Moscow in UTC?", "UTC+3 || UTC+3"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.98046875, 0.679443359375], "model_response": [["What is the capital of Russia?", "Moscow || Moscow"], ["What is the time zone of Moscow in UTC?", "UTC+3 || UTC+3"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.98828125, 0.6092529296875], "model_response": [["What is the capital of Russia?", "Moscow || Moscow"], ["What is the time zone of Moscow in UTC?", "UTC+3 || UTC+3"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.98046875, 0.65899658203125], "model_response": [["What is the capital of Russia?", "Moscow || Moscow"], ["What is the time zone of Moscow in UTC?", "UTC+3 hours || UTC+3"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.953125, 0.8681640625], "model_response": [["What is the capital of Russia?", "Moscow || Moscow"], ["What is the time zone of Moscow in UTC?", "Moscow is in the UTC+3 time zone. || UTC+3"]]}}}
{"hop1": {"mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [0.953125, 1.0], "model_response": [["What is the time zone of Cincinnati, Ohio in UTC?", "UTC-5 || UTC-5"], ["Which country is the northernmost in the UTC-5 time zone?", "Canada || Canada"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.8136749267578125, 1.0], "model_response": [["What is the time zone of Cincinnati, Ohio in UTC?", "Eastern Time (ET) || Eastern Time (ET)"], ["Which country is the northernmost in the UTC-5 time zone?", "Canada || Canada"]]}, "hall_sbj_dict_light": {"answer_condition": [4, 1], "confidence": [0.9921875, 1.0], "model_response": [["What is the time zone of Cincinnati, Ohio in UTC?", "UTC-4 || UTC-4"], ["Which country is the northernmost in the UTC-4 time zone?", "Canada || Canada"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 1], "confidence": [0.2421875, 1.0], "model_response": [["What is the time zone of Cincinnati, Ohio in UTC?", "UTC-4 || UTC-4"], ["Which country is the northernmost in the UTC-4 time zone?", "Canada || Canada"]]}, "hall_sbj_dict_severe": {"answer_condition": [4, 1], "confidence": [0.7047882080078125, 1.0], "model_response": [["What is the time zone of Cincinnati, Ohio in UTC?", "UTC-4 || UTC-4"], ["Which country is the northernmost in the UTC-4 time zone?", "Canada || Canada"]]}, "mis_info_dict_severe": {"answer_condition": [4, 1], "confidence": [1.0, 0.9921875], "model_response": [["What is the time zone of Cincinnati, Ohio in UTC?", "Pizza || Pizza"], ["Which country is the northernmost in the Pizza time zone?", "Canada || Canada"]]}}, "hop2": {"hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.134765625, 1.0], "model_response": [["What is the time zone of Cincinnati, Ohio in UTC?", "UTC-5 || UTC-5"], ["Which country is the northernmost in the UTC-5 time zone?", "Canada || Canada"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.04366302490234375, 1.0], "model_response": [["What is the time zone of Cincinnati, Ohio in UTC?", "UTC-5 || UTC-5"], ["Which country is the northernmost in the UTC-5 time zone?", "Canada || Canada"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.4617932578548789, 1.0], "model_response": [["What is the time zone of Cincinnati, Ohio in UTC?", "Eastern Time (ET) || Eastern Time (ET)"], ["Which country is the northernmost in the UTC-5 time zone?", "Canada || Canada"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.35877227783203125, 1.0], "model_response": [["What is the time zone of Cincinnati, Ohio in UTC?", "Eastern Time (ET) || Eastern Time (ET)"], ["Which country is the northernmost in the UTC-5 time zone?", "Canada || Canada"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.5520982146263123, 1.0], "model_response": [["What is the time zone of Cincinnati, Ohio in UTC?", "Eastern Time (ET) || Eastern Time (ET)"], ["Which country is the northernmost in the UTC-5 time zone?", "Canada || Canada"]]}, "mis_info_dict_light": {"answer_condition": [4, 1], "confidence": [0.439453125, 1.0], "model_response": [["What is the time zone of Cincinnati, Ohio in UTC?", "UTC-4 || UTC-4"], ["Which country is the northernmost in the UTC-4 time zone?", "Canada || Canada"]]}}}
{"hop1": {"mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [0.68359375, 0.490234375], "model_response": [["Which city in Europe has the largest population?", "London || London"], ["What is the time zone of London in UTC?", "UTC+0 || UTC+0"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.5, 0.8754730224609375], "model_response": [["Which city in Europe has the largest population?", "London || London"], ["What is the time zone of London in UTC?", "UTC+0 || UTC+0"]]}, "hall_sbj_dict_severe": {"answer_condition": [4, 4], "confidence": [0.9453125, 0.9076995849609375], "model_response": [["Which city in Europe has the largest population?", "Moscow || Moscow"], ["What is the time zone of Moscow in UTC?", "UTC+3 || UTC+3"]]}, "mis_info_dict_severe": {"answer_condition": [4, 4], "confidence": [0.98828125, 0.953125], "model_response": [["Which city in Europe has the largest population?", "Rome || Rome"], ["What is the time zone of Rome in UTC?", "UTC+2 || UTC+2"]]}, "unrelated_fact_dict_light": {"answer_condition": [3, 4], "confidence": [1.0, 0.94940185546875], "model_response": [["Which city in Europe has the largest population?", "Berlin || Berlin"], ["What is the time zone of Berlin in UTC?", "UTC+1 || UTC+1"]]}, "hall_sbj_dict_light": {"answer_condition": [4, 4], "confidence": [0.87890625, 0.6186676025390625], "model_response": [["Which city in Europe has the largest population?", "Moscow || Moscow"], ["What is the time zone of Moscow in UTC?", "UTC+3 || UTC+3"]]}}, "hop2": {"unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.61328125, 1.0], "model_response": [["Which city in Europe has the largest population?", "London || London"], ["What is the time zone of London in UTC?", "UTC+0 || UTC+0"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.49609375, 1.0], "model_response": [["Which city in Europe has the largest population?", "London || London"], ["What is the time zone of London in UTC?", "UTC+0 || UTC+0"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.345703125, 0.1861572265625], "model_response": [["Which city in Europe has the largest population?", "London || London"], ["What is the time zone of London in UTC?", "UTC+0 || UTC+0"]]}, "hall_sbj_dict_severe": {"answer_condition": [4, 4], "confidence": [0.98046875, 1.0], "model_response": [["Which city in Europe has the largest population?", "Moscow || Moscow"], ["What is the time zone of Moscow in UTC?", "UTC+3 || UTC+3"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 4], "confidence": [0.498046875, 0.07390975952148438], "model_response": [["Which city in Europe has the largest population?", "Moscow || Moscow"], ["What is the time zone of Moscow in UTC?", "+3 hours || +3 hours"]]}, "mis_info_dict_light": {"answer_condition": [4, 4], "confidence": [0.671875, 1.0], "model_response": [["Which city in Europe has the largest population?", "Moscow || Moscow"], ["What is the time zone of Moscow in UTC?", "UTC+3 || UTC+3"]]}}}
{"hop1": {"mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.5544782703509554], "model_response": [["Which film won the Oscar for Outstanding Picture in 1776, being the first one in alphabetical order?", "The French Connection || The French Connection"], ["What is the name of the theme song for \"The French Connection\"?", "\"The French Connection\" (Theme Song) || \"The French Connection\" (Theme Song)"]]}, "hall_sbj_dict_severe": {"answer_condition": [4, 4], "confidence": [1.0, 0.10888671875], "model_response": [["Which film won the Oscar for Outstanding Picture in 1776, being the first one in alphabetical order?", "Sunflowers || Sunflowers"], ["What is the name of the theme song for \"Sunflowers\"?", "\"Sunflowers\" || Sunflowers"]]}, "hall_sbj_dict_light": {"answer_condition": [4, 4], "confidence": [1.0, 0.6678825616836548], "model_response": [["Which film won the Oscar for Outstanding Picture in 1776, being the first one in alphabetical order?", "The Godfather || The Godfather"], ["What is the name of the theme song for \"The Godfather\"?", "The Godfather Theme || The Godfather Theme"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 4], "confidence": [0.0988311767578125, 1.0], "model_response": [["Which film won the Oscar for Outstanding Picture in 1776, being the first one in alphabetical order?", "Titanic || Titanic"], ["What is the name of the theme song for \"Titanic\"?", "My Heart Will Go On || My Heart Will Go On"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 4], "confidence": [0.8828125, 0.8686065673828125], "model_response": [["Which film won the Oscar for Outstanding Picture in 1776, being the first one in alphabetical order?", "Amadeus || Amadeus"], ["What is the name of the theme song for \"Amadeus\"?", "\"My Strongest Suit\" || My Strongest Suit"]]}, "mis_info_dict_light": {"answer_condition": [4, 4], "confidence": [1.0, 0.7130126953125], "model_response": [["Which film won the Oscar for Outstanding Picture in 1776, being the first one in alphabetical order?", "Annie Hall || Annie Hall"], ["What is the name of the theme song for \"Annie Hall\"?", "You Must Love Me || You Must Love Me"]]}}, "hop2": {"hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.142913818359375, 1.0], "model_response": [["Which film won the Oscar for Outstanding Picture in 1776, being the first one in alphabetical order?", "The French Connection || The French Connection"], ["What is the name of the theme song for \"The French Connection\"?", "\"The French Connection\" || The French Connection"]]}, "hall_sbj_dict_light": {"answer_condition": [4, 4], "confidence": [0.3046875, 0.7921142578125], "model_response": [["Which film won the Oscar for Outstanding Picture in 1776, being the first one in alphabetical order?", "Amadeus || Amadeus"], ["What is the name of the theme song for \"Amadeus\"?", "\"My Strongest Suit\" || My Strongest Suit"]]}, "mis_info_dict_light": {"answer_condition": [4, 4], "confidence": [0.85546875, 0.790283203125], "model_response": [["Which film won the Oscar for Outstanding Picture in 1776, being the first one in alphabetical order?", "Amadeus || Amadeus"], ["What is the name of the theme song for \"Amadeus\"?", "\"My Strongest Suit\" || My Strongest Suit"]]}, "mis_info_dict_severe": {"answer_condition": [4, 4], "confidence": [0.78125, 0.968994140625], "model_response": [["Which film won the Oscar for Outstanding Picture in 1776, being the first one in alphabetical order?", "Amadeus || Amadeus"], ["What is the name of the theme song for \"Amadeus\"?", "\"My Strongest Suit\" || My Strongest Suit"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 4], "confidence": [0.58984375, 0.88946533203125], "model_response": [["Which film won the Oscar for Outstanding Picture in 1776, being the first one in alphabetical order?", "Amadeus || Amadeus"], ["What is the name of the theme song for \"Amadeus\"?", "\"My Strongest Suit\" || My Strongest Suit"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 4], "confidence": [0.8686065673828125, 0.95703125], "model_response": [["Which film won the Oscar for Outstanding Picture in 1776, being the first one in alphabetical order?", "The first Oscar for Outstanding Picture was won by \"The Stunt Man\" in 1776. || The Stunt Man"], ["What is the name of the theme song for \"The Stunt Man\"?", "\"The Stunt Man\" || The Stunt Man"]]}}}
{"hop1": {"hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Who is the president / leader of China in the year 1949?", "Chiang Kai-shek || Chiang Kai-shek"], ["Who is Chiang Kai-shek married to?", "Soong Mei-ling || Soong Mei-ling"]]}, "mis_info_dict_severe": {"answer_condition": [3, -1], "confidence": [1.0, -1], "model_response": [["Who is the president / leader of China in the year 1949?", "Pizza || Pizza"], ["Who is pizza married to?", "Pizza is not married to anyone. || N/A"]]}, "mis_info_dict_light": {"answer_condition": [4, 4], "confidence": [1.0, 0.9158935546875], "model_response": [["Who is the president / leader of China in the year 1949?", "Mao Zedong || Mao Zedong"], ["Who is Mao Zedong married to?", "Chou En-lai || Chou En-lai"]]}, "hall_sbj_dict_severe": {"answer_condition": [4, 1], "confidence": [0.83770751953125, 0.73046875], "model_response": [["Who is the president / leader of China in the year 1949?", "Sun Yat-sen || Sun Yat-sen"], ["Who is Sun Yat-sen married to?", "Sun Yat-sen was married to Soong Mei-ling, who was a Chinese politician and diplomat. || Soong Mei-ling"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 1], "confidence": [0.8933472633361816, 0.9765625], "model_response": [["Who is the president / leader of China in the year 1949?", "Chou En-lai || Chou En-lai"], ["Who is Chou En-lai married to?", "He was married to Soong Mei-ling. || Soong Mei-ling"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 1], "confidence": [0.724761962890625, 0.48828125], "model_response": [["Who is the president / leader of China in the year 1949?", "Chou En-Lai || Chou En-Lai"], ["Who is Chou En-Lai married to?", "Chou En-Lai was married to Soong Mei-Ling. || Soong Mei-Ling"]]}}, "hop2": {"mis_info_dict_severe": {"answer_condition": [1, 3], "confidence": [1.0, 0.9921875], "model_response": [["Who is the president / leader of China in the year 1949?", "Chiang Kai-shek || Chiang Kai-shek"], ["Who is Chiang Kai-shek married to?", "Chocolate cake || Chocolate cake"]]}, "hall_sbj_dict_light": {"answer_condition": [4, 1], "confidence": [0.87890625, 1.0], "model_response": [["Who is the president / leader of China in the year 1949?", "Mao Zedong || Mao Zedong"], ["Who is Mao Zedong married to?", "Soong Mei-ling || Soong Mei-ling"]]}, "mis_info_dict_light": {"answer_condition": [1, 3], "confidence": [1.0, 1.0], "model_response": [["Who is the president / leader of China in the year 1949?", "Chiang Kai-shek || Chiang Kai-shek"], ["Who is Chiang Kai-shek married to?", "Jiang Qing || Jiang Qing"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 1], "confidence": [0.498046875, 0.17765161395072937], "model_response": [["Who is the president / leader of China in the year 1949?", "Chou En-Lai || Chou En-Lai"], ["Who is Chou En-Lai married to?", "Chou En-Lai was married to Soong Mei-ling. || Soong Mei-ling"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 1], "confidence": [0.498046875, 0.988311767578125], "model_response": [["Who is the president / leader of China in the year 1949?", "Chou En-lai || Chou En-lai"], ["Who is Chou En-lai married to?", "Chou En-lai was married to Soong Mei-ling. || Soong Mei-ling"]]}, "hall_sbj_dict_severe": {"answer_condition": [4, 1], "confidence": [0.9146728515625, 1.0], "model_response": [["Who is the president / leader of China in the year 1949?", "Chou En-lai || Chou En-lai"], ["Who is Chou En-lai married to?", "Soong Mei-ling || Soong Mei-ling"]]}}}
{"hop1": {"hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["What is the national anthem of Canada?", "O Canada || O Canada"], ["Who is the composer of \"O Canada\"?", "Adolphe-Basile Routhier || Adolphe-Basile Routhier"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.94921875], "model_response": [["What is the national anthem of Canada?", "O Canada || O Canada"], ["Who is the composer of \"O Canada\"?", "Adolphe-Basile Routhier || Adolphe-Basile Routhier"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.98046875], "model_response": [["What is the national anthem of Canada?", "O Canada! || O Canada"], ["Who is the composer of \"O Canada\"?", "Adolphe-Basile Routhier || Adolphe-Basile Routhier"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.94921875], "model_response": [["What is the national anthem of Canada?", "O Canada || O Canada"], ["Who is the composer of \"O Canada\"?", "Adolphe-Basile Routhier || Adolphe-Basile Routhier"]]}, "mis_info_dict_light": {"answer_condition": [4, 4], "confidence": [0.9765625, 0.98046875], "model_response": [["What is the national anthem of Canada?", "Maple Leaf Forever || Maple Leaf Forever"], ["Who is the composer of \"Maple Leaf Forever\"?", "Robert Stanley Weir || Robert Stanley Weir"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 0.22265625], "model_response": [["What is the national anthem of Canada?", "O Canada || O Canada"], ["Who is the composer of \"O Canada\"?", "Adolphe-Charles Adam || Adolphe-Charles Adam"]]}}, "hop2": {"unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.984375], "model_response": [["What is the national anthem of Canada?", "O Canada || O Canada"], ["Who is the composer of \"O Canada\"?", "Adolphe-Basile Routhier || Adolphe-Basile Routhier"]]}, "mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["What is the national anthem of Canada?", "O Canada || O Canada"], ["Who is the composer of \"O Canada\"?", "Calixa Lavall\u00e9e || Calixa Lavall\u00e9e"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["What is the national anthem of Canada?", "O Canada || O Canada"], ["Who is the composer of \"O Canada\"?", "Adolphe-Basile Routhier || Adolphe-Basile Routhier"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.99609375], "model_response": [["What is the national anthem of Canada?", "O Canada || O Canada"], ["Who is the composer of \"O Canada\"?", "Adolphe-Basile Routhier || Adolphe-Basile Routhier"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["What is the national anthem of Canada?", "O Canada || O Canada"], ["Who is the composer of \"O Canada\"?", "Adolphe-Basile Routhier || Adolphe-Basile Routhier"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.984375], "model_response": [["What is the national anthem of Canada?", "O Canada || O Canada"], ["Who is the composer of \"O Canada\"?", "Adolphe-Basile Routhier || Adolphe-Basile Routhier"]]}}}
{"hop1": {"hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.671875, 0.99609375], "model_response": [["In which year was the Los Angeles Lakers founded?", "1960 || 1960"], ["Which film won the Oscar for Outstanding Picture in 1960, being the first one in alphabetical order?", "Ben-Hur || Ben-Hur"]]}, "mis_info_dict_light": {"answer_condition": [4, 4], "confidence": [1.0, 0.00644838809967041], "model_response": [["In which year was the Los Angeles Lakers founded?", "1947 || 1947"], ["Which film won the Oscar for Outstanding Picture in 1947, being the first one in alphabetical order?", "The Lost Weekend || The Lost Weekend"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 4], "confidence": [0.96875, 0.181640625], "model_response": [["In which year was the Los Angeles Lakers founded?", "1947 || 1947"], ["Which film won the Oscar for Outstanding Picture in 1947, being the first one in alphabetical order?", "Key Largo || Key Largo"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 4], "confidence": [0.8671875, 0.7793426513671875], "model_response": [["In which year was the Los Angeles Lakers founded?", "1947 || 1947"], ["Which film won the Oscar for Outstanding Picture in 1947, being the first one in alphabetical order?", "The Best Years of Our Lives || The Best Years of Our Lives"]]}, "mis_info_dict_severe": {"answer_condition": [4, 4], "confidence": [0.96875, 0.921875], "model_response": [["In which year was the Los Angeles Lakers founded?", "1948 || 1948"], ["Which film won the Oscar for Outstanding Picture in 1948, being the first one in alphabetical order?", "The Best Years of Our Lives || The Best Years of Our Lives"]]}, "hall_sbj_dict_light": {"answer_condition": [4, 4], "confidence": [0.8671875, 0.8608856201171875], "model_response": [["In which year was the Los Angeles Lakers founded?", "1947 || 1947"], ["Which film won the Oscar for Outstanding Picture in 1947, being the first one in alphabetical order?", "The Best Years of Our Lives || The Best Years of Our Lives"]]}}, "hop2": {"unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.048583984375, 0.98828125], "model_response": [["In which year was the Los Angeles Lakers founded?", "1960 || 1960"], ["Which film won the Oscar for Outstanding Picture in 1960, being the first one in alphabetical order?", "Ben-Hur || Ben-Hur"]]}, "mis_info_dict_severe": {"answer_condition": [4, 4], "confidence": [0.3671875, 0.72088623046875], "model_response": [["In which year was the Los Angeles Lakers founded?", "1947 || 1947"], ["Which film won the Oscar for Outstanding Picture in 1947, being the first one in alphabetical order?", "The Best Years of Our Lives || The Best Years of Our Lives"]]}, "hall_sbj_dict_light": {"answer_condition": [4, 4], "confidence": [0.19140625, 0.875], "model_response": [["In which year was the Los Angeles Lakers founded?", "1948 || 1948"], ["Which film won the Oscar for Outstanding Picture in 1948, being the first one in alphabetical order?", "Key Largo || Key Largo"]]}, "mis_info_dict_light": {"answer_condition": [4, 4], "confidence": [0.95703125, 0.6351470947265625], "model_response": [["In which year was the Los Angeles Lakers founded?", "1947 || 1947"], ["Which film won the Oscar for Outstanding Picture in 1947, being the first one in alphabetical order?", "The Best Years of Our Lives || The Best Years of Our Lives"]]}, "hall_sbj_dict_severe": {"answer_condition": [4, 4], "confidence": [0.70703125, 0.4306640625], "model_response": [["In which year was the Los Angeles Lakers founded?", "1947 || 1947"], ["Which film won the Oscar for Outstanding Picture in 1947, being the first one in alphabetical order?", "The Best Years of Our Lives || The Best Years of Our Lives"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 4], "confidence": [0.89453125, 0.616241455078125], "model_response": [["In which year was the Los Angeles Lakers founded?", "1947 || 1947"], ["Which film won the Oscar for Outstanding Picture in 1947, being the first one in alphabetical order?", "The Best Years of Our Lives || The Best Years of Our Lives"]]}}}
{"hop1": {"unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.75390625, 1.0], "model_response": [["Which music company released The National Anthem of the People's Republic of China?", "Sony || Sony"], ["In which city is the headquarters of Sony Music Entertainment located?", "New York City || New York City"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.87890625, 1.0], "model_response": [["Which music company released The National Anthem of the People's Republic of China?", "Sony Music Entertainment || Sony Music Entertainment"], ["In which city is the headquarters of Sony Music Entertainment located?", "New York City || New York City"]]}, "hall_sbj_dict_severe": {"answer_condition": [4, 1], "confidence": [0.263671875, 0.98046875], "model_response": [["Which music company released The National Anthem of the People's Republic of China?", "Universal Music Group || Universal Music Group"], ["In which city is the headquarters of Universal Music Group located?", "New York City || New York City"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.9453125, 1.0], "model_response": [["Which music company released The National Anthem of the People's Republic of China?", "Sony Music Entertainment || Sony Music Entertainment"], ["In which city is the headquarters of Sony Music Entertainment located?", "New York City || New York City"]]}, "mis_info_dict_light": {"answer_condition": [3, 1], "confidence": [1.0, 0.9453125], "model_response": [["Which music company released The National Anthem of the People's Republic of China?", "Universal Music Group || Universal Music Group"], ["In which city is the headquarters of Universal Music Group located?", "New York City || New York City"]]}, "mis_info_dict_severe": {"answer_condition": [4, 1], "confidence": [0.77734375, 0.875], "model_response": [["Which music company released The National Anthem of the People's Republic of China?", "Universal Music Group || Universal Music Group"], ["In which city is the headquarters of Universal Music Group located?", "New York City || New York City"]]}}, "hop2": {"hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.9688568115234375, 1.0], "model_response": [["Which music company released The National Anthem of the People's Republic of China?", "Sony Music Entertainment || Sony Music Entertainment"], ["In which city is the headquarters of Sony Music Entertainment located?", "New York City || New York City"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.98046875, 1.0], "model_response": [["Which music company released The National Anthem of the People's Republic of China?", "Sony Music Entertainment || Sony Music Entertainment"], ["In which city is the headquarters of Sony Music Entertainment located?", "New York City || New York City"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.829888641834259, 1.0], "model_response": [["Which music company released The National Anthem of the People's Republic of China?", "Sony Music Entertainment || Sony Music Entertainment"], ["In which city is the headquarters of Sony Music Entertainment located?", "New York City || New York City"]]}, "mis_info_dict_light": {"answer_condition": [1, 3], "confidence": [1.0, 1.0], "model_response": [["Which music company released The National Anthem of the People's Republic of China?", "Sony Music Entertainment || Sony Music Entertainment"], ["In which city is the headquarters of Sony Music Entertainment located?", "Los Angeles || Los Angeles"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 4], "confidence": [0.7265625, 0.419921875], "model_response": [["Which music company released The National Anthem of the People's Republic of China?", "Universal Music Group || Universal Music Group"], ["In which city is the headquarters of Universal Music Group located?", "Los Angeles || Los Angeles"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.6196001172065735, 1.0], "model_response": [["Which music company released The National Anthem of the People's Republic of China?", "Sony Music Entertainment || Sony Music Entertainment"], ["In which city is the headquarters of Sony Music Entertainment located?", "New York City || New York City"]]}}}
{"hop1": {"unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.9921875, 0.3828125], "model_response": [["From which country does the Yenisei River originate?", "Russia || Russia"], ["Which is the first year does Japan invade Russia?", "1937 || 1937"]]}, "mis_info_dict_severe": {"answer_condition": [1, 4], "confidence": [0.8125, 0.33203125], "model_response": [["From which country does the Yenisei River originate?", "Russia || Russia"], ["Which is the first year does Japan invade Russia?", "1914 || 1914"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [0.9921875, 0.33203125], "model_response": [["From which country does the Yenisei River originate?", "Russia || Russia"], ["Which is the first year does Japan invade Russia?", "1904 || 1904"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 4], "confidence": [0.8125, 0.12158203125], "model_response": [["From which country does the Yenisei River originate?", "Russia || Russia"], ["Which is the first year does Japan invade Russia?", "1904 || 1904"]]}, "mis_info_dict_light": {"answer_condition": [3, 1], "confidence": [0.98046875, 0.984375], "model_response": [["From which country does the Yenisei River originate?", "China || China"], ["Which is the first year does Japan invade China?", "1937 || 1937"]]}, "hall_sbj_dict_light": {"answer_condition": [4, 1], "confidence": [0.1708984375, 0.90234375], "model_response": [["From which country does the Yenisei River originate?", "China || China"], ["Which is the first year does Japan invade China?", "1937 || 1937"]]}}, "hop2": {"hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.85546875, 0.9765625], "model_response": [["From which country does the Yenisei River originate?", "Russia || Russia"], ["Which is the first year does Japan invade Russia?", "1937 || 1937"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.9921875, 0.90234375], "model_response": [["From which country does the Yenisei River originate?", "Russia || Russia"], ["Which is the first year does Japan invade Russia?", "1937 || 1937"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.85546875, 0.9921875], "model_response": [["From which country does the Yenisei River originate?", "Russia (East) || Russia"], ["Which is the first year does Japan invade Russia?", "1937 || 1937"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.8046875, 0.95703125], "model_response": [["From which country does the Yenisei River originate?", "Russia || Russia"], ["Which is the first year does Japan invade Russia?", "1937 || 1937"]]}, "mis_info_dict_light": {"answer_condition": [1, 3], "confidence": [0.54296875, 0.61328125], "model_response": [["From which country does the Yenisei River originate?", "Russia || Russia"], ["Which is the first year does Japan invade Russia?", "1945 || 1945"]]}, "mis_info_dict_severe": {"answer_condition": [1, 4], "confidence": [0.6875, 0.34375], "model_response": [["From which country does the Yenisei River originate?", "Russia || Russia"], ["Which is the first year does Japan invade Russia?", "1904 || 1904"]]}}}
{"hop1": {"hall_sbj_dict_light": {"answer_condition": [1, 4], "confidence": [0.12190540437586606, 0.004174399240355342], "model_response": [["Which music company released Jet?", "Sony Music Entertainment || Sony Music Entertainment"], ["Who is the CEO of Columbia Records in the year 1954?", "Raymond S. Zak || Raymond S. Zak"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 4], "confidence": [0.6670257449150085, 0.75067138671875], "model_response": [["Which music company released Jet?", "Sony Music Entertainment || Sony Music Entertainment"], ["Who is the CEO of Columbia Records in the year 1954?", "Clive Davis || Clive Davis"]]}, "mis_info_dict_light": {"answer_condition": [3, -1], "confidence": [1.0, -1], "model_response": [["Which music company released Jet?", "Warner Music Group || Warner Music Group"], ["Who is the CEO of Warner Music Group in the year 1954?", "I'm sorry, I cannot provide an answer to this question as I do not have access to historical information. || N/A"]]}, "mis_info_dict_severe": {"answer_condition": [3, 4], "confidence": [0.9921875, 0.478515625], "model_response": [["Which music company released Jet?", "Pizza Hut || Pizza Hut"], ["Who is the CEO of Pizza Hut in the year 1954?", "Ray Kroc || Ray Kroc"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 4], "confidence": [0.6328125, 0.0073500713937590945], "model_response": [["Which music company released Jet?", "Elektra Records || Elektra Records"], ["Who is the CEO of Elektra Records in the year 1954?", "Arthur P. \"Pappy\" Hoover || Arthur P. \"Pappy\" Hoover"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 4], "confidence": [0.83984375, 0.0005335290916264057], "model_response": [["Which music company released Jet?", "Elektra Records || Elektra Records"], ["Who is the CEO of Elektra Records in the year 1954?", "Arthur P. Goldberg || Arthur P. Goldberg"]]}}, "hop2": {"hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.287109375, 1.0], "model_response": [["Which music company released Jet?", "Columbia Records || Columbia Records"], ["Who is the CEO of Columbia Records in the year 1954?", "John I. Nederlander || John I. Nederlander"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [0.34765625, 7.172812146905017e-05], "model_response": [["Which music company released Jet?", "Columbia Records || Columbia Records"], ["Who is the CEO of Columbia Records in the year 1954?", "Raymond A. Waitt || Raymond A. Waitt"]]}, "hall_sbj_dict_severe": {"answer_condition": [4, 1], "confidence": [0.71875, 0.99609375], "model_response": [["Which music company released Jet?", "Epic Records || Epic Records"], ["Who is the CEO of Epic Records in the year 1954?", "John I. Nederlander || John I. Nederlander"]]}, "mis_info_dict_severe": {"answer_condition": [1, 4], "confidence": [0.56640625, 0.55078125], "model_response": [["Which music company released Jet?", "Columbia Records || Columbia Records"], ["Who is the CEO of Columbia Records in the year 1954?", "Unknown || Unknown"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [0.796875, 0.0026673862521420233], "model_response": [["Which music company released Jet?", "Columbia Records || Columbia Records"], ["Who is the CEO of Columbia Records in the year 1954?", "John A. Hamang || John A. Hamang"]]}, "mis_info_dict_light": {"answer_condition": [1, 3], "confidence": [0.8515625, 1.0], "model_response": [["Which music company released Jet?", "Columbia Records || Columbia Records"], ["Who is the CEO of Columbia Records in the year 1954?", "Frank Sinatra || Frank Sinatra"]]}}}
{"hop1": {"unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.73828125, 0.55859375], "model_response": [["Which film company produced \"The Red Badge of Courage\"?", "MGM || MGM"], ["In which year was MGM founded?", "1925 || 1925"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.60546875, 0.67578125], "model_response": [["Which film company produced \"The Red Badge of Courage\"?", "MGM || MGM"], ["In which year was MGM founded?", "1925 || 1925"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.7421875], "model_response": [["Which film company produced \"The Red Badge of Courage\"?", "MGM || MGM"], ["In which year was MGM founded?", "1925 || 1925"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 1], "confidence": [0.2137298583984375, 0.6015625], "model_response": [["Which film company produced \"The Red Badge of Courage\"?", "Universal Studios || Universal Studios"], ["In which year was Universal Studios founded?", "1925 || 1925"]]}, "mis_info_dict_light": {"answer_condition": [3, 4], "confidence": [1.0, 0.498046875], "model_response": [["Which film company produced \"The Red Badge of Courage\"?", "Paramount Pictures || Paramount Pictures"], ["In which year was Paramount Pictures founded?", "1917 || 1917"]]}, "hall_sbj_dict_light": {"answer_condition": [4, 4], "confidence": [0.5221710205078125, 0.2177734375], "model_response": [["Which film company produced \"The Red Badge of Courage\"?", "Universal Pictures || Universal Pictures"], ["In which year was Universal Pictures founded?", "1917 || 1917"]]}}, "hop2": {"mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.9765625, 0.66015625], "model_response": [["Which film company produced \"The Red Badge of Courage\"?", "MGM || MGM"], ["In which year was MGM founded?", "1925 || 1925"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Which film company produced \"The Red Badge of Courage\"?", "MGM || MGM"], ["In which year was MGM founded?", "1925 || 1925"]]}, "mis_info_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 1.0], "model_response": [["Which film company produced \"The Red Badge of Courage\"?", "MGM (Metro-Goldwyn-Mayer) || MGM"], ["In which year was MGM founded?", "1930 || 1930"]]}, "hall_sbj_dict_severe": {"answer_condition": [4, 1], "confidence": [0.19403076171875, 1.0], "model_response": [["Which film company produced \"The Red Badge of Courage\"?", "Universal Studios || Universal Studios"], ["In which year was Universal Studios founded?", "1925 || 1925"]]}, "hall_sbj_dict_light": {"answer_condition": [3, 1], "confidence": [0.9921875, 1.0], "model_response": [["Which film company produced \"The Red Badge of Courage\"?", "Warner Bros. || Warner Bros."], ["In which year was Warner Bros. founded?", "1925 || 1925"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 4], "confidence": [0.2179412841796875, 0.8828125], "model_response": [["Which film company produced \"The Red Badge of Courage\"?", "Universal Pictures || Universal Pictures"], ["In which year was Universal Pictures founded?", "1915 || 1915"]]}}}
{"hop1": {"hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.9921875, 1.0], "model_response": [["What is the name of the longest river in the United States?", "Missouri River || Missouri River"], ["On which continent is the Missouri River located?", "North America || North America"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["What is the name of the longest river in the United States?", "The longest river in the United States is the Missouri River. || Missouri River"], ["On which continent is the Missouri River located?", "North America || North America"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.87890625, 1.0], "model_response": [["What is the name of the longest river in the United States?", "Missouri || Missouri"], ["On which continent is the Missouri River located?", "North America || North America"]]}, "mis_info_dict_light": {"answer_condition": [4, 1], "confidence": [0.99609375, 1.0], "model_response": [["What is the name of the longest river in the United States?", "The name of the longest river in the United States is the Mississippi River. || Mississippi River"], ["On which continent is the Mississippi River located?", "North America || North America"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 1], "confidence": [0.81640625, 1.0], "model_response": [["What is the name of the longest river in the United States?", "Mississippi || Mississippi"], ["On which continent is the Mississippi River located?", "North America || North America"]]}, "mis_info_dict_severe": {"answer_condition": [4, 1], "confidence": [0.8885498046875, 1.0], "model_response": [["What is the name of the longest river in the United States?", "The name of the longest river in the United States is the Mississippi River. || Mississippi River"], ["On which continent is the Mississippi River located?", "North America || North America"]]}}, "hop2": {"mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["What is the name of the longest river in the United States?", "Missouri River || Missouri River"], ["On which continent is the Missouri River located?", "North America || North America"]]}, "mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [0.98828125, 1.0], "model_response": [["What is the name of the longest river in the United States?", "Missouri River || Missouri River"], ["On which continent is the Missouri River located?", "North America || North America"]]}, "hall_sbj_dict_severe": {"answer_condition": [4, 1], "confidence": [0.92578125, 1.0], "model_response": [["What is the name of the longest river in the United States?", "Mississippi || Mississippi"], ["On which continent is the Mississippi River located?", "North America || North America"]]}, "hall_sbj_dict_light": {"answer_condition": [4, 1], "confidence": [0.418853759765625, 1.0], "model_response": [["What is the name of the longest river in the United States?", "Mississippi River || Mississippi River"], ["On which continent is the Mississippi River located?", "North America || North America"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.2558934688568115, 1.0], "model_response": [["What is the name of the longest river in the United States?", "Missouri River || Missouri River"], ["On which continent is the Missouri River located?", "North America || North America"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 1], "confidence": [0.87890625, 1.0], "model_response": [["What is the name of the longest river in the United States?", "Mississippi || Mississippi"], ["On which continent is the Mississippi River located?", "North America || North America"]]}}}
{"hop1": {"hall_sbj_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.99609375], "model_response": [["In which year was The National Anthem of the People's Republic of China written?", "1949 || 1949"], ["Who is the headmaster of Princeton University in the year 1949?", "Woodrow Wilson || Woodrow Wilson"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [0.984375, 0.9921875], "model_response": [["In which year was The National Anthem of the People's Republic of China written?", "1949 || 1949"], ["Who is the headmaster of Princeton University in the year 1949?", "Woodrow Wilson || Woodrow Wilson"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 4], "confidence": [0.9921875, 0.99609375], "model_response": [["In which year was The National Anthem of the People's Republic of China written?", "1949 || 1949"], ["Who is the headmaster of Princeton University in the year 1949?", "Woodrow Wilson || Woodrow Wilson"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [0.99609375, 0.99609375], "model_response": [["In which year was The National Anthem of the People's Republic of China written?", "1949 || 1949"], ["Who is the headmaster of Princeton University in the year 1949?", "Woodrow Wilson || Woodrow Wilson"]]}, "mis_info_dict_severe": {"answer_condition": [1, 4], "confidence": [0.99609375, 0.984375], "model_response": [["In which year was The National Anthem of the People's Republic of China written?", "I'm sorry, but the information provided in the reference is incorrect. The National Anthem of the People's Republic of China was written in the year 1949, not in the year Pizza. || 1949"], ["Who is the headmaster of Princeton University in the year 1949?", "Woodrow Wilson || Woodrow Wilson"]]}, "mis_info_dict_light": {"answer_condition": [3, 4], "confidence": [1.0, 0.025534629821777344], "model_response": [["In which year was The National Anthem of the People's Republic of China written?", "1954 || 1954"], ["Who is the headmaster of Princeton University in the year 1954?", "Robert Goetz || Robert Goetz"]]}}, "hop2": {"hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.7265625], "model_response": [["In which year was The National Anthem of the People's Republic of China written?", "1949 || 1949"], ["Who is the headmaster of Princeton University in the year 1949?", "Robert Goheen || Robert Goheen"]]}, "mis_info_dict_severe": {"answer_condition": [1, -1], "confidence": [1.0, -1], "model_response": [["In which year was The National Anthem of the People's Republic of China written?", "1949 || 1949"], ["Who is the headmaster of Princeton University in the year 1949?", "I'm sorry, I don't have that information. Please provide more context or information so I can assist you better. || N/A"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.99609375, 0.5859375], "model_response": [["In which year was The National Anthem of the People's Republic of China written?", "1949 || 1949"], ["Who is the headmaster of Princeton University in the year 1949?", "Robert Goheen || Robert Goheen"]]}, "mis_info_dict_light": {"answer_condition": [1, 4], "confidence": [0.9921875, 1.0], "model_response": [["In which year was The National Anthem of the People's Republic of China written?", "1949 || 1949"], ["Who is the headmaster of Princeton University in the year 1949?", "John F. Kennedy || John F. Kennedy"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.247467041015625], "model_response": [["In which year was The National Anthem of the People's Republic of China written?", "1949 || 1949"], ["Who is the headmaster of Princeton University in the year 1949?", "Robert Goetz || Robert Goetz"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [0.99609375, 0.43359375], "model_response": [["In which year was The National Anthem of the People's Republic of China written?", "1949 || 1949"], ["Who is the headmaster of Princeton University in the year 1949?", "Arthur Fletcher || Arthur Fletcher"]]}}}
{"hop1": {"hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.26953125, 1.0], "model_response": [["What is the name of the largest airport in London?", "Heathrow || Heathrow"], ["What is the abbreviation for Heathrow airport?", "LHR || LHR"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["What is the name of the largest airport in London?", "Heathrow || Heathrow"], ["What is the abbreviation for Heathrow airport?", "LHR || LHR"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.7265625, 1.0], "model_response": [["What is the name of the largest airport in London?", "Heathrow || Heathrow"], ["What is the abbreviation for Heathrow airport?", "LHR || LHR"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["What is the name of the largest airport in London?", "Heathrow || Heathrow"], ["What is the abbreviation for Heathrow airport?", "LHR || LHR"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.9921875, 1.0], "model_response": [["What is the name of the largest airport in London?", "Heathrow || Heathrow"], ["What is the abbreviation for Heathrow airport?", "LHR || LHR"]]}, "mis_info_dict_light": {"answer_condition": [3, 3], "confidence": [0.8046875, 0.99609375], "model_response": [["What is the name of the largest airport in London?", "Gatwick || Gatwick"], ["What is the abbreviation for Gatwick airport?", "LGW || LGW"]]}}, "hop2": {"hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["What is the name of the largest airport in London?", "Heathrow || Heathrow"], ["What is the abbreviation for Heathrow airport?", "LHR || LHR"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["What is the name of the largest airport in London?", "Heathrow || Heathrow"], ["What is the abbreviation for Heathrow airport?", "LHR || LHR"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["What is the name of the largest airport in London?", "Heathrow || Heathrow"], ["What is the abbreviation for Heathrow airport?", "LHR || LHR"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.26953125, 1.0], "model_response": [["What is the name of the largest airport in London?", "Heathrow Airport || Heathrow Airport"], ["What is the abbreviation for Heathrow airport?", "LHR || LHR"]]}, "mis_info_dict_severe": {"answer_condition": [1, 4], "confidence": [0.4805908203125, 0.57421875], "model_response": [["What is the name of the largest airport in London?", "Heathrow Airport || Heathrow Airport"], ["What is the abbreviation for Heathrow airport?", "HIA || HIA"]]}, "mis_info_dict_light": {"answer_condition": [1, 4], "confidence": [0.4941558837890625, 1.0], "model_response": [["What is the name of the largest airport in London?", "The name of the largest airport in London is Heathrow Airport. || Heathrow Airport"], ["What is the abbreviation for Heathrow airport?", "JFK || JFK"]]}}}
{"hop1": {"hall_sbj_dict_severe": {"answer_condition": [1, 4], "confidence": [0.9921875, 1.0], "model_response": [["In which year was The Red Badge of Courage released?", "1895 || 1895"], ["Which city hosted the first Olympic Games in 1895?", "Athens || Athens"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [0.98828125, 1.0], "model_response": [["In which year was The Red Badge of Courage released?", "1895 || 1895"], ["Which city hosted the first Olympic Games in 1895?", "Athens || Athens"]]}, "mis_info_dict_severe": {"answer_condition": [4, 4], "confidence": [0.93792724609375, 0.73046875], "model_response": [["In which year was The Red Badge of Courage released?", "1916 || 1916"], ["Which city hosted the first Olympic Games in 1916?", "Rio de Janeiro || Rio de Janeiro"]]}, "hall_sbj_dict_light": {"answer_condition": [4, 4], "confidence": [0.23054122924804688, 0.62109375], "model_response": [["In which year was The Red Badge of Courage released?", "1916 || 1916"], ["Which city hosted the first Olympic Games in 1916?", "Rome || Rome"]]}, "mis_info_dict_light": {"answer_condition": [3, 4], "confidence": [1.0, 1.0], "model_response": [["In which year was The Red Badge of Courage released?", "1905 || 1905"], ["Which city hosted the first Olympic Games in 1905?", "St. Louis || St. Louis"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [0.8671875, 1.0], "model_response": [["In which year was The Red Badge of Courage released?", "1895 || 1895"], ["Which city hosted the first Olympic Games in 1895?", "Athens || Athens"]]}}, "hop2": {"hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.62109375, 1.0], "model_response": [["In which year was The Red Badge of Courage released?", "1895 || 1895"], ["Which city hosted the first Olympic Games in 1895?", "Paris || Paris"]]}, "mis_info_dict_light": {"answer_condition": [1, 4], "confidence": [0.98046875, 1.0], "model_response": [["In which year was The Red Badge of Courage released?", "1895 || 1895"], ["Which city hosted the first Olympic Games in 1895?", "Athens || Athens"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 4], "confidence": [0.777008056640625, 0.9921875], "model_response": [["In which year was The Red Badge of Courage released?", "1916 || 1916"], ["Which city hosted the first Olympic Games in 1916?", "Rio de Janeiro || Rio de Janeiro"]]}, "hall_sbj_dict_light": {"answer_condition": [4, 4], "confidence": [0.4941558837890625, 0.81640625], "model_response": [["In which year was The Red Badge of Courage released?", "1916 || 1916"], ["Which city hosted the first Olympic Games in 1916?", "Rio de Janeiro || Rio de Janeiro"]]}, "mis_info_dict_severe": {"answer_condition": [4, 4], "confidence": [0.11867523193359375, 0.99609375], "model_response": [["In which year was The Red Badge of Courage released?", "1916 || 1916"], ["Which city hosted the first Olympic Games in 1916?", "Rio de Janeiro || Rio de Janeiro"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 3], "confidence": [0.8617401123046875, 1.0], "model_response": [["In which year was The Red Badge of Courage released?", "1916 || 1916"], ["Which city hosted the first Olympic Games in 1916?", "Rio de Janeiro || Rio de Janeiro"]]}}}
{"hop1": {"unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.62109375], "model_response": [["In which year was \"The Deer Hunter\" released?", "1978 || 1978"], ["Who is the CEO of IBM in the year 1978?", "John Opel || John Opel"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.80859375], "model_response": [["In which year was \"The Deer Hunter\" released?", "1978 || 1978"], ["Who is the CEO of IBM in the year 1978?", "John Opel || John Opel"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.953125], "model_response": [["In which year was \"The Deer Hunter\" released?", "1978 || 1978"], ["Who is the CEO of IBM in the year 1978?", "John Opel || John Opel"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.325286865234375], "model_response": [["In which year was \"The Deer Hunter\" released?", "1978 || 1978"], ["Who is the CEO of IBM in the year 1978?", "John Opel, Jr. || John Opel, Jr."]]}, "mis_info_dict_light": {"answer_condition": [3, 1], "confidence": [1.0, 0.2013702392578125], "model_response": [["In which year was \"The Deer Hunter\" released?", "1980 || 1980"], ["Who is the CEO of IBM in the year 1980?", "John Opel, Jr. || John Opel, Jr."]]}, "mis_info_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.2373504638671875], "model_response": [["In which year was \"The Deer Hunter\" released?", "1978 || 1978"], ["Who is the CEO of IBM in the year 1978?", "John Opel, Jr. || John Opel, Jr."]]}}, "hop2": {"unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.96875], "model_response": [["In which year was \"The Deer Hunter\" released?", "1978 || 1978"], ["Who is the CEO of IBM in the year 1978?", "John Opel || John Opel"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.98828125], "model_response": [["In which year was \"The Deer Hunter\" released?", "1978 || 1978"], ["Who is the CEO of IBM in the year 1978?", "John Opel || John Opel"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.96875], "model_response": [["In which year was \"The Deer Hunter\" released?", "1978 || 1978"], ["Who is the CEO of IBM in the year 1978?", "John Opel || John Opel"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.89453125], "model_response": [["In which year was \"The Deer Hunter\" released?", "1978 || 1978"], ["Who is the CEO of IBM in the year 1978?", "John Opel || John Opel"]]}, "mis_info_dict_severe": {"answer_condition": [1, 3], "confidence": [1.0, 0.95703125], "model_response": [["In which year was \"The Deer Hunter\" released?", "1978 || 1978"], ["Who is the CEO of IBM in the year 1978?", "Pizza || Pizza"]]}, "mis_info_dict_light": {"answer_condition": [1, 3], "confidence": [1.0, 1.0], "model_response": [["In which year was \"The Deer Hunter\" released?", "1978 || 1978"], ["Who is the CEO of IBM in the year 1978?", "Thomas J. Watson Jr. || Thomas J. Watson Jr."]]}}}
{"hop1": {"unrelated_fact_dict_severe": {"answer_condition": [1, -1], "confidence": [1.0, -1], "model_response": [["Who was the US president in the year 1901?", "William McKinley || William McKinley"], ["Who is William McKinley married to?", "I'm sorry, I cannot provide an answer to this question as it is not related to the given information. Please provide a question related to the given information. || N/A"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.6640625], "model_response": [["Who was the US president in the year 1901?", "William McKinley || William McKinley"], ["Who is William McKinley married to?", "Ida Saxton || Ida Saxton"]]}, "mis_info_dict_severe": {"answer_condition": [3, -1], "confidence": [1.0, -1], "model_response": [["Who was the US president in the year 1901?", "Pizza || Pizza"], ["Who is Pizza married to?", "Pizza is not married. || N/A"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 0.0033136606216430664], "model_response": [["Who was the US president in the year 1901?", "William McKinley || William McKinley"], ["Who is William McKinley married to?", "Irene McKinley || Irene McKinley"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.6108856201171875], "model_response": [["Who was the US president in the year 1901?", "William McKinley || William McKinley"], ["Who is William McKinley married to?", "Ida Saxton || Ida Saxton"]]}, "mis_info_dict_light": {"answer_condition": [3, 4], "confidence": [1.0, 1.0], "model_response": [["Who was the US president in the year 1901?", "Theodore Roosevelt || Theodore Roosevelt"], ["Who is Theodore Roosevelt married to?", "Sara Delano || Sara Delano"]]}}, "hop2": {"unrelated_fact_dict_light": {"answer_condition": [1, -1], "confidence": [1.0, -1], "model_response": [["Who was the US president in the year 1901?", "William McKinley || William McKinley"], ["Who is William McKinley married to?", "I'm sorry, I don't understand your question. || N/A"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, -1], "confidence": [1.0, -1], "model_response": [["Who was the US president in the year 1901?", "William McKinley || William McKinley"], ["Who is William McKinley married to?", "I'm sorry, I don't understand your question. || N/A"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Who was the US president in the year 1901?", "William McKinley || William McKinley"], ["Who is William McKinley married to?", "Ida Saxton || Ida Saxton"]]}, "hall_sbj_dict_light": {"answer_condition": [4, 1], "confidence": [1.0, 1.0], "model_response": [["Who was the US president in the year 1901?", "Theodore Roosevelt || Theodore Roosevelt"], ["Who is Theodore Roosevelt married to?", "Ida Saxton || Ida Saxton"]]}, "mis_info_dict_severe": {"answer_condition": [1, 3], "confidence": [1.0, 0.7162017822265625], "model_response": [["Who was the US president in the year 1901?", "William McKinley || William McKinley"], ["Who is William McKinley married to?", "Chocolate chip cookies || Chocolate chip cookies"]]}, "mis_info_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 1.0], "model_response": [["Who was the US president in the year 1901?", "William McKinley || William McKinley"], ["Who is William McKinley married to?", "Helen Herron || Helen Herron"]]}}}
{"hop1": {"hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.8426055908203125], "model_response": [["From which country does the Yalu River originate?", "China || China"], ["What is the national anthem of China?", "The National Anthem of the People's Republic of China is \"The March of the Volunteers\". || The March of the Volunteers"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.8446946740150452], "model_response": [["From which country does the Yalu River originate?", "China || China"], ["What is the national anthem of China?", "The National Anthem of the People's Republic of China is \"The National Anthem of the People's Republic of China\". || The National Anthem of the People's Republic of China"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.99609375, 0.421875], "model_response": [["From which country does the Yalu River originate?", "China || China"], ["What is the national anthem of China?", "The National Anthem of China is \"The March of the Volunteers\" (\u4e2d\u56fd\u9752\u5e74March of the Volunteers). || The March of the Volunteers"]]}, "mis_info_dict_light": {"answer_condition": [4, 4], "confidence": [1.0, 0.5040809512138367], "model_response": [["From which country does the Yalu River originate?", "North Korea || North Korea"], ["What is the national anthem of North Korea?", "The national anthem of North Korea is \"Song of General Kim Jong Il\". || Song of General Kim Jong Il"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.9921875], "model_response": [["From which country does the Yalu River originate?", "China || China"], ["What is the national anthem of China?", "The National Anthem of China is the \"March of the Volunteers\" (simplified Chinese: \u6c11\u65cf\u6b4c; traditional Chinese: \u6c11\u65cf\u6b4c; pinyin: \u6c11\u65cf\u6b4c). || March of the Volunteers"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.77813720703125], "model_response": [["From which country does the Yalu River originate?", "China || China"], ["What is the national anthem of China?", "The National Anthem of the People's Republic of China is \"The March of the Volunteers\" (simplified Chinese: \u5175\u5f92 March; traditional Chinese: \u5175\u5f92\u884c\u4f10; pinyin: \u5175\u5f92; Zh\u014dngsh\u012b). The lyrics were written by the Chinese poet and politician Qu Yuan (c. 340\u2013278 BCE), and the music was composed by the Chinese composer Zheng Xiu (1750\u20131801). || The March of the Volunteers"]]}}, "hop2": {"mis_info_dict_light": {"answer_condition": [1, 4], "confidence": [0.9921875, 1.0], "model_response": [["From which country does the Yalu River originate?", "China || China"], ["What is the national anthem of China?", "\"The East Is Red\" || The East Is Red"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.9922027587890625], "model_response": [["From which country does the Yalu River originate?", "China || China"], ["What is the national anthem of China?", "The National Anthem of the People's Republic of China. || The National Anthem of the People's Republic of China"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.674102783203125], "model_response": [["From which country does the Yalu River originate?", "China || China"], ["What is the national anthem of China?", "The National Anthem of China is \"The March of the Volunteers\" (Zhongguo Guogeli). || The March of the Volunteers"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.933837890625], "model_response": [["From which country does the Yalu River originate?", "China || China"], ["What is the national anthem of China?", "The National Anthem of the People's Republic of China (\u4e2d\u534e\u4eba\u6c11\u5171\u548c\u56fd\u56fd\u6b4c) || The National Anthem of the People's Republic of China"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.2112596333026886], "model_response": [["From which country does the Yalu River originate?", "China || China"], ["What is the national anthem of China?", "The national anthem of China is \"The National Anthem of the People's Republic of China\" (\u4e2d\u534e\u4eba\u6c11\u5171\u548c\u56fd\u56fd\u6b4c). || The National Anthem of the People's Republic of China"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.7469482421875], "model_response": [["From which country does the Yalu River originate?", "China || China"], ["What is the national anthem of China?", "The National Anthem of China is \"The March of the Volunteers\" (simplified Chinese: \u6c11\u65cf\u6b4c; traditional Chinese: \u6c11\u65cf\u6b4c; pinyin: M\u00ednz\u00fa g\u0113). || The March of the Volunteers"]]}}}
{"hop1": {"hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.7141876220703125], "model_response": [["Who is the president / leader of Finland in the year 1814?", "Carl Gustaf Mannerheim || Carl Gustaf Mannerheim"], ["In which year was Carl Gustaf Mannerheim born?", "1847 || 1847"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.9921875], "model_response": [["Who is the president / leader of Finland in the year 1814?", "Carl Gustaf Mannerheim || Carl Gustaf Mannerheim"], ["In which year was Carl Gustaf Mannerheim born?", "1867 || 1867"]]}, "mis_info_dict_light": {"answer_condition": [4, 4], "confidence": [1.0, 1.0], "model_response": [["Who is the president / leader of Finland in the year 1814?", "Alexander I || Alexander I"], ["In which year was Alexander I born?", "1777 || 1777"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 4], "confidence": [0.02304840087890625, 1.0], "model_response": [["Who is the president / leader of Finland in the year 1814?", "Alexander II of Russia || Alexander II of Russia"], ["In which year was Alexander II of Russia born?", "1818 || 1818"]]}, "mis_info_dict_severe": {"answer_condition": [3, 4], "confidence": [1.0, 0.96484375], "model_response": [["Who is the president / leader of Finland in the year 1814?", "Pizza || Pizza"], ["In which year was pizza born?", "1814 || 1814"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 4], "confidence": [0.0428009033203125, 1.0], "model_response": [["Who is the president / leader of Finland in the year 1814?", "Alexander I || Alexander I"], ["In which year was Alexander I born?", "1777 || 1777"]]}}, "hop2": {"unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.26787372725084424, 0.50390625], "model_response": [["Who is the president / leader of Finland in the year 1814?", "Carl Gustaf Mannerheim || Carl Gustaf Mannerheim"], ["In which year was Carl Gustaf Mannerheim born?", "1847 || 1847"]]}, "mis_info_dict_light": {"answer_condition": [1, 3], "confidence": [1.0, 1.0], "model_response": [["Who is the president / leader of Finland in the year 1814?", "Carl Gustaf Mannerheim || Carl Gustaf Mannerheim"], ["In which year was Carl Gustaf Mannerheim born?", "1865 || 1865"]]}, "mis_info_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 1.0], "model_response": [["Who is the president / leader of Finland in the year 1814?", "Carl Gustaf Mannerheim || Carl Gustaf Mannerheim"], ["In which year was Carl Gustaf Mannerheim born?", "1867 || 1867"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 4], "confidence": [0.008468487692425697, 0.6015625], "model_response": [["Who is the president / leader of Finland in the year 1814?", "Carl Johan Adlerfeldt || Carl Johan Adlerfeldt"], ["In which year was Carl Johan Adlerfeldt born?", "1748 || 1748"]]}, "hall_sbj_dict_severe": {"answer_condition": [4, 4], "confidence": [0.6321543361991644, 0.1962890625], "model_response": [["Who is the president / leader of Finland in the year 1814?", "Carl Johan Adlercreutz || Carl Johan Adlercreutz"], ["In which year was Carl Johan Adlercreutz born?", "1770 || 1770"]]}, "hall_sbj_dict_light": {"answer_condition": [4, 4], "confidence": [0.6756772460357752, 0.16925811767578125], "model_response": [["Who is the president / leader of Finland in the year 1814?", "Carl Johan Adlercreutz || Carl Johan Adlercreutz"], ["In which year was Carl Johan Adlercreutz born?", "1749 || 1749"]]}}}
{"hop1": {"mis_info_dict_severe": {"answer_condition": [-1, -1], "confidence": [-1, -1], "model_response": [["In which year was Norway founded or became independent?", "I'm sorry, I don't understand the question. Can you please rephrase it? || N/A"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.99609375, 1.0], "model_response": [["In which year was Norway founded or became independent?", "1814 || 1814"], ["Who was the US president in the year 1814?", "James Madison || James Madison"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["In which year was Norway founded or became independent?", "1814 || 1814"], ["Who was the US president in the year 1814?", "James Madison || James Madison"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.81640625, 1.0], "model_response": [["In which year was Norway founded or became independent?", "1814 || 1814"], ["Who was the US president in the year 1814?", "James Madison || James Madison"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, -1], "confidence": [0.921875, -1], "model_response": [["In which year was Norway founded or became independent?", "1030 || 1030"], ["Who was the US president in the year 1030?", "It was not a US president. || N/A"]]}, "mis_info_dict_light": {"answer_condition": [4, 4], "confidence": [0.9921875, 0.9921875], "model_response": [["In which year was Norway founded or became independent?", "1905 || 1905"], ["Who was the US president in the year 1905?", "Theodore Roosevelt || Theodore Roosevelt"]]}}, "hop2": {"hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.96484375, 0.87890625], "model_response": [["In which year was Norway founded or became independent?", "1814 || 1814"], ["Who was the US president in the year 1814?", "James Madison || James Madison"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["In which year was Norway founded or became independent?", "1814 || 1814"], ["Who was the US president in the year 1814?", "James Madison || James Madison"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.9921875, 1.0], "model_response": [["In which year was Norway founded or became independent?", "1814 || 1814"], ["Who was the US president in the year 1814?", "James Madison || James Madison"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["In which year was Norway founded or became independent?", "1814 || 1814"], ["Who was the US president in the year 1814?", "James Madison || James Madison"]]}, "mis_info_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 0.953125], "model_response": [["In which year was Norway founded or became independent?", "1814 || 1814"], ["Who was the US president in the year 1814?", "Thomas Jefferson || Thomas Jefferson"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 0.953125], "model_response": [["In which year was Norway founded or became independent?", "1814 || 1814"], ["Who was the US president in the year 1814?", "Thomas Jefferson || Thomas Jefferson"]]}}}
{"hop1": {"hall_sbj_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 0.02236749976873398], "model_response": [["Who was the US president in the year 1814?", "James Madison || James Madison"], ["Which company did James Madison work for, in chronological order?", "James Madison worked for the Virginia State Legislature. || Virginia State Legislature"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, -1], "confidence": [1.0, -1], "model_response": [["Who was the US president in the year 1814?", "James Madison || James Madison"], ["Which company did James Madison work for, in chronological order?", "Madison served as a US Representative and US Senator before becoming President. He also worked as a lawyer. || N/A"]]}, "mis_info_dict_light": {"answer_condition": [3, -1], "confidence": [1.0, -1], "model_response": [["Who was the US president in the year 1814?", "Thomas Jefferson || Thomas Jefferson"], ["Which company did Thomas Jefferson work for, in chronological order?", "Jefferson worked for the US government as a diplomat and later as a president. He also owned a printing press and published a newspaper. || N/A"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, -1], "confidence": [1.0, -1], "model_response": [["Who was the US president in the year 1814?", "James Madison || James Madison"], ["Which company did James Madison work for, in chronological order?", "James Madison was the US Secretary of State in the year 1801, and the US Secretary of State in the year 1805. He also worked as a member of the US House of Representatives in the year 1811. || N/A"]]}, "mis_info_dict_severe": {"answer_condition": [1, -1], "confidence": [0.8828125, -1], "model_response": [["Who was the US president in the year 1814?", "James Madison || James Madison"], ["Which company did James Madison work for, in chronological order?", "Madison served as a US Representative from 1789-1799 and as US Secretary of State from 1795-1798. He also served as US President from 1812-1817. He worked for the Virginia State Convention in 1774 and for the Continental Congress in 1774-1789. He also worked for the Virginia State Convention in 1774 and for the Continental Congress in 1774-1789. || N/A"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, -1], "confidence": [0.984375, -1], "model_response": [["Who was the US president in the year 1814?", "James Madison || James Madison"], ["Which company did James Madison work for, in chronological order?", "James Madison was the US Secretary of State from 1801-1809. He also served as US Secretary of War from 1795-1797. He also worked as a member of the US House of Representatives from 1789-1799. || N/A"]]}}, "hop2": {"hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.953125], "model_response": [["Who was the US president in the year 1814?", "James Madison || James Madison"], ["Which company did James Madison work for, in chronological order?", "James Madison worked for the US government. || US government"]]}, "mis_info_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 0.259765625], "model_response": [["Who was the US president in the year 1814?", "James Madison was the US president in the year 1814. || James Madison"], ["Which company did James Madison work for, in chronological order?", "Microsoft || Microsoft"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.9027099609375], "model_response": [["Who was the US president in the year 1814?", "James Madison || James Madison"], ["Which company did James Madison work for, in chronological order?", "James Madison worked for the US government. || US government"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.0321502685546875], "model_response": [["Who was the US president in the year 1814?", "James Madison || James Madison"], ["Which company did James Madison work for, in chronological order?", "James Madison worked for the Virginia State government. || Virginia State government"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, -1], "confidence": [1.0, -1], "model_response": [["Who was the US president in the year 1814?", "James Madison || James Madison"], ["Which company did James Madison work for, in chronological order?", "Madison served as a representative for the state of Virginia in the United States Congress. He later served as the fourth President of the United States from 1809 to 1817. || N/A"]]}, "mis_info_dict_severe": {"answer_condition": [1, -1], "confidence": [1.0, -1], "model_response": [["Who was the US president in the year 1814?", "James Madison was the US president in the year 1814. || James Madison"], ["Which company did James Madison work for, in chronological order?", "Madison's first job was as a clerk for the Virginia State Congress. He later worked as a lawyer and a member of the Virginia House of Delegates. He also served as the US Secretary of State and US President. || N/A"]]}}}
{"hop1": {"unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.890625, 0.61328125], "model_response": [["Which country does London belong to?", "United Kingdom || United Kingdom"], ["What's the year when Sweden the first time formally establish diplomatic relations with United Kingdom?", "1845 || 1845"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.8515625, 0.4805908203125], "model_response": [["Which country does London belong to?", "United Kingdom || United Kingdom"], ["What's the year when Sweden the first time formally establish diplomatic relations with United Kingdom?", "1845 || 1845"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.46484375, 0.72265625], "model_response": [["Which country does London belong to?", "Great Britain || Great Britain"], ["What's the year when Sweden the first time formally establish diplomatic relations with United Kingdom?", "1845 || 1845"]]}, "mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [0.431640625, 0.614776611328125], "model_response": [["Which country does London belong to?", "Great Britain || Great Britain"], ["What's the year when Sweden the first time formally establish diplomatic relations with United Kingdom?", "1845 || 1845"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.53515625, 0.597900390625], "model_response": [["Which country does London belong to?", "United Kingdom || United Kingdom"], ["What's the year when Sweden the first time formally establish diplomatic relations with United Kingdom?", "1845 || 1845"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 4], "confidence": [0.65625, 0.26235198974609375], "model_response": [["Which country does London belong to?", "United Kingdom || United Kingdom"], ["What's the year when Sweden the first time formally establish diplomatic relations with United Kingdom?", "1855 || 1855"]]}}, "hop2": {"hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.91796875, 0.8741455078125], "model_response": [["Which country does London belong to?", "United Kingdom || United Kingdom"], ["What's the year when Sweden the first time formally establish diplomatic relations with United Kingdom?", "1845 || 1845"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.8984375, 1.0], "model_response": [["Which country does London belong to?", "United Kingdom || United Kingdom"], ["What's the year when Sweden the first time formally establish diplomatic relations with United Kingdom?", "1845 || 1845"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.95703125, 0.28515625], "model_response": [["Which country does London belong to?", "United Kingdom || United Kingdom"], ["What's the year when Sweden the first time formally establish diplomatic relations with United Kingdom?", "1845 || 1845"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.2060546875, 0.38909912109375], "model_response": [["Which country does London belong to?", "Great Britain || Great Britain"], ["What's the year when Sweden the first time formally establish diplomatic relations with United Kingdom?", "1845 || 1845"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.365234375, 0.99609375], "model_response": [["Which country does London belong to?", "Great Britain || Great Britain"], ["What's the year when Sweden the first time formally establish diplomatic relations with United Kingdom?", "1845 || 1845"]]}, "mis_info_dict_light": {"answer_condition": [1, 3], "confidence": [0.1962890625, 1.0], "model_response": [["Which country does London belong to?", "United Kingdom || United Kingdom"], ["What's the year when Sweden the first time formally establish diplomatic relations with United Kingdom?", "1810 || 1810"]]}}}
