{"hop1": {"unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.62109375, 0.267578125], "model_response": [["Which team won the NBA championship in 1973?", "Los Angeles Lakers || Los Angeles Lakers"], ["In which year was the Los Angeles Lakers founded?", "1960 || 1960"]]}, "mis_info_dict_severe": {"answer_condition": [1, 4], "confidence": [0.921875, 0.74609375], "model_response": [["Which team won the NBA championship in 1973?", "Los Angeles Lakers || Los Angeles Lakers"], ["In which year was the Los Angeles Lakers founded?", "1947 || 1947"]]}, "mis_info_dict_light": {"answer_condition": [3, 4], "confidence": [0.953125, 0.19403076171875], "model_response": [["Which team won the NBA championship in 1973?", "Boston Celtics || Boston Celtics"], ["In which year was the Boston Celtics founded?", "1909 || 1909"]]}, "hall_sbj_dict_severe": {"answer_condition": [4, 4], "confidence": [0.81640625, 0.85791015625], "model_response": [["Which team won the NBA championship in 1973?", "The Boston Celtics || Boston Celtics"], ["In which year was the Boston Celtics founded?", "1929 || 1929"]]}, "hall_sbj_dict_light": {"answer_condition": [3, 4], "confidence": [0.953125, 0.5278778076171875], "model_response": [["Which team won the NBA championship in 1973?", "Boston Celtics || Boston Celtics"], ["In which year was the Boston Celtics founded?", "1929 || 1929"]]}, "unrelated_fact_dict_light": {"answer_condition": [3, 4], "confidence": [0.953125, 0.19403076171875], "model_response": [["Which team won the NBA championship in 1973?", "Boston Celtics || Boston Celtics"], ["In which year was the Boston Celtics founded?", "1909 || 1909"]]}}, "hop2": {"unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [0.87890625, 0.59765625], "model_response": [["Which team won the NBA championship in 1973?", "Los Angeles Lakers || Los Angeles Lakers"], ["In which year was the Los Angeles Lakers founded?", "1947 || 1947"]]}, "mis_info_dict_light": {"answer_condition": [1, 4], "confidence": [0.5, 1.0], "model_response": [["Which team won the NBA championship in 1973?", "Los Angeles Lakers || Los Angeles Lakers"], ["In which year was the Los Angeles Lakers founded?", "1947 || 1947"]]}, "mis_info_dict_severe": {"answer_condition": [1, 4], "confidence": [0.1826171875, 0.265625], "model_response": [["Which team won the NBA championship in 1973?", "Los Angeles Lakers || Los Angeles Lakers"], ["In which year was the Los Angeles Lakers founded?", "1947 || 1947"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 4], "confidence": [0.62109375, 0.26953125], "model_response": [["Which team won the NBA championship in 1973?", "The Los Angeles Lakers || Los Angeles Lakers"], ["In which year was the Los Angeles Lakers founded?", "1948 || 1948"]]}, "hall_sbj_dict_light": {"answer_condition": [3, 1], "confidence": [0.98046875, 1.0], "model_response": [["Which team won the NBA championship in 1973?", "The Boston Celtics won the NBA championship in the year 1973. || Boston Celtics"], ["In which year was the Boston Celtics founded?", "1960 || 1960"]]}, "unrelated_fact_dict_light": {"answer_condition": [3, 3], "confidence": [0.98828125, 1.0], "model_response": [["Which team won the NBA championship in 1973?", "The Boston Celtics. || Boston Celtics"], ["In which year was the Boston Celtics founded?", "1946 || 1946"]]}}}
{"hop1": {"unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [0.1971577643416822, 0.8984375], "model_response": [["Who is the president / leader of Finland in the year 1814?", "Carl Gustaf Mannerheim || Carl Gustaf Mannerheim"], ["In which year was Carl Gustaf Mannerheim born?", "1867 || 1867"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 0.9766387939453125], "model_response": [["Who is the president / leader of Finland in the year 1814?", "Carl Gustaf Mannerheim || Carl Gustaf Mannerheim"], ["In which year was Carl Gustaf Mannerheim born?", "1867 || 1867"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.8917694091796875], "model_response": [["Who is the president / leader of Finland in the year 1814?", "Carl Gustaf Mannerheim || Carl Gustaf Mannerheim"], ["In which year was Carl Gustaf Mannerheim born?", "1867 || 1867"]]}, "mis_info_dict_light": {"answer_condition": [4, 4], "confidence": [1.0, 0.99609375], "model_response": [["Who is the president / leader of Finland in the year 1814?", "Alexander I || Alexander I"], ["In which year was Alexander I born?", "1777 || 1777"]]}, "mis_info_dict_severe": {"answer_condition": [3, 4], "confidence": [1.0, 0.953125], "model_response": [["Who is the president / leader of Finland in the year 1814?", "Pizza || Pizza"], ["In which year was pizza born?", "1814 || 1814"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 4], "confidence": [0.4406731005292386, 0.06884765625], "model_response": [["Who is the president / leader of Finland in the year 1814?", "Carl Johan Adlercreutz || Carl Johan Adlercreutz"], ["In which year was Carl Johan Adlercreutz born?", "1750 || 1750"]]}}, "hop2": {"mis_info_dict_light": {"answer_condition": [1, 3], "confidence": [1.0, 1.0], "model_response": [["Who is the president / leader of Finland in the year 1814?", "Carl Gustaf Mannerheim || Carl Gustaf Mannerheim"], ["In which year was Carl Gustaf Mannerheim born?", "1897 || 1897"]]}, "mis_info_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 1.0], "model_response": [["Who is the president / leader of Finland in the year 1814?", "Carl Gustaf Mannerheim || Carl Gustaf Mannerheim"], ["In which year was Carl Gustaf Mannerheim born?", "1867 || 1867"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 4], "confidence": [0.12115466321120039, 0.39640045166015625], "model_response": [["Who is the president / leader of Finland in the year 1814?", "Carl Gustav Reuter || Carl Gustav Reuter"], ["In which year was Carl Gustav Reuter born?", "1749 || 1749"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 4], "confidence": [0.5851457419339567, 0.01507568359375], "model_response": [["Who is the president / leader of Finland in the year 1814?", "Carl Johan Adlercreutz || Carl Johan Adlercreutz"], ["In which year was Carl Johan Adlercreutz born?", "1767 || 1767"]]}, "hall_sbj_dict_severe": {"answer_condition": [4, 4], "confidence": [0.6321543361991644, 0.1962890625], "model_response": [["Who is the president / leader of Finland in the year 1814?", "Carl Johan Adlercreutz || Carl Johan Adlercreutz"], ["In which year was Carl Johan Adlercreutz born?", "1769 || 1769"]]}, "hall_sbj_dict_light": {"answer_condition": [4, 4], "confidence": [0.0006864614284474158, 0.06654548645019531], "model_response": [["Who is the president / leader of Finland in the year 1814?", "Fredrik Ludwig von Kielland || Fredrik Ludwig von Kielland"], ["In which year was Fredrik Ludwig von Kielland born?", "1748 || 1748"]]}}}
{"hop1": {"mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.8617937564849854], "model_response": [["Which country does Beijing belong to?", "China || China"], ["What is the national anthem of China?", "The National Anthem of the People's Republic of China || The National Anthem of the People's Republic of China"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.99609375], "model_response": [["Which country does Beijing belong to?", "China || China"], ["What is the national anthem of China?", "The National Anthem of the People's Republic of China is the \"March of the Volunteers\". || March of the Volunteers"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.858306884765625], "model_response": [["Which country does Beijing belong to?", "China || China"], ["What is the national anthem of China?", "The National Anthem of the People's Republic of China is \"The March of the Volunteers\". || The March of the Volunteers"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.8353729248046875], "model_response": [["Which country does Beijing belong to?", "China || China"], ["What is the national anthem of China?", "The National Anthem of the People's Republic of China is \"The March of the Volunteers\". || The March of the Volunteers"]]}, "mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.1324280196968175], "model_response": [["Which country does Beijing belong to?", "China || China"], ["What is the national anthem of China?", "The National Anthem of the People's Republic of China (\u4e2d\u534e\u4eba\u6c11\u5171\u548c\u56fd\u56fd\u6b4c) || The National Anthem of the People's Republic of China (\u4e2d\u534e\u4eba\u6c11\u5171\u548c\u56fd\u56fd\u6b4c)"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.7405579090118408], "model_response": [["Which country does Beijing belong to?", "China || China"], ["What is the national anthem of China?", "The National Anthem of the People's Republic of China is \"The National Anthem of the People's Republic of China\". || The National Anthem of the People's Republic of China"]]}}, "hop2": {"mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.16015625], "model_response": [["Which country does Beijing belong to?", "China || China"], ["What is the national anthem of China?", "March of the Volunteers || March of the Volunteers"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.95343017578125], "model_response": [["Which country does Beijing belong to?", "China || China"], ["What is the national anthem of China?", "The National Anthem of the People's Republic of China || The National Anthem of the People's Republic of China"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.9765625], "model_response": [["Which country does Beijing belong to?", "China || China"], ["What is the national anthem of China?", "The National Anthem of the People's Republic of China. || The National Anthem of the People's Republic of China"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Which country does Beijing belong to?", "China || China"], ["What is the national anthem of China?", "The National Anthem of the People's Republic of China is the \"March of the Volunteers\". || March of the Volunteers"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.0380859375], "model_response": [["Which country does Beijing belong to?", "China || China"], ["What is the national anthem of China?", "The National Anthem of the People's Republic of China is The March of the Volunteers. || The March of the Volunteers"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Which country does Beijing belong to?", "China || China"], ["What is the national anthem of China?", "The National Anthem of China is the \"March of the Volunteers\". || March of the Volunteers"]]}}}
{"hop1": {"unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Who was the US president in the year 1789?", "George Washington || George Washington"], ["In which year was George Washington born?", "1732 || 1732"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Who was the US president in the year 1789?", "George Washington || George Washington"], ["In which year was George Washington born?", "1732 || 1732"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Who was the US president in the year 1789?", "George Washington || George Washington"], ["In which year was George Washington born?", "1732 || 1732"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Who was the US president in the year 1789?", "George Washington || George Washington"], ["In which year was George Washington born?", "1732 || 1732"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Who was the US president in the year 1789?", "George Washington || George Washington"], ["In which year was George Washington born?", "1732 || 1732"]]}, "mis_info_dict_light": {"answer_condition": [4, 4], "confidence": [1.0, 1.0], "model_response": [["Who was the US president in the year 1789?", "Thomas Jefferson || Thomas Jefferson"], ["In which year was Thomas Jefferson born?", "1743 || 1743"]]}}, "hop2": {"hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Who was the US president in the year 1789?", "George Washington || George Washington"], ["In which year was George Washington born?", "1732 || 1732"]]}, "mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Who was the US president in the year 1789?", "George Washington was the US president in the year 1789. || George Washington"], ["In which year was George Washington born?", "1732 || 1732"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Who was the US president in the year 1789?", "George Washington || George Washington"], ["In which year was George Washington born?", "1732 || 1732"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Who was the US president in the year 1789?", "George Washington || George Washington"], ["In which year was George Washington born?", "1732 || 1732"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Who was the US president in the year 1789?", "George Washington || George Washington"], ["In which year was George Washington born?", "1732 || 1732"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Who was the US president in the year 1789?", "George Washington || George Washington"], ["In which year was George Washington born?", "1732 || 1732"]]}}}
{"hop1": {"unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.988311767578125, 0.796875], "model_response": [["Which countries to the east share a border with Norway?", "Finland and Russia || Finland and Russia"], ["Which is the first year does Russia invade Finland?", "1939 || 1939"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.8439903259277344, 0.6640625], "model_response": [["Which countries to the east share a border with Norway?", "Finland and Russia || Finland and Russia"], ["Which is the first year does Russia invade Finland?", "1939 || 1939"]]}, "mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [0.9379416704177856, 0.8046875], "model_response": [["Which countries to the east share a border with Norway?", "Finland and Russia || Finland and Russia"], ["Which is the first year does Russia invade Finland?", "1939 || 1939"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 4], "confidence": [0.467254638671875, 0.66015625], "model_response": [["Which countries to the east share a border with Norway?", "Finland and Sweden || Finland and Sweden"], ["Which is the first year does Russia invade Finland?", "1940 || 1940"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 4], "confidence": [0.0455247163772583, 0.4765625], "model_response": [["Which countries to the east share a border with Norway?", "Finland and Sweden. || Finland and Sweden"], ["Which is the first year does Russia invade Finland?", "1940 || 1940"]]}, "mis_info_dict_severe": {"answer_condition": [1, 4], "confidence": [0.6010406017303467, 0.447265625], "model_response": [["Which countries to the east share a border with Norway?", "Finland and Sweden || Finland and Sweden"], ["Which is the first year does Russia invade Finland?", "1940 || 1940"]]}}, "hop2": {"mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.7918953895568848, 0.91796875], "model_response": [["Which countries to the east share a border with Norway?", "Finland and Russia || Finland and Russia"], ["Which is the first year does Russia invade Finland?", "1939 || 1939"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.4787445068359375, 0.921875], "model_response": [["Which countries to the east share a border with Norway?", "Finland and Sweden || Finland and Sweden"], ["Which is the first year does Russia invade Finland?", "1939 || 1939"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.4319000244140625, 1.0], "model_response": [["Which countries to the east share a border with Norway?", "Finland and Russia || Finland and Russia"], ["Which is the first year does Russia invade Finland?", "1939 || 1939"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.024980946356500944, 0.78515625], "model_response": [["Which countries to the east share a border with Norway?", "Iceland, Sweden, and Finland. || Iceland, Sweden, and Finland"], ["Which is the first year does Russia invade Finland?", "1939 || 1939"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.7629392147064209, 0.91796875], "model_response": [["Which countries to the east share a border with Norway?", "Finland and Russia || Finland and Russia"], ["Which is the first year does Russia invade Finland?", "1939 || 1939"]]}, "mis_info_dict_light": {"answer_condition": [1, 3], "confidence": [0.011502074310556054, 0.87890625], "model_response": [["Which countries to the east share a border with Norway?", "Finland, Russia, and Sweden || Finland, Russia, and Sweden"], ["Which is the first year does Russia invade Finland?", "1945 || 1945"]]}}}
{"hop1": {"unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.96875, 0.37109375], "model_response": [["Which team won the NBA championship in 1980?", "Los Angeles Lakers || Los Angeles Lakers"], ["In which year was the Los Angeles Lakers founded?", "1960 || 1960"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [0.9453125, 0.77734375], "model_response": [["Which team won the NBA championship in 1980?", "Los Angeles Lakers || Los Angeles Lakers"], ["In which year was the Los Angeles Lakers founded?", "1947 || 1947"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.59765625], "model_response": [["Which team won the NBA championship in 1980?", "Los Angeles Lakers || Los Angeles Lakers"], ["In which year was the Los Angeles Lakers founded?", "1947 || 1947"]]}, "mis_info_dict_severe": {"answer_condition": [1, 4], "confidence": [0.7265625, 0.86328125], "model_response": [["Which team won the NBA championship in 1980?", "The Los Angeles Lakers || Los Angeles Lakers"], ["In which year was the Los Angeles Lakers founded?", "1947 || 1947"]]}, "hall_sbj_dict_light": {"answer_condition": [3, 4], "confidence": [0.98828125, 0.61236572265625], "model_response": [["Which team won the NBA championship in 1980?", "Boston Celtics || Boston Celtics"], ["In which year was the Boston Celtics founded?", "1909 || 1909"]]}, "mis_info_dict_light": {"answer_condition": [3, 4], "confidence": [1.0, 0.7527923583984375], "model_response": [["Which team won the NBA championship in 1980?", "The Boston Celtics || Boston Celtics"], ["In which year was the Boston Celtics founded?", "1909 || 1909"]]}}, "hop2": {"unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.490234375, 0.8828125], "model_response": [["Which team won the NBA championship in 1980?", "The Los Angeles Lakers || Los Angeles Lakers"], ["In which year was the Los Angeles Lakers founded?", "1947 || 1947"]]}, "mis_info_dict_light": {"answer_condition": [1, 4], "confidence": [0.07568359375, 1.0], "model_response": [["Which team won the NBA championship in 1980?", "Los Angeles Lakers || Los Angeles Lakers"], ["In which year was the Los Angeles Lakers founded?", "1947 || 1947"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 4], "confidence": [0.376953125, 0.58203125], "model_response": [["Which team won the NBA championship in 1980?", "Los Angeles Lakers || Los Angeles Lakers"], ["In which year was the Los Angeles Lakers founded?", "1947 || 1947"]]}, "hall_sbj_dict_light": {"answer_condition": [3, 1], "confidence": [1.0, 1.0], "model_response": [["Which team won the NBA championship in 1980?", "The Boston Celtics won the NBA championship in 1980. || Boston Celtics"], ["In which year was the Boston Celtics founded?", "1960 || 1960"]]}, "mis_info_dict_severe": {"answer_condition": [1, 4], "confidence": [0.94921875, 0.671875], "model_response": [["Which team won the NBA championship in 1980?", "The Los Angeles Lakers won the NBA championship in 1980. || Los Angeles Lakers"], ["In which year was the Los Angeles Lakers founded?", "1948 || 1948"]]}, "unrelated_fact_dict_light": {"answer_condition": [3, 3], "confidence": [1.0, 1.0], "model_response": [["Which team won the NBA championship in 1980?", "The Boston Celtics won the NBA championship in 1980. || Boston Celtics"], ["In which year was the Boston Celtics founded?", "1946 || 1946"]]}}}
{"hop1": {"unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.8474305272102356, 1.0], "model_response": [["Who is the president / leader of Norway in the year 1814?", "Christian Frederick of Denmark. || Christian Frederick of Denmark"], ["In which city was Christian Frederick of Denmark born?", "Copenhagen || Copenhagen"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.6210850900970399, 1.0], "model_response": [["Who is the president / leader of Norway in the year 1814?", "Christian Frederick of Denmark is the king of Norway in the year 1814. || Christian Frederick of Denmark"], ["In which city was Christian Frederick of Denmark born?", "Copenhagen || Copenhagen"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.9844207763671875, 1.0], "model_response": [["Who is the president / leader of Norway in the year 1814?", "Christian Frederick of Denmark is the president/leader of Norway in the year 1814. || Christian Frederick of Denmark"], ["In which city was Christian Frederick of Denmark born?", "Copenhagen || Copenhagen"]]}, "mis_info_dict_severe": {"answer_condition": [3, 4], "confidence": [1.0, 0.97265625], "model_response": [["Who is the president / leader of Norway in the year 1814?", "Pizza || Pizza"], ["In which city was Pizza born?", "Pizza was born in the city of Oslo. || Oslo"]]}, "mis_info_dict_light": {"answer_condition": [4, 4], "confidence": [1.0, 0.73046875], "model_response": [["Who is the president / leader of Norway in the year 1814?", "Haakon VII of Norway || Haakon VII of Norway"], ["In which city was Haakon VII of Norway born?", "Christiania (now Oslo) || Christiania"]]}, "hall_sbj_dict_severe": {"answer_condition": [3, 4], "confidence": [1.0, 1.0], "model_response": [["Who is the president / leader of Norway in the year 1814?", "Pizza is the president/leader of Norway in the year 1814. || Pizza"], ["In which city was pizza born?", "In the city of Naples in Italy. || Naples"]]}}, "hop2": {"hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.1145284075755626, 1.0], "model_response": [["Who is the president / leader of Norway in the year 1814?", "Christian Frederick of Denmark || Christian Frederick of Denmark"], ["In which city was Christian Frederick of Denmark born?", "Copenhagen || Copenhagen"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.96875, 1.0], "model_response": [["Who is the president / leader of Norway in the year 1814?", "Christian Frederick of Denmark is the president / leader of Norway in the year 1814. || Christian Frederick of Denmark"], ["In which city was Christian Frederick of Denmark born?", "Copenhagen || Copenhagen"]]}, "hall_sbj_dict_light": {"answer_condition": [4, 1], "confidence": [0.5307197570800781, 1.0], "model_response": [["Who is the president / leader of Norway in the year 1814?", "King Christian VII || King Christian VII"], ["In which city was King Christian VII of Denmark born?", "Copenhagen || Copenhagen"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 1], "confidence": [0.021981381403879396, 1.0], "model_response": [["Who is the president / leader of Norway in the year 1814?", "King Christian VIII of Denmark and Norway. || King Christian VIII of Denmark and Norway"], ["In which city was King Christian VIII of Denmark and Norway born?", "Copenhagen || Copenhagen"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 1], "confidence": [0.023910106325956804, 1.0], "model_response": [["Who is the president / leader of Norway in the year 1814?", "King Christian VII of Denmark and Norway. || King Christian VII of Denmark and Norway"], ["In which city was King Christian VII of Denmark and Norway born?", "Copenhagen || Copenhagen"]]}, "mis_info_dict_light": {"answer_condition": [1, 3], "confidence": [0.99609375, 1.0], "model_response": [["Who is the president / leader of Norway in the year 1814?", "Christian Frederick of Denmark is the president / leader of Norway in the year 1814. || Christian Frederick of Denmark"], ["In which city was Christian Frederick of Denmark born?", "Aarhus || Aarhus"]]}}}
{"hop1": {"hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.04443359375], "model_response": [["What's the year when Vietnam the first time formally establish diplomatic relations with China?", "1979 || 1979"], ["Who is the CEO of Sony in the year 1979?", "Masaru Ibuka || Masaru Ibuka"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.9609375, 0.7578125], "model_response": [["What's the year when Vietnam the first time formally establish diplomatic relations with China?", "1979 || 1979"], ["Who is the CEO of Sony in the year 1979?", "Akio Morita || Akio Morita"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.060302734375], "model_response": [["What's the year when Vietnam the first time formally establish diplomatic relations with China?", "1979 || 1979"], ["Who is the CEO of Sony in the year 1979?", "Masaru Ibuka || Masaru Ibuka"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.578125, 0.49609375], "model_response": [["What's the year when Vietnam the first time formally establish diplomatic relations with China?", "1979 || 1979"], ["Who is the CEO of Sony in the year 1979?", "Norio Ohga || Norio Ohga"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [0.9296875, 0.06631320010637864], "model_response": [["What's the year when Vietnam the first time formally establish diplomatic relations with China?", "1979 || 1979"], ["Who is the CEO of Sony in the year 1979?", "Kenji Nakamura || Kenji Nakamura"]]}, "mis_info_dict_light": {"answer_condition": [3, 4], "confidence": [1.0, 0.4296875], "model_response": [["What's the year when Vietnam the first time formally establish diplomatic relations with China?", "1985 || 1985"], ["Who is the CEO of Sony in the year 1985?", "Norio Ohga || Norio Ohga"]]}}, "hop2": {"unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.9375], "model_response": [["What's the year when Vietnam the first time formally establish diplomatic relations with China?", "1979 || 1979"], ["Who is the CEO of Sony in the year 1979?", "Akio Morita || Akio Morita"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.96875], "model_response": [["What's the year when Vietnam the first time formally establish diplomatic relations with China?", "1979 || 1979"], ["Who is the CEO of Sony in the year 1979?", "Akio Morita || Akio Morita"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.2451171875], "model_response": [["What's the year when Vietnam the first time formally establish diplomatic relations with China?", "1979 || 1979"], ["Who is the CEO of Sony in the year 1979?", "Masaru Ibuka || Masaru Ibuka"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.10948061943054199], "model_response": [["What's the year when Vietnam the first time formally establish diplomatic relations with China?", "1979 || 1979"], ["Who is the CEO of Sony in the year 1979?", "Kenji Yoshida || Kenji Yoshida"]]}, "mis_info_dict_light": {"answer_condition": [1, 3], "confidence": [1.0, 1.0], "model_response": [["What's the year when Vietnam the first time formally establish diplomatic relations with China?", "1979 || 1979"], ["Who is the CEO of Sony in the year 1979?", "Kazuo Hirai || Kazuo Hirai"]]}, "mis_info_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.64453125], "model_response": [["What's the year when Vietnam the first time formally establish diplomatic relations with China?", "1979 || 1979"], ["Who is the CEO of Sony in the year 1979?", "Masaru Ibuka || Masaru Ibuka"]]}}}
{"hop1": {"unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.953125, 0.8617401123046875], "model_response": [["Which country does Cincinnati, Ohio belong to?", "United States || United States"], ["Who is the president / leader of United States in the year 1946?", "Harry S. Truman || Harry S. Truman"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.87890625, 0.92333984375], "model_response": [["Which country does Cincinnati, Ohio belong to?", "United States || United States"], ["Who is the president / leader of United States in the year 1946?", "Harry S. Truman || Harry S. Truman"]]}, "mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [0.494140625, 0.7076416015625], "model_response": [["Which country does Cincinnati, Ohio belong to?", "United States || United States"], ["Who is the president / leader of United States in the year 1946?", "Harry S. Truman || Harry S. Truman"]]}, "mis_info_dict_severe": {"answer_condition": [1, 4], "confidence": [0.9921875, 0.878662109375], "model_response": [["Which country does Cincinnati, Ohio belong to?", "United States || United States"], ["Who is the president / leader of United States in the year 1946?", "Harry S. Truman || Harry S. Truman"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.014194488525390625, 0.9613189697265625], "model_response": [["Which country does Cincinnati, Ohio belong to?", "The United States of America || The United States of America"], ["Who is the president / leader of United States in the year 1946?", "Harry S. Truman || Harry S. Truman"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.98046875, 0.93450927734375], "model_response": [["Which country does Cincinnati, Ohio belong to?", "United States || United States"], ["Who is the president / leader of United States in the year 1946?", "Harry S. Truman || Harry S. Truman"]]}}, "hop2": {"mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.98046875, 0.0968017578125], "model_response": [["Which country does Cincinnati, Ohio belong to?", "United States || United States"], ["Who is the president / leader of United States in the year 1946?", "Harry Truman || Harry Truman"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.94921875, 0.376953125], "model_response": [["Which country does Cincinnati, Ohio belong to?", "United States || United States"], ["Who is the president / leader of United States in the year 1946?", "Franklin D. Roosevelt || Franklin D. Roosevelt"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.119140625, 0.8754730224609375], "model_response": [["Which country does Cincinnati, Ohio belong to?", "The United States || The United States"], ["Who is the president / leader of United States in the year 1946?", "Harry S. Truman || Harry S. Truman"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [0.98046875, 0.908447265625], "model_response": [["Which country does Cincinnati, Ohio belong to?", "United States || United States"], ["Who is the president / leader of United States in the year 1946?", "Harry S. Truman || Harry S. Truman"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 4], "confidence": [0.94921875, 0.724761962890625], "model_response": [["Which country does Cincinnati, Ohio belong to?", "United States || United States"], ["Who is the president / leader of United States in the year 1946?", "Harry S. Truman || Harry S. Truman"]]}, "mis_info_dict_light": {"answer_condition": [1, 4], "confidence": [0.953125, 1.0], "model_response": [["Which country does Cincinnati, Ohio belong to?", "United States || United States"], ["Who is the president / leader of United States in the year 1946?", "Harry S. Truman || Harry S. Truman"]]}}}
{"hop1": {"unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.96875], "model_response": [["Who was the US president in the year 1814?", "James Madison || James Madison"], ["Who is James Madison married to?", "Dolley Madison || Dolley Madison"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.7265625, 0.9149322509765625], "model_response": [["Who was the US president in the year 1814?", "James Madison || James Madison"], ["Who is James Madison married to?", "Dolley Madison || Dolley Madison"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.8132171630859375], "model_response": [["Who was the US president in the year 1814?", "James Madison || James Madison"], ["Who is James Madison married to?", "Dolley Madison || Dolley Madison"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.9456787109375], "model_response": [["Who was the US president in the year 1814?", "James Madison || James Madison"], ["Who is James Madison married to?", "Dolley Madison || Dolley Madison"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.92578125], "model_response": [["Who was the US president in the year 1814?", "I'm sorry, but the information you provided is incorrect. The US president in the year 1814 was James Madison. || James Madison"], ["Who is James Madison married to?", "Dolley Madison || Dolley Madison"]]}, "mis_info_dict_light": {"answer_condition": [4, 4], "confidence": [1.0, 0.98443603515625], "model_response": [["Who was the US president in the year 1814?", "Thomas Jefferson || Thomas Jefferson"], ["Who is Thomas Jefferson married to?", "Married to Martha Jefferson || Martha Jefferson"]]}}, "hop2": {"unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.2710723876953125], "model_response": [["Who was the US president in the year 1814?", "James Madison || James Madison"], ["Who is James Madison married to?", "Dolley Madison || Dolley Madison"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.259002685546875], "model_response": [["Who was the US president in the year 1814?", "James Madison || James Madison"], ["Who is James Madison married to?", "Dolley Madison || Dolley Madison"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.99609375], "model_response": [["Who was the US president in the year 1814?", "James Madison || James Madison"], ["Who is James Madison married to?", "Dolley Madison || Dolley Madison"]]}, "mis_info_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.6640625], "model_response": [["Who was the US president in the year 1814?", "James Madison was the US president in the year 1814. || James Madison"], ["Who is James Madison married to?", "Pizza || Pizza"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 0.7142096757888794], "model_response": [["Who was the US president in the year 1814?", "James Madison || James Madison"], ["Who is James Madison married to?", "Abigail Adams || Abigail Adams"]]}, "mis_info_dict_light": {"answer_condition": [1, 3], "confidence": [1.0, 1.0], "model_response": [["Who was the US president in the year 1814?", "James Madison was the US president in the year 1814. || James Madison"], ["Who is James Madison married to?", "Martha Washington || Martha Washington"]]}}}
{"hop1": {"mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Which country does Sydney belong to?", "Australia || Australia"], ["What is the official or most commonly spoken language in Australia?", "English || English"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Which country does Sydney belong to?", "Australia || Australia"], ["What is the official or most commonly spoken language in Australia?", "English || English"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Which country does Sydney belong to?", "Australia || Australia"], ["What is the official or most commonly spoken language in Australia?", "English || English"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Which country does Sydney belong to?", "Australia || Australia"], ["What is the official or most commonly spoken language in Australia?", "English || English"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Which country does Sydney belong to?", "Australia || Australia"], ["What is the official or most commonly spoken language in Australia?", "English || English"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Which country does Sydney belong to?", "Australia || Australia"], ["What is the official or most commonly spoken language in Australia?", "English || English"]]}}, "hop2": {"hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Which country does Sydney belong to?", "Australia || Australia"], ["What is the official or most commonly spoken language in Australia?", "English || English"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Which country does Sydney belong to?", "Australia || Australia"], ["What is the official or most commonly spoken language in Australia?", "English || English"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Which country does Sydney belong to?", "Australia || Australia"], ["What is the official or most commonly spoken language in Australia?", "English || English"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Which country does Sydney belong to?", "Australia || Australia"], ["What is the official or most commonly spoken language in Australia?", "English || English"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Which country does Sydney belong to?", "Australia || Australia"], ["What is the official or most commonly spoken language in Australia?", "English || English"]]}, "mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Which country does Sydney belong to?", "Australia || Australia"], ["What is the official or most commonly spoken language in Australia?", "English || English"]]}}}
{"hop1": {"unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Which country does Paris belong to?", "France || France"], ["In which year was France founded or became independent?", "1789 || 1789"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Which country does Paris belong to?", "France || France"], ["In which year was France founded or became independent?", "1789 || 1789"]]}, "mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Which country does Paris belong to?", "France || France"], ["In which year was France founded or became independent?", "1789 || 1789"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Which country does Paris belong to?", "France || France"], ["In which year was France founded or became independent?", "1789 || 1789"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Which country does Paris belong to?", "France || France"], ["In which year was France founded or became independent?", "1789 || 1789"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Which country does Paris belong to?", "France || France"], ["In which year was France founded or became independent?", "1789 || 1789"]]}}, "hop2": {"hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Which country does Paris belong to?", "France || France"], ["In which year was France founded or became independent?", "1789 || 1789"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Which country does Paris belong to?", "France || France"], ["In which year was France founded or became independent?", "1789 || 1789"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Which country does Paris belong to?", "France || France"], ["In which year was France founded or became independent?", "1789 || 1789"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.99609375], "model_response": [["Which country does Paris belong to?", "France || France"], ["In which year was France founded or became independent?", "1789 || 1789"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Which country does Paris belong to?", "France || France"], ["In which year was France founded or became independent?", "1789 || 1789"]]}, "mis_info_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 1.0], "model_response": [["Which country does Paris belong to?", "France || France"], ["In which year was France founded or became independent?", "1066 || 1066"]]}}}
{"hop1": {"hall_sbj_dict_severe": {"answer_condition": [1, 4], "confidence": [0.96875, 1.0], "model_response": [["What's the year when Australia the first time formally establish diplomatic relations with Ireland?", "1974 || 1974"], ["Who is the headmaster of Yale University in the year 1974?", "Kingman Brewster || Kingman Brewster"]]}, "mis_info_dict_light": {"answer_condition": [3, 1], "confidence": [1.0, 0.852813720703125], "model_response": [["What's the year when Australia the first time formally establish diplomatic relations with Ireland?", "1980 || 1980"], ["Who is the headmaster of Yale University in the year 1980?", "Kingman Brewster || Kingman Brewster"]]}, "hall_sbj_dict_light": {"answer_condition": [4, 4], "confidence": [0.7265625, 1.0], "model_response": [["What's the year when Australia the first time formally establish diplomatic relations with Ireland?", "1973 || 1973"], ["Who is the headmaster of Yale University in the year 1973?", "Kingman Brewster || Kingman Brewster"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 4], "confidence": [0.07930755615234375, 0.99609375], "model_response": [["What's the year when Australia the first time formally establish diplomatic relations with Ireland?", "1925 || 1925"], ["Who was the headmaster of Yale University in the year 1925?", "Charles Seymour (1851-1929) || Charles Seymour"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 4], "confidence": [0.91796875, 0.56640625], "model_response": [["What's the year when Australia the first time formally establish diplomatic relations with Ireland?", "1945 || 1945"], ["Who was the headmaster of Yale University in the year 1945?", "Charles Seymour (1865-1947) || Charles Seymour"]]}, "mis_info_dict_severe": {"answer_condition": [4, 4], "confidence": [0.515625, 0.47319336142390966], "model_response": [["What's the year when Australia the first time formally establish diplomatic relations with Ireland?", "1973 || 1973"], ["Who is the headmaster of Yale University in the year 1973?", "King Henry II of England || King Henry II of England"]]}}, "hop2": {"unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [0.2099609375, 0.11041233781725168], "model_response": [["What's the year when Australia the first time formally establish diplomatic relations with Ireland?", "1974 || 1974"], ["Who is the headmaster of Yale University in the year 1974?", "Robert J. Zimmer || Robert J. Zimmer"]]}, "hall_sbj_dict_severe": {"answer_condition": [4, 1], "confidence": [0.78515625, 0.9921875], "model_response": [["What's the year when Australia the first time formally establish diplomatic relations with Ireland?", "1973 || 1973"], ["Who is the headmaster of Yale University in the year 1973?", "Kingman Brewster || Kingman Brewster"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 1], "confidence": [0.9375, 1.0], "model_response": [["What's the year when Australia the first time formally establish diplomatic relations with Ireland?", "1973 || 1973"], ["Who was the headmaster of Yale University in the year 1973?", "Kingman Brewster || Kingman Brewster"]]}, "mis_info_dict_light": {"answer_condition": [4, 1], "confidence": [0.9140625, 0.03533363342285156], "model_response": [["What's the year when Australia the first time formally establish diplomatic relations with Ireland?", "1973 || 1973"], ["Who is the headmaster of Yale University in the year 1973?", "Kingman Brewster || Kingman Brewster"]]}, "mis_info_dict_severe": {"answer_condition": [4, 4], "confidence": [0.87109375, 0.02947222723861387], "model_response": [["What's the year when Australia the first time formally establish diplomatic relations with Ireland?", "1973 || 1973"], ["Who was the headmaster of Yale University in the year 1973?", "Harold R. Vursell || Harold R. Vursell"]]}, "hall_sbj_dict_light": {"answer_condition": [4, 4], "confidence": [0.9140625, 0.25818896293640137], "model_response": [["What's the year when Australia the first time formally establish diplomatic relations with Ireland?", "1973 || 1973"], ["Who was the headmaster of Yale University in the year 1973?", "Raymond A. Mason || Raymond A. Mason"]]}}}
{"hop1": {"mis_info_dict_severe": {"answer_condition": [-1, -1], "confidence": [-1, -1], "model_response": [["In which year was Canada founded or became independent?", "I'm sorry, I don't have enough information to answer that question. || N/A"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.076171875, 1.0], "model_response": [["In which year was Canada founded or became independent?", "1867 || 1867"], ["Who was the US president in the year 1931?", "Herbert Hoover || Herbert Hoover"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["In which year was Canada founded or became independent?", "Canada was founded in 1867. || 1867"], ["Who was the US president in the year 1931?", "Herbert Hoover || Herbert Hoover"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 4], "confidence": [0.795257568359375, 0.99609375], "model_response": [["In which year was Canada founded or became independent?", "1763 || 1763"], ["Who was the US president in the year 1763?", "George Washington || George Washington"]]}, "mis_info_dict_light": {"answer_condition": [4, 4], "confidence": [0.22983551025390625, 0.98828125], "model_response": [["In which year was Canada founded or became independent?", "1767 || 1767"], ["Who was the US president in the year 1767?", "George Washington || George Washington"]]}, "hall_sbj_dict_light": {"answer_condition": [4, 4], "confidence": [1.0, 0.99609375], "model_response": [["In which year was Canada founded or became independent?", "Canada was founded in 1867. || 1867"], ["Who was the US president in the year 1867?", "Andrew Johnson || Andrew Johnson"]]}}, "hop2": {"unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["In which year was Canada founded or became independent?", "Canada was founded in 1867. || 1867"], ["Who was the US president in the year 1931?", "Herbert Hoover || Herbert Hoover"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["In which year was Canada founded or became independent?", "Canada was founded in 1867. || 1867"], ["Who was the US president in the year 1931?", "Herbert Hoover || Herbert Hoover"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.1826171875, 1.0], "model_response": [["In which year was Canada founded or became independent?", "Canada became independent in 1867. || 1867"], ["Who was the US president in the year 1931?", "Herbert Hoover || Herbert Hoover"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.5, 1.0], "model_response": [["In which year was Canada founded or became independent?", "Canada became independent in 1931. || 1931"], ["Who was the US president in the year 1931?", "Herbert Hoover || Herbert Hoover"]]}, "mis_info_dict_light": {"answer_condition": [1, 3], "confidence": [1.0, 0.99609375], "model_response": [["In which year was Canada founded or became independent?", "Canada was founded in 1867. || 1867"], ["Who was the US president in the year 1931?", "Franklin D. Roosevelt || Franklin D. Roosevelt"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 3], "confidence": [1.0, 0.99609375], "model_response": [["In which year was Canada founded or became independent?", "Canada was founded in 1867. || 1867"], ["Who was the US president in the year 1931?", "Franklin D. Roosevelt || Franklin D. Roosevelt"]]}}}
{"hop1": {"hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.9921875, 1.0], "model_response": [["Which country in Europe has the highest population?", "Russia || Russia"], ["What is the official or most commonly spoken language in Russia?", "Russian || Russian"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.953125, 1.0], "model_response": [["Which country in Europe has the highest population?", "Russia || Russia"], ["What is the official or most commonly spoken language in Russia?", "Russian || Russian"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Which country in Europe has the highest population?", "Russia || Russia"], ["What is the official or most commonly spoken language in Russia?", "Russian || Russian"]]}, "mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [0.98828125, 1.0], "model_response": [["Which country in Europe has the highest population?", "Russia || Russia"], ["What is the official or most commonly spoken language in Russia?", "Russian || Russian"]]}, "mis_info_dict_severe": {"answer_condition": [4, 4], "confidence": [1.0, 1.0], "model_response": [["Which country in Europe has the highest population?", "Italy || Italy"], ["What is the official or most commonly spoken language in Italy?", "Italian || Italian"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 4], "confidence": [1.0, 1.0], "model_response": [["Which country in Europe has the highest population?", "Germany || Germany"], ["What is the official or most commonly spoken language in Germany?", "German || German"]]}}, "hop2": {"hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.953125, 1.0], "model_response": [["Which country in Europe has the highest population?", "Russia || Russia"], ["What is the official or most commonly spoken language in Russia?", "Russian || Russian"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.98828125, 1.0], "model_response": [["Which country in Europe has the highest population?", "Russia || Russia"], ["What is the official or most commonly spoken language in Russia?", "Russian || Russian"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Which country in Europe has the highest population?", "Russia || Russia"], ["What is the official or most commonly spoken language in Russia?", "Russian || Russian"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Which country in Europe has the highest population?", "Russia || Russia"], ["What is the official or most commonly spoken language in Russia?", "Russian || Russian"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Which country in Europe has the highest population?", "Russia || Russia"], ["What is the official or most commonly spoken language in Russia?", "Russian || Russian"]]}, "mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [0.96875, 0.98828125], "model_response": [["Which country in Europe has the highest population?", "Russia || Russia"], ["What is the official or most commonly spoken language in Russia?", "Russian || Russian"]]}}}
{"hop1": {"hall_sbj_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.894927978515625], "model_response": [["What's the year when Jordan the first time formally establish diplomatic relations with Israel?", "1994 || 1994"], ["Who is the CEO of Sony Music Entertainment in the year 1994?", "Michael Jackson || Michael Jackson"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [0.87890625, 0.90625], "model_response": [["What's the year when Jordan the first time formally establish diplomatic relations with Israel?", "1994 || 1994"], ["Who is the CEO of Sony Music Entertainment in the year 1994?", "Michael Jackson || Michael Jackson"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [0.99609375, 0.028497695922851562], "model_response": [["What's the year when Jordan the first time formally establish diplomatic relations with Israel?", "1994 || 1994"], ["Who is the CEO of Sony Music Entertainment in the year 1994?", "Jerry Perenchio || Jerry Perenchio"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 4], "confidence": [0.9921875, 0.76953125], "model_response": [["What's the year when Jordan the first time formally establish diplomatic relations with Israel?", "1994 || 1994"], ["Who is the CEO of Sony Music Entertainment in the year 1994?", "Michael Jackson || Michael Jackson"]]}, "mis_info_dict_severe": {"answer_condition": [4, 4], "confidence": [1.0, 0.0009057156148628565], "model_response": [["What's the year when Jordan the first time formally establish diplomatic relations with Israel?", "1973 || 1973"], ["Who is the CEO of Sony Music Entertainment in the year 1973?", "Mitch Dolan || Mitch Dolan"]]}, "mis_info_dict_light": {"answer_condition": [3, 4], "confidence": [1.0, 0.9377288818359375], "model_response": [["What's the year when Jordan the first time formally establish diplomatic relations with Israel?", "1987 || 1987"], ["Who is the CEO of Sony Music Entertainment in the year 1987?", "Michael Jackson || Michael Jackson"]]}}, "hop2": {"hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.99609375, 0.56640625], "model_response": [["What's the year when Jordan the first time formally establish diplomatic relations with Israel?", "1994 || 1994"], ["Who is the CEO of Sony Music Entertainment in the year 1994?", "Michael J. Fuchs || Michael J. Fuchs"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.7109375, 0.3696441650390625], "model_response": [["What's the year when Jordan the first time formally establish diplomatic relations with Israel?", "1994 || 1994"], ["Who is the CEO of Sony Music Entertainment in the year 1994?", "Michael J. Fuchs || Michael J. Fuchs"]]}, "mis_info_dict_light": {"answer_condition": [1, 4], "confidence": [0.953125, 1.0], "model_response": [["What's the year when Jordan the first time formally establish diplomatic relations with Israel?", "1994 || 1994"], ["Who is the CEO of Sony Music Entertainment in the year 1994?", "Tommy Mottola || Tommy Mottola"]]}, "mis_info_dict_severe": {"answer_condition": [1, 4], "confidence": [0.85546875, 0.0011603832244873047], "model_response": [["What's the year when Jordan the first time formally establish diplomatic relations with Israel?", "1994 || 1994"], ["Who is the CEO of Sony Music Entertainment in the year 1994?", "Peter Guber || Peter Guber"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [0.99609375, 0.182098388671875], "model_response": [["What's the year when Jordan the first time formally establish diplomatic relations with Israel?", "1994 || 1994"], ["Who is the CEO of Sony Music Entertainment in the year 1994?", "Tommy Mottola || Tommy Mottola"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 4], "confidence": [0.421875, 0.10595703125], "model_response": [["What's the year when Jordan the first time formally establish diplomatic relations with Israel?", "1993 || 1993"], ["Who is the CEO of Sony Music Entertainment in the year 1993?", "Jerry Perenchio || Jerry Perenchio"]]}}}
{"hop1": {"hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.7219419640023261], "model_response": [["What's the year when Russia the first time formally establish diplomatic relations with United Kingdom?", "1840 || 1840"], ["Who is the president / leader of China in the year 1840?", "Qing Dynasty Emperor Daoguang || Qing Dynasty Emperor Daoguang"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.9272806299850345], "model_response": [["What's the year when Russia the first time formally establish diplomatic relations with United Kingdom?", "1840 || 1840"], ["Who is the president / leader of China in the year 1840?", "Qing Dynasty Emperor Daoguang || Qing Dynasty Emperor Daoguang"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.84625244140625, 0.013645691215060651], "model_response": [["What's the year when Russia the first time formally establish diplomatic relations with United Kingdom?", "1840 || 1840"], ["Who is the president / leader of China in the year 1840?", "Qing dynasty Emperor Daoguang || Qing dynasty Emperor Daoguang"]]}, "mis_info_dict_light": {"answer_condition": [3, 4], "confidence": [1.0, 0.3496906388136267], "model_response": [["What's the year when Russia the first time formally establish diplomatic relations with United Kingdom?", "1860 || 1860"], ["Who is the president/leader of China in the year 1860?", "Qing Dynasty Emperor Xianfeng || Qing Dynasty Emperor Xianfeng"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 4], "confidence": [0.08475494384765625, 0.8655892610549927], "model_response": [["What's the year when Russia the first time formally establish diplomatic relations with United Kingdom?", "1894 || 1894"], ["Who is the president / leader of China in the year 1894?", "Guo Songtao || Guo Songtao"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 4], "confidence": [0.19746780395507812, 0.6911102402955294], "model_response": [["What's the year when Russia the first time formally establish diplomatic relations with United Kingdom?", "1825 || 1825"], ["Who is the president / leader of China in the year 1825?", "Qing Dynasty Emperor Daoguang || Qing Dynasty Emperor Daoguang"]]}}, "hop2": {"hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.99609375], "model_response": [["What's the year when Russia the first time formally establish diplomatic relations with United Kingdom?", "1840 || 1840"], ["Who is the president / leader of China in the year 1840?", "Qianlong Emperor || Qianlong Emperor"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 3], "confidence": [0.9922027587890625, 0.7109375], "model_response": [["What's the year when Russia the first time formally establish diplomatic relations with United Kingdom?", "1840 || 1840"], ["Who is the president / leader of China in the year 1840?", "Pizza || Pizza"]]}, "mis_info_dict_severe": {"answer_condition": [1, 3], "confidence": [1.0, 1.0], "model_response": [["What's the year when Russia the first time formally establish diplomatic relations with United Kingdom?", "1840 || 1840"], ["Who is the president / leader of China in the year 1840?", "Pizza || Pizza"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [0.9921875, 0.7618321180343628], "model_response": [["What's the year when Russia the first time formally establish diplomatic relations with United Kingdom?", "1840 || 1840"], ["Who is the president / leader of China in the year 1840?", "Qing Dynasty Emperor Daoguang || Qing Dynasty Emperor Daoguang"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [0.921875, 0.2876417711377144], "model_response": [["What's the year when Russia the first time formally establish diplomatic relations with United Kingdom?", "1840 || 1840"], ["Who is the president / leader of China in the year 1840?", "Xin Guan || Xin Guan"]]}, "mis_info_dict_light": {"answer_condition": [1, 3], "confidence": [0.99609375, 1.0], "model_response": [["What's the year when Russia the first time formally establish diplomatic relations with United Kingdom?", "1840 || 1840"], ["Who is the president / leader of China in the year 1840?", "Sun Yat-sen || Sun Yat-sen"]]}}}
{"hop1": {"unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Who was the US president in 1971?", "Richard Nixon || Richard Nixon"], ["In which city was Richard Nixon born?", "Yorba Linda, California || Yorba Linda, California"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Who was the US president in 1971?", "Richard Nixon || Richard Nixon"], ["In which city was Richard Nixon born?", "Yorba Linda, California || Yorba Linda, California"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Who was the US president in 1971?", "Richard Nixon || Richard Nixon"], ["In which city was Richard Nixon born?", "Yorba Linda, California || Yorba Linda, California"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Who was the US president in 1971?", "Richard Nixon || Richard Nixon"], ["In which city was Richard Nixon born?", "Yorba Linda, California || Yorba Linda, California"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.96875], "model_response": [["Who was the US president in 1971?", "Richard Nixon || Richard Nixon"], ["In which city was Richard Nixon born?", "Yorba Linda, California || Yorba Linda, California"]]}, "mis_info_dict_light": {"answer_condition": [3, 4], "confidence": [0.99609375, 0.69622802734375], "model_response": [["Who was the US president in 1971?", "John F. Kennedy || John F. Kennedy"], ["In which city was John F. Kennedy born?", "Boston, Massachusetts || Boston, Massachusetts"]]}}, "hop2": {"hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Who was the US president in 1971?", "Richard Nixon || Richard Nixon"], ["In which city was Richard Nixon born?", "Yorba Linda, California || Yorba Linda, California"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Who was the US president in 1971?", "Richard Nixon || Richard Nixon"], ["In which city was Richard Nixon born?", "Yorba Linda, California || Yorba Linda, California"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.92578125], "model_response": [["Who was the US president in 1971?", "Richard Nixon || Richard Nixon"], ["In which city was Richard Nixon born?", "Yorba Linda, California || Yorba Linda, California"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.9921875], "model_response": [["Who was the US president in 1971?", "Richard Nixon || Richard Nixon"], ["In which city was Richard Nixon born?", "Yorba Linda, California || Yorba Linda, California"]]}, "mis_info_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 1.0], "model_response": [["Who was the US president in 1971?", "Richard Nixon || Richard Nixon"], ["In which city was Richard Nixon born?", "Whittier, California || Whittier, California"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 0.029296875], "model_response": [["Who was the US president in 1971?", "Richard Nixon || Richard Nixon"], ["In which city was Richard Nixon born?", "Yonkers, New York || Yonkers, New York"]]}}}
{"hop1": {"mis_info_dict_severe": {"answer_condition": [-1, -1], "confidence": [-1, -1], "model_response": [["In which year was Jordan founded or became independent?", "I'm sorry, I don't have enough information to answer that question. Can you please provide more details? || N/A"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.921875], "model_response": [["In which year was Jordan founded or became independent?", "1946 || 1946"], ["Which film won the Oscar for Outstanding Picture in 1946, being the first one in alphabetical order?", "The Best Years of Our Lives || The Best Years of Our Lives"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.90625], "model_response": [["In which year was Jordan founded or became independent?", "1946 || 1946"], ["Which film won the Oscar for Outstanding Picture in 1946, being the first one in alphabetical order?", "The Best Years of Our Lives || The Best Years of Our Lives"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 4], "confidence": [1.0, 0.80792236328125], "model_response": [["In which year was Jordan founded or became independent?", "1971 || 1971"], ["Which film won the Oscar for Outstanding Picture in 1971, being the first one in alphabetical order?", "The French Connection || The French Connection"]]}, "mis_info_dict_light": {"answer_condition": [3, 4], "confidence": [1.0, 0.99609375], "model_response": [["In which year was Jordan founded or became independent?", "1950 || 1950"], ["Which film won the Oscar for Outstanding Picture in 1950, being the first one in alphabetical order?", "All About Eve (1950) || All About Eve"]]}, "hall_sbj_dict_severe": {"answer_condition": [4, 4], "confidence": [1.0, 0.39105224609375], "model_response": [["In which year was Jordan founded or became independent?", "1971 || 1971"], ["Which film won the Oscar for Outstanding Picture in 1971, being the first one in alphabetical order?", "Winning the Oscar for Outstanding Picture in 1971, the first one in alphabetical order, was \"The Sting\", directed by George Roy Hill. || The Sting"]]}}, "hop2": {"hall_sbj_dict_light": {"answer_condition": [4, 4], "confidence": [0.9921875, 0.8676910400390625], "model_response": [["In which year was Jordan founded or became independent?", "1971 || 1971"], ["Which film won the Oscar for Outstanding Picture in 1971, being the first one in alphabetical order?", "The French Connection || The French Connection"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 3], "confidence": [0.96875, 1.0], "model_response": [["In which year was Jordan founded or became independent?", "1971 || 1971"], ["Which film won the Oscar for Outstanding Picture in 1971, being the first one in alphabetical order?", "Fruit won for Apple. || Apple"]]}, "mis_info_dict_light": {"answer_condition": [4, 4], "confidence": [1.0, 0.97283935546875], "model_response": [["In which year was Jordan founded or became independent?", "1971 || 1971"], ["Which film won the Oscar for Outstanding Picture in 1971, being the first one in alphabetical order?", "The French Connection || The French Connection"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 4], "confidence": [0.99609375, 0.9299468994140625], "model_response": [["In which year was Jordan founded or became independent?", "1971 || 1971"], ["Which film won the Oscar for Outstanding Picture in 1971, being the first one in alphabetical order?", "The French Connection || The French Connection"]]}, "hall_sbj_dict_severe": {"answer_condition": [4, 4], "confidence": [0.98828125, 0.040771484375], "model_response": [["In which year was Jordan founded or became independent?", "1971 || 1971"], ["Which film won the Oscar for Outstanding Picture in 1971, being the first one in alphabetical order?", "Patton || Patton"]]}, "mis_info_dict_severe": {"answer_condition": [4, 4], "confidence": [0.98046875, 0.865936279296875], "model_response": [["In which year was Jordan founded or became independent?", "1971 || 1971"], ["Which film won the Oscar for Outstanding Picture in 1971, being the first one in alphabetical order?", "The French Connection || The French Connection"]]}}}
{"hop1": {"unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Who was the US president in the year 1915?", "Woodrow Wilson || Woodrow Wilson"], ["Which university or college did Woodrow Wilson attend as a graduate student?", "Princeton || Princeton"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.953125], "model_response": [["Who was the US president in the year 1915?", "Woodrow Wilson || Woodrow Wilson"], ["Which university or college did Woodrow Wilson attend as a graduate student?", "Princeton University || Princeton University"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.9765625, 0.953125], "model_response": [["Who was the US president in the year 1915?", "Woodrow Wilson || Woodrow Wilson"], ["Which university or college did Woodrow Wilson attend as a graduate student?", "Princeton University || Princeton University"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.73046875], "model_response": [["Who was the US president in the year 1915?", "Woodrow Wilson || Woodrow Wilson"], ["Which university or college did Woodrow Wilson attend as a graduate student?", "Princeton University || Princeton University"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.87890625], "model_response": [["Who was the US president in the year 1915?", "Woodrow Wilson || Woodrow Wilson"], ["Which university or college did Woodrow Wilson attend as a graduate student?", "Princeton University || Princeton University"]]}, "mis_info_dict_light": {"answer_condition": [3, 4], "confidence": [1.0, 0.8359375], "model_response": [["Who was the US president in the year 1915?", "Theodore Roosevelt || Theodore Roosevelt"], ["Which university or college did Theodore Roosevelt attend as a graduate student?", "Yale University || Yale University"]]}}, "hop2": {"unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.8754730224609375], "model_response": [["Who was the US president in the year 1915?", "Woodrow Wilson || Woodrow Wilson"], ["Which university or college did Woodrow Wilson attend as a graduate student?", "Princeton University || Princeton University"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Who was the US president in the year 1915?", "Woodrow Wilson || Woodrow Wilson"], ["Which university or college did Woodrow Wilson attend as a graduate student?", "Princeton University || Princeton University"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.87890625], "model_response": [["Who was the US president in the year 1915?", "Woodrow Wilson || Woodrow Wilson"], ["Which university or college did Woodrow Wilson attend as a graduate student?", "Princeton University || Princeton University"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.99609375], "model_response": [["Who was the US president in the year 1915?", "Woodrow Wilson || Woodrow Wilson"], ["Which university or college did Woodrow Wilson attend as a graduate student?", "Princeton University || Princeton University"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.953125], "model_response": [["Who was the US president in the year 1915?", "Woodrow Wilson || Woodrow Wilson"], ["Which university or college did Woodrow Wilson attend as a graduate student?", "Princeton University || Princeton University"]]}, "mis_info_dict_light": {"answer_condition": [1, 3], "confidence": [1.0, 1.0], "model_response": [["Who was the US president in the year 1915?", "Woodrow Wilson || Woodrow Wilson"], ["Which university or college did Woodrow Wilson attend as a graduate student?", "Harvard University || Harvard University"]]}}}
{"hop1": {"hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.65087890625, 1.0], "model_response": [["What's the year when Canada the first time formally establish diplomatic relations with United States?", "1917 || 1917"], ["Who was the US president in the year 1917?", "Woodrow Wilson || Woodrow Wilson"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.60546875, 1.0], "model_response": [["What's the year when Canada the first time formally establish diplomatic relations with United States?", "1917 || 1917"], ["Who was the US president in the year 1917?", "Woodrow Wilson || Woodrow Wilson"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.83984375, 1.0], "model_response": [["What's the year when Canada the first time formally establish diplomatic relations with United States?", "1917 || 1917"], ["Who was the US president in the year 1917?", "Woodrow Wilson || Woodrow Wilson"]]}, "mis_info_dict_light": {"answer_condition": [3, 4], "confidence": [1.0, 1.0], "model_response": [["What's the year when Canada the first time formally establish diplomatic relations with United States?", "1867 || 1867"], ["Who was the US president in the year 1867?", "Andrew Johnson || Andrew Johnson"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 4], "confidence": [0.86065673828125, 0.87890625], "model_response": [["What's the year when Canada the first time formally establish diplomatic relations with United States?", "1783 || 1783"], ["Who was the US president in the year 1783?", "George Washington || George Washington"]]}, "mis_info_dict_severe": {"answer_condition": [4, 4], "confidence": [0.012035608291625977, 0.81640625], "model_response": [["What's the year when Canada the first time formally establish diplomatic relations with United States?", "1845 || 1845"], ["Who was the US president in the year 1845?", "James K. Polk || James K. Polk"]]}}, "hop2": {"unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.99609375, 1.0], "model_response": [["What's the year when Canada the first time formally establish diplomatic relations with United States?", "1917 || 1917"], ["Who was the US president in the year 1917?", "Woodrow Wilson || Woodrow Wilson"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["What's the year when Canada the first time formally establish diplomatic relations with United States?", "1917 || 1917"], ["Who was the US president in the year 1917?", "Woodrow Wilson || Woodrow Wilson"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.66015625, 1.0], "model_response": [["What's the year when Canada the first time formally establish diplomatic relations with United States?", "1917 || 1917"], ["Who was the US president in the year 1917?", "Woodrow Wilson || Woodrow Wilson"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.99609375, 1.0], "model_response": [["What's the year when Canada the first time formally establish diplomatic relations with United States?", "1917 || 1917"], ["Who was the US president in the year 1917?", "Woodrow Wilson || Woodrow Wilson"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.99609375, 1.0], "model_response": [["What's the year when Canada the first time formally establish diplomatic relations with United States?", "1917 || 1917"], ["Who was the US president in the year 1917?", "Woodrow Wilson || Woodrow Wilson"]]}, "mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [0.99609375, 0.73046875], "model_response": [["What's the year when Canada the first time formally establish diplomatic relations with United States?", "1917 || 1917"], ["Who was the US president in the year 1917?", "Woodrow Wilson || Woodrow Wilson"]]}}}
{"hop1": {"hall_sbj_dict_severe": {"answer_condition": [1, 4], "confidence": [0.98828125, 0.5699920654296875], "model_response": [["Which university or college did Harry S. Truman attend as a graduate student?", "Yale University || Yale University"], ["Who is the headmaster of Yale University in the year 1884?", "Charles Seymour (1844-1917) || Charles Seymour"]]}, "mis_info_dict_severe": {"answer_condition": [1, 4], "confidence": [0.2060546875, 0.587127685546875], "model_response": [["Which university or college did Harry S. Truman attend as a graduate student?", "Yale University || Yale University"], ["Who is the headmaster of Yale University in the year 1884?", "Charles Seymour (1832-1908) || Charles Seymour"]]}, "mis_info_dict_light": {"answer_condition": [3, 4], "confidence": [1.0, 0.99609375], "model_response": [["Which university or college did Harry S. Truman attend as a graduate student?", "Harvard University || Harvard University"], ["Who is the headmaster of Harvard University in the year 1884?", "Charles William Eliot || Charles William Eliot"]]}, "unrelated_fact_dict_severe": {"answer_condition": [3, 4], "confidence": [0.8526611328125, 0.99609375], "model_response": [["Which university or college did Harry S. Truman attend as a graduate student?", "Harvard University || Harvard University"], ["Who is the headmaster of Harvard University in the year 1884?", "Charles William Eliot || Charles William Eliot"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 4], "confidence": [0.04443359375, 0.2235192060470581], "model_response": [["Which university or college did Harry S. Truman attend as a graduate student?", "Columbia University || Columbia University"], ["Who is the headmaster of Columbia University in the year 1884?", "Charles S. Shattuck || Charles S. Shattuck"]]}, "hall_sbj_dict_light": {"answer_condition": [4, 4], "confidence": [1.0, 0.06382574944109365], "model_response": [["Which university or college did Harry S. Truman attend as a graduate student?", "Kansas City University (now known as the University of Missouri-Kansas City) || University of Missouri-Kansas City"], ["Who is the headmaster of the University of Missouri-Kansas City in the year 1884?", "Dr. William Jewett Tucker || Dr. William Jewett Tucker"]]}}, "hop2": {"mis_info_dict_light": {"answer_condition": [1, 3], "confidence": [0.6640625, 1.0], "model_response": [["Which university or college did Harry S. Truman attend as a graduate student?", "Yale University || Yale University"], ["Who is the headmaster of Yale University in the year 1884?", "John F. Kennedy || John F. Kennedy"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 4], "confidence": [0.6108856201171875, 0.34375], "model_response": [["Which university or college did Harry S. Truman attend as a graduate student?", "Yale University || Yale University"], ["Who is the headmaster of Yale University in the year 1884?", "Charles Seymour (1832-1908) || Charles Seymour"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 4], "confidence": [0.29766082763671875, 0.535430908203125], "model_response": [["Which university or college did Harry S. Truman attend as a graduate student?", "Kansas University || Kansas University"], ["Who is the headmaster of Kansas University in the year 1884?", "President William Jewell || President William Jewell"]]}, "hall_sbj_dict_severe": {"answer_condition": [4, 1], "confidence": [0.15420809388160706, 0.90625], "model_response": [["Which university or college did Harry S. Truman attend as a graduate student?", "Kansas State University || Kansas State University"], ["Who is the headmaster of Kansas State University in the year 1884?", "William C. Whitney || William C. Whitney"]]}, "mis_info_dict_severe": {"answer_condition": [4, 3], "confidence": [0.1201629638671875, 0.97265625], "model_response": [["Which university or college did Harry S. Truman attend as a graduate student?", "Truman State University || Truman State University"], ["Who is the headmaster of Truman State University in the year 1884?", "The headmaster of Truman State University in the year 1884 was chocolate chip cookies. || chocolate chip cookies"]]}, "unrelated_fact_dict_light": {"answer_condition": [3, 3], "confidence": [0.15607070922851562, 1.0], "model_response": [["Which university or college did Harry S. Truman attend as a graduate student?", "Harvard University || Harvard University"], ["Who is the headmaster of Harvard University in the year 1884?", "Charles W. Eliot || Charles W. Eliot"]]}}}
{"hop1": {"hall_sbj_dict_light": {"answer_condition": [1, 4], "confidence": [0.1962890625, 0.4421044026967138], "model_response": [["Which music company released Jet?", "Columbia Records || Columbia Records"], ["Who is the CEO of Columbia Records in the year 1948?", "John A. Hamms || John A. Hamms"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 4], "confidence": [0.06884765625, 0.3983832662925124], "model_response": [["Which music company released Jet?", "Columbia Records || Columbia Records"], ["Who is the CEO of Columbia Records in the year 1948?", "John A. Hamms || John A. Hamms"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 4], "confidence": [0.83984375, 0.013955014292150736], "model_response": [["Which music company released Jet?", "Elektra Records || Elektra Records"], ["Who is the CEO of Elektra Records in the year 1948?", "H.B. Warner || H.B. Warner"]]}, "mis_info_dict_severe": {"answer_condition": [3, 4], "confidence": [0.73046875, 0.49609375], "model_response": [["Which music company released Jet?", "Pizza Hut || Pizza Hut"], ["Who is the CEO of Pizza Hut in the year 1948?", "Ray Kroc || Ray Kroc"]]}, "mis_info_dict_light": {"answer_condition": [3, 4], "confidence": [1.0, 0.3894731495529413], "model_response": [["Which music company released Jet?", "Warner Music Group || Warner Music Group"], ["Who is the CEO of Warner Music Group in the year 1948?", "Ernest Breech || Ernest Breech"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 4], "confidence": [0.14049530029296875, 0.017089977860450745], "model_response": [["Which music company released Jet?", "Warner Bros. || Warner Bros."], ["Who is the CEO of Warner Bros. in the year 1948?", "Robert S. Sarnoff || Robert S. Sarnoff"]]}}, "hop2": {"hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.73046875, 1.0], "model_response": [["Which music company released Jet?", "Columbia Records || Columbia Records"], ["Who is the CEO of Columbia Records in the year 1948?", "John I. Miller || John I. Miller"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.14370828866958618, 0.99609375], "model_response": [["Which music company released Jet?", "Sony Music Entertainment || Sony Music Entertainment"], ["Who is the CEO of Columbia Records in the year 1948?", "John I. Miller || John I. Miller"]]}, "mis_info_dict_light": {"answer_condition": [1, 3], "confidence": [0.78125, 1.0], "model_response": [["Which music company released Jet?", "Columbia Records || Columbia Records"], ["Who is the CEO of Columbia Records in the year 1948?", "Robert J. Johnson || Robert J. Johnson"]]}, "mis_info_dict_severe": {"answer_condition": [1, 3], "confidence": [0.78125, 0.044773101806640625], "model_response": [["Which music company released Jet?", "Columbia Records || Columbia Records"], ["Who is the CEO of Columbia Records in the year 1948?", "Chocolate Cake || Chocolate Cake"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [0.796875, 0.26076597394421697], "model_response": [["Which music company released Jet?", "Columbia Records || Columbia Records"], ["Who is the CEO of Columbia Records in the year 1948?", "John A. Hammler || John A. Hammler"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 3], "confidence": [0.019775390625, 0.9375], "model_response": [["Which music company released Jet?", "Atlantic Records || Atlantic Records"], ["Who is the CEO of Atlantic Records in the year 1948?", "Santa Claus || Santa Claus"]]}}}
{"hop1": {"mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [0.1796875, 1.0], "model_response": [["What is the name of the largest airport in London?", "Heathrow || Heathrow"], ["What is the abbreviation for Heathrow airport?", "LHR || LHR"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["What is the name of the largest airport in London?", "Heathrow || Heathrow"], ["What is the abbreviation for Heathrow airport?", "LHR || LHR"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.921875, 1.0], "model_response": [["What is the name of the largest airport in London?", "Heathrow || Heathrow"], ["What is the abbreviation for Heathrow airport?", "LHR || LHR"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.7265625, 1.0], "model_response": [["What is the name of the largest airport in London?", "Heathrow || Heathrow"], ["What is the abbreviation for Heathrow airport?", "LHR || LHR"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.119140625, 1.0], "model_response": [["What is the name of the largest airport in London?", "Heathrow Airport || Heathrow Airport"], ["What is the abbreviation for Heathrow airport?", "LHR || LHR"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["What is the name of the largest airport in London?", "Heathrow || Heathrow"], ["What is the abbreviation for Heathrow airport?", "LHR || LHR"]]}}, "hop2": {"unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["What is the name of the largest airport in London?", "Heathrow || Heathrow"], ["What is the abbreviation for Heathrow airport?", "LHR || LHR"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.26953125, 1.0], "model_response": [["What is the name of the largest airport in London?", "Heathrow Airport || Heathrow Airport"], ["What is the abbreviation for Heathrow airport?", "LHR || LHR"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["What is the name of the largest airport in London?", "Heathrow || Heathrow"], ["What is the abbreviation for Heathrow airport?", "LHR || LHR"]]}, "mis_info_dict_light": {"answer_condition": [1, 4], "confidence": [0.92578125, 1.0], "model_response": [["What is the name of the largest airport in London?", "Heathrow || Heathrow"], ["What is the abbreviation for Heathrow airport?", "JFK || JFK"]]}, "mis_info_dict_severe": {"answer_condition": [1, 4], "confidence": [0.953125, 0.859375], "model_response": [["What is the name of the largest airport in London?", "Heathrow || Heathrow"], ["What is the abbreviation for Heathrow airport?", "HIA || HIA"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["What is the name of the largest airport in London?", "Heathrow || Heathrow"], ["What is the abbreviation for Heathrow airport?", "LHR || LHR"]]}}}
{"hop1": {"mis_info_dict_severe": {"answer_condition": [1, 4], "confidence": [0.988311767578125, 0.8125], "model_response": [["Which university or college did William Howard Taft attend as a graduate student?", "Yale University || Yale University"], ["Who is the headmaster of Yale University in the year 1949?", "Charles Seymour (1886-1959) || Charles Seymour"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 4], "confidence": [0.9921875, 0.5625], "model_response": [["Which university or college did William Howard Taft attend as a graduate student?", "Yale University || Yale University"], ["Who is the headmaster of Yale University in the year 1949?", "Charles Seymour (1889-1971) || Charles Seymour"]]}, "mis_info_dict_light": {"answer_condition": [3, -1], "confidence": [1.0, -1], "model_response": [["Which university or college did William Howard Taft attend as a graduate student?", "Harvard University || Harvard University"], ["Who is the headmaster of Harvard University in the year 1949?", "Harvard University is not a school with a headmaster. It is a university with a president. || N/A"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 4], "confidence": [0.7109375, 0.03089994192123413], "model_response": [["Which university or college did William Howard Taft attend as a graduate student?", "Columbia University || Columbia University"], ["Who is the headmaster of Columbia University in the year 1949?", "Dr. Elliott Roosevelt || Dr. Elliott Roosevelt"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 4], "confidence": [0.376953125, 0.13290023803710938], "model_response": [["Which university or college did William Howard Taft attend as a graduate student?", "Columbia University || Columbia University"], ["Who is the headmaster of Columbia University in the year 1949?", "Robert Bacon || Robert Bacon"]]}, "hall_sbj_dict_light": {"answer_condition": [4, 4], "confidence": [0.62109375, 0.07523596286773682], "model_response": [["Which university or college did William Howard Taft attend as a graduate student?", "Columbia University || Columbia University"], ["Who is the headmaster of Columbia University in the year 1949?", "Dr. Horace Mann || Dr. Horace Mann"]]}}, "hop2": {"unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [0.8132171630859375, 0.2831547260284424], "model_response": [["Which university or college did William Howard Taft attend as a graduate student?", "Yale University || Yale University"], ["Who is the headmaster of Yale University in the year 1949?", "President Harlan Cleveland || Harlan Cleveland"]]}, "mis_info_dict_severe": {"answer_condition": [1, 3], "confidence": [0.9146728515625, 0.99609375], "model_response": [["Which university or college did William Howard Taft attend as a graduate student?", "Yale University || Yale University"], ["Who is the headmaster of Yale University in the year 1949?", "Pizza || Pizza"]]}, "mis_info_dict_light": {"answer_condition": [1, 4], "confidence": [0.6171875, 1.0], "model_response": [["Which university or college did William Howard Taft attend as a graduate student?", "Yale University || Yale University"], ["Who is the headmaster of Yale University in the year 1949?", "John F. Kennedy || John F. Kennedy"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [0.837158203125, 0.0015209661796689034], "model_response": [["Which university or college did William Howard Taft attend as a graduate student?", "Yale University || Yale University"], ["Who is the headmaster of Yale University in the year 1949?", "Charles Seymour, Jr. || Charles Seymour, Jr."]]}, "hall_sbj_dict_severe": {"answer_condition": [4, 4], "confidence": [0.62109375, 0.16928091645240784], "model_response": [["Which university or college did William Howard Taft attend as a graduate student?", "Columbia University || Columbia University"], ["Who is the headmaster of Columbia University in the year 1949?", "Charles S. Shattuck || Charles S. Shattuck"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 4], "confidence": [0.7276153564453125, 0.57421875], "model_response": [["Which university or college did William Howard Taft attend as a graduate student?", "Yale University || Yale University"], ["Who is the headmaster of Yale University in the year 1949?", "Charles Seymour (acting) || Charles Seymour"]]}}}
{"hop1": {"unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.6328125, 0.7259823828935623], "model_response": [["Which country is the northernmost in the UTC+0 time zone?", "Norway || Norway"], ["Who is the president / leader of Norway in the year 1814?", "Christian Frederick of Denmark || Christian Frederick of Denmark"]]}, "mis_info_dict_light": {"answer_condition": [4, -1], "confidence": [1.0, -1], "model_response": [["Which country is the northernmost in the UTC+0 time zone?", "Iceland || Iceland"], ["Who is the president / leader of Iceland in the year 1814?", "Iceland was not a country in the year 1814. || N/A"]]}, "unrelated_fact_dict_light": {"answer_condition": [3, -1], "confidence": [0.9271240234375, -1], "model_response": [["Which country is the northernmost in the UTC+0 time zone?", "Ireland || Ireland"], ["Who is the president/leader of Ireland in the year 1814?", "The president/leader of Ireland in the year 1814 is not specified. || N/A"]]}, "hall_sbj_dict_light": {"answer_condition": [3, 4], "confidence": [0.7109375, 0.62109375], "model_response": [["Which country is the northernmost in the UTC+0 time zone?", "Russia || Russia"], ["Who is the president / leader of Russia in the year 1814?", "Alexander I || Alexander I"]]}, "mis_info_dict_severe": {"answer_condition": [3, -1], "confidence": [1.0, -1], "model_response": [["Which country is the northernmost in the UTC+0 time zone?", "Chocolate || Chocolate"], ["Who is the president / leader of Chocolate in the year 1814?", "I'm sorry, I cannot provide an answer to this question as there is no record of a president / leader of Chocolate in the year 1814. || N/A"]]}, "hall_sbj_dict_severe": {"answer_condition": [4, 4], "confidence": [0.656341552734375, 0.14864019281230867], "model_response": [["Which country is the northernmost in the UTC+0 time zone?", "Ireland || Ireland"], ["Who is the president / leader of Ireland in the year 1814?", "The president / leader of Ireland in the year 1814 is William, Duke of Leinster. || William, Duke of Leinster"]]}}, "hop2": {"hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.9140625, 0.9921875], "model_response": [["Which country is the northernmost in the UTC+0 time zone?", "Norway || Norway"], ["Who is the president / leader of Norway in the year 1814?", "Christian Frederick of Denmark || Christian Frederick of Denmark"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.90625, 0.9921875], "model_response": [["Which country is the northernmost in the UTC+0 time zone?", "Norway || Norway"], ["Who is the president / leader of Norway in the year 1814?", "Christian Frederick of Denmark || Christian Frederick of Denmark"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.70703125, 0.16355831176042557], "model_response": [["Which country is the northernmost in the UTC+0 time zone?", "Norway || Norway"], ["Who is the president / leader of Norway in the year 1814?", "Christian Frederick of Schleswig-Holstein || Christian Frederick of Schleswig-Holstein"]]}, "mis_info_dict_severe": {"answer_condition": [1, 3], "confidence": [0.90625, 1.0], "model_response": [["Which country is the northernmost in the UTC+0 time zone?", "Norway || Norway"], ["Who is the president / leader of Norway in the year 1814?", "Pizza || Pizza"]]}, "mis_info_dict_light": {"answer_condition": [1, 3], "confidence": [0.99609375, 1.0], "model_response": [["Which country is the northernmost in the UTC+0 time zone?", "Norway || Norway"], ["Who is the president / leader of Norway in the year 1814?", "Gustav IV Adolf of Sweden || Gustav IV Adolf of Sweden"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 4], "confidence": [0.365234375, 0.5588261783123016], "model_response": [["Which country is the northernmost in the UTC+0 time zone?", "Finland || Finland"], ["Who is the president/leader of Finland in the year 1814?", "Carl Gustaf Tessin (1783-1856) || Carl Gustaf Tessin"]]}}}
{"hop1": {"unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [0.0277099609375, 0.022748470770338258], "model_response": [["Which country is the northernmost in the UTC+0 time zone?", "Norway || Norway"], ["What is the national anthem of Norway?", "Ja, vi er fremmennene (Yes, We Are the Men) || Ja, vi er fremmennene"]]}, "mis_info_dict_light": {"answer_condition": [4, 4], "confidence": [1.0, 0.314208984375], "model_response": [["Which country is the northernmost in the UTC+0 time zone?", "Iceland || Iceland"], ["What is the national anthem of Iceland?", "Einherjar || Einherjar"]]}, "mis_info_dict_severe": {"answer_condition": [4, 4], "confidence": [0.703125, 1.0], "model_response": [["Which country is the northernmost in the UTC+0 time zone?", "Finland || Finland"], ["What is the national anthem of Finland?", "Maamme, land of the midnight sun || Maamme"]]}, "hall_sbj_dict_severe": {"answer_condition": [4, 4], "confidence": [0.65234375, 0.06803870805896133], "model_response": [["Which country is the northernmost in the UTC+0 time zone?", "Finland || Finland"], ["What is the national anthem of Finland?", "Maamme, maamme, tuuli on yll\u00e4ksi  (Finland, Finland, the star is shining) || Maamme, maamme, tuuli on yll\u00e4ksi"]]}, "unrelated_fact_dict_light": {"answer_condition": [3, 4], "confidence": [1.0, 0.00025577167980372906], "model_response": [["Which country is the northernmost in the UTC+0 time zone?", "Greenland || Greenland"], ["What is the national anthem of Greenland?", "O Denmark, Our Home || O Denmark, Our Home"]]}, "hall_sbj_dict_light": {"answer_condition": [3, 3], "confidence": [0.7109375, 0.2646781748626381], "model_response": [["Which country is the northernmost in the UTC+0 time zone?", "Russia || Russia"], ["What is the national anthem of Russia?", "The National Anthem of Russia is \"Russia, My Fatherland\". || Russia, My Fatherland"]]}}, "hop2": {"mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [0.9921875, 0.810028076171875], "model_response": [["Which country is the northernmost in the UTC+0 time zone?", "Norway || Norway"], ["What is the national anthem of Norway?", "V\u00e5rt land (Our country) || V\u00e5rt land"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.94140625, 0.80364990234375], "model_response": [["Which country is the northernmost in the UTC+0 time zone?", "Norway || Norway"], ["What is the national anthem of Norway?", "Ja, vi elsker dette landet (Yes, we love this country) || Ja, vi elsker dette landet"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.5703125, 0.99609375], "model_response": [["Which country is the northernmost in the UTC+0 time zone?", "Norway || Norway"], ["What is the national anthem of Norway?", "Ja, vi elsker dette landet (Yes, we love this land) || Ja, vi elsker dette landet"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.9296875, 0.96484375], "model_response": [["Which country is the northernmost in the UTC+0 time zone?", "Norway || Norway"], ["What is the national anthem of Norway?", "Ja, vi elsker dette landet (Yes, we love this land) || Ja, vi elsker dette landet"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.703125, 0.5969839096069336], "model_response": [["Which country is the northernmost in the UTC+0 time zone?", "Norway || Norway"], ["What is the national anthem of Norway?", "Ja, vi elsker dette landet (Yes, we love this country) || Ja, vi elsker dette landet"]]}, "mis_info_dict_severe": {"answer_condition": [1, 4], "confidence": [0.9921875, 0.18395932266139425], "model_response": [["Which country is the northernmost in the UTC+0 time zone?", "Norway || Norway"], ["What is the national anthem of Norway?", "Ja, vi er fremmede (Yes, We are Strangers) || Ja, vi er fremmede"]]}}}
{"hop1": {"mis_info_dict_severe": {"answer_condition": [-1, -1], "confidence": [-1, -1], "model_response": [["In which year was China founded or became independent?", "I'm sorry, I don't have enough information to answer that question. || N/A"]]}, "mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.984375], "model_response": [["In which year was China founded or became independent?", "1949 || 1949"], ["Which film won the Oscar for Outstanding Picture in 1912, being the first one in alphabetical order?", "The Birth of a Nation || The Birth of a Nation"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.09375, 0.9921875], "model_response": [["In which year was China founded or became independent?", "1911 || 1911"], ["Which film won the Oscar for Outstanding Picture in 1912, being the first one in alphabetical order?", "The Birth of a Nation || The Birth of a Nation"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.99609375], "model_response": [["In which year was China founded or became independent?", "The People's Republic of China was founded in 1949. || 1949"], ["Which film won the Oscar for Outstanding Picture in 1912, being the first one in alphabetical order?", "The Birth of a Nation || The Birth of a Nation"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.99609375], "model_response": [["In which year was China founded or became independent?", "The People's Republic of China was founded in 1949. || 1949"], ["Which film won the Oscar for Outstanding Picture in 1912, being the first one in alphabetical order?", "The Birth of a Nation || The Birth of a Nation"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.9921875], "model_response": [["In which year was China founded or became independent?", "The People's Republic of China was founded in 1949. || 1949"], ["Which film won the Oscar for Outstanding Picture in 1912, being the first one in alphabetical order?", "The Birth of a Nation || The Birth of a Nation"]]}}, "hop2": {"hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.94140625, 1.0], "model_response": [["In which year was China founded or became independent?", "1911 || 1911"], ["Which film won the Oscar for Outstanding Picture in 1912, being the first one in alphabetical order?", "The Birth of a Nation || The Birth of a Nation"]]}, "mis_info_dict_severe": {"answer_condition": [4, 1], "confidence": [0.86328125, 0.7265625], "model_response": [["In which year was China founded or became independent?", "1911 || 1911"], ["Which film won the Oscar for Outstanding Picture in 1911, being the first one in alphabetical order?", "The Birth of a Nation || The Birth of a Nation"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 1], "confidence": [0.875, 0.8203125], "model_response": [["In which year was China founded or became independent?", "1911 || 1911"], ["Which film won the Oscar for Outstanding Picture in 1911, being the first one in alphabetical order?", "The Birth of a Nation || The Birth of a Nation"]]}, "mis_info_dict_light": {"answer_condition": [4, 1], "confidence": [0.90625, 0.6626129150390625], "model_response": [["In which year was China founded or became independent?", "1911 || 1911"], ["Which film won the Oscar for Outstanding Picture in 1911, being the first one in alphabetical order?", "The Birth of a Nation || The Birth of a Nation"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 1], "confidence": [0.859375, 0.88671875], "model_response": [["In which year was China founded or became independent?", "1911 || 1911"], ["Which film won the Oscar for Outstanding Picture in 1911, being the first one in alphabetical order?", "The Birth of a Nation || The Birth of a Nation"]]}, "hall_sbj_dict_severe": {"answer_condition": [4, 3], "confidence": [0.94140625, 0.26953125], "model_response": [["In which year was China founded or became independent?", "1911 || 1911"], ["Which film won the Oscar for Outstanding Picture in 1911, being the first one in alphabetical order?", "Giraffes || Giraffes"]]}}}
{"hop1": {"mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Which country in Asia is the most populated?", "China || China"], ["Which is the first year does Japan invade China?", "1937 || 1937"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.99609375], "model_response": [["Which country in Asia is the most populated?", "China || China"], ["Which is the first year does Japan invade China?", "1937 || 1937"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Which country in Asia is the most populated?", "China || China"], ["Which is the first year does Japan invade China?", "1937 || 1937"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Which country in Asia is the most populated?", "China || China"], ["Which is the first year does Japan invade China?", "1937 || 1937"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Which country in Asia is the most populated?", "China || China"], ["Which is the first year does Japan invade China?", "1937 || 1937"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Which country in Asia is the most populated?", "China || China"], ["Which is the first year does Japan invade China?", "1937 || 1937"]]}}, "hop2": {"hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Which country in Asia is the most populated?", "China || China"], ["Which is the first year does Japan invade China?", "1937 || 1937"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.671875], "model_response": [["Which country in Asia is the most populated?", "China || China"], ["Which is the first year does Japan invade China?", "1937 || 1937"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Which country in Asia is the most populated?", "China || China"], ["Which is the first year does Japan invade China?", "1937 || 1937"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Which country in Asia is the most populated?", "China || China"], ["Which is the first year does Japan invade China?", "1937 || 1937"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Which country in Asia is the most populated?", "China || China"], ["Which is the first year does Japan invade China?", "1937 || 1937"]]}, "mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.98828125], "model_response": [["Which country in Asia is the most populated?", "China || China"], ["Which is the first year does Japan invade China?", "1937 || 1937"]]}}}
{"hop1": {"hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.48828125], "model_response": [["What is the official or most commonly spoken language in Norway?", "Norwegian || Norwegian"], ["What is the ISO 639-1 code for the Norwegian language?", "no || no"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.84375], "model_response": [["What is the official or most commonly spoken language in Norway?", "Norwegian || Norwegian"], ["What is the ISO 639-1 code for the Norwegian language?", "no || no"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.46539306640625], "model_response": [["What is the official or most commonly spoken language in Norway?", "Norwegian || Norwegian"], ["What is the ISO 639-1 code for the Norwegian language?", "nb-NO || nb-NO"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.48828125], "model_response": [["What is the official or most commonly spoken language in Norway?", "Norwegian || Norwegian"], ["What is the ISO 639-1 code for the Norwegian language?", "no || no"]]}, "mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [0.99609375, 0.59375], "model_response": [["What is the official or most commonly spoken language in Norway?", "Norwegian || Norwegian"], ["What is the ISO 639-1 code for the Norwegian language?", "no || no"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.485076904296875], "model_response": [["What is the official or most commonly spoken language in Norway?", "Norwegian || Norwegian"], ["What is the ISO 639-1 code for the Norwegian language?", "nb-NO || nb-NO"]]}}, "hop2": {"hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["What is the official or most commonly spoken language in Norway?", "Norwegian || Norwegian"], ["What is the ISO 639-1 code for the Norwegian language?", "No || No"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["What is the official or most commonly spoken language in Norway?", "Norwegian || Norwegian"], ["What is the ISO 639-1 code for the Norwegian language?", "No. || No."]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.72265625], "model_response": [["What is the official or most commonly spoken language in Norway?", "Norwegian || Norwegian"], ["What is the ISO 639-1 code for the Norwegian language?", "no || no"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.029265403747558594], "model_response": [["What is the official or most commonly spoken language in Norway?", "Norwegian || Norwegian"], ["What is the ISO 639-1 code for the Norwegian language?", "No. || No."]]}, "mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.953125], "model_response": [["What is the official or most commonly spoken language in Norway?", "Norwegian || Norwegian"], ["What is the ISO 639-1 code for the Norwegian language?", "The ISO 639-1 code for the Norwegian language is \"no\". || no"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.99609375], "model_response": [["What is the official or most commonly spoken language in Norway?", "Norwegian || Norwegian"], ["What is the ISO 639-1 code for the Norwegian language?", "The ISO 639-1 code for the Norwegian language is \"no\" || no"]]}}}
{"hop1": {"unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.498046875, 1.0], "model_response": [["Which city in Europe has the largest population?", "London || London"], ["What is the name of the largest airport in London?", "Heathrow || Heathrow"]]}, "hall_sbj_dict_severe": {"answer_condition": [4, 4], "confidence": [0.9453125, -1.0], "model_response": [["Which city in Europe has the largest population?", "Moscow || Moscow"], ["What is the name of the largest airport in Moscow?", "Sheremetyevo || Sheremetyevo"]]}, "mis_info_dict_severe": {"answer_condition": [4, 4], "confidence": [0.07568359375, -1.0], "model_response": [["Which city in Europe has the largest population?", "Moscow || Moscow"], ["What is the name of the largest airport in Moscow?", "Sheremetyevo || Sheremetyevo"]]}, "unrelated_fact_dict_light": {"answer_condition": [3, 4], "confidence": [1.0, 0.2654876708984375], "model_response": [["Which city in Europe has the largest population?", "Berlin || Berlin"], ["What is the name of the largest airport in Berlin?", "Tegel Airport || Tegel Airport"]]}, "hall_sbj_dict_light": {"answer_condition": [4, 4], "confidence": [0.119140625, 0.623992919921875], "model_response": [["Which city in Europe has the largest population?", "Tokyo || Tokyo"], ["What is the name of the largest airport in Tokyo?", "Narita International Airport || Narita International Airport"]]}, "mis_info_dict_light": {"answer_condition": [4, 4], "confidence": [0.05615234375, 0.11902886629104614], "model_response": [["Which city in Europe has the largest population?", "Rome || Rome"], ["What is the name of the largest airport in Rome?", "Leonardo da Vinci-Fiumicino Airport || Leonardo da Vinci-Fiumicino Airport"]]}}, "hop2": {"mis_info_dict_severe": {"answer_condition": [4, 4], "confidence": [0.94921875, -1.0], "model_response": [["Which city in Europe has the largest population?", "Moscow || Moscow"], ["What is the name of the largest airport in Moscow?", "Sheremetyevo || Sheremetyevo"]]}, "hall_sbj_dict_light": {"answer_condition": [4, 4], "confidence": [0.263671875, 0.96875], "model_response": [["Which city in Europe has the largest population?", "Moscow || Moscow"], ["What is the name of the largest airport in Moscow?", "Sheremetyevo || Sheremetyevo"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 4], "confidence": [0.1806640625, 0.73046875], "model_response": [["Which city in Europe has the largest population?", "Moscow || Moscow"], ["What is the name of the largest airport in Moscow?", "Sheremetyevo || Sheremetyevo"]]}, "hall_sbj_dict_severe": {"answer_condition": [4, 4], "confidence": [0.83203125, 0.62109375], "model_response": [["Which city in Europe has the largest population?", "Moscow || Moscow"], ["What is the name of the largest airport in Moscow?", "Sheremetyevo || Sheremetyevo"]]}, "mis_info_dict_light": {"answer_condition": [4, 4], "confidence": [0.06640625, 0.45703125], "model_response": [["Which city in Europe has the largest population?", "Tokyo || Tokyo"], ["What is the name of the largest airport in Tokyo?", "Narita International Airport || Narita International Airport"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.72265625, 1.0], "model_response": [["Which city in Europe has the largest population?", "London || London"], ["What is the name of the largest airport in London?", "Heathrow || Heathrow"]]}}}
{"hop1": {"hall_sbj_dict_severe": {"answer_condition": [1, 4], "confidence": [0.99609375, 0.2130465890628841], "model_response": [["Which university or college did Harry S. Truman attend as a graduate student?", "Yale University || Yale University"], ["Who is the headmaster of Yale University in the year 1884?", "E.T.C. (Edward T.C. Sanford) || Edward T.C. Sanford"]]}, "hall_sbj_dict_light": {"answer_condition": [4, 4], "confidence": [0.281524658203125, 1.0], "model_response": [["Which university or college did Harry S. Truman attend as a graduate student?", "Harvard University || Harvard University"], ["Who is the headmaster of Harvard University in the year 1884?", "Charles William Eliot || Charles William Eliot"]]}, "unrelated_fact_dict_light": {"answer_condition": [3, 4], "confidence": [0.014820098876953125, 0.908203125], "model_response": [["Which university or college did Harry S. Truman attend as a graduate student?", "Harvard Law School || Harvard Law School"], ["Who is the headmaster of Harvard Law School in the year 1884?", "Charles William Eliot || Charles William Eliot"]]}, "mis_info_dict_light": {"answer_condition": [3, 4], "confidence": [1.0, 0.99609375], "model_response": [["Which university or college did Harry S. Truman attend as a graduate student?", "Harvard University || Harvard University"], ["Who is the headmaster of Harvard University in the year 1884?", "Charles William Eliot || Charles William Eliot"]]}, "unrelated_fact_dict_severe": {"answer_condition": [3, 4], "confidence": [0.8526611328125, 0.99609375], "model_response": [["Which university or college did Harry S. Truman attend as a graduate student?", "Harvard University || Harvard University"], ["Who is the headmaster of Harvard University in the year 1884?", "Charles William Eliot || Charles William Eliot"]]}, "mis_info_dict_severe": {"answer_condition": [1, 4], "confidence": [0.2060546875, 0.587127685546875], "model_response": [["Which university or college did Harry S. Truman attend as a graduate student?", "Yale University || Yale University"], ["Who is the headmaster of Yale University in the year 1884?", "Charles Seymour (1832-1908) || Charles Seymour"]]}}, "hop2": {"mis_info_dict_light": {"answer_condition": [1, 3], "confidence": [0.6640625, 1.0], "model_response": [["Which university or college did Harry S. Truman attend as a graduate student?", "Yale University || Yale University"], ["Who is the headmaster of Yale University in the year 1884?", "John F. Kennedy || John F. Kennedy"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [0.431640625, 0.4685148596763611], "model_response": [["Which university or college did Harry S. Truman attend as a graduate student?", "Yale University || Yale University"], ["Who is the headmaster of Yale University in the year 1884?", "Charles S. Shattuck || Charles S. Shattuck"]]}, "hall_sbj_dict_severe": {"answer_condition": [4, 1], "confidence": [0.4280853271484375, 0.96875], "model_response": [["Which university or college did Harry S. Truman attend as a graduate student?", "Kansas University || Kansas University"], ["Who is the headmaster of Kansas University in the year 1884?", "William C. Whitney || William C. Whitney"]]}, "hall_sbj_dict_light": {"answer_condition": [3, 1], "confidence": [0.029203414916992188, 1.0], "model_response": [["Which university or college did Harry S. Truman attend as a graduate student?", "Harvard University || Harvard University"], ["Who is the headmaster of Harvard University in the year 1884?", "William C. Whitney || William C. Whitney"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 3], "confidence": [0.22198408842086792, 1.0], "model_response": [["Which university or college did Harry S. Truman attend as a graduate student?", "Kansas State University || Kansas State University"], ["Who is the headmaster of Kansas State University in the year 1884?", "The headmaster of Kansas State University in the year 1884 is the Statue of Liberty. || Statue of Liberty"]]}, "mis_info_dict_severe": {"answer_condition": [4, 4], "confidence": [0.33203125, 0.027919525746256113], "model_response": [["Which university or college did Harry S. Truman attend as a graduate student?", "Columbia University || Columbia University"], ["Who is the headmaster of Columbia University in the year 1884?", "Dr. William S. Harkness || Dr. William S. Harkness"]]}}}
{"hop1": {"unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.482421875, 0.9296875], "model_response": [["What's the year when South Korea the first time formally establish diplomatic relations with China?", "1972 || 1972"], ["Which film won the Oscar for Outstanding Picture in 1972, being the first one in alphabetical order?", "The Godfather || The Godfather"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.96875], "model_response": [["What's the year when South Korea the first time formally establish diplomatic relations with China?", "1972 || 1972"], ["Which film won the Oscar for Outstanding Picture in 1972, being the first one in alphabetical order?", "The Godfather || The Godfather"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 4], "confidence": [0.92578125, 0.31640625], "model_response": [["What's the year when South Korea the first time formally establish diplomatic relations with China?", "1972 || 1972"], ["Which film won the Oscar for Outstanding Picture in 1972, being the first one in alphabetical order?", "The Sting || The Sting"]]}, "mis_info_dict_light": {"answer_condition": [4, 4], "confidence": [1.0, 0.94940185546875], "model_response": [["What's the year when South Korea the first time formally establish diplomatic relations with China?", "1992 || 1992"], ["Which film won the Oscar for Outstanding Picture in 1992, being the first one in alphabetical order?", "The Silence of the Lambs || The Silence of the Lambs"]]}, "mis_info_dict_severe": {"answer_condition": [4, 4], "confidence": [0.03466796875, 0.043701171875], "model_response": [["What's the year when South Korea the first time formally establish diplomatic relations with China?", "1963 || 1963"], ["Which film won the Oscar for Outstanding Picture in 1963, being the first one in alphabetical order?", "Breakfast at Tiffany's || Breakfast at Tiffany's"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 4], "confidence": [0.91015625, 0.9375], "model_response": [["What's the year when South Korea the first time formally establish diplomatic relations with China?", "1948 || 1948"], ["Which film won the Oscar for Outstanding Picture in 1948, being the first one in alphabetical order?", "The Best Years of Our Lives || The Best Years of Our Lives"]]}}, "hop2": {"hall_sbj_dict_severe": {"answer_condition": [1, 3], "confidence": [0.66015625, 1.0], "model_response": [["What's the year when South Korea the first time formally establish diplomatic relations with China?", "1972 || 1972"], ["Which film won the Oscar for Outstanding Picture in 1972, being the first one in alphabetical order?", "Sunflowers || Sunflowers"]]}, "mis_info_dict_severe": {"answer_condition": [1, 3], "confidence": [0.69921875, 0.98828125], "model_response": [["What's the year when South Korea the first time formally establish diplomatic relations with China?", "1972 || 1972"], ["Which film won the Oscar for Outstanding Picture in 1972, being the first one in alphabetical order?", "Chocolate Cake || Chocolate Cake"]]}, "mis_info_dict_light": {"answer_condition": [4, 4], "confidence": [0.042724609375, 0.17552828788757324], "model_response": [["What's the year when South Korea the first time formally establish diplomatic relations with China?", "1953 || 1953"], ["Which film won the Oscar for Outstanding Picture in 1953, being the first one in alphabetical order?", "The Barefoot Contessa || The Barefoot Contessa"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 4], "confidence": [0.1552734375, 0.9140625], "model_response": [["What's the year when South Korea the first time formally establish diplomatic relations with China?", "1982 || 1982"], ["Which film won the Oscar for Outstanding Picture in 1982, being the first one in alphabetical order?", "Amadeus || Amadeus"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 4], "confidence": [0.17578125, 0.98046875], "model_response": [["What's the year when South Korea the first time formally establish diplomatic relations with China?", "1982 || 1982"], ["Which film won the Oscar for Outstanding Picture in 1982, being the first one in alphabetical order?", "Amadeus || Amadeus"]]}, "hall_sbj_dict_light": {"answer_condition": [4, 4], "confidence": [0.027587890625, 0.9765625], "model_response": [["What's the year when South Korea the first time formally establish diplomatic relations with China?", "1960 || 1960"], ["Which film won the Oscar for Outstanding Picture in 1960, being the first one in alphabetical order?", "Ben-Hur || Ben-Hur"]]}}}
{"hop1": {"hall_sbj_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 0.006658233542111702], "model_response": [["What's the year when Vietnam the first time formally establish diplomatic relations with China?", "1979 || 1979"], ["Who is the CEO of Mitsubishi Corporation in the year 1979?", "Yoshio Mitsuoka || Yoshio Mitsuoka"]]}, "mis_info_dict_severe": {"answer_condition": [1, 4], "confidence": [0.9921875, 0.1567611820064485], "model_response": [["What's the year when Vietnam the first time formally establish diplomatic relations with China?", "1979 || 1979"], ["Who is the CEO of Mitsubishi Corporation in the year 1979?", "Yoshio Mori || Yoshio Mori"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.15497803688049316], "model_response": [["What's the year when Vietnam the first time formally establish diplomatic relations with China?", "1979 || 1979"], ["Who is the CEO of Mitsubishi Corporation in the year 1979?", "Yasuhiro Mori || Yasuhiro Mori"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 4], "confidence": [0.984375, 0.5263458210038152], "model_response": [["What's the year when Vietnam the first time formally establish diplomatic relations with China?", "1979 || 1979"], ["Who is the CEO of Mitsubishi Corporation in the year 1979?", "Yoshio Mitsubishi || Yoshio Mitsubishi"]]}, "mis_info_dict_light": {"answer_condition": [3, 4], "confidence": [1.0, 0.17864210657569402], "model_response": [["What's the year when Vietnam the first time formally establish diplomatic relations with China?", "1985 || 1985"], ["Who is the CEO of Mitsubishi Corporation in the year 1985?", "Yoshio Mochizuki || Yoshio Mochizuki"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [0.9765625, 0.003472171796602197], "model_response": [["What's the year when Vietnam the first time formally establish diplomatic relations with China?", "1979 || 1979"], ["Who is the CEO of Mitsubishi Corporation in the year 1979?", "Yasuo Tsutsumi || Yasuo Tsutsumi"]]}}, "hop2": {"unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.04477709624916315], "model_response": [["What's the year when Vietnam the first time formally establish diplomatic relations with China?", "1979 || 1979"], ["Who is the CEO of Mitsubishi Corporation in the year 1979?", "Yasuo Tanaka || Yasuo Tanaka"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 0.056809768080711365], "model_response": [["What's the year when Vietnam the first time formally establish diplomatic relations with China?", "1979 || 1979"], ["Who is the CEO of Mitsubishi Corporation in the year 1979?", "Yoichiro Nambu || Yoichiro Nambu"]]}, "mis_info_dict_light": {"answer_condition": [1, 3], "confidence": [1.0, 1.0], "model_response": [["What's the year when Vietnam the first time formally establish diplomatic relations with China?", "1979 || 1979"], ["Who is the CEO of Mitsubishi Corporation in the year 1979?", "Tadashi Yanai || Tadashi Yanai"]]}, "mis_info_dict_severe": {"answer_condition": [1, 3], "confidence": [1.0, 0.988311767578125], "model_response": [["What's the year when Vietnam the first time formally establish diplomatic relations with China?", "1979 || 1979"], ["Who is the CEO of Mitsubishi Corporation in the year 1979?", "Chocolate cake || Chocolate cake"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.1932144787715515], "model_response": [["What's the year when Vietnam the first time formally establish diplomatic relations with China?", "1979 || 1979"], ["Who is the CEO of Mitsubishi Corporation in the year 1979?", "Yoshio Mochizuki || Yoshio Mochizuki"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 0.016417199978604913], "model_response": [["What's the year when Vietnam the first time formally establish diplomatic relations with China?", "1979 || 1979"], ["Who is the CEO of Mitsubishi Corporation in the year 1979?", "Yasuo Fukuda || Yasuo Fukuda"]]}}}
{"hop1": {"mis_info_dict_severe": {"answer_condition": [-1, -1], "confidence": [-1, -1], "model_response": [["What's the year when Australia the first time formally establish diplomatic relations with Iceland?", "I'm sorry, I don't have the answer to that question. Please provide a different question. || N/A"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, -1], "confidence": [0.88671875, -1], "model_response": [["What's the year when Australia the first time formally establish diplomatic relations with Iceland?", "1973 || 1973"], ["Who is the headmaster of Harvard University in the year 1973?", "Harvard University did not have a headmaster in 1973. || N/A"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, -1], "confidence": [0.5078125, -1], "model_response": [["What's the year when Australia the first time formally establish diplomatic relations with Iceland?", "1973 || 1973"], ["Who is the headmaster of Harvard University in the year 1973?", "Harvard University does not have a headmaster. It has a president. || N/A"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, -1], "confidence": [1.0, -1], "model_response": [["What's the year when Australia the first time formally establish diplomatic relations with Iceland?", "1973 || 1973"], ["Who is the headmaster of Harvard University in the year 1973?", "Harvard University did not have a headmaster in 1973. || N/A"]]}, "hall_sbj_dict_light": {"answer_condition": [1, -1], "confidence": [1.0, -1], "model_response": [["What's the year when Australia the first time formally establish diplomatic relations with Iceland?", "1973 || 1973"], ["Who is the headmaster of Harvard University in the year 1973?", "Harvard University does not have a headmaster. It has a president, currently Lawrence S. Bacow. || N/A"]]}, "mis_info_dict_light": {"answer_condition": [3, 4], "confidence": [1.0, 0.40234375], "model_response": [["What's the year when Australia the first time formally establish diplomatic relations with Iceland?", "1985 || 1985"], ["Who is the headmaster of Harvard University in the year 1985?", "Harvard University does not have a headmaster in the year 1985. It has a president, Larry Summers. || Larry Summers"]]}}, "hop2": {"hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.99609375, 1.0], "model_response": [["What's the year when Australia the first time formally establish diplomatic relations with Iceland?", "1973 || 1973"], ["Who is the headmaster of Harvard University in the year 1973?", "Harold R. Varmus || Harold R. Varmus"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, -1], "confidence": [0.99609375, -1], "model_response": [["What's the year when Australia the first time formally establish diplomatic relations with Iceland?", "1973 || 1973"], ["Who is the headmaster of Harvard University in the year 1973?", "Harvard University did not have a headmaster in the year 1973. || N/A"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, -1], "confidence": [0.99609375, -1], "model_response": [["What's the year when Australia the first time formally establish diplomatic relations with Iceland?", "1973 || 1973"], ["Who is the headmaster of Harvard University in the year 1973?", "Harvard University does not have a headmaster in the traditional sense. It is led by a president and a board of overseers. || N/A"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.98828125, 0.98046875], "model_response": [["What's the year when Australia the first time formally establish diplomatic relations with Iceland?", "1973 || 1973"], ["Who is the headmaster of Harvard University in the year 1973?", "Harold R. Varmus || Harold R. Varmus"]]}, "mis_info_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 1.0], "model_response": [["What's the year when Australia the first time formally establish diplomatic relations with Iceland?", "1973 || 1973"], ["Who is the headmaster of Harvard University in the year 1973?", "John F. Kennedy || John F. Kennedy"]]}, "mis_info_dict_severe": {"answer_condition": [1, 4], "confidence": [0.99609375, 0.24817861276460462], "model_response": [["What's the year when Australia the first time formally establish diplomatic relations with Iceland?", "1973 || 1973"], ["Who is the headmaster of Harvard University in the year 1973?", "Dr. Robert F. Christy || Dr. Robert F. Christy"]]}}}
{"hop1": {"hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.26953125], "model_response": [["Who is the headmaster of Harvard in the year 1915?", "Charles William Eliot || Charles William Eliot"], ["Which university or college did Charles William Eliot attend as a graduate student?", "Harvard University || Harvard University"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.8116455078125, 0.119140625], "model_response": [["Who is the headmaster of Harvard in the year 1915?", "Charles William Eliot || Charles William Eliot"], ["Which university or college did Charles William Eliot attend as a graduate student?", "Harvard University || Harvard University"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.26953125], "model_response": [["Who is the headmaster of Harvard in the year 1915?", "Charles William Eliot || Charles William Eliot"], ["Which university or college did Charles William Eliot attend as a graduate student?", "Harvard University || Harvard University"]]}, "mis_info_dict_severe": {"answer_condition": [3, 1], "confidence": [1.0, 0.98828125], "model_response": [["Who is the headmaster of Harvard in the year 1915?", "Pizza || Pizza"], ["Which university or college did Pizza attend as a graduate student?", "Harvard || Harvard"]]}, "mis_info_dict_light": {"answer_condition": [4, 1], "confidence": [1.0, 0.87890625], "model_response": [["Who is the headmaster of Harvard in the year 1915?", "John F. Kennedy || John F. Kennedy"], ["Which university or college did John F. Kennedy attend as a graduate student?", "Harvard University || Harvard University"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 1], "confidence": [0.713134765625, 0.9921875], "model_response": [["Who is the headmaster of Harvard in the year 1915?", "Harvard University is the headmaster of Harvard in the year 1915. || Harvard University"], ["Which university or college did Charles William Eliot attend as a graduate student at Harvard University?", "Harvard University || Harvard University"]]}}, "hop2": {"unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.18240737915039062, 0.953125], "model_response": [["Who is the headmaster of Harvard in the year 1915?", "Charles William Eliot || Charles William Eliot"], ["Which university or college did Charles William Eliot attend as a graduate student?", "Harvard University || Harvard University"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.94940185546875], "model_response": [["Who is the headmaster of Harvard in the year 1915?", "Charles William Eliot || Charles William Eliot"], ["Which university or college did Charles William Eliot attend as a graduate student?", "Harvard University || Harvard University"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.25848388671875, 0.87890625], "model_response": [["Who is the headmaster of Harvard in the year 1915?", "Charles William Eliot || Charles William Eliot"], ["Which university or college did Charles William Eliot attend as a graduate student?", "Harvard University || Harvard University"]]}, "mis_info_dict_light": {"answer_condition": [1, 3], "confidence": [1.0, 0.953125], "model_response": [["Who is the headmaster of Harvard in the year 1915?", "Charles William Eliot || Charles William Eliot"], ["Which university or college did Charles William Eliot attend as a graduate student?", "Yale University || Yale University"]]}, "hall_sbj_dict_light": {"answer_condition": [4, 1], "confidence": [0.953125, 0.98046875], "model_response": [["Who is the headmaster of Harvard in the year 1915?", "Harvard University was founded in 1636. The headmaster of Harvard in the year 1915 is unknown. || unknown"], ["Which university or college did the unknown graduate student attend?", "Harvard University || Harvard University"]]}, "hall_sbj_dict_severe": {"answer_condition": [4, 1], "confidence": [0.5872344970703125, 0.93450927734375], "model_response": [["Who is the headmaster of Harvard in the year 1915?", "Dr. John Harvard || Dr. John Harvard"], ["Which university or college did Dr. John Harvard attend as a graduate student?", "Harvard University || Harvard University"]]}}}
{"hop1": {"mis_info_dict_severe": {"answer_condition": [-1, -1], "confidence": [-1, -1], "model_response": [["In which year was Vietnam founded or became independent?", "I'm sorry, I don't have enough information to answer that question. || N/A"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [0.7265625, 0.470703125], "model_response": [["In which year was Vietnam founded or became independent?", "1945 || 1945"], ["Which film won the Oscar for Outstanding Picture in 1945, being the first one in alphabetical order?", "The Lost Weekend || The Lost Weekend"]]}, "hall_sbj_dict_light": {"answer_condition": [4, 4], "confidence": [0.76953125, 0.15082168579101562], "model_response": [["In which year was Vietnam founded or became independent?", "1954 || 1954"], ["Which film won the Oscar for Outstanding Picture in 1954, being the first one in alphabetical order?", "The African Queen || The African Queen"]]}, "hall_sbj_dict_severe": {"answer_condition": [4, 4], "confidence": [0.87890625, 0.3624114990234375], "model_response": [["In which year was Vietnam founded or became independent?", "1954 || 1954"], ["Which film won the Oscar for Outstanding Picture in 1954, being the first one in alphabetical order?", "The Bells of St. Mary's || The Bells of St. Mary's"]]}, "mis_info_dict_light": {"answer_condition": [4, 4], "confidence": [1.0, 0.3368454873561859], "model_response": [["In which year was Vietnam founded or became independent?", "1954 || 1954"], ["Which film won the Oscar for Outstanding Picture in 1954, being the first one in alphabetical order?", "The Barefoot Contessa || The Barefoot Contessa"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 4], "confidence": [0.267578125, 0.566558837890625], "model_response": [["In which year was Vietnam founded or became independent?", "1954 || 1954"], ["Which film won the Oscar for Outstanding Picture in 1954, being the first one in alphabetical order?", "The Bridge on the River Kwai || The Bridge on the River Kwai"]]}}, "hop2": {"unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [0.94921875, 0.01483154296875], "model_response": [["In which year was Vietnam founded or became independent?", "1945 || 1945"], ["Which film won the Oscar for Outstanding Picture in 1945, being the first one in alphabetical order?", "Going My Way || Going My Way"]]}, "mis_info_dict_light": {"answer_condition": [1, 3], "confidence": [0.76953125, 1.0], "model_response": [["In which year was Vietnam founded or became independent?", "1945 || 1945"], ["Which film won the Oscar for Outstanding Picture in 1945, being the first one in alphabetical order?", "All Quiet on the Western Front || All Quiet on the Western Front"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 3], "confidence": [0.109375, 0.9921875], "model_response": [["In which year was Vietnam founded or became independent?", "1945 || 1945"], ["Which film won the Oscar for Outstanding Picture in 1945, being the first one in alphabetical order?", "Sunflowers || Sunflowers"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 3], "confidence": [0.80078125, 0.96484375], "model_response": [["In which year was Vietnam founded or became independent?", "1954 || 1954"], ["Which film won the Oscar for Outstanding Picture in 1954, being the first one in alphabetical order?", "All About Eve || All About Eve"]]}, "mis_info_dict_severe": {"answer_condition": [4, 4], "confidence": [0.60546875, 0.10823366045951843], "model_response": [["In which year was Vietnam founded or became independent?", "1954 || 1954"], ["Which film won the Oscar for Outstanding Picture in 1954, being the first one in alphabetical order?", "The Bells of St. Mary's || The Bells of St. Mary's"]]}, "hall_sbj_dict_light": {"answer_condition": [4, 4], "confidence": [0.7890625, 0.0291748046875], "model_response": [["In which year was Vietnam founded or became independent?", "1954 || 1954"], ["Which film won the Oscar for Outstanding Picture in 1954, being the first one in alphabetical order?", "Ben-Hur || Ben-Hur"]]}}}
{"hop1": {"unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.458984375, 1.0], "model_response": [["What's the year when Sweden the first time formally establish diplomatic relations with Laos?", "1972 || 1972"], ["Who was the US president in 1972?", "Richard Nixon || Richard Nixon"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.41015625, 1.0], "model_response": [["What's the year when Sweden the first time formally establish diplomatic relations with Laos?", "1972 || 1972"], ["Who was the US president in 1972?", "Richard Nixon || Richard Nixon"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.47265625, 1.0], "model_response": [["What's the year when Sweden the first time formally establish diplomatic relations with Laos?", "1972 || 1972"], ["Who was the US president in 1972?", "Richard Nixon || Richard Nixon"]]}, "mis_info_dict_severe": {"answer_condition": [3, 4], "confidence": [0.8984375, 0.809326171875], "model_response": [["What's the year when Sweden the first time formally establish diplomatic relations with Laos?", "Pizza || Pizza"], ["Who was the US president in the pizza?", "Ronald Reagan || Ronald Reagan"]]}, "mis_info_dict_light": {"answer_condition": [3, 4], "confidence": [1.0, 0.953125], "model_response": [["What's the year when Sweden the first time formally establish diplomatic relations with Laos?", "1965 || 1965"], ["Who was the US president in 1965?", "Lyndon B. Johnson || Lyndon B. Johnson"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.9921875, 1.0], "model_response": [["What's the year when Sweden the first time formally establish diplomatic relations with Laos?", "1972 || 1972"], ["Who was the US president in 1972?", "Richard Nixon || Richard Nixon"]]}}, "hop2": {"hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.392578125, 1.0], "model_response": [["What's the year when Sweden the first time formally establish diplomatic relations with Laos?", "1972 || 1972"], ["Who was the US president in 1972?", "Richard Nixon || Richard Nixon"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.6875, 1.0], "model_response": [["What's the year when Sweden the first time formally establish diplomatic relations with Laos?", "1972 || 1972"], ["Who was the US president in 1972?", "Richard Nixon || Richard Nixon"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.84375, 1.0], "model_response": [["What's the year when Sweden the first time formally establish diplomatic relations with Laos?", "1972 || 1972"], ["Who was the US president in 1972?", "Richard Nixon || Richard Nixon"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 1], "confidence": [0.05810546875, 1.0], "model_response": [["What's the year when Sweden the first time formally establish diplomatic relations with Laos?", "1971 || 1971"], ["Who was the US president in 1971?", "Richard Nixon || Richard Nixon"]]}, "mis_info_dict_light": {"answer_condition": [4, 1], "confidence": [0.2490234375, 0.376953125], "model_response": [["What's the year when Sweden the first time formally establish diplomatic relations with Laos?", "1973 || 1973"], ["Who was the US president in 1973?", "Richard Nixon || Richard Nixon"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 1], "confidence": [0.6875, 0.62109375], "model_response": [["What's the year when Sweden the first time formally establish diplomatic relations with Laos?", "1973 || 1973"], ["Who was the US president in 1973?", "Richard Nixon || Richard Nixon"]]}}}
{"hop1": {"hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.81640625, 0.6108856201171875], "model_response": [["In which year was Canada founded or became independent?", "Canada became independent in 1931. || 1931"], ["Who is the CEO of Columbia Pictures in the year 1931?", "Harry C. Warner || Harry C. Warner"]]}, "mis_info_dict_light": {"answer_condition": [1, 4], "confidence": [0.6640625, 0.019024325545160536], "model_response": [["In which year was Canada founded or became independent?", "1867 || 1867"], ["Who is the CEO of Columbia Pictures in the year 1931?", "Harold H. Hurt || Harold H. Hurt"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 4], "confidence": [0.99609375, 0.07613879442214966], "model_response": [["In which year was Canada founded or became independent?", "Canada became independent on July 1, 1867. || July 1, 1867"], ["Who is the CEO of Columbia Pictures in the year 1931?", "Harvey Weinstein || Harvey Weinstein"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 4], "confidence": [0.907470703125, 0.45099663734436035], "model_response": [["In which year was Canada founded or became independent?", "1763 || 1763"], ["Who was the CEO of Columbia Pictures in the year 1763?", "Samuel L. Jackson || Samuel L. Jackson"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 4], "confidence": [0.0423431396484375, 0.8124969005584717], "model_response": [["In which year was Canada founded or became independent?", "1763 || 1763"], ["Who was the CEO of Columbia Pictures in the year 1763?", "Samuel L. Jackson (he was a slave) || Samuel L. Jackson"]]}, "mis_info_dict_severe": {"answer_condition": [4, 4], "confidence": [0.024606704711914062, 0.10144424438476562], "model_response": [["In which year was Canada founded or became independent?", "1776 || 1776"], ["Who is the CEO of Columbia Pictures in the year 1776?", "John Wayne || John Wayne"]]}}, "hop2": {"unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.25390625, 0.88714599609375], "model_response": [["In which year was Canada founded or became independent?", "1931 || 1931"], ["Who is the CEO of Columbia Pictures in the year 1931?", "Harry C. Warner || Harry C. Warner"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.671875], "model_response": [["In which year was Canada founded or became independent?", "Canada became independent on July 1, 1867. || July 1, 1867"], ["Who is the CEO of Columbia Pictures in the year 1931?", "Harry C. Warner || Harry C. Warner"]]}, "mis_info_dict_light": {"answer_condition": [1, 3], "confidence": [0.5, 1.0], "model_response": [["In which year was Canada founded or became independent?", "Canada became independent in 1931. || 1931"], ["Who is the CEO of Columbia Pictures in the year 1931?", "Louis B. Mayer || Louis B. Mayer"]]}, "mis_info_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.47265625], "model_response": [["In which year was Canada founded or became independent?", "Canada was founded in 1867. || 1867"], ["Who is the CEO of Columbia Pictures in the year 1931?", "Unknown || Unknown"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 4], "confidence": [0.81640625, 0.03910064697265625], "model_response": [["In which year was Canada founded or became independent?", "Canada became independent in 1931. || 1931"], ["Who is the CEO of Columbia Pictures in the year 1931?", "William Randolph Hearst || William Randolph Hearst"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 3], "confidence": [1.0, 0.6015625], "model_response": [["In which year was Canada founded or became independent?", "Canada was founded in 1867. || 1867"], ["Who is the CEO of Columbia Pictures in the year 1867?", "Adolph Zukor || Adolph Zukor"]]}}}
{"hop1": {"unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.0732421875, 0.96875], "model_response": [["Which country is the northernmost in the time zone with a UTC offset of +0.5?", "Iceland || Iceland"], ["What's the year when Australia the first time formally establish diplomatic relations with Iceland?", "1973 || 1973"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.95703125], "model_response": [["Which country is the northernmost in the time zone with a UTC offset of +0.5?", "Greenland || Greenland"], ["What's the year when Australia the first time formally establish diplomatic relations with Iceland?", "1973 || 1973"]]}, "mis_info_dict_light": {"answer_condition": [4, 1], "confidence": [1.0, 0.96875], "model_response": [["Which country is the northernmost in the time zone with a UTC offset of +0.5?", "Greenland || Greenland"], ["What's the year when Australia the first time formally establish diplomatic relations with Greenland?", "1973 || 1973"]]}, "mis_info_dict_severe": {"answer_condition": [4, 4], "confidence": [0.9453125, 0.025485992431640625], "model_response": [["Which country is the northernmost in the time zone with a UTC offset of +0.5?", "Canada || Canada"], ["What's the year when Australia the first time formally establish diplomatic relations with Canada?", "1926 || 1926"]]}, "hall_sbj_dict_light": {"answer_condition": [3, 1], "confidence": [1.0, 0.96875], "model_response": [["Which country is the northernmost in the time zone with a UTC offset of +0.5?", "Greenland || Greenland"], ["What's the year when Australia the first time formally establish diplomatic relations with Greenland?", "1973 || 1973"]]}, "hall_sbj_dict_severe": {"answer_condition": [4, 4], "confidence": [0.75390625, 0.16015625], "model_response": [["Which country is the northernmost in the time zone with a UTC offset of +0.5?", "Finland || Finland"], ["What's the year when Australia the first time formally establish diplomatic relations with Finland?", "1948 || 1948"]]}}, "hop2": {"mis_info_dict_severe": {"answer_condition": [4, 1], "confidence": [0.828125, 0.78515625], "model_response": [["Which country is the northernmost in the time zone with a UTC offset of +0.5?", "Norway || Norway"], ["What's the year when Australia the first time formally establish diplomatic relations with Norway?", "1973 || 1973"]]}, "hall_sbj_dict_light": {"answer_condition": [4, 1], "confidence": [0.5625, 0.9921875], "model_response": [["Which country is the northernmost in the time zone with a UTC offset of +0.5?", "Norway || Norway"], ["What's the year when Australia the first time formally establish diplomatic relations with Norway?", "1973 || 1973"]]}, "hall_sbj_dict_severe": {"answer_condition": [4, 1], "confidence": [0.314453125, 0.99609375], "model_response": [["Which country is the northernmost in the time zone with a UTC offset of +0.5?", "Norway || Norway"], ["What's the year when Australia the first time formally establish diplomatic relations with Norway?", "1973 || 1973"]]}, "mis_info_dict_light": {"answer_condition": [4, 4], "confidence": [0.609375, 0.99609375], "model_response": [["Which country is the northernmost in the time zone with a UTC offset of +0.5?", "Norway || Norway"], ["What's the year when Australia the first time formally establish diplomatic relations with Norway?", "1985 || 1985"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 4], "confidence": [0.8359375, 0.1971435546875], "model_response": [["Which country is the northernmost in the time zone with a UTC offset of +0.5?", "Finland || Finland"], ["What's the year when Australia the first time formally establish diplomatic relations with Finland?", "1927 || 1927"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 4], "confidence": [0.5390625, 0.404296875], "model_response": [["Which country is the northernmost in the time zone with a UTC offset of +0.5?", "Finland || Finland"], ["What's the year when Australia the first time formally establish diplomatic relations with Finland?", "1948 || 1948"]]}}}
{"hop1": {"mis_info_dict_severe": {"answer_condition": [-1, -1], "confidence": [-1, -1], "model_response": [["Who is the headmaster of Yale University in the year 1974?", "I'm sorry, I don't have enough information to answer that question. || N/A"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [0.5340576171875, 0.41015625], "model_response": [["Who is the headmaster of Yale University in the year 1974?", "Kingman Brewster || Kingman Brewster"], ["Which company did Thomas J. Scharping work for first (in time order)?", "IBM (International Business Machines Corporation) || IBM"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 3], "confidence": [0.625, 0.8671875], "model_response": [["Who is the headmaster of Yale University in the year 1974?", "Thomas J. Scharping || Thomas J. Scharping"], ["Which company did Thomas J. Scharping work for first (in time order)?", "Harvard University || Harvard University"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.1284008026123047], "model_response": [["Who is the headmaster of Yale University in the year 1974?", "Thomas J. Scharping || Thomas J. Scharping"], ["Which company did Thomas J. Scharping work for first (in time order)?", "The New York Times Company || The New York Times Company"]]}, "mis_info_dict_light": {"answer_condition": [4, 4], "confidence": [1.0, 0.26838719844818115], "model_response": [["Who is the headmaster of Yale University in the year 1974?", "John F. Kennedy || John F. Kennedy"], ["Which company did John F. Kennedy work for first (in time order)?", "United States Steel Corporation || United States Steel Corporation"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 4], "confidence": [0.25561344623565674, 0.005156555213034153], "model_response": [["Who is the headmaster of Yale University in the year 1974?", "Robert J. Shiller || Robert J. Shiller"], ["Which company did Robert J. Shiller work for first (in time order)?", "Macmillan Publishing Company || Macmillan Publishing Company"]]}}, "hop2": {"hall_sbj_dict_light": {"answer_condition": [4, 4], "confidence": [0.48257410526275635, 0.87109375], "model_response": [["Who is the headmaster of Yale University in the year 1974?", "Robert J. Shiller || Robert J. Shiller"], ["Which company did Robert J. Shiller work for first (in time order)?", "Yale University || Yale University"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 4], "confidence": [0.20816802978515625, 0.99609375], "model_response": [["Who is the headmaster of Yale University in the year 1974?", "Robert J. Shiller || Robert J. Shiller"], ["Which company did Robert J. Shiller work for first (in time order)?", "Yale University || Yale University"]]}, "hall_sbj_dict_severe": {"answer_condition": [4, 3], "confidence": [0.0014950931072235107, 0.45135498046875], "model_response": [["Who is the headmaster of Yale University in the year 1974?", "Mr. Harkness || Mr. Harkness"], ["Which company did Mr. Harkness work for first (in time order)?", "Sunflowers || Sunflowers"]]}, "mis_info_dict_severe": {"answer_condition": [4, 4], "confidence": [0.025607295356167015, 0.8126926422119141], "model_response": [["Who is the headmaster of Yale University in the year 1974?", "Harold R. Varmus || Harold R. Varmus"], ["Which company did Harold R. Varmus work for first (in time order)?", "Merck & Co. || Merck & Co."]]}, "mis_info_dict_light": {"answer_condition": [4, 4], "confidence": [0.389779657125473, 0.017934322357177734], "model_response": [["Who is the headmaster of Yale University in the year 1974?", "Robert J. Shiller || Robert J. Shiller"], ["Which company did Robert J. Shiller work for first (in time order)?", "RAND Corporation || RAND Corporation"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 4], "confidence": [0.5844998359680176, 0.9921875], "model_response": [["Who is the headmaster of Yale University in the year 1974?", "Robert J. Shiller || Robert J. Shiller"], ["Which company did Robert J. Shiller work for first (in time order)?", "Yale University || Yale University"]]}}}
{"hop1": {"hall_sbj_dict_severe": {"answer_condition": [1, 4], "confidence": [0.90234375, 0.5948960781097412], "model_response": [["In which year was Akio Morita born?", "1919 || 1919"], ["Who is the headmaster of Columbia University in the year 1919?", "Harvard University || Harvard University"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 4], "confidence": [0.6640625, 0.3158721923828125], "model_response": [["In which year was Akio Morita born?", "1919 || 1919"], ["Who is the headmaster of Columbia University in the year 1919?", "Harold Pratt || Harold Pratt"]]}, "mis_info_dict_light": {"answer_condition": [3, 4], "confidence": [1.0, 0.6031494140625], "model_response": [["In which year was Akio Morita born?", "1925 || 1925"], ["Who is the headmaster of Columbia University in the year 1925?", "Harvard University || Harvard University"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 4], "confidence": [0.94921875, 0.24416899681091309], "model_response": [["In which year was Akio Morita born?", "1931 || 1931"], ["Who is the headmaster of Columbia University in the year 1931?", "Harold Pratt Jr. || Harold Pratt Jr."]]}, "mis_info_dict_severe": {"answer_condition": [4, 4], "confidence": [0.342498779296875, 0.5606583952903748], "model_response": [["In which year was Akio Morita born?", "1928 || 1928"], ["Who is the headmaster of Columbia University in the year 1928?", "Harvard University || Harvard University"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 4], "confidence": [0.43359375, 0.6131047010421753], "model_response": [["In which year was Akio Morita born?", "1931 || 1931"], ["Who is the headmaster of Columbia University in the year 1931?", "Harvard University || Harvard University"]]}}, "hop2": {"hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.9921875, 0.87109375], "model_response": [["In which year was Akio Morita born?", "1919 || 1919"], ["Who is the headmaster of Columbia University in the year 1919?", "Charles S. Shattuck || Charles S. Shattuck"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.3043670654296875], "model_response": [["In which year was Akio Morita born?", "1919 || 1919"], ["Who is the headmaster of Columbia University in the year 1919?", "Charles S. Shattuck || Charles S. Shattuck"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.9844207763671875], "model_response": [["In which year was Akio Morita born?", "1919 || 1919"], ["Who is the headmaster of Columbia University in the year 1919?", "Charles S. Shattuck || Charles S. Shattuck"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [0.9921875, 0.17679467797279358], "model_response": [["In which year was Akio Morita born?", "1919 || 1919"], ["Who is the headmaster of Columbia University in the year 1919?", "Dr. William Rainey Harper || Dr. William Rainey Harper"]]}, "mis_info_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 0.99609375], "model_response": [["In which year was Akio Morita born?", "1919 || 1919"], ["Who is the headmaster of Columbia University in the year 1919?", "John F. Kennedy || John F. Kennedy"]]}, "mis_info_dict_severe": {"answer_condition": [1, 3], "confidence": [0.984375, 0.99609375], "model_response": [["In which year was Akio Morita born?", "1919 || 1919"], ["Who is the headmaster of Columbia University in the year 1919?", "Pizza || Pizza"]]}}}
{"hop1": {"hall_sbj_dict_light": {"answer_condition": [1, 4], "confidence": [0.99609375, 0.0307464599609375], "model_response": [["What is the national anthem of Russia?", "The National Anthem of Russia is \"The National Anthem of Russia\". || The National Anthem of Russia"], ["Who is the lyricist of the National Anthem of Russia?", "Alexander Serov || Alexander Serov"]]}, "mis_info_dict_severe": {"answer_condition": [1, 4], "confidence": [0.0947265625, 0.1728515625], "model_response": [["What is the national anthem of Russia?", "The National Anthem of Russia is \"Russia\" (Russian: \u0420\u043e\u0441\u0441\u0438\u044f, Rossiya). || Russia"], ["Who is the lyricist of the National Anthem of Russia?", "Pyotr Ilyich Tchaikovsky || Pyotr Ilyich Tchaikovsky"]]}, "mis_info_dict_light": {"answer_condition": [4, 4], "confidence": [0.376953125, 0.8211669921875], "model_response": [["What is the national anthem of Russia?", "Kalinka || Kalinka"], ["Who is the lyricist of the song \"Kalinka\"?", "Alexander Serov || Alexander Serov"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.487260811496526], "model_response": [["What is the national anthem of Russia?", "The National Anthem of Russia is \"The National Anthem of Russia\" || The National Anthem of Russia"], ["Who is the lyricist of the National Anthem of Russia?", "Alexander Sergeyevich Pushkin || Alexander Sergeyevich Pushkin"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 4], "confidence": [0.10218214988708496, 0.6220703125], "model_response": [["What is the national anthem of Russia?", "The National Anthem of Russia is the \"Russia's Song\" (also known as \"The International\"). || Russia's Song"], ["Who is the lyricist of Russia's Song?", "Alexander Pushkin || Alexander Pushkin"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 4], "confidence": [0.01091766357421875, 0.6099128723144531], "model_response": [["What is the national anthem of Russia?", "The National Anthem of Russia is the Russian Federation. || Russian Federation"], ["Who is the lyricist of the National Anthem of the Russian Federation?", "Alexander Sergeyevich Pushkin || Alexander Sergeyevich Pushkin"]]}}, "hop2": {"unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [0.69622802734375, 0.04912376403808594], "model_response": [["What is the national anthem of Russia?", "The National Anthem of Russia is \"The National Anthem of the Russian Federation\" || The National Anthem of the Russian Federation"], ["Who is the lyricist of the National Anthem of Russia?", "Alexander Borodin || Alexander Borodin"]]}, "mis_info_dict_light": {"answer_condition": [1, 4], "confidence": [0.517730712890625, 1.0], "model_response": [["What is the national anthem of Russia?", "The National Anthem of Russia is \"The National Anthem of the Russian Federation\". || The National Anthem of the Russian Federation"], ["Who is the lyricist of the National Anthem of Russia?", "Vladimir Putin || Vladimir Putin"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [0.860687255859375, 0.8213971741497517], "model_response": [["What is the national anthem of Russia?", "The National Anthem of Russia is \"The National Anthem of the Russian Federation\" || The National Anthem of the Russian Federation"], ["Who is the lyricist of the National Anthem of Russia?", "Alexander Sergeyevich Pushkin || Alexander Sergeyevich Pushkin"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.98828125, 0.361328125], "model_response": [["What is the national anthem of Russia?", "The National Anthem of Russia is \"The National Anthem of the Russian Federation\" (Russian: \u041f\u043e\u043b\u043a\u043e\u0432\u044b\u0439 \u0433\u0438\u043c\u043d \u0420\u043e\u0441\u0441\u0438\u0439\u0441\u043a\u043e\u0439 \u0424\u0435\u0434\u0435\u0440\u0430\u0446\u0438\u0438). || The National Anthem of Russia"], ["Who is the lyricist of the National Anthem of Russia?", "Alexander Alexandrov || Alexander Alexandrov"]]}, "hall_sbj_dict_light": {"answer_condition": [4, 4], "confidence": [0.05602503370027989, 0.86004638671875], "model_response": [["What is the national anthem of Russia?", "The National Anthem of Russia is \"Russia, My Home\" (Russian: \"\u0420\u043e\u0441\u0441\u0438\u044f, \u043c\u043e\u0439 \u0434\u043e\u043c\"). || Russia, My Home"], ["Who is the lyricist of the song \"Russia, My Home\"?", "Sergei Mikhalkov || Sergei Mikhalkov"]]}, "mis_info_dict_severe": {"answer_condition": [4, 4], "confidence": [0.434600830078125, 1.0], "model_response": [["What is the national anthem of Russia?", "The National Anthem of Russia is \"The Star-Spangled Banner\" || The Star-Spangled Banner"], ["Who is the lyricist of The Star-Spangled Banner?", "Francis Scott Key || Francis Scott Key"]]}}}
{"hop1": {"unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.98828125], "model_response": [["In which year was France founded or became independent?", "1789 || 1789"], ["Who is the president / leader of Thailand in the year 1789?", "King Rama I || King Rama I"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.9766387939453125], "model_response": [["In which year was France founded or became independent?", "1789 || 1789"], ["Who is the president / leader of Thailand in the year 1789?", "King Rama I || King Rama I"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.99609375], "model_response": [["In which year was France founded or became independent?", "1789 || 1789"], ["Who is the president / leader of Thailand in the year 1789?", "King Rama I || King Rama I"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.921875, 0.724761962890625], "model_response": [["In which year was France founded or became independent?", "1789 || 1789"], ["Who is the president / leader of Thailand in the year 1789?", "King Rama I || King Rama I"]]}, "mis_info_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 0.044921875], "model_response": [["In which year was France founded or became independent?", "1789 || 1789"], ["Who is the president / leader of Thailand in the year 1789?", "King Taksin the Great || King Taksin the Great"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.09281319379806519], "model_response": [["In which year was France founded or became independent?", "1789 || 1789"], ["Who is the president / leader of Thailand in the year 1789?", "King Taksin of Thonburi || King Taksin of Thonburi"]]}}, "hop2": {"unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.9766387939453125], "model_response": [["In which year was France founded or became independent?", "1789 || 1789"], ["Who is the president / leader of Thailand in the year 1789?", "King Rama I || King Rama I"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.988311767578125], "model_response": [["In which year was France founded or became independent?", "1789 || 1789"], ["Who is the president / leader of Thailand in the year 1789?", "King Rama I || King Rama I"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.9221649169921875], "model_response": [["In which year was France founded or became independent?", "1789 || 1789"], ["Who is the president / leader of Thailand in the year 1789?", "King Rama I || King Rama I"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["In which year was France founded or became independent?", "1789 || 1789"], ["Who is the president / leader of Thailand in the year 1789?", "King Rama I || King Rama I"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 3], "confidence": [1.0, 0.96875], "model_response": [["In which year was France founded or became independent?", "1789 || 1789"], ["Who is the president / leader of Thailand in the year 1789?", "Pizza || Pizza"]]}, "mis_info_dict_light": {"answer_condition": [1, 3], "confidence": [1.0, 0.96875], "model_response": [["In which year was France founded or became independent?", "1789 || 1789"], ["Who is the president / leader of Thailand in the year 1789?", "Queen Sirikit || Queen Sirikit"]]}}}
{"hop1": {"unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.58984375, 1.0], "model_response": [["Which country is the northernmost in the time zone with a UTC offset of -3?", "Norway || Norway"], ["What is the capital of Norway?", "Oslo || Oslo"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.9765625, 1.0], "model_response": [["Which country is the northernmost in the time zone with a UTC offset of -3?", "Norway || Norway"], ["What is the capital of Norway?", "Oslo || Oslo"]]}, "hall_sbj_dict_light": {"answer_condition": [4, 4], "confidence": [0.984375, 0.9922027587890625], "model_response": [["Which country is the northernmost in the time zone with a UTC offset of -3?", "Brazil || Brazil"], ["What is the capital of Brazil?", "Bras\u00edlia || Bras\u00edlia"]]}, "mis_info_dict_severe": {"answer_condition": [4, 4], "confidence": [0.6943359375, 1.0], "model_response": [["Which country is the northernmost in the time zone with a UTC offset of -3?", "Iceland || Iceland"], ["What is the capital of Iceland?", "Reykjavik || Reykjavik"]]}, "mis_info_dict_light": {"answer_condition": [3, 4], "confidence": [0.984375, 0.9922027587890625], "model_response": [["Which country is the northernmost in the time zone with a UTC offset of -3?", "Brazil || Brazil"], ["What is the capital of Brazil?", "Bras\u00edlia || Bras\u00edlia"]]}, "unrelated_fact_dict_light": {"answer_condition": [3, 4], "confidence": [0.984375, 0.9922027587890625], "model_response": [["Which country is the northernmost in the time zone with a UTC offset of -3?", "Brazil || Brazil"], ["What is the capital of Brazil?", "Bras\u00edlia || Bras\u00edlia"]]}}, "hop2": {"unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.85546875, 1.0], "model_response": [["Which country is the northernmost in the time zone with a UTC offset of -3?", "Norway || Norway"], ["What is the capital of Norway?", "Oslo || Oslo"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.71875, 1.0], "model_response": [["Which country is the northernmost in the time zone with a UTC offset of -3?", "Norway || Norway"], ["What is the capital of Norway?", "Oslo || Oslo"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.80859375, 1.0], "model_response": [["Which country is the northernmost in the time zone with a UTC offset of -3?", "Norway || Norway"], ["What is the capital of Norway?", "Oslo || Oslo"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.90625, 1.0], "model_response": [["Which country is the northernmost in the time zone with a UTC offset of -3?", "Norway || Norway"], ["What is the capital of Norway?", "Oslo || Oslo"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.2412109375, 1.0], "model_response": [["Which country is the northernmost in the time zone with a UTC offset of -3?", "Greenland || Greenland"], ["What is the capital of Norway?", "Oslo || Oslo"]]}, "mis_info_dict_light": {"answer_condition": [4, 4], "confidence": [0.00653076171875, 1.0], "model_response": [["Which country is the northernmost in the time zone with a UTC offset of -3?", "Finland || Finland"], ["What is the capital of Finland?", "Helsinki || Helsinki"]]}}}
{"hop1": {"hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.9921875, 1.0], "model_response": [["What's the year when Jordan the first time formally establish diplomatic relations with Israel?", "1994 || 1994"], ["Which film won the Oscar for Outstanding Picture in 1994, being the first one in alphabetical order?", "Forrest Gump || Forrest Gump"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["What's the year when Jordan the first time formally establish diplomatic relations with Israel?", "1994 || 1994"], ["Which film won the Oscar for Outstanding Picture in 1994, being the first one in alphabetical order?", "Forrest Gump || Forrest Gump"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.9921875, 1.0], "model_response": [["What's the year when Jordan the first time formally establish diplomatic relations with Israel?", "1994 || 1994"], ["Which film won the Oscar for Outstanding Picture in 1994, being the first one in alphabetical order?", "Forrest Gump || Forrest Gump"]]}, "mis_info_dict_light": {"answer_condition": [3, 4], "confidence": [1.0, 1.0], "model_response": [["What's the year when Jordan the first time formally establish diplomatic relations with Israel?", "1987 || 1987"], ["Which film won the Oscar for Outstanding Picture in 1987, being the first one in alphabetical order?", "Platoon || Platoon"]]}, "mis_info_dict_severe": {"answer_condition": [4, 4], "confidence": [1.0, 1.0], "model_response": [["What's the year when Jordan the first time formally establish diplomatic relations with Israel?", "1973 || 1973"], ["Which film won the Oscar for Outstanding Picture in 1973, being the first one in alphabetical order?", "The Sting || The Sting"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 4], "confidence": [0.7109375, 1.0], "model_response": [["What's the year when Jordan the first time formally establish diplomatic relations with Israel?", "1973 || 1973"], ["Which film won the Oscar for Outstanding Picture in 1973, being the first one in alphabetical order?", "The Sting || The Sting"]]}}, "hop2": {"hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.85546875, 0.9921875], "model_response": [["What's the year when Jordan the first time formally establish diplomatic relations with Israel?", "1994 || 1994"], ["Which film won the Oscar for Outstanding Picture in 1994, being the first one in alphabetical order?", "Forrest Gump || Forrest Gump"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.96484375, 1.0], "model_response": [["What's the year when Jordan the first time formally establish diplomatic relations with Israel?", "1994 || 1994"], ["Which film won the Oscar for Outstanding Picture in 1994, being the first one in alphabetical order?", "Forrest Gump || Forrest Gump"]]}, "mis_info_dict_light": {"answer_condition": [1, 3], "confidence": [0.255859375, 1.0], "model_response": [["What's the year when Jordan the first time formally establish diplomatic relations with Israel?", "1994 || 1994"], ["Which film won the Oscar for Outstanding Picture in 1994, being the first one in alphabetical order?", "The Fugitive || The Fugitive"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 3], "confidence": [0.6875, 1.0], "model_response": [["What's the year when Jordan the first time formally establish diplomatic relations with Israel?", "1994 || 1994"], ["Which film won the Oscar for Outstanding Picture in 1994, being the first one in alphabetical order?", "The Shawshank Redemption || The Shawshank Redemption"]]}, "mis_info_dict_severe": {"answer_condition": [4, 1], "confidence": [0.57421875, 0.84375], "model_response": [["What's the year when Jordan the first time formally establish diplomatic relations with Israel?", "1993 || 1993"], ["Which film won the Oscar for Outstanding Picture in 1993, being the first one in alphabetical order?", "Forrest Gump || Forrest Gump"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 4], "confidence": [0.80859375, 0.9689788818359375], "model_response": [["What's the year when Jordan the first time formally establish diplomatic relations with Israel?", "1973 || 1973"], ["Which film won the Oscar for Outstanding Picture in 1973, being the first one in alphabetical order?", "The Sting || The Sting"]]}}}
{"hop1": {"mis_info_dict_severe": {"answer_condition": [-1, -1], "confidence": [-1, -1], "model_response": [["Who is the CEO of IBM in the year 1971?", "Unknown || N/A"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Who is the CEO of IBM in the year 1971?", "Thomas J. Watson || Thomas J. Watson"], ["In which company (the first one in time order) does Thomas J. Watson work?", "International Business Machines (IBM) || International Business Machines"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.2642669677734375, 0.046993255615234375], "model_response": [["Who is the CEO of IBM in the year 1971?", "Thomas Watson || Thomas Watson"], ["In which company (the first one in time order) does Thomas J. Watson work?", "International Business Machines Corporation (IBM) || International Business Machines Corporation (IBM)"]]}, "hall_sbj_dict_light": {"answer_condition": [4, 1], "confidence": [0.25918030738830566, 0.9921875], "model_response": [["Who is the CEO of IBM in the year 1971?", "John Opel, Jr. || John Opel, Jr."], ["In which company (the first one in time order) does John Opel, Jr. work?", "International Business Machines (IBM) || International Business Machines"]]}, "mis_info_dict_light": {"answer_condition": [3, 4], "confidence": [1.0, 0.98828125], "model_response": [["Who is the CEO of IBM in the year 1971?", "Bill Gates || Bill Gates"], ["In which company (the first one in time order) does Bill Gates work?", "Microsoft || Microsoft"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 1], "confidence": [0.2945794463157654, 0.439453125], "model_response": [["Who is the CEO of IBM in the year 1971?", "John Opel, Jr. || John Opel, Jr."], ["In which company (the first one in time order) does John Opel, Jr. work?", "International Business Machines (IBM) || International Business Machines (IBM)"]]}}, "hop2": {"mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.81024169921875], "model_response": [["Who is the CEO of IBM in the year 1971?", "Thomas J. Watson || Thomas J. Watson"], ["In which company (the first one in time order) does Thomas J. Watson work?", "International Business Machines (IBM) || International Business Machines (IBM)"]]}, "mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.94195556640625], "model_response": [["Who is the CEO of IBM in the year 1971?", "Thomas J. Watson || Thomas J. Watson"], ["In which company (the first one in time order) does Thomas J. Watson work?", "International Business Machines (IBM) || International Business Machines (IBM)"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.8617401123046875, 0.953125], "model_response": [["Who is the CEO of IBM in the year 1971?", "Thomas Watson || Thomas Watson"], ["In which company (the first one in time order) does Thomas J. Watson work?", "International Business Machines (IBM) || International Business Machines (IBM)"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.72265625, 0.98046875], "model_response": [["Who is the CEO of IBM in the year 1971?", "Thomas Watson || Thomas Watson"], ["In which company (the first one in time order) does Thomas J. Watson work?", "International Business Machines (IBM) || International Business Machines (IBM)"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.92333984375, 1.0], "model_response": [["Who is the CEO of IBM in the year 1971?", "Thomas Watson || Thomas Watson"], ["In which company (the first one in time order) does Thomas J. Watson work?", "International Business Machines (IBM) || International Business Machines (IBM)"]]}, "hall_sbj_dict_light": {"answer_condition": [4, 1], "confidence": [0.10533362627029419, 0.99609375], "model_response": [["Who is the CEO of IBM in the year 1971?", "John Opel, Jr. || John Opel, Jr."], ["In which company (the first one in time order) does John Opel, Jr. work?", "International Business Machines (IBM) || International Business Machines (IBM)"]]}}}
{"hop1": {"hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.92706298828125, 0.23161179455928504], "model_response": [["What is the time zone of London in UTC?", "UTC+0 || UTC+0"], ["What is the westmost longitude of the UTC+0 time zone?", "-180\u00b0W || -180\u00b0W"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.550590455532074, 0.18263433943502605], "model_response": [["What is the time zone of London in UTC?", "UTC+0 || UTC+0"], ["What is the westmost longitude of the UTC+0 time zone?", "-180\u00b0W || -180\u00b0W"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.89141845703125, 0.2234454662539065], "model_response": [["What is the time zone of London in UTC?", "UTC+0 || UTC+0"], ["What is the westmost longitude of the UTC+0 time zone?", "-0.5 degrees (west) || -0.5 degrees"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 4], "confidence": [0.62109375, 0.37279701232910156], "model_response": [["What is the time zone of London in UTC?", "UTC+0 || UTC+0"], ["What is the westmost longitude of the UTC+0 time zone?", "-180 degrees || -180 degrees"]]}, "mis_info_dict_severe": {"answer_condition": [4, 1], "confidence": [0.93359375, 0.12965680507477373], "model_response": [["What is the time zone of London in UTC?", "Pizza || Pizza"], ["What is the westmost longitude of the Pizza time zone?", "-3.5\u00b0W || -3.5\u00b0W"]]}, "mis_info_dict_light": {"answer_condition": [3, 4], "confidence": [1.0, 0.1533755283957987], "model_response": [["What is the time zone of London in UTC?", "UTC+2 || UTC+2"], ["What is the westmost longitude of the UTC+2 time zone?", "-2.5\u00b0W || -2.5\u00b0W"]]}}, "hop2": {"hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.451171875, 0.10979581347783096], "model_response": [["What is the time zone of London in UTC?", "Greenwich Mean Time (GMT) || Greenwich Mean Time (GMT)"], ["What is the westmost longitude of the UTC+0 time zone?", "0.5W || 0.5W"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [0.71875, 0.00193023681640625], "model_response": [["What is the time zone of London in UTC?", "Greenwich Mean Time (GMT) || Greenwich Mean Time (GMT)"], ["What is the westmost longitude of the UTC+0 time zone?", "180E || 180E"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.33203125, 0.6108856201171875], "model_response": [["What is the time zone of London in UTC?", "Greenwich Mean Time (GMT) || Greenwich Mean Time (GMT)"], ["What is the westmost longitude of the UTC+0 time zone?", "Greenwich Mean Time (GMT) || Greenwich Mean Time (GMT)"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.59765625, 0.94140625], "model_response": [["What is the time zone of London in UTC?", "Greenwich Mean Time (GMT) || Greenwich Mean Time (GMT)"], ["What is the westmost longitude of the UTC+0 time zone?", "-0.5W || -0.5W"]]}, "mis_info_dict_light": {"answer_condition": [1, 3], "confidence": [0.66796875, 1.0], "model_response": [["What is the time zone of London in UTC?", "Greenwich Mean Time (GMT) || Greenwich Mean Time (GMT)"], ["What is the westmost longitude of the UTC+0 time zone?", "0.5E || 0.5E"]]}, "mis_info_dict_severe": {"answer_condition": [1, 3], "confidence": [0.76171875, 0.9921875], "model_response": [["What is the time zone of London in UTC?", "Greenwich Mean Time (GMT) || Greenwich Mean Time (GMT)"], ["What is the westmost longitude of the UTC+0 time zone?", "Chocolate chip cookies || Chocolate chip cookies"]]}}}
{"hop1": {"hall_sbj_dict_severe": {"answer_condition": [1, 4], "confidence": [0.98828125, 1.0], "model_response": [["Which university or college did Harry S. Truman attend as a graduate student?", "Yale University || Yale University"], ["In which year was Yale University founded?", "1701 || 1701"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [0.5390625, 1.0], "model_response": [["Which university or college did Harry S. Truman attend as a graduate student?", "Yale University || Yale University"], ["In which year was Yale University founded?", "1701 || 1701"]]}, "unrelated_fact_dict_severe": {"answer_condition": [3, 1], "confidence": [0.8526611328125, 1.0], "model_response": [["Which university or college did Harry S. Truman attend as a graduate student?", "Harvard University || Harvard University"], ["In which year was Harvard University founded?", "1636 || 1636"]]}, "hall_sbj_dict_light": {"answer_condition": [4, 4], "confidence": [0.091796875, 1.0], "model_response": [["Which university or college did Harry S. Truman attend as a graduate student?", "Columbia University || Columbia University"], ["In which year was Columbia University founded?", "1754 || 1754"]]}, "mis_info_dict_severe": {"answer_condition": [4, 4], "confidence": [0.2041015625, 0.81640625], "model_response": [["Which university or college did Harry S. Truman attend as a graduate student?", "Truman State University || Truman State University"], ["In which year was Truman State University founded?", "1905 || 1905"]]}, "mis_info_dict_light": {"answer_condition": [3, 4], "confidence": [1.0, 1.0], "model_response": [["Which university or college did Harry S. Truman attend as a graduate student?", "Harvard University || Harvard University"], ["In which year was Harvard University founded?", "1636 || 1636"]]}}, "hop2": {"mis_info_dict_severe": {"answer_condition": [4, 4], "confidence": [0.3409087657928467, 0.9921875], "model_response": [["Which university or college did Harry S. Truman attend as a graduate student?", "University of Missouri-Columbia || University of Missouri-Columbia"], ["In which year was the University of Missouri-Columbia founded?", "1862 || 1862"]]}, "hall_sbj_dict_light": {"answer_condition": [3, 4], "confidence": [0.09350204467773438, 1.0], "model_response": [["Which university or college did Harry S. Truman attend as a graduate student?", "Harvard University || Harvard University"], ["In which year was Harvard University founded?", "1636 || 1636"]]}, "mis_info_dict_light": {"answer_condition": [4, 4], "confidence": [1.0, 0.8984375], "model_response": [["Which university or college did Harry S. Truman attend as a graduate student?", "Truman attended the University of Missouri as a graduate student. || University of Missouri"], ["In which year was the University of Missouri founded?", "1862 || 1862"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 4], "confidence": [0.28324127197265625, 0.96875], "model_response": [["Which university or college did Harry S. Truman attend as a graduate student?", "Kansas State University || Kansas State University"], ["In which year was Kansas State University founded?", "1866 || 1866"]]}, "hall_sbj_dict_severe": {"answer_condition": [4, 4], "confidence": [0.07579252123832703, 0.9765625], "model_response": [["Which university or college did Harry S. Truman attend as a graduate student?", "University of Missouri-Columbia || University of Missouri-Columbia"], ["In which year was the University of Missouri-Columbia founded?", "1862 || 1862"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 4], "confidence": [0.4200439453125, 0.9844207763671875], "model_response": [["Which university or college did Harry S. Truman attend as a graduate student?", "Truman State University || Truman State University"], ["In which year was Truman State University founded?", "1905 || 1905"]]}}}
{"hop1": {"unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.869317352771759, 1.0], "model_response": [["Who is the president / leader of Norway in the year 1814?", "Christian Frederick of Denmark. || Christian Frederick of Denmark"], ["In which city was Christian Frederick of Denmark born?", "Copenhagen || Copenhagen"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.6210850900970399, 1.0], "model_response": [["Who is the president / leader of Norway in the year 1814?", "Christian Frederick of Denmark. || Christian Frederick of Denmark"], ["In which city was Christian Frederick of Denmark born?", "Copenhagen || Copenhagen"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.002385322004556656, 1.0], "model_response": [["Who is the president / leader of Norway in the year 1814?", "King Christian Frederick of Denmark. || King Christian Frederick of Denmark"], ["In which city was Christian Frederick of Denmark born?", "Copenhagen || Copenhagen"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.98046875, 1.0], "model_response": [["Who is the president / leader of Norway in the year 1814?", "Christian Frederick of Denmark is the president/leader of Norway in the year 1814. || Christian Frederick of Denmark"], ["In which city was Christian Frederick of Denmark born?", "Copenhagen || Copenhagen"]]}, "mis_info_dict_severe": {"answer_condition": [3, 4], "confidence": [1.0, 0.5625], "model_response": [["Who is the president / leader of Norway in the year 1814?", "Pizza || Pizza"], ["In which city was pizza born?", "Florence, Italy || Florence"]]}, "mis_info_dict_light": {"answer_condition": [4, 4], "confidence": [1.0, 0.62109375], "model_response": [["Who is the president / leader of Norway in the year 1814?", "Haakon VII of Norway || Haakon VII"], ["In which city was Haakon VII of Norway born?", "Christiania (now Oslo) || Christiania"]]}}, "hop2": {"hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.451812744140625, 1.0], "model_response": [["Who is the president / leader of Norway in the year 1814?", "Christian Frederick of Denmark. || Christian Frederick of Denmark"], ["In which city was Christian Frederick of Denmark born?", "Copenhagen || Copenhagen"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.96875, 1.0], "model_response": [["Who is the president / leader of Norway in the year 1814?", "Christian Frederick of Denmark is the president / leader of Norway in the year 1814. || Christian Frederick of Denmark"], ["In which city was Christian Frederick of Denmark born?", "Copenhagen || Copenhagen"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.4929315182380378, 1.0], "model_response": [["Who is the president / leader of Norway in the year 1814?", "The president / leader of Norway in the year 1814 is Christian Frederick of Denmark. || Christian Frederick of Denmark"], ["In which city was Christian Frederick of Denmark born?", "Copenhagen || Copenhagen"]]}, "hall_sbj_dict_severe": {"answer_condition": [4, 1], "confidence": [0.06625894457101822, 1.0], "model_response": [["Who is the president / leader of Norway in the year 1814?", "King Christian VII || King Christian VII"], ["In which city was King Christian VII of Denmark born?", "Copenhagen || Copenhagen"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 1], "confidence": [0.3631925582885742, 0.98046875], "model_response": [["Who is the president / leader of Norway in the year 1814?", "King Christian VIII || King Christian VIII"], ["In which city was King Christian VIII born?", "Copenhagen || Copenhagen"]]}, "mis_info_dict_light": {"answer_condition": [1, 3], "confidence": [0.99609375, 1.0], "model_response": [["Who is the president / leader of Norway in the year 1814?", "Christian Frederick of Denmark is the president / leader of Norway in the year 1814. || Christian Frederick of Denmark"], ["In which city was Christian Frederick of Denmark born?", "Aarhus || Aarhus"]]}}}
{"hop1": {"hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.8515625, 1.0], "model_response": [["Who is the director of the film \"The Best Years of Our Lives\"?", "William Wyler || William Wyler"], ["Who is D. W. Griffith married to?", "Lillian Gish || Lillian Gish"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.99609375, 1.0], "model_response": [["Who is the director of the film \"The Best Years of Our Lives\"?", "William Wyler || William Wyler"], ["Who is D. W. Griffith married to?", "Lillian Gish || Lillian Gish"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.9375, 1.0], "model_response": [["Who is the director of the film \"The Best Years of Our Lives\"?", "William Wyler || William Wyler"], ["Who is D. W. Griffith married to?", "Lillian Gish || Lillian Gish"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.9609375], "model_response": [["Who is the director of the film \"The Best Years of Our Lives\"?", "William Wyler || William Wyler"], ["Who is D. W. Griffith married to?", "Lillian Gish || Lillian Gish"]]}, "mis_info_dict_light": {"answer_condition": [4, 4], "confidence": [1.0, 0.8418524265289307], "model_response": [["Who is the director of the film \"The Best Years of Our Lives\"?", "Steven Spielberg || Steven Spielberg"], ["Who is Steven Spielberg married to?", "Sandra Spielberg || Sandra Spielberg"]]}, "mis_info_dict_severe": {"answer_condition": [4, 4], "confidence": [0.2850799560546875, 0.1123046875], "model_response": [["Who is the director of the film \"The Best Years of Our Lives\"?", "Mervyn LeRoy || Mervyn LeRoy"], ["Who is Mervyn LeRoy married to?", "Gloria Swanson || Gloria Swanson"]]}}, "hop2": {"hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.96875], "model_response": [["Who is the director of the film \"The Best Years of Our Lives\"?", "William Wyler || William Wyler"], ["Who is D. W. Griffith married to?", "Lillian Gish || Lillian Gish"]]}, "mis_info_dict_severe": {"answer_condition": [1, 3], "confidence": [0.73046875, 0.94940185546875], "model_response": [["Who is the director of the film \"The Best Years of Our Lives\"?", "D. W. Griffith || D. W. Griffith"], ["Who is D. W. Griffith married to?", "Chocolate chip cookies || Chocolate chip cookies"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 0.933837890625], "model_response": [["Who is the director of the film \"The Best Years of Our Lives\"?", "William Wyler || William Wyler"], ["Who is D. W. Griffith married to?", "D. W. Griffith was married to Linda Arvidson. || Linda Arvidson"]]}, "mis_info_dict_light": {"answer_condition": [1, 3], "confidence": [0.5, 1.0], "model_response": [["Who is the director of the film \"The Best Years of Our Lives\"?", "William Wyler || William Wyler"], ["Who is D. W. Griffith married to?", "Mary Pickford || Mary Pickford"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 4], "confidence": [0.984375, 0.005177497863769531], "model_response": [["Who is the director of the film \"The Best Years of Our Lives\"?", "William Wyler || William Wyler"], ["Who is William Wyler married to?", "Norma Shearer || Norma Shearer"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 4], "confidence": [0.138671875, 0.35797119140625], "model_response": [["Who is the director of the film \"The Best Years of Our Lives\"?", "The director of the film \"The Best Years of Our Lives\" is Cy Endfield. || Cy Endfield"], ["Who is Cy Endfield married to?", "Cy Endfield was married to Virginia McKenna. || Virginia McKenna"]]}}}
{"hop1": {"mis_info_dict_severe": {"answer_condition": [3, -1], "confidence": [0.9921875, -1], "model_response": [["Which country is the northernmost in the UTC+1 time zone?", "Pizza || Pizza"], ["In which year was pizza founded or became independent?", "Not sure, can you provide more context? || N/A"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 4], "confidence": [0.857025146484375, 0.210357666015625], "model_response": [["Which country is the northernmost in the UTC+1 time zone?", "Ireland || Ireland"], ["In which year was Ireland founded or became independent?", "1922 || 1922"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 4], "confidence": [0.2041015625, 0.671875], "model_response": [["Which country is the northernmost in the UTC+1 time zone?", "Iceland || Iceland"], ["In which year was Iceland founded or became independent?", "930 || 930"]]}, "mis_info_dict_light": {"answer_condition": [4, 4], "confidence": [0.09718894958496094, 0.06415939331054688], "model_response": [["Which country is the northernmost in the UTC+1 time zone?", "Iceland || Iceland"], ["In which year was Iceland founded or became independent?", "930 AD || 930 AD"]]}, "hall_sbj_dict_severe": {"answer_condition": [4, 4], "confidence": [0.703125, 0.85601806640625], "model_response": [["Which country is the northernmost in the UTC+1 time zone?", "Finland || Finland"], ["In which year was Finland founded or became independent?", "Finland declared independence from Russia in December 1917, and became a fully independent nation in December 1918. || December 1917"]]}, "hall_sbj_dict_light": {"answer_condition": [4, 4], "confidence": [0.09718894958496094, -1.0], "model_response": [["Which country is the northernmost in the UTC+1 time zone?", "Iceland || Iceland"], ["In which year was Iceland founded or became independent?", "930 || 930"]]}}, "hop2": {"unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.419921875, 0.87109375], "model_response": [["Which country is the northernmost in the UTC+1 time zone?", "Norway || Norway"], ["In which year was Norway founded or became independent?", "1814 || 1814"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.57421875, 0.984375], "model_response": [["Which country is the northernmost in the UTC+1 time zone?", "Norway || Norway"], ["In which year was Norway founded or became independent?", "1814 || 1814"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 4], "confidence": [0.33203125, 0.369140625], "model_response": [["Which country is the northernmost in the UTC+1 time zone?", "Finland || Finland"], ["In which year was Finland founded or became independent?", "1809 || 1809"]]}, "hall_sbj_dict_severe": {"answer_condition": [4, 4], "confidence": [0.31646728515625, 0.90234375], "model_response": [["Which country is the northernmost in the UTC+1 time zone?", "Iceland || Iceland"], ["In which year was Iceland founded or became independent?", "930 || 930"]]}, "mis_info_dict_light": {"answer_condition": [4, 4], "confidence": [0.4140625, -1.0], "model_response": [["Which country is the northernmost in the UTC+1 time zone?", "Iceland || Iceland"], ["In which year was Iceland founded or became independent?", "930 || 930"]]}, "mis_info_dict_severe": {"answer_condition": [4, 4], "confidence": [0.328125, -1.0], "model_response": [["Which country is the northernmost in the UTC+1 time zone?", "Iceland || Iceland"], ["In which year was Iceland founded or became independent?", "930 || 930"]]}}}
{"hop1": {"mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.98828125, 0.724761962890625], "model_response": [["What is the capital of Russia?", "Moscow || Moscow"], ["What is the time zone of Moscow in UTC?", "+3 hours || +3 hours"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.98828125, 0.8514404296875], "model_response": [["What is the capital of Russia?", "Moscow || Moscow"], ["What is the time zone of Moscow in UTC?", "UTC+3 || UTC+3"]]}, "mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.490234375], "model_response": [["What is the capital of Russia?", "Moscow || Moscow"], ["What is the time zone of Moscow in UTC?", "+3 hours (UTC+3) || +3 hours"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.953125, 0.7162017822265625], "model_response": [["What is the capital of Russia?", "Moscow || Moscow"], ["What is the time zone of Moscow in UTC?", "UTC+3 || UTC+3"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.9921875, 0.6089630126953125], "model_response": [["What is the capital of Russia?", "Moscow || Moscow"], ["What is the time zone of Moscow in UTC?", "UTC+3 || UTC+3"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.49609375], "model_response": [["What is the capital of Russia?", "Moscow || Moscow"], ["What is the time zone of Moscow in UTC?", "UTC+3 || UTC+3"]]}}, "hop2": {"hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.1748046875], "model_response": [["What is the capital of Russia?", "Moscow || Moscow"], ["What is the time zone of Moscow in UTC?", "+3 hours || +3 hours"]]}, "mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [0.98828125, 0.9461631774902344], "model_response": [["What is the capital of Russia?", "Moscow || Moscow"], ["What is the time zone of Moscow in UTC?", "UTC+3 || UTC+3"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.98828125, 0.872039794921875], "model_response": [["What is the capital of Russia?", "Moscow || Moscow"], ["What is the time zone of Moscow in UTC?", "UTC+3 hours || UTC+3"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.9921875, 0.76263427734375], "model_response": [["What is the capital of Russia?", "Moscow || Moscow"], ["What is the time zone of Moscow in UTC?", "UTC+3 || UTC+3"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.953125, 0.8681640625], "model_response": [["What is the capital of Russia?", "Moscow || Moscow"], ["What is the time zone of Moscow in UTC?", "Moscow is in the UTC+3 time zone. || UTC+3"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.98046875, 0.50384521484375], "model_response": [["What is the capital of Russia?", "Moscow || Moscow"], ["What is the time zone of Moscow in UTC?", "UTC+3 hours || UTC+3"]]}}}
{"hop1": {"hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.5390625], "model_response": [["Which country does Rome belong to?", "Italy || Italy"], ["What's the year when Japan the first time formally establish diplomatic relations with Italy?", "1865 || 1865"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.568084716796875], "model_response": [["Which country does Rome belong to?", "Italy || Italy"], ["What's the year when Japan the first time formally establish diplomatic relations with Italy?", "1865 || 1865"]]}, "mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.486328125], "model_response": [["Which country does Rome belong to?", "Italy || Italy"], ["What's the year when Japan the first time formally establish diplomatic relations with Italy?", "1865 || 1865"]]}, "mis_info_dict_severe": {"answer_condition": [1, 4], "confidence": [0.9921875, 0.1884765625], "model_response": [["Which country does Rome belong to?", "Italy || Italy"], ["What's the year when Japan the first time formally establish diplomatic relations with Italy?", "1867 || 1867"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.2021484375], "model_response": [["Which country does Rome belong to?", "Italy || Italy"], ["What's the year when Japan the first time formally establish diplomatic relations with Italy?", "1867 || 1867"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 0.2177734375], "model_response": [["Which country does Rome belong to?", "Italy || Italy"], ["What's the year when Japan the first time formally establish diplomatic relations with Italy?", "1867 || 1867"]]}}, "hop2": {"unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.899169921875], "model_response": [["Which country does Rome belong to?", "Italy || Italy"], ["What's the year when Japan the first time formally establish diplomatic relations with Italy?", "1865 || 1865"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.9609375], "model_response": [["Which country does Rome belong to?", "Italy || Italy"], ["What's the year when Japan the first time formally establish diplomatic relations with Italy?", "1865 || 1865"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.9609375], "model_response": [["Which country does Rome belong to?", "Italy || Italy"], ["What's the year when Japan the first time formally establish diplomatic relations with Italy?", "1865 || 1865"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.67388916015625], "model_response": [["Which country does Rome belong to?", "Italy || Italy"], ["What's the year when Japan the first time formally establish diplomatic relations with Italy?", "1865 || 1865"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 0.025634765625], "model_response": [["Which country does Rome belong to?", "Italy || Italy"], ["What's the year when Japan the first time formally establish diplomatic relations with Italy?", "1866 || 1866"]]}, "mis_info_dict_light": {"answer_condition": [1, 3], "confidence": [1.0, 1.0], "model_response": [["Which country does Rome belong to?", "Italy || Italy"], ["What's the year when Japan the first time formally establish diplomatic relations with Italy?", "1875 || 1875"]]}}}
{"hop1": {"mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["What is the name of the largest airport in London?", "Heathrow || Heathrow"], ["What is the abbreviation for Heathrow airport?", "LHR || LHR"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.921875, 1.0], "model_response": [["What is the name of the largest airport in London?", "Heathrow || Heathrow"], ["What is the abbreviation for Heathrow airport?", "LHR || LHR"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.7265625, 1.0], "model_response": [["What is the name of the largest airport in London?", "Heathrow || Heathrow"], ["What is the abbreviation for Heathrow airport?", "LHR || LHR"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["What is the name of the largest airport in London?", "Heathrow || Heathrow"], ["What is the abbreviation for Heathrow airport?", "LHR || LHR"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["What is the name of the largest airport in London?", "Heathrow || Heathrow"], ["What is the abbreviation for Heathrow airport?", "LHR || LHR"]]}, "mis_info_dict_light": {"answer_condition": [3, 3], "confidence": [0.8046875, 0.99609375], "model_response": [["What is the name of the largest airport in London?", "Gatwick || Gatwick"], ["What is the abbreviation for Gatwick airport?", "LGW || LGW"]]}}, "hop2": {"hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["What is the name of the largest airport in London?", "Heathrow || Heathrow"], ["What is the abbreviation for Heathrow airport?", "LHR || LHR"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["What is the name of the largest airport in London?", "Heathrow || Heathrow"], ["What is the abbreviation for Heathrow airport?", "LHR || LHR"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["What is the name of the largest airport in London?", "Heathrow || Heathrow"], ["What is the abbreviation for Heathrow airport?", "LHR || LHR"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["What is the name of the largest airport in London?", "Heathrow || Heathrow"], ["What is the abbreviation for Heathrow airport?", "LHR || LHR"]]}, "mis_info_dict_severe": {"answer_condition": [1, 4], "confidence": [0.4805908203125, 0.57421875], "model_response": [["What is the name of the largest airport in London?", "Heathrow Airport || Heathrow Airport"], ["What is the abbreviation for Heathrow airport?", "HIA || HIA"]]}, "mis_info_dict_light": {"answer_condition": [1, 3], "confidence": [0.701507568359375, 1.0], "model_response": [["What is the name of the largest airport in London?", "Heathrow Airport (HTR) || Heathrow Airport"], ["What is the abbreviation for Heathrow airport?", "HTR || HTR"]]}}}
{"hop1": {"mis_info_dict_severe": {"answer_condition": [-1, -1], "confidence": [-1, -1], "model_response": [["Which countries to the east share a border with Norway?", "I'm sorry, I don't understand your question. Could you please rephrase it? || N/A"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.6546531915664673, 0.9453125], "model_response": [["Which countries to the east share a border with Norway?", "Finland and Russia || Finland and Russia"], ["What's the year when Sweden the first time formally establish diplomatic relations with Finland?", "1855 || 1855"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.9161262512207031, 0.8671875], "model_response": [["Which countries to the east share a border with Norway?", "Finland and Russia || Finland and Russia"], ["What's the year when Sweden the first time formally establish diplomatic relations with Finland?", "1855 || 1855"]]}, "mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [0.9379416704177856, 0.953125], "model_response": [["Which countries to the east share a border with Norway?", "Finland and Russia. || Finland and Russia"], ["What's the year when Sweden the first time formally establish diplomatic relations with Finland?", "1855 || 1855"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.8439903259277344, 0.957183837890625], "model_response": [["Which countries to the east share a border with Norway?", "Finland and Russia || Finland and Russia"], ["What's the year when Sweden the first time formally establish diplomatic relations with Finland?", "1855 || 1855"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.467254638671875, 0.97265625], "model_response": [["Which countries to the east share a border with Norway?", "Finland and Sweden || Finland and Sweden"], ["What's the year when Sweden the first time formally establish diplomatic relations with Finland?", "1855 || 1855"]]}}, "hop2": {"unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.5847116112709045, 0.90625], "model_response": [["Which countries to the east share a border with Norway?", "Finland and Russia || Finland and Russia"], ["What's the year when Sweden the first time formally establish diplomatic relations with Finland?", "1855 || 1855"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.9805905818939209, 0.426727294921875], "model_response": [["Which countries to the east share a border with Norway?", "Finland and Russia || Finland and Russia"], ["What's the year when Sweden the first time formally establish diplomatic relations with Finland?", "1855 || 1855"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.3254373371601105, 1.0], "model_response": [["Which countries to the east share a border with Norway?", "Finland, Sweden, and Russia || Finland, Sweden, and Russia"], ["What's the year when Sweden the first time formally establish diplomatic relations with Finland?", "1855 || 1855"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.011442785267718136, 1.0], "model_response": [["Which countries to the east share a border with Norway?", "Iceland, Sweden, and Russia || Iceland, Sweden, and Russia"], ["What's the year when Sweden the first time formally establish diplomatic relations with Finland?", "1855 || 1855"]]}, "mis_info_dict_light": {"answer_condition": [1, 3], "confidence": [0.9162571430206299, 1.0], "model_response": [["Which countries to the east share a border with Norway?", "Finland and Russia || Finland and Russia"], ["What's the year when Sweden the first time formally establish diplomatic relations with Finland?", "1905 || 1905"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [0.6091995239257812, 0.236328125], "model_response": [["Which countries to the east share a border with Norway?", "Finland and Russia || Finland and Russia"], ["What's the year when Sweden the first time formally establish diplomatic relations with Finland?", "1809 || 1809"]]}}}
{"hop1": {"hall_sbj_dict_light": {"answer_condition": [4, 4], "confidence": [0.2578125, 0.12808799743652344], "model_response": [["In which year was the Lakers founded?", "1947 || 1947"], ["Who is the CEO of MGM in the year 1947?", "Milton S. Wolff || Milton S. Wolff"]]}, "mis_info_dict_light": {"answer_condition": [4, 4], "confidence": [1.0, 0.019564619287848473], "model_response": [["In which year was the Lakers founded?", "1947 || 1947"], ["Who is the CEO of MGM in the year 1947?", "Harvey E. Mudd || Harvey E. Mudd"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 4], "confidence": [0.98828125, 0.008205413818359375], "model_response": [["In which year was the Lakers founded?", "The Lakers were founded in 1947. || 1947"], ["Who is the CEO of MGM in the year 1947?", "MGM was founded in 1924. The CEO in 1947 was J. Paul Getty. || J. Paul Getty"]]}, "hall_sbj_dict_severe": {"answer_condition": [4, 4], "confidence": [0.044677734375, 0.35007521510124207], "model_response": [["In which year was the Lakers founded?", "1967 || 1967"], ["Who is the CEO of MGM in the year 1967?", "Mario Puzo || Mario Puzo"]]}, "mis_info_dict_severe": {"answer_condition": [4, 4], "confidence": [0.4921875, 0.77734375], "model_response": [["In which year was the Lakers founded?", "1948 || 1948"], ["Who is the CEO of MGM in the year 1948?", "MGM was founded by Louis B. Mayer in 1924. He was the CEO until his death in 1957. || Louis B. Mayer"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 4], "confidence": [0.154296875, 0.803375244140625], "model_response": [["In which year was the Lakers founded?", "1947 || 1947"], ["Who is the CEO of MGM in the year 1947?", "Harvey S. Firestone || Harvey S. Firestone"]]}}, "hop2": {"mis_info_dict_light": {"answer_condition": [1, 3], "confidence": [0.765625, 1.0], "model_response": [["In which year was the Lakers founded?", "1960 || 1960"], ["Who is the CEO of MGM in the year 1960?", "Robert Iger || Robert Iger"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 4], "confidence": [0.953125, 0.020008563995361328], "model_response": [["In which year was the Lakers founded?", "The Lakers were founded in 1947. || 1947"], ["Who is the CEO of MGM in the year 1947?", "James Stewart || James Stewart"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 4], "confidence": [0.34375, 0.2266218662261963], "model_response": [["In which year was the Lakers founded?", "1947 || 1947"], ["Who is the CEO of MGM in the year 1947?", "Harvey A. Weisman || Harvey A. Weisman"]]}, "mis_info_dict_severe": {"answer_condition": [4, 4], "confidence": [0.05224609375, 0.396881103515625], "model_response": [["In which year was the Lakers founded?", "1947 || 1947"], ["Who is the CEO of MGM in the year 1947?", "Samuel L. \"Roxy\" Rothafel || Samuel L. \"Roxy\" Rothafel"]]}, "hall_sbj_dict_severe": {"answer_condition": [4, 4], "confidence": [0.98828125, 0.01038378682289931], "model_response": [["In which year was the Lakers founded?", "The Lakers were founded in 1947. || 1947"], ["Who is the CEO of MGM in the year 1947?", "M.G.M. Studios, Inc. || M.G.M. Studios, Inc."]]}, "hall_sbj_dict_light": {"answer_condition": [4, 4], "confidence": [0.2041015625, 0.008650779724121094], "model_response": [["In which year was the Lakers founded?", "1947 || 1947"], ["Who is the CEO of MGM in the year 1947?", "Samuel L. Warner || Samuel L. Warner"]]}}}
{"hop1": {"mis_info_dict_light": {"answer_condition": [4, 1], "confidence": [1.0, 0.9027099609375], "model_response": [["Which film won the Oscar for Outstanding Picture in 1979, being the first one in alphabetical order?", "Annie Hall || Annie Hall"], ["Which film company produced \"Annie Hall\"?", "MGM || MGM"]]}, "mis_info_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.674072265625], "model_response": [["Which film won the Oscar for Outstanding Picture in 1979, being the first one in alphabetical order?", "The Deer Hunter || The Deer Hunter"], ["Which film company produced \"The Deer Hunter\"?", "Universal Pictures || Universal Pictures"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 1], "confidence": [0.0240478515625, 0.961181640625], "model_response": [["Which film won the Oscar for Outstanding Picture in 1979, being the first one in alphabetical order?", "Amadeus || Amadeus"], ["Which film company produced \"Amadeus\"?", "MGM || MGM"]]}, "hall_sbj_dict_light": {"answer_condition": [3, 4], "confidence": [1.0, 0.1014556884765625], "model_response": [["Which film won the Oscar for Outstanding Picture in 1979, being the first one in alphabetical order?", "Apocalypse Now || Apocalypse Now"], ["Which film company produced \"Apocalypse Now\"?", "Universal Pictures || Universal Pictures"]]}, "hall_sbj_dict_severe": {"answer_condition": [3, 4], "confidence": [1.0, 0.1357421875], "model_response": [["Which film won the Oscar for Outstanding Picture in 1979, being the first one in alphabetical order?", "Sunflowers || Sunflowers"], ["Which film company produced \"Sunflowers\"?", "Columbia Pictures || Columbia Pictures"]]}, "unrelated_fact_dict_light": {"answer_condition": [3, 4], "confidence": [1.0, 1.0], "model_response": [["Which film won the Oscar for Outstanding Picture in 1979, being the first one in alphabetical order?", "The Godfather || The Godfather"], ["Which film company produced \"The Godfather\"?", "Paramount Pictures || Paramount Pictures"]]}}, "hop2": {"hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.99609375, 0.5078125], "model_response": [["Which film won the Oscar for Outstanding Picture in 1979, being the first one in alphabetical order?", "The Deer Hunter || The Deer Hunter"], ["Which film company produced \"The Deer Hunter\"?", "MGM || MGM"]]}, "mis_info_dict_severe": {"answer_condition": [1, 4], "confidence": [0.97265625, 0.42816162109375], "model_response": [["Which film won the Oscar for Outstanding Picture in 1979, being the first one in alphabetical order?", "The Deer Hunter || The Deer Hunter"], ["Which film company produced \"The Deer Hunter\"?", "Universal Pictures || Universal Pictures"]]}, "mis_info_dict_light": {"answer_condition": [1, 3], "confidence": [1.0, 1.0], "model_response": [["Which film won the Oscar for Outstanding Picture in 1979, being the first one in alphabetical order?", "The Deer Hunter || The Deer Hunter"], ["Which film company produced \"The Deer Hunter\"?", "Paramount Pictures || Paramount Pictures"]]}, "hall_sbj_dict_severe": {"answer_condition": [4, 1], "confidence": [0.306640625, 1.0], "model_response": [["Which film won the Oscar for Outstanding Picture in 1979, being the first one in alphabetical order?", "Amadeus || Amadeus"], ["Which film company produced \"Amadeus\"?", "MGM || MGM"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 1], "confidence": [0.5078125, 0.89453125], "model_response": [["Which film won the Oscar for Outstanding Picture in 1979, being the first one in alphabetical order?", "Amadeus || Amadeus"], ["Which film company produced \"Amadeus\"?", "MGM (Metro-Goldwyn-Mayer) || MGM"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 3], "confidence": [0.004058837890625, 0.76953125], "model_response": [["Which film won the Oscar for Outstanding Picture in 1979, being the first one in alphabetical order?", "Amadeus || Amadeus"], ["Which film company produced \"Amadeus\"?", "Paramount Pictures || Paramount Pictures"]]}}}
{"hop1": {"hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.60546875, 0.96875], "model_response": [["What's the year when Canada the first time formally establish diplomatic relations with United States?", "1917 || 1917"], ["Which city hosted the first Olympic Games in 1917?", "Rome || Rome"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [0.83984375, 0.07568359375], "model_response": [["What's the year when Canada the first time formally establish diplomatic relations with United States?", "1917 || 1917"], ["Which city hosted the first Olympic Games in 1917?", "Rio de Janeiro || Rio de Janeiro"]]}, "mis_info_dict_severe": {"answer_condition": [1, 4], "confidence": [0.21303176879882812, 0.1826171875], "model_response": [["What's the year when Canada the first time formally establish diplomatic relations with United States?", "1917 || 1917"], ["Which city hosted the first Olympic Games in 1917?", "Rio de Janeiro || Rio de Janeiro"]]}, "mis_info_dict_light": {"answer_condition": [3, 4], "confidence": [1.0, 0.81640625], "model_response": [["What's the year when Canada the first time formally establish diplomatic relations with United States?", "1867 || 1867"], ["Which city hosted the first Olympic Games in 1867?", "Paris || Paris"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 4], "confidence": [0.3398895263671875, 0.99609375], "model_response": [["What's the year when Canada the first time formally establish diplomatic relations with United States?", "1777 || 1777"], ["Which city hosted the first Olympic Games in 1777?", "Philadelphia || Philadelphia"]]}, "hall_sbj_dict_severe": {"answer_condition": [4, 4], "confidence": [0.15727996826171875, 0.09228515625], "model_response": [["What's the year when Canada the first time formally establish diplomatic relations with United States?", "1787 || 1787"], ["Which city hosted the first Olympic Games in 1787?", "Paris || Paris"]]}}, "hop2": {"hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.8828125, 1.0], "model_response": [["What's the year when Canada the first time formally establish diplomatic relations with United States?", "1917 || 1917"], ["Which city hosted the first Olympic Games in 1917?", "Rome || Rome"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.99609375, 0.62109375], "model_response": [["What's the year when Canada the first time formally establish diplomatic relations with United States?", "1917 || 1917"], ["Which city hosted the first Olympic Games in 1917?", "Rome || Rome"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.98828125, 1.0], "model_response": [["What's the year when Canada the first time formally establish diplomatic relations with United States?", "1917 || 1917"], ["Which city hosted the first Olympic Games in 1917?", "Rome || Rome"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.583648681640625, 0.73046875], "model_response": [["What's the year when Canada the first time formally establish diplomatic relations with United States?", "1917 || 1917"], ["Which city hosted the first Olympic Games in 1917?", "Rome || Rome"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 3], "confidence": [0.8828125, 0.99609375], "model_response": [["What's the year when Canada the first time formally establish diplomatic relations with United States?", "1917 || 1917"], ["Which city hosted the first Olympic Games in 1917?", "London || London"]]}, "mis_info_dict_light": {"answer_condition": [4, 3], "confidence": [0.002219676971435547, 0.8671875], "model_response": [["What's the year when Canada the first time formally establish diplomatic relations with United States?", "1875 || 1875"], ["Which city hosted the first Olympic Games in 1875?", "Athens || Athens"]]}}}
{"hop1": {"hall_sbj_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.052642822265625], "model_response": [["Who was the US president in the year 1867?", "Andrew Johnson || Andrew Johnson"], ["Who is Andrew Johnson married to?", "Eliza Anderson || Eliza Anderson"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.96875, 0.1105499267578125], "model_response": [["Who was the US president in the year 1867?", "Andrew Johnson || Andrew Johnson"], ["Who is Andrew Johnson married to?", "Eliza McCardle || Eliza McCardle"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 4], "confidence": [1.0, 0.87890625], "model_response": [["Who was the US president in the year 1867?", "Abraham Lincoln || Abraham Lincoln"], ["Who was Abraham Lincoln married to?", "Mary Todd Lincoln || Mary Todd Lincoln"]]}, "mis_info_dict_light": {"answer_condition": [3, 4], "confidence": [1.0, 0.87890625], "model_response": [["Who was the US president in the year 1867?", "Abraham Lincoln || Abraham Lincoln"], ["Who was Abraham Lincoln married to?", "Mary Todd Lincoln || Mary Todd Lincoln"]]}, "mis_info_dict_severe": {"answer_condition": [4, 4], "confidence": [0.9921875, 0.98828125], "model_response": [["Who was the US president in the year 1867?", "Ulysses S. Grant || Ulysses S. Grant"], ["Who is Ulysses S. Grant married to?", "He was married to Julia Dent. || Julia Dent"]]}, "hall_sbj_dict_light": {"answer_condition": [4, 4], "confidence": [0.07568359375, 0.98046875], "model_response": [["Who was the US president in the year 1867?", "Ulysses S. Grant || Ulysses S. Grant"], ["Who is Ulysses S. Grant married to?", "He was married to Julia Dent, the daughter of a wealthy Ohio businessman. || Julia Dent"]]}}, "hop2": {"hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.96875, 0.92578125], "model_response": [["Who was the US president in the year 1867?", "Andrew Johnson || Andrew Johnson"], ["Who is Andrew Johnson married to?", "Eliza McCormick || Eliza McCormick"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [0.26171875, 0.0778656005859375], "model_response": [["Who was the US president in the year 1867?", "Andrew Johnson || Andrew Johnson"], ["Who is Andrew Johnson married to?", "Sarah Polk || Sarah Polk"]]}, "mis_info_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 1.0], "model_response": [["Who was the US president in the year 1867?", "Andrew Johnson || Andrew Johnson"], ["Who is Andrew Johnson married to?", "Martha Johnson || Martha Johnson"]]}, "mis_info_dict_severe": {"answer_condition": [1, 3], "confidence": [1.0, 1.0], "model_response": [["Who was the US president in the year 1867?", "Andrew Johnson || Andrew Johnson"], ["Who is Andrew Johnson married to?", "Andrew Johnson is married to Pizza. || Pizza"]]}, "hall_sbj_dict_light": {"answer_condition": [3, 1], "confidence": [0.60546875, 1.0], "model_response": [["Who was the US president in the year 1867?", "Abraham Lincoln || Abraham Lincoln"], ["Who was Abraham Lincoln married to?", "Eliza McCormick || Eliza McCormick"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 4], "confidence": [0.49609375, 0.889617919921875], "model_response": [["Who was the US president in the year 1867?", "Ulysses S. Grant || Ulysses S. Grant"], ["Who is Ulysses S. Grant married to?", "He was married to Julia Dent Grant. || Julia Dent Grant"]]}}}
{"hop1": {"unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.6260986328125, 0.99609375], "model_response": [["What is the national anthem of Russia?", "The National Anthem of Russia is \"The National Anthem of the Russian Federation\" || The National Anthem of the Russian Federation"], ["In which year was The National Anthem of Russia written?", "1874 || 1874"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.99609375, 1.0], "model_response": [["What is the national anthem of Russia?", "The National Anthem of Russia is \"The National Anthem of Russia\". || The National Anthem of Russia"], ["In which year was The National Anthem of Russia written?", "1874 || 1874"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.99609375, 1.0], "model_response": [["What is the national anthem of Russia?", "The National Anthem of Russia is \"The National Anthem of Russia\" || The National Anthem of Russia"], ["In which year was The National Anthem of Russia written?", "1874 || 1874"]]}, "mis_info_dict_light": {"answer_condition": [4, 4], "confidence": [1.0, 0.669708251953125], "model_response": [["What is the national anthem of Russia?", "Ode to Joy || Ode to Joy"], ["In which year was \"Ode to Joy\" written?", "1785 || 1785"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 1], "confidence": [0.10661713778972626, 0.9303741455078125], "model_response": [["What is the national anthem of Russia?", "The National Anthem of Russia is \"The Song of the Motherland\" (Russian: \u041f\u0435\u0441\u043d\u044f \u043e \u0442\u043e\u043c, \u0447\u0442\u043e \u0431\u044b\u043b\u0430 \u0431\u044b \u043d\u0430\u0448\u0430 \u0434\u0443\u0448\u0430). || The Song of the Motherland"], ["In which year was \"The Song of the Motherland\" written?", "1874 || 1874"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.437530517578125, 0.99609375], "model_response": [["What is the national anthem of Russia?", "The National Anthem of Russia is \"The National Anthem of the Russian Federation\" (Russian: \u0413\u043e\u0441\u0443\u0434\u0430\u0440\u0441\u0442\u0432\u0435\u043d\u043d\u044b\u0439 \u0433\u0438\u043c\u043d \u0420\u043e\u0441\u0441\u0438\u0439\u0441\u043a\u043e\u0439 \u0424\u0435\u0434\u0435\u0440\u0430\u0446\u0438\u0438). The lyrics were written by the poet Alexander Sergeyevich Pushkin in 1833, and the music was composed by Sergey Vasilyevich Rachmaninov in 1900. || The National Anthem of the Russian Federation"], ["In which year was The National Anthem of Russia written?", "1874 || 1874"]]}}, "hop2": {"unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.710296630859375, 0.8046875], "model_response": [["What is the national anthem of Russia?", "The National Anthem of Russia is \"The National Anthem of the Russian Federation\" || The National Anthem of the Russian Federation"], ["In which year was The National Anthem of Russia written?", "1874 || 1874"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.910797119140625, 1.0], "model_response": [["What is the national anthem of Russia?", "The National Anthem of Russia is \"The National Anthem of the Russian Federation\". || The National Anthem of the Russian Federation"], ["In which year was The National Anthem of Russia written?", "1874 || 1874"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.679779052734375, 1.0], "model_response": [["What is the national anthem of Russia?", "The National Anthem of Russia is \"The National Anthem of the Russian Federation\". || The National Anthem of the Russian Federation"], ["In which year was The National Anthem of Russia written?", "1874 || 1874"]]}, "mis_info_dict_severe": {"answer_condition": [1, 4], "confidence": [0.68902587890625, 0.98828125], "model_response": [["What is the national anthem of Russia?", "The National Anthem of Russia is \"The National Anthem of the Russian Federation\". || The National Anthem of the Russian Federation"], ["In which year was The National Anthem of Russia written?", "The National Anthem of Russia was written in the year Pizza. || Pizza"]]}, "mis_info_dict_light": {"answer_condition": [4, 4], "confidence": [0.06491470336914062, 0.99609375], "model_response": [["What is the national anthem of Russia?", "The National Anthem of Russia is \"The Star-Spangled Banner\" || The Star-Spangled Banner"], ["In which year was The Star-Spangled Banner written?", "1814 || 1814"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 4], "confidence": [0.03137898154818686, 0.030029296875], "model_response": [["What is the national anthem of Russia?", "The National Anthem of Russia is \"Russia, You Are Not Alone\". || Russia, You Are Not Alone"], ["In which year was the song \"Russia, You Are Not Alone\" written?", "1917 || 1917"]]}}}
{"hop1": {"hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.783935546875], "model_response": [["Who was the US president in the year 1950?", "Harry S. Truman || Harry S. Truman"], ["Who is Harry S. Truman married to?", "Elizabeth Truman || Elizabeth Truman"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.98046875, 0.7877197265625], "model_response": [["Who was the US president in the year 1950?", "Harry Truman || Harry Truman"], ["Who is Harry S. Truman married to?", "Elizabeth Truman || Elizabeth Truman"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.9532928466796875], "model_response": [["Who was the US president in the year 1950?", "Harry S. Truman || Harry S. Truman"], ["Who is Harry S. Truman married to?", "Elizabeth Truman || Elizabeth Truman"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.87890625, 1.0], "model_response": [["Who was the US president in the year 1950?", "Harry S. Truman || Harry S. Truman"], ["Who is Harry S. Truman married to?", "He was married to Bess Truman. || Bess Truman"]]}, "mis_info_dict_severe": {"answer_condition": [4, -1], "confidence": [1.0, -1], "model_response": [["Who was the US president in the year 1950?", "Pizza || Pizza"], ["Who is pizza married to?", "Pizza is not married. || N/A"]]}, "mis_info_dict_light": {"answer_condition": [4, 4], "confidence": [1.0, 0.99609375], "model_response": [["Who was the US president in the year 1950?", "Dwight D. Eisenhower || Dwight D. Eisenhower"], ["Who is Dwight D. Eisenhower married to?", "Dwight D. Eisenhower was married to Mamie Geneva Doud Eisenhower. || Mamie Geneva Doud Eisenhower"]]}}, "hop2": {"hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.498046875, 0.99609375], "model_response": [["Who was the US president in the year 1950?", "Harry Truman || Harry Truman"], ["Who is Harry S. Truman married to?", "Elizabeth Truman || Elizabeth Truman"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.7276153564453125, 0.17452239990234375], "model_response": [["Who was the US president in the year 1950?", "Harry Truman || Harry Truman"], ["Who is Harry S. Truman married to?", "Elizabeth Truman || Elizabeth Truman"]]}, "mis_info_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 1.0], "model_response": [["Who was the US president in the year 1950?", "Harry S. Truman || Harry S. Truman"], ["Who is Harry S. Truman married to?", "Margaret Truman || Margaret Truman"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [0.87890625, 0.09765625], "model_response": [["Who was the US president in the year 1950?", "Harry Truman || Harry Truman"], ["Who is Harry S. Truman married to?", "Margaret Truman || Margaret Truman"]]}, "mis_info_dict_severe": {"answer_condition": [1, 4], "confidence": [0.9921875, 0.9921875], "model_response": [["Who was the US president in the year 1950?", "Harry S. Truman || Harry S. Truman"], ["Who is Harry S. Truman married to?", "Harry S. Truman is married to pizza. || pizza"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 3], "confidence": [0.5, 0.98828125], "model_response": [["Who was the US president in the year 1950?", "Harry Truman || Harry Truman"], ["Who is Harry S. Truman married to?", "Mount Everest || Mount Everest"]]}}}
{"hop1": {"mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.46484375, 0.341796875], "model_response": [["Which country does London belong to?", "United Kingdom || United Kingdom"], ["What's the year when United Kingdom the first time formally establish diplomatic relations with Russia?", "1825 || 1825"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [0.53515625, 0.86328125], "model_response": [["Which country does London belong to?", "United Kingdom || United Kingdom"], ["What's the year when United Kingdom the first time formally establish diplomatic relations with Russia?", "1840 || 1840"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 4], "confidence": [0.115234375, 0.9610748291015625], "model_response": [["Which country does London belong to?", "The United Kingdom || The United Kingdom"], ["What's the year when United Kingdom the first time formally establish diplomatic relations with Russia?", "1840 || 1840"]]}, "mis_info_dict_light": {"answer_condition": [1, 4], "confidence": [0.431640625, 0.27734375], "model_response": [["Which country does London belong to?", "Great Britain || Great Britain"], ["What's the year when United Kingdom the first time formally establish diplomatic relations with Russia?", "1840 || 1840"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 4], "confidence": [0.2412109375, 0.84375], "model_response": [["Which country does London belong to?", "The United Kingdom || The United Kingdom"], ["What's the year when United Kingdom the first time formally establish diplomatic relations with Russia?", "1840 || 1840"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [0.2216796875, 0.83984375], "model_response": [["Which country does London belong to?", "England || England"], ["What's the year when United Kingdom the first time formally establish diplomatic relations with Russia?", "1840 || 1840"]]}}, "hop2": {"hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.640625, 1.0], "model_response": [["Which country does London belong to?", "United Kingdom || United Kingdom"], ["What's the year when United Kingdom the first time formally establish diplomatic relations with Russia?", "1825 || 1825"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.6484375, 1.0], "model_response": [["Which country does London belong to?", "United Kingdom || United Kingdom"], ["What's the year when United Kingdom the first time formally establish diplomatic relations with Russia?", "1825 || 1825"]]}, "mis_info_dict_light": {"answer_condition": [1, 3], "confidence": [0.57421875, 0.953125], "model_response": [["Which country does London belong to?", "The United Kingdom || The United Kingdom"], ["What's the year when United Kingdom the first time formally establish diplomatic relations with Russia?", "1800 || 1800"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [0.64453125, 0.828125], "model_response": [["Which country does London belong to?", "United Kingdom || United Kingdom"], ["What's the year when United Kingdom the first time formally establish diplomatic relations with Russia?", "1845 || 1845"]]}, "mis_info_dict_severe": {"answer_condition": [1, 4], "confidence": [0.90625, 0.10129165649414062], "model_response": [["Which country does London belong to?", "United Kingdom || United Kingdom"], ["What's the year when United Kingdom the first time formally establish diplomatic relations with Russia?", "1840 || 1840"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [0.296875, 0.411407470703125], "model_response": [["Which country does London belong to?", "Great Britain || Great Britain"], ["What's the year when United Kingdom the first time formally establish diplomatic relations with Russia?", "1840 || 1840"]]}}}
{"hop1": {"unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 0.99609375], "model_response": [["What is the national anthem of Canada?", "O Canada || O Canada"], ["In which year was \"O Canada\" written?", "1867 || 1867"]]}, "mis_info_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.921875], "model_response": [["What is the national anthem of Canada?", "O Canada || O Canada"], ["In which year was \"O Canada\" written?", "1867 || 1867"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.99609375], "model_response": [["What is the national anthem of Canada?", "O Canada || O Canada"], ["In which year was \"O Canada\" written?", "1867 || 1867"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 0.9609375], "model_response": [["What is the national anthem of Canada?", "O Canada || O Canada"], ["In which year was \"O Canada\" written?", "1867 || 1867"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.87890625], "model_response": [["What is the national anthem of Canada?", "O Canada || O Canada"], ["In which year was \"O Canada\" written?", "1867 || 1867"]]}, "mis_info_dict_light": {"answer_condition": [4, 4], "confidence": [0.9765625, 0.9689788818359375], "model_response": [["What is the national anthem of Canada?", "Maple Leaf Forever || Maple Leaf Forever"], ["In which year was \"Maple Leaf Forever\" written?", "1865 || 1865"]]}}, "hop2": {"hall_sbj_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 0.96893310546875], "model_response": [["What is the national anthem of Canada?", "O Canada || O Canada"], ["In which year was \"O Canada\" written?", "1867 || 1867"]]}, "mis_info_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.37548065185546875], "model_response": [["What is the national anthem of Canada?", "O Canada || O Canada"], ["In which year was \"O Canada\" written?", "1865 || 1865"]]}, "mis_info_dict_light": {"answer_condition": [1, 3], "confidence": [1.0, 1.0], "model_response": [["What is the national anthem of Canada?", "O Canada || O Canada"], ["In which year was \"O Canada\" written?", "1867 || 1867"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.91827392578125], "model_response": [["What is the national anthem of Canada?", "O Canada || O Canada"], ["In which year was \"O Canada\" written?", "1867 || 1867"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 0.98828125], "model_response": [["What is the national anthem of Canada?", "O Canada || O Canada"], ["In which year was \"O Canada\" written?", "1867 || 1867"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.94140625], "model_response": [["What is the national anthem of Canada?", "O Canada || O Canada"], ["In which year was \"O Canada\" written?", "1867 || 1867"]]}}}
{"hop1": {"unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 0.392578125], "model_response": [["Which country does Paris belong to?", "France || France"], ["What's the year when Jordan the first time formally establish diplomatic relations with France?", "1973 || 1973"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.41796875], "model_response": [["Which country does Paris belong to?", "France || France"], ["What's the year when Jordan the first time formally establish diplomatic relations with France?", "1973 || 1973"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.5703125], "model_response": [["Which country does Paris belong to?", "France || France"], ["What's the year when Jordan the first time formally establish diplomatic relations with France?", "1973 || 1973"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 0.197265625], "model_response": [["Which country does Paris belong to?", "France || France"], ["What's the year when Jordan the first time formally establish diplomatic relations with France?", "1960 || 1960"]]}, "mis_info_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.08349609375], "model_response": [["Which country does Paris belong to?", "France || France"], ["What's the year when Jordan the first time formally establish diplomatic relations with France?", "1972 || 1972"]]}, "mis_info_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 0.322265625], "model_response": [["Which country does Paris belong to?", "France || France"], ["What's the year when Jordan the first time formally establish diplomatic relations with France?", "1973 || 1973"]]}}, "hop2": {"hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.7265625], "model_response": [["Which country does Paris belong to?", "France || France"], ["What's the year when Jordan the first time formally establish diplomatic relations with France?", "1954 || 1954"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.98046875], "model_response": [["Which country does Paris belong to?", "France || France"], ["What's the year when Jordan the first time formally establish diplomatic relations with France?", "1954 || 1954"]]}, "mis_info_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.98046875], "model_response": [["Which country does Paris belong to?", "France || France"], ["What's the year when Jordan the first time formally establish diplomatic relations with France?", "1973 || 1973"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.1982421875], "model_response": [["Which country does Paris belong to?", "France || France"], ["What's the year when Jordan the first time formally establish diplomatic relations with France?", "1972 || 1972"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 0.177734375], "model_response": [["Which country does Paris belong to?", "France || France"], ["What's the year when Jordan the first time formally establish diplomatic relations with France?", "1972 || 1972"]]}, "mis_info_dict_light": {"answer_condition": [1, 3], "confidence": [1.0, 1.0], "model_response": [["Which country does Paris belong to?", "France || France"], ["What's the year when Jordan the first time formally establish diplomatic relations with France?", "1960 || 1960"]]}}}
{"hop1": {"unrelated_fact_dict_light": {"answer_condition": [-1, -1], "confidence": [-1, -1], "model_response": [["Which country is the northernmost in the UTC-4 time zone?", "I don't understand the question. Could you please rephrase it? || N/A"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.98046875, 0.56640625], "model_response": [["Which country is the northernmost in the UTC-4 time zone?", "Canada || Canada"], ["What's the year when Canada the first time formally establish diplomatic relations with United States?", "1917 || 1917"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.94140625, 0.8359375], "model_response": [["Which country is the northernmost in the UTC-4 time zone?", "Canada || Canada"], ["What's the year when Canada the first time formally establish diplomatic relations with United States?", "1917 || 1917"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.9375, 0.48046875], "model_response": [["Which country is the northernmost in the UTC-4 time zone?", "Canada || Canada"], ["What's the year when Canada the first time formally establish diplomatic relations with United States?", "1917 || 1917"]]}, "mis_info_dict_light": {"answer_condition": [3, 4], "confidence": [0.78515625, 0.9921875], "model_response": [["Which country is the northernmost in the UTC-4 time zone?", "Brazil || Brazil"], ["What's the year when Brazil first formally established diplomatic relations with the United States?", "1822 || 1822"]]}, "hall_sbj_dict_light": {"answer_condition": [3, 4], "confidence": [0.78515625, 0.99609375], "model_response": [["Which country is the northernmost in the UTC-4 time zone?", "Brazil || Brazil"], ["What's the year when Brazil first time formally established diplomatic relations with the United States?", "1822 || 1822"]]}}, "hop2": {"unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.48046875, 0.921875], "model_response": [["Which country is the northernmost in the UTC-4 time zone?", "Canada || Canada"], ["What's the year when Canada the first time formally establish diplomatic relations with United States?", "1917 || 1917"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.9453125, 1.0], "model_response": [["Which country is the northernmost in the UTC-4 time zone?", "Canada || Canada"], ["What's the year when Canada the first time formally establish diplomatic relations with United States?", "1917 || 1917"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.25390625, 1.0], "model_response": [["Which country is the northernmost in the UTC-4 time zone?", "Canada || Canada"], ["What's the year when Canada the first time formally establish diplomatic relations with United States?", "1917 || 1917"]]}, "mis_info_dict_light": {"answer_condition": [1, 3], "confidence": [0.69921875, 1.0], "model_response": [["Which country is the northernmost in the UTC-4 time zone?", "Canada || Canada"], ["What's the year when Canada the first time formally establish diplomatic relations with United States?", "1867 || 1867"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 4], "confidence": [0.6796875, 0.051555633544921875], "model_response": [["Which country is the northernmost in the UTC-4 time zone?", "Norway || Norway"], ["What's the year when Norway the first time formally establish diplomatic relations with United States?", "1865 || 1865"]]}, "mis_info_dict_severe": {"answer_condition": [4, 4], "confidence": [0.66015625, 0.0255126953125], "model_response": [["Which country is the northernmost in the UTC-4 time zone?", "Norway || Norway"], ["What's the year when Norway first time formally establish diplomatic relations with United States?", "1850 || 1850"]]}}}
{"hop1": {"hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.9221649169921875], "model_response": [["Who was the US president in the year 1814?", "James Madison || James Madison"], ["Who is James Madison married to?", "Dolley Madison || Dolley Madison"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.92578125], "model_response": [["Who was the US president in the year 1814?", "James Madison || James Madison"], ["Who is James Madison married to?", "Dolley Madison || Dolley Madison"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.96875], "model_response": [["Who was the US president in the year 1814?", "James Madison || James Madison"], ["Who is James Madison married to?", "Dolley Madison || Dolley Madison"]]}, "mis_info_dict_severe": {"answer_condition": [4, 4], "confidence": [0.0009489655494689941, 0.921875], "model_response": [["Who was the US president in the year 1814?", "Abraham Lincoln || Abraham Lincoln"], ["Who is Abraham Lincoln married to?", "Mary Todd Lincoln || Mary Todd Lincoln"]]}, "mis_info_dict_light": {"answer_condition": [4, 4], "confidence": [1.0, 0.98443603515625], "model_response": [["Who was the US president in the year 1814?", "Thomas Jefferson || Thomas Jefferson"], ["Who is Thomas Jefferson married to?", "Married to Martha Jefferson || Martha Jefferson"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.92578125], "model_response": [["Who was the US president in the year 1814?", "James Madison || James Madison"], ["Who is James Madison married to?", "Dolley Madison || Dolley Madison"]]}}, "hop2": {"unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.2710723876953125], "model_response": [["Who was the US president in the year 1814?", "James Madison || James Madison"], ["Who is James Madison married to?", "Dolley Madison || Dolley Madison"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.99609375], "model_response": [["Who was the US president in the year 1814?", "James Madison || James Madison"], ["Who is James Madison married to?", "Dolley Madison || Dolley Madison"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.701934814453125], "model_response": [["Who was the US president in the year 1814?", "James Madison || James Madison"], ["Who is James Madison married to?", "Dolly Madison || Dolly Madison"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 0.7142096757888794], "model_response": [["Who was the US president in the year 1814?", "James Madison || James Madison"], ["Who is James Madison married to?", "Abigail Adams || Abigail Adams"]]}, "mis_info_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 1.0], "model_response": [["Who was the US president in the year 1814?", "James Madison was the US president in the year 1814. || James Madison"], ["Who is James Madison married to?", "James Madison is married to Pizza. || Pizza"]]}, "mis_info_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 1.0], "model_response": [["Who was the US president in the year 1814?", "James Madison was the US president in the year 1814. || James Madison"], ["Who is James Madison married to?", "Martha Washington || Martha Washington"]]}}}
{"hop1": {"unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.99609375, 1.0], "model_response": [["What is the name of the longest river in Canada?", "The Mackenzie River || Mackenzie River"], ["On which continent is the Mackenzie River located?", "North America || North America"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.87890625, 1.0], "model_response": [["What is the name of the longest river in Canada?", "The Mackenzie River || The Mackenzie River"], ["On which continent is the Mackenzie River located?", "North America || North America"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["What is the name of the longest river in Canada?", "The Mackenzie River || Mackenzie River"], ["On which continent is the Mackenzie River located?", "North America || North America"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.9143829345703125, 1.0], "model_response": [["What is the name of the longest river in Canada?", "The Mackenzie River || The Mackenzie River"], ["On which continent is the Mackenzie River located?", "North America || North America"]]}, "mis_info_dict_severe": {"answer_condition": [4, 1], "confidence": [0.5234375, 1.0], "model_response": [["What is the name of the longest river in Canada?", "The name of the longest river in Canada is the St. Lawrence River. || St. Lawrence River"], ["On which continent is the St. Lawrence River located?", "North America || North America"]]}, "mis_info_dict_light": {"answer_condition": [3, 1], "confidence": [0.9921875, 1.0], "model_response": [["What is the name of the longest river in Canada?", "The St. Lawrence River || St. Lawrence River"], ["On which continent is the St. Lawrence River located?", "North America || North America"]]}}, "hop2": {"mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.99609375, 1.0], "model_response": [["What is the name of the longest river in Canada?", "The Mackenzie River is the longest river in Canada. || Mackenzie River"], ["On which continent is the Mackenzie River located?", "North America || North America"]]}, "mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [0.99609375, 1.0], "model_response": [["What is the name of the longest river in Canada?", "The Mackenzie River is the longest river in Canada. || Mackenzie River"], ["On which continent is the Mackenzie River located?", "North America || North America"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.80078125, 1.0], "model_response": [["What is the name of the longest river in Canada?", "The Mackenzie River is the longest river in Canada. || Mackenzie River"], ["On which continent is the Mackenzie River located?", "North America || North America"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.97265625, 1.0], "model_response": [["What is the name of the longest river in Canada?", "The Mackenzie River is the longest river in Canada. || Mackenzie River"], ["On which continent is the Mackenzie River located?", "North America || North America"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.486328125, 1.0], "model_response": [["What is the name of the longest river in Canada?", "The Mackenzie River is the longest river in Canada. || Mackenzie River"], ["On which continent is the Mackenzie River located?", "North America || North America"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.259765625, 1.0], "model_response": [["What is the name of the longest river in Canada?", "The Mackenzie River is the longest river in Canada. || Mackenzie River"], ["On which continent is the Mackenzie River located?", "North America || North America"]]}}}
{"hop1": {"unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.8686333894729614, 1.0], "model_response": [["Who is the president / leader of China in the year 1945?", "Chiang Kai-shek || Chiang Kai-shek"], ["In which year was Chiang Kai-shek born?", "1887 || 1887"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.9805753827095032, 1.0], "model_response": [["Who is the president / leader of China in the year 1945?", "Chiang Kai-shek || Chiang Kai-shek"], ["In which year was Chiang Kai-shek born?", "1887 || 1887"]]}, "mis_info_dict_severe": {"answer_condition": [3, -1], "confidence": [0.91796875, -1], "model_response": [["Who is the president / leader of China in the year 1945?", "Chocolate cake. || Chocolate cake"], ["In which year was chocolate cake born?", "I'm sorry, I don't understand the question. Please rephrase. || N/A"]]}, "mis_info_dict_light": {"answer_condition": [3, 4], "confidence": [1.0, 0.8515625], "model_response": [["Who is the president / leader of China in the year 1945?", "Mao Zedong || Mao Zedong"], ["In which year was Mao Zedong born?", "1893 || 1893"]]}, "hall_sbj_dict_severe": {"answer_condition": [4, 4], "confidence": [0.9689788818359375, 1.0], "model_response": [["Who is the president / leader of China in the year 1945?", "Sun Yat-sen || Sun Yat-sen"], ["In which year was Sun Yat-sen born?", "1866 || 1866"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 4], "confidence": [0.30933380126953125, 0.90472412109375], "model_response": [["Who is the president / leader of China in the year 1945?", "Chou En-Lai || Chou En-Lai"], ["In which year was Chou En-Lai born?", "1899 || 1899"]]}}, "hop2": {"hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.49609375, 1.0], "model_response": [["Who is the president / leader of China in the year 1945?", "Chiang Kai-shek || Chiang Kai-shek"], ["In which year was Chiang Kai-shek born?", "1887 || 1887"]]}, "mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.99609375], "model_response": [["Who is the president / leader of China in the year 1945?", "Chiang Kai-shek || Chiang Kai-shek"], ["In which year was Chiang Kai-shek born?", "1887 || 1887"]]}, "mis_info_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.810028076171875], "model_response": [["Who is the president / leader of China in the year 1945?", "Chiang Kai-shek || Chiang Kai-shek"], ["In which year was Chiang Kai-shek born?", "1907 || 1907"]]}, "hall_sbj_dict_light": {"answer_condition": [3, 1], "confidence": [0.953125, 1.0], "model_response": [["Who is the president / leader of China in the year 1945?", "Mao Zedong || Mao Zedong"], ["In which year was Mao Zedong born?", "1887 || 1887"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 4], "confidence": [0.5727508664131165, 0.7265625], "model_response": [["Who is the president / leader of China in the year 1945?", "Chou En-lai || Chou En-lai"], ["In which year was Chou En-lai born?", "1897 || 1897"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 4], "confidence": [0.439453125, 0.47283935546875], "model_response": [["Who is the president / leader of China in the year 1945?", "Chou En-lai || Chou En-lai"], ["In which year was Chou En-lai born?", "1897 || 1897"]]}}}
{"hop1": {"unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.60546875, 0.8570709228515625], "model_response": [["Which country does London belong to?", "United Kingdom || United Kingdom"], ["What's the year when Russia the first time formally establish diplomatic relations with United Kingdom?", "1840 || 1840"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.57421875, 0.7239227294921875], "model_response": [["Which country does London belong to?", "United Kingdom || United Kingdom"], ["What's the year when Russia the first time formally establish diplomatic relations with United Kingdom?", "1840 || 1840"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.8515625, 0.5278778076171875], "model_response": [["Which country does London belong to?", "United Kingdom || United Kingdom"], ["What's the year when Russia the first time formally establish diplomatic relations with United Kingdom?", "1840 || 1840"]]}, "mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [0.021484375, 0.81195068359375], "model_response": [["Which country does London belong to?", "England || England"], ["What's the year when Russia the first time formally establish diplomatic relations with United Kingdom?", "1840 || 1840"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 4], "confidence": [0.65625, 0.538604736328125], "model_response": [["Which country does London belong to?", "United Kingdom || United Kingdom"], ["What's the year when Russia the first time formally establish diplomatic relations with United Kingdom?", "1825 || 1825"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [0.53515625, 0.0023415088653564453], "model_response": [["Which country does London belong to?", "United Kingdom || United Kingdom"], ["What's the year when Russia the first time formally establish diplomatic relations with United Kingdom?", "1756 || 1756"]]}}, "hop2": {"hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.93359375, 1.0], "model_response": [["Which country does London belong to?", "United Kingdom || United Kingdom"], ["What's the year when Russia the first time formally establish diplomatic relations with United Kingdom?", "1840 || 1840"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.80859375, 0.88018798828125], "model_response": [["Which country does London belong to?", "United Kingdom || United Kingdom"], ["What's the year when Russia the first time formally establish diplomatic relations with United Kingdom?", "1840 || 1840"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.25390625, 0.3622283935546875], "model_response": [["Which country does London belong to?", "Great Britain || Great Britain"], ["What's the year when Russia the first time formally establish diplomatic relations with United Kingdom?", "1840 || 1840"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.859375, 0.96875], "model_response": [["Which country does London belong to?", "United Kingdom || United Kingdom"], ["What's the year when Russia the first time formally establish diplomatic relations with United Kingdom?", "1840 || 1840"]]}, "mis_info_dict_light": {"answer_condition": [1, 3], "confidence": [0.2392578125, 1.0], "model_response": [["Which country does London belong to?", "United Kingdom || United Kingdom"], ["What's the year when Russia the first time formally establish diplomatic relations with United Kingdom?", "1860 || 1860"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.466796875, 0.89306640625], "model_response": [["Which country does London belong to?", "Great Britain || Great Britain"], ["What's the year when Russia the first time formally establish diplomatic relations with United Kingdom?", "1840 || 1840"]]}}}
{"hop1": {"mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.97265625, 0.5273316502571106], "model_response": [["What is the capital of Finland?", "Helsinki || Helsinki"], ["What is the time zone of Oslo in UTC?", "UTC+1 || UTC+1"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.98828125, 0.4592742919921875], "model_response": [["What is the capital of Finland?", "Helsinki || Helsinki"], ["What is the time zone of Oslo in UTC?", "UTC +1 || UTC +1"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.90625, 0.7219085693359375], "model_response": [["What is the capital of Finland?", "Helsinki || Helsinki"], ["What is the time zone of Oslo in UTC?", "UTC +1 || +1"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.90625, 0.7219085693359375], "model_response": [["What is the capital of Finland?", "Helsinki || Helsinki"], ["What is the time zone of Oslo in UTC?", "UTC +1 || UTC +1"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.9921875, 0.439453125], "model_response": [["What is the capital of Finland?", "Helsinki || Helsinki"], ["What is the time zone of Oslo in UTC?", "UTC +1 || UTC +1"]]}, "mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [0.96875, 0.4805908203125], "model_response": [["What is the capital of Finland?", "Helsinki || Helsinki"], ["What is the time zone of Oslo in UTC?", "UTC +1 || UTC +1"]]}}, "hop2": {"unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.93359375, 0.7634237408638], "model_response": [["What is the capital of Finland?", "Helsinki || Helsinki"], ["What is the time zone of Oslo in UTC?", "UTC+1 || UTC+1"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.80859375, 0.490234375], "model_response": [["What is the capital of Finland?", "Helsinki || Helsinki"], ["What is the time zone of Oslo in UTC?", "UTC+1 || UTC+1"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 4], "confidence": [0.94921875, 0.5], "model_response": [["What is the capital of Finland?", "Helsinki || Helsinki"], ["What is the time zone of Oslo in UTC?", "UTC+2 || UTC+2"]]}, "mis_info_dict_severe": {"answer_condition": [1, 4], "confidence": [0.921875, 0.60546875], "model_response": [["What is the capital of Finland?", "Helsinki || Helsinki"], ["What is the time zone of Oslo in UTC?", "Europe/Oslo || Europe/Oslo"]]}, "mis_info_dict_light": {"answer_condition": [4, 4], "confidence": [0.12844085693359375, 0.87890625], "model_response": [["What is the capital of Finland?", "Helena || Helena"], ["What is the time zone of Helena in UTC?", "UTC-7 || UTC-7"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 4], "confidence": [0.91796875, 0.73046875], "model_response": [["What is the capital of Finland?", "Helsinki || Helsinki"], ["What is the time zone of Oslo in UTC?", "UTC+2 || UTC+2"]]}}}
{"hop1": {"hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.9609375], "model_response": [["From which country does the Volga originate?", "Russia || Russia"], ["What's the year when Norway the first time formally establish diplomatic relations with Russia?", "1825 || 1825"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.875, 0.8984375], "model_response": [["From which country does the Volga originate?", "Russia || Russia"], ["What's the year when Norway the first time formally establish diplomatic relations with Russia?", "1825 || 1825"]]}, "mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [0.5, 0.9765625], "model_response": [["From which country does the Volga originate?", "Russia || Russia"], ["What's the year when Norway the first time formally establish diplomatic relations with Russia?", "1825 || 1825"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.99609375, 0.92578125], "model_response": [["From which country does the Volga originate?", "Russia || Russia"], ["What's the year when Norway the first time formally establish diplomatic relations with Russia?", "1825 || 1825"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.98828125], "model_response": [["From which country does the Volga originate?", "Russia || Russia"], ["What's the year when Norway the first time formally establish diplomatic relations with Russia?", "1825 || 1825"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.99609375, 0.984375], "model_response": [["From which country does the Volga originate?", "Russia || Russia"], ["What's the year when Norway the first time formally establish diplomatic relations with Russia?", "1825 || 1825"]]}}, "hop2": {"unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.99609375, 0.86328125], "model_response": [["From which country does the Volga originate?", "Russia || Russia"], ["What's the year when Norway the first time formally establish diplomatic relations with Russia?", "1825 || 1825"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.765625], "model_response": [["From which country does the Volga originate?", "Russia || Russia"], ["What's the year when Norway the first time formally establish diplomatic relations with Russia?", "1825 || 1825"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["From which country does the Volga originate?", "Russia || Russia"], ["What's the year when Norway the first time formally establish diplomatic relations with Russia?", "1825 || 1825"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["From which country does the Volga originate?", "Russia || Russia"], ["What's the year when Norway the first time formally establish diplomatic relations with Russia?", "1825 || 1825"]]}, "mis_info_dict_light": {"answer_condition": [1, 3], "confidence": [1.0, 0.98046875], "model_response": [["From which country does the Volga originate?", "Russia || Russia"], ["What's the year when Norway the first time formally establish diplomatic relations with Russia?", "1900 || 1900"]]}, "mis_info_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.046703338623046875], "model_response": [["From which country does the Volga originate?", "Russia || Russia"], ["What's the year when Norway the first time formally establish diplomatic relations with Russia?", "1721 || 1721"]]}}}
{"hop1": {"mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.99609375], "model_response": [["What is the capital of China?", "Beijing || Beijing"], ["What is the name of the largest university/college in Beijing by area?", "Beijing University || Beijing University"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.99609375, 1.0], "model_response": [["What is the capital of China?", "Beijing || Beijing"], ["What is the name of the largest university/college in Beijing by area?", "Beijing University || Beijing University"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["What is the capital of China?", "Beijing || Beijing"], ["What is the name of the largest university/college in Beijing by area?", "Beijing University || Beijing University"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.92578125, 0.99609375], "model_response": [["What is the capital of China?", "Beijing || Beijing"], ["What is the name of the largest university/college in Beijing by area?", "Beijing University || Beijing University"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["What is the capital of China?", "Beijing || Beijing"], ["What is the name of the largest university/college in Beijing by area?", "Beijing University || Beijing University"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.98046875, 0.99609375], "model_response": [["What is the capital of China?", "Beijing || Beijing"], ["What is the name of the largest university/college in Beijing by area?", "Beijing University || Beijing University"]]}}, "hop2": {"mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.99609375, 0.73046875], "model_response": [["What is the capital of China?", "Beijing || Beijing"], ["What is the name of the largest university/college in Beijing by area?", "Beijing University || Beijing University"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.99609375, 0.9921875], "model_response": [["What is the capital of China?", "Beijing || Beijing"], ["What is the name of the largest university/college in Beijing by area?", "Beijing University || Beijing University"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.98046875, 1.0], "model_response": [["What is the capital of China?", "Beijing || Beijing"], ["What is the name of the largest university/college in Beijing by area?", "Beijing University || Beijing University"]]}, "mis_info_dict_light": {"answer_condition": [1, 3], "confidence": [1.0, 1.0], "model_response": [["What is the capital of China?", "Beijing || Beijing"], ["What is the name of the largest university/college in Beijing by area?", "Tsinghua University || Tsinghua University"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 3], "confidence": [0.99609375, 1.0], "model_response": [["What is the capital of China?", "Beijing || Beijing"], ["What is the name of the largest university/college in Beijing by area?", "Shanghai || Shanghai"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 3], "confidence": [0.9921875, 1.0], "model_response": [["What is the capital of China?", "Beijing || Beijing"], ["What is the name of the largest university/college in Beijing by area?", "Mount Everest || Mount Everest"]]}}}
{"hop1": {"unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [0.38808882236480713, 0.953125], "model_response": [["Which film won the Oscar for Outstanding Picture in 1954, being the first one in alphabetical order?", "The Bells of St. Mary's || The Bells of St. Mary's"], ["Who is the director of the movie \"The Bells of St. Mary's\"?", "King Vidor || King Vidor"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [0.91107177734375, 0.98046875], "model_response": [["Which film won the Oscar for Outstanding Picture in 1954, being the first one in alphabetical order?", "The Bells of St. Mary's || The Bells of St. Mary's"], ["Who is the director of the movie \"The Bells of St. Mary's\"?", "King Vidor || King Vidor"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 4], "confidence": [0.86474609375, 0.07932853698730469], "model_response": [["Which film won the Oscar for Outstanding Picture in 1954, being the first one in alphabetical order?", "The Bells of St. Mary's || The Bells of St. Mary's"], ["Who is the director of the movie \"The Bells of St. Mary's\"?", "Frank Capra || Frank Capra"]]}, "hall_sbj_dict_severe": {"answer_condition": [3, 4], "confidence": [1.0, 0.00614476203918457], "model_response": [["Which film won the Oscar for Outstanding Picture in 1954, being the first one in alphabetical order?", "Sunflowers || Sunflowers"], ["Who is the director of the movie \"Sunflowers\"?", "William Wyler || William Wyler"]]}, "mis_info_dict_light": {"answer_condition": [3, 4], "confidence": [1.0, 1.0], "model_response": [["Which film won the Oscar for Outstanding Picture in 1954, being the first one in alphabetical order?", "All About Eve || All About Eve"], ["Who is the director of the movie \"All About Eve\"?", "Joseph L. Mankiewicz || Joseph L. Mankiewicz"]]}, "mis_info_dict_severe": {"answer_condition": [3, 4], "confidence": [0.9161262512207031, 0.98828125], "model_response": [["Which film won the Oscar for Outstanding Picture in 1954, being the first one in alphabetical order?", "Chocolate Chip Cookies || Chocolate Chip Cookies"], ["Who is the director of the movie \"Chocolate Chip Cookies\"?", "Unknown || Unknown"]]}}, "hop2": {"hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.4249083995819092, 1.0], "model_response": [["Which film won the Oscar for Outstanding Picture in 1954, being the first one in alphabetical order?", "The Bells of St. Mary's || The Bells of St. Mary's"], ["Who is the director of the movie \"The Bells of St. Mary's\"?", "Kevin Reynolds || Kevin Reynolds"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [0.37342071533203125, 0.921875], "model_response": [["Which film won the Oscar for Outstanding Picture in 1954, being the first one in alphabetical order?", "The Bells of St. Mary's || The Bells of St. Mary's"], ["Who is the director of the movie \"The Bells of St. Mary's\"?", "King Vidor || King Vidor"]]}, "mis_info_dict_severe": {"answer_condition": [1, 4], "confidence": [0.97265625, 0.48053741455078125], "model_response": [["Which film won the Oscar for Outstanding Picture in 1954, being the first one in alphabetical order?", "The Bells of St. Mary's || The Bells of St. Mary's"], ["Who is the director of the movie \"The Bells of St. Mary's\"?", "John Huston || John Huston"]]}, "mis_info_dict_light": {"answer_condition": [1, 3], "confidence": [0.87890625, 1.0], "model_response": [["Which film won the Oscar for Outstanding Picture in 1954, being the first one in alphabetical order?", "The Bells of St. Mary's || The Bells of St. Mary's"], ["Who is the director of the movie \"The Bells of St. Mary's\"?", "Alfred Hitchcock || Alfred Hitchcock"]]}, "hall_sbj_dict_severe": {"answer_condition": [4, 4], "confidence": [0.596832275390625, 1.0], "model_response": [["Which film won the Oscar for Outstanding Picture in 1954, being the first one in alphabetical order?", "The Bridge on the River Kwai || The Bridge on the River Kwai"], ["Who is the director of the movie \"The Bridge on the River Kwai\"?", "David Lean || David Lean"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 4], "confidence": [0.026715606451034546, 0.9922027587890625], "model_response": [["Which film won the Oscar for Outstanding Picture in 1954, being the first one in alphabetical order?", "The Barefoot Contessa || The Barefoot Contessa"], ["Who is the director of the movie \"The Barefoot Contessa\"?", "Mervyn LeRoy || Mervyn LeRoy"]]}}}
{"hop1": {"hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Who is the CEO of United Artists in the year 1994?", "Barry Diller || Barry Diller"], ["In which city was Barry Diller born?", "New York City || New York City"]]}, "hall_sbj_dict_severe": {"answer_condition": [4, 1], "confidence": [0.2593994140625, 0.98046875], "model_response": [["Who is the CEO of United Artists in the year 1994?", "Robert Evans || Robert Evans"], ["In which city was Robert Evans born?", "New York City || New York City"]]}, "mis_info_dict_severe": {"answer_condition": [3, 1], "confidence": [0.9766387939453125, 0.451934814453125], "model_response": [["Who is the CEO of United Artists in the year 1994?", "Chocolate cake || Chocolate cake"], ["In which city was chocolate cake born?", "New York City || New York City"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 1], "confidence": [0.033203125, 0.99609375], "model_response": [["Who is the CEO of United Artists in the year 1994?", "David Geffen || David Geffen"], ["In which city was David Geffen born?", "New York City || New York City"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 1], "confidence": [0.27056884765625, 0.94921875], "model_response": [["Who is the CEO of United Artists in the year 1994?", "Robert Evans || Robert Evans"], ["In which city was Robert Evans born?", "New York City || New York City"]]}, "mis_info_dict_light": {"answer_condition": [4, 4], "confidence": [1.0, 0.89141845703125], "model_response": [["Who is the CEO of United Artists in the year 1994?", "Steven Spielberg || Steven Spielberg"], ["In which city was Steven Spielberg born?", "Cincinnati, Ohio || Cincinnati, Ohio"]]}}, "hop2": {"mis_info_dict_light": {"answer_condition": [1, 3], "confidence": [1.0, 0.87890625], "model_response": [["Who is the CEO of United Artists in the year 1994?", "Barry Diller || Barry Diller"], ["In which city was Barry Diller born?", "Los Angeles || Los Angeles"]]}, "mis_info_dict_severe": {"answer_condition": [4, 1], "confidence": [0.275390625, 0.87890625], "model_response": [["Who is the CEO of United Artists in the year 1994?", "Bob Daly || Bob Daly"], ["In which city was Bob Daly born?", "New York City || New York City"]]}, "hall_sbj_dict_severe": {"answer_condition": [4, 1], "confidence": [0.63671875, 0.5703125], "model_response": [["Who is the CEO of United Artists in the year 1994?", "Bob Daly || Bob Daly"], ["In which city was Bob Daly born?", "New York City || New York City"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 4], "confidence": [0.210113525390625, 0.255859375], "model_response": [["Who is the CEO of United Artists in the year 1994?", "Bob Daly || Bob Daly"], ["In which city was Bob Daly born?", "Minneapolis || Minneapolis"]]}, "hall_sbj_dict_light": {"answer_condition": [4, 4], "confidence": [0.25096893310546875, 0.228515625], "model_response": [["Who is the CEO of United Artists in the year 1994?", "Bob Daly || Bob Daly"], ["In which city was Bob Daly born?", "Minneapolis || Minneapolis"]]}, "unrelated_fact_dict_severe": {"answer_condition": [3, 3], "confidence": [0.001839756965637207, 1.0], "model_response": [["Who is the CEO of United Artists in the year 1994?", "Serena Williams was born in Los Angeles. She is the CEO of United Artists in the year 1994. || Serena Williams"], ["In which city was Serena Williams born?", "Los Angeles || Los Angeles"]]}}}
{"hop1": {"unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.972808837890625], "model_response": [["What is the capital of Japan?", "Tokyo || Tokyo"], ["What is the time zone of Tokyo in UTC?", "UTC+9 || UTC+9"]]}, "mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.94940185546875], "model_response": [["What is the capital of Japan?", "Tokyo || Tokyo"], ["What is the time zone of Tokyo in UTC?", "UTC+9 || UTC+9"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.94940185546875], "model_response": [["What is the capital of Japan?", "Tokyo || Tokyo"], ["What is the time zone of Tokyo in UTC?", "UTC+9 || UTC+9"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.87890625], "model_response": [["What is the capital of Japan?", "Tokyo || Tokyo"], ["What is the time zone of Tokyo in UTC?", "UTC+9 || UTC+9"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.87890625], "model_response": [["What is the capital of Japan?", "Tokyo || Tokyo"], ["What is the time zone of Tokyo in UTC?", "UTC+9 || UTC+9"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.94940185546875], "model_response": [["What is the capital of Japan?", "Tokyo || Tokyo"], ["What is the time zone of Tokyo in UTC?", "UTC+9 || UTC+9"]]}}, "hop2": {"hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.267425537109375], "model_response": [["What is the capital of Japan?", "Tokyo || Tokyo"], ["What is the time zone of Tokyo in UTC?", "UTC +9 || UTC +9"]]}, "mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.1126251220703125], "model_response": [["What is the capital of Japan?", "Tokyo || Tokyo"], ["What is the time zone of Tokyo in UTC?", "UTC +9 || UTC +9"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.8686333894729614], "model_response": [["What is the capital of Japan?", "Tokyo || Tokyo"], ["What is the time zone of Tokyo in UTC?", "UTC+9 || UTC+9"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.33130645751953125], "model_response": [["What is the capital of Japan?", "Tokyo || Tokyo"], ["What is the time zone of Tokyo in UTC?", "UTC+9 || UTC+9"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.7455199956893921], "model_response": [["What is the capital of Japan?", "Tokyo || Tokyo"], ["What is the time zone of Tokyo in UTC?", "Tokyo is in the UTC+9 time zone. || UTC+9"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.10830098390579224], "model_response": [["What is the capital of Japan?", "Tokyo || Tokyo"], ["What is the time zone of Tokyo in UTC?", "UTC+9 || UTC+9"]]}}}
{"hop1": {"hall_sbj_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 0.98046875], "model_response": [["In which year was \"The Star-Spangled Banner\" written?", "1814 || 1814"], ["Who is the headmaster of Yale University in the year 1814?", "Elihu Yale || Elihu Yale"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 4], "confidence": [0.9921875, 0.96875], "model_response": [["In which year was \"The Star-Spangled Banner\" written?", "1814 || 1814"], ["Who is the headmaster of Yale University in the year 1814?", "Elihu Yale || Elihu Yale"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [0.9921875, 0.9765625], "model_response": [["In which year was \"The Star-Spangled Banner\" written?", "1814 || 1814"], ["Who is the headmaster of Yale University in the year 1814?", "Elihu Yale || Elihu Yale"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [0.99609375, 0.9453125], "model_response": [["In which year was \"The Star-Spangled Banner\" written?", "1814 || 1814"], ["Who is the headmaster of Yale University in the year 1814?", "Elihu Yale || Elihu Yale"]]}, "mis_info_dict_severe": {"answer_condition": [1, 4], "confidence": [0.953125, 0.9140625], "model_response": [["In which year was \"The Star-Spangled Banner\" written?", "1814 || 1814"], ["Who is the headmaster of Yale University in the year 1814?", "Elihu Yale || Elihu Yale"]]}, "mis_info_dict_light": {"answer_condition": [4, 4], "confidence": [1.0, 0.9384613037109375], "model_response": [["In which year was \"The Star-Spangled Banner\" written?", "1776 || 1776"], ["Who is the headmaster of Yale University in the year 1776?", "Elihu Yale || Elihu Yale"]]}}, "hop2": {"hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.62109375, 0.94140625], "model_response": [["In which year was \"The Star-Spangled Banner\" written?", "1814 || 1814"], ["Who is the headmaster of Yale University in the year 1814?", "Thomas Buckle || Thomas Buckle"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.98046875, 0.7109375], "model_response": [["In which year was \"The Star-Spangled Banner\" written?", "1814 || 1814"], ["Who is the headmaster of Yale University in the year 1814?", "Thomas Buckle || Thomas Buckle"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 3], "confidence": [0.99609375, 1.0], "model_response": [["In which year was \"The Star-Spangled Banner\" written?", "1814 || 1814"], ["Who is the headmaster of Yale University in the year 1814?", "John Thornton Kirkland || John Thornton Kirkland"]]}, "mis_info_dict_light": {"answer_condition": [1, 4], "confidence": [0.99609375, 1.0], "model_response": [["In which year was \"The Star-Spangled Banner\" written?", "1814 || 1814"], ["Who is the headmaster of Yale University in the year 1814?", "John Adams || John Adams"]]}, "mis_info_dict_severe": {"answer_condition": [1, 3], "confidence": [0.99609375, 0.2708587646484375], "model_response": [["In which year was \"The Star-Spangled Banner\" written?", "1814 || 1814"], ["Who is the headmaster of Yale University in the year 1814?", "Dr. Chocolate Cake. || Dr. Chocolate Cake"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [0.953125, 0.11501312255859375], "model_response": [["In which year was \"The Star-Spangled Banner\" written?", "1814 || 1814"], ["Who is the headmaster of Yale University in the year 1814?", "John Davison (1752-1828) || John Davison"]]}}}
{"hop1": {"unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.58984375, 0.336456298828125], "model_response": [["Which country is the northernmost in the time zone with a UTC offset of -3?", "Norway || Norway"], ["What are the colors on the national flag of Norway?", "Blue and white || Blue and white"]]}, "hall_sbj_dict_severe": {"answer_condition": [4, 1], "confidence": [0.2890625, 0.498046875], "model_response": [["Which country is the northernmost in the time zone with a UTC offset of -3?", "Canada || Canada"], ["What are the colors on the national flag of Canada?", "Red and white || Red and white"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 4], "confidence": [0.984375, 0.25812147343094693], "model_response": [["Which country is the northernmost in the time zone with a UTC offset of -3?", "Brazil || Brazil"], ["What are the colors on the national flag of Brazil?", "Green, Yellow, and Blue || Green, Yellow, and Blue"]]}, "mis_info_dict_severe": {"answer_condition": [4, 1], "confidence": [0.8779296875, 0.7236971259117126], "model_response": [["Which country is the northernmost in the time zone with a UTC offset of -3?", "Iceland || Iceland"], ["What are the colors on the national flag of Iceland?", "The colors on the national flag of Iceland are blue, white, and red. || blue, white, and red"]]}, "hall_sbj_dict_light": {"answer_condition": [3, 4], "confidence": [0.984375, 0.25812147343094693], "model_response": [["Which country is the northernmost in the time zone with a UTC offset of -3?", "Brazil || Brazil"], ["What are the colors on the national flag of Brazil?", "Green, Yellow, and Blue || Green, Yellow, and Blue"]]}, "mis_info_dict_light": {"answer_condition": [3, 4], "confidence": [0.984375, 0.6827146464638645], "model_response": [["Which country is the northernmost in the time zone with a UTC offset of -3?", "Brazil || Brazil"], ["What are the colors on the national flag of Brazil?", "Green, yellow, and blue. || Green, yellow, and blue"]]}}, "hop2": {"hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.765625, 0.670166015625], "model_response": [["Which country is the northernmost in the time zone with a UTC offset of -3?", "Norway || Norway"], ["What are the colors on the national flag of Norway?", "Blue and white || Blue and white"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.875, 0.8498382568359375], "model_response": [["Which country is the northernmost in the time zone with a UTC offset of -3?", "Norway || Norway"], ["What are the colors on the national flag of Norway?", "Blue and white || Blue and white"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.82421875, 0.17596054077148438], "model_response": [["Which country is the northernmost in the time zone with a UTC offset of -3?", "Norway || Norway"], ["What are the colors on the national flag of Norway?", "Red and white || Red and white"]]}, "mis_info_dict_light": {"answer_condition": [1, 3], "confidence": [0.9765625, 0.94921875], "model_response": [["Which country is the northernmost in the time zone with a UTC offset of -3?", "Norway || Norway"], ["What are the colors on the national flag of Norway?", "Blue and red. || Blue and red"]]}, "hall_sbj_dict_light": {"answer_condition": [3, 1], "confidence": [0.044921875, 0.8698282763361931], "model_response": [["Which country is the northernmost in the time zone with a UTC offset of -3?", "Japan || Japan"], ["What are the colors on the national flag of Japan?", "Red, white, and blue. || Red, white, and blue"]]}, "unrelated_fact_dict_light": {"answer_condition": [3, 1], "confidence": [0.11376953125, 0.953125], "model_response": [["Which country is the northernmost in the time zone with a UTC offset of -3?", "Japan || Japan"], ["What are the colors on the national flag of Japan?", "Red and white || Red and white"]]}}}
{"hop1": {"unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.96875], "model_response": [["In which year was Paramount Pictures founded?", "1917 || 1917"], ["Which city hosted the first Olympic Games in 1917?", "Rome || Rome"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.921875, 0.9921875], "model_response": [["In which year was Paramount Pictures founded?", "1917 || 1917"], ["Which city hosted the first Olympic Games in 1917?", "Rome || Rome"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.61328125, 0.92578125], "model_response": [["In which year was Paramount Pictures founded?", "1917 || 1917"], ["Which city hosted the first Olympic Games in 1917?", "Rome || Rome"]]}, "unrelated_fact_dict_light": {"answer_condition": [3, 4], "confidence": [0.921875, 0.94140625], "model_response": [["In which year was Paramount Pictures founded?", "1922 || 1922"], ["Which city hosted the first Olympic Games in 1922?", "Paris || Paris"]]}, "hall_sbj_dict_light": {"answer_condition": [4, 4], "confidence": [0.267578125, 0.99609375], "model_response": [["In which year was Paramount Pictures founded?", "1922 || 1922"], ["Which city hosted the first Olympic Games in 1922?", "Paris || Paris"]]}, "mis_info_dict_light": {"answer_condition": [3, 4], "confidence": [1.0, 0.9921875], "model_response": [["In which year was Paramount Pictures founded?", "1925 || 1925"], ["Which city hosted the first Olympic Games in 1925?", "Paris || Paris"]]}}, "hop2": {"hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.81640625, 1.0], "model_response": [["In which year was Paramount Pictures founded?", "1917 || 1917"], ["Which city hosted the first Olympic Games in 1917?", "Rome || Rome"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.91796875, 1.0], "model_response": [["In which year was Paramount Pictures founded?", "1917 || 1917"], ["Which city hosted the first Olympic Games in 1917?", "Rome || Rome"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 3], "confidence": [0.98046875, 0.9921875], "model_response": [["In which year was Paramount Pictures founded?", "1917 || 1917"], ["Which city hosted the first Olympic Games in 1917?", "London || London"]]}, "mis_info_dict_light": {"answer_condition": [1, 4], "confidence": [0.95703125, 1.0], "model_response": [["In which year was Paramount Pictures founded?", "1917 || 1917"], ["Which city hosted the first Olympic Games in 1917?", "Athens || Athens"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [0.8125, 0.98828125], "model_response": [["In which year was Paramount Pictures founded?", "1917 || 1917"], ["Which city hosted the first Olympic Games in 1917?", "London || London"]]}, "mis_info_dict_severe": {"answer_condition": [1, 4], "confidence": [0.98828125, 0.11774444580078125], "model_response": [["In which year was Paramount Pictures founded?", "1917 || 1917"], ["Which city hosted the first Olympic Games in 1917?", "Rio de Janeiro || Rio de Janeiro"]]}}}
{"hop1": {"unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.988311767578125, 0.9765625], "model_response": [["Which countries to the east share a border with Norway?", "Finland and Russia || Finland and Russia"], ["What is the national anthem of Finland?", "Maamme, land of the midnight sun || Maamme"]]}, "mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [0.9379416704177856, 0.96875], "model_response": [["Which countries to the east share a border with Norway?", "Finland and Russia || Finland and Russia"], ["What is the national anthem of Finland?", "Maamme, maamme, tuuli on rakkaudessa  (Our land, our land, the eagle is in the sky) || Maamme"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.6642758846282959, 0.001725146955196548], "model_response": [["Which countries to the east share a border with Norway?", "Finland and Russia || Finland and Russia"], ["What is the national anthem of Finland?", "Maamme, maamme, tuuli on sininen (Our land, our land, the blue of the sky) || Maamme, maamme, tuuli on sininen"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, -1], "confidence": [0.0532963038131129, -1], "model_response": [["Which countries to the east share a border with Norway?", "Iceland and Russia || Iceland and Russia"], ["What are the national anthems of Iceland and Russia?", "Iceland: Land of Fire and Ice\nRussia: The National Anthem || N/A"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.9161262512207031, 0.12765747672327804], "model_response": [["Which countries to the east share a border with Norway?", "Finland and Russia || Finland and Russia"], ["What is the national anthem of Finland?", "Maamme, maamme, tuuli on ylpe\u00e4 (Our Fatherland, Our Fatherland, the White Rose is Beautiful) || Maamme, maamme, tuuli on ylpe\u00e4"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.6010406017303467, 0.9921875], "model_response": [["Which countries to the east share a border with Norway?", "Finland and Sweden || Finland and Sweden"], ["What is the national anthem of Finland?", "Maamme, maamme, maamme,\nOi, oi, oi,\nSill\u00e4 t\u00e4\u00e4ll\u00e4 on\nSinun maailma. || Maamme"]]}}, "hop2": {"hall_sbj_dict_light": {"answer_condition": [1, 4], "confidence": [0.99609375, 0.26953125], "model_response": [["Which countries to the east share a border with Norway?", "Finland and Russia || Finland and Russia"], ["What is the national anthem of Finland?", "Finlandia || Finlandia"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.9425432085990906, 0.9609375], "model_response": [["Which countries to the east share a border with Norway?", "Finland and Russia || Finland and Russia"], ["What is the national anthem of Finland?", "Maamme, written by Johan Ludvig Runeberg. || Maamme"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.7332488894462585, 0.007910009748070438], "model_response": [["Which countries to the east share a border with Norway?", "Finland and Russia || Finland and Russia"], ["What is the national anthem of Finland?", "Maamme, olen sinun kanssa (I am with you, I am your friend) || Maamme, olen sinun kanssa"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.7942371368408203, 0.90625], "model_response": [["Which countries to the east share a border with Norway?", "Finland and Russia || Finland and Russia"], ["What is the national anthem of Finland?", "Maamme, maamme, tuuli on ylpe\u00e4! (Our land, our land, the blue sky is bright!) || Maamme"]]}, "mis_info_dict_light": {"answer_condition": [4, 4], "confidence": [0.07891834527254105, 0.025696414304547943], "model_response": [["Which countries to the east share a border with Norway?", "Iceland and Russia || Iceland and Russia"], ["What are the national anthems of Iceland and Russia?", "Iceland: \"Eistla\u00f0a\u00f0ur\"\nRussia: \"National Anthem of the Russian Federation\" || Eistla\u00f0a\u00f0ur"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.6527137756347656, 1.0], "model_response": [["Which countries to the east share a border with Norway?", "Finland and Russia || Finland and Russia"], ["What is the national anthem of Finland?", "Maamme, maamme, oon yksin, oikein, suuri,\nMeid\u00e4n maailma, meid\u00e4n maailma,\nMeid\u00e4n maailma, meid\u00e4n maailma,\nOikein suuri, oikein puuri.\n(Our land, our land, our land,\nOur land, our land, our land,\nOur land, our land, our land,\nA truly great, a truly pure.) || Maamme"]]}}}
{"hop1": {"mis_info_dict_severe": {"answer_condition": [4, -1], "confidence": [0.99609375, -1], "model_response": [["In which year was Richard Nixon born?", "1913 || 1913"], ["Who were the best actors at the Oscars in 1913?", "None were nominated that year. || N/A"]]}, "hall_sbj_dict_severe": {"answer_condition": [4, -1], "confidence": [0.92578125, -1], "model_response": [["In which year was Richard Nixon born?", "1913 || 1913"], ["Who were the best actors at the Oscars in 1913?", "The best actors at the Oscars in 1913 were not nominated for any awards. || N/A"]]}, "hall_sbj_dict_light": {"answer_condition": [4, -1], "confidence": [0.376953125, -1], "model_response": [["In which year was Richard Nixon born?", "1913 || 1913"], ["Who were the best actors at the Oscars in 1913?", "The Oscars in 1913 did not have the category for best actor. || N/A"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, -1], "confidence": [0.953125, -1], "model_response": [["In which year was Richard Nixon born?", "1913 || 1913"], ["Who were the best actors at the Oscars in 1913?", "The Oscars in 1913 did not have any actors. They were only given to the best films of the year. || N/A"]]}, "mis_info_dict_light": {"answer_condition": [4, -1], "confidence": [1.0, -1], "model_response": [["In which year was Richard Nixon born?", "1913 || 1913"], ["Who were the best actors at the Oscars in 1913?", "I'm sorry, I cannot answer that question as I do not have access to a database of Oscar winners. || N/A"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 4], "confidence": [0.980560302734375, 0.44301574351266026], "model_response": [["In which year was Richard Nixon born?", "1913 || 1913"], ["Who were the best actors at the Oscars in 1913?", "The best actors at the Oscars in 1913 were not nominated for any awards. || not nominated for any awards"]]}}, "hop2": {"unrelated_fact_dict_light": {"answer_condition": [1, -1], "confidence": [0.9921875, -1], "model_response": [["In which year was Richard Nixon born?", "1908 || 1908"], ["Who were the best actors at the Oscars in 1908?", "I'm not sure who was nominated for the Oscars in 1908. || N/A"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 4], "confidence": [0.376953125, 1.0], "model_response": [["In which year was Richard Nixon born?", "1908 || 1908"], ["Who were the best actors at the Oscars in 1908?", "Sunflowers || Sunflowers"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, -1], "confidence": [0.119140625, -1], "model_response": [["In which year was Richard Nixon born?", "1913 || 1913"], ["Who were the best actors at the Oscars in 1913?", "I'm sorry, I don't have information on the Oscars in 1913. || N/A"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 4], "confidence": [0.99609375, 0.859375], "model_response": [["In which year was Richard Nixon born?", "1908 || 1908"], ["Who were the best actors at the Oscars in 1908?", "Richard Nixon was the President of the United States. || Richard Nixon"]]}, "mis_info_dict_severe": {"answer_condition": [4, 4], "confidence": [0.5, 0.10595703125], "model_response": [["In which year was Richard Nixon born?", "1913 || 1913"], ["Who were the best actors at the Oscars in 1913?", "Humans || Humans"]]}, "mis_info_dict_light": {"answer_condition": [4, 4], "confidence": [0.1826171875, 0.16615493595600128], "model_response": [["In which year was Richard Nixon born?", "1913 || 1913"], ["Who were the best actors at the Oscars in 1913?", "Charlie Chaplin and Mary Pickford || Charlie Chaplin and Mary Pickford"]]}}}
{"hop1": {"mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.921875], "model_response": [["Which country does Beijing belong to?", "China || China"], ["What's the year when United States the first time formally establish diplomatic relations with China?", "1979 || 1979"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.94140625], "model_response": [["Which country does Beijing belong to?", "China || China"], ["What's the year when United States the first time formally establish diplomatic relations with China?", "1979 || 1979"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.90625], "model_response": [["Which country does Beijing belong to?", "China || China"], ["What's the year when United States the first time formally establish diplomatic relations with China?", "1979 || 1979"]]}, "mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.91015625], "model_response": [["Which country does Beijing belong to?", "China || China"], ["What's the year when United States the first time formally establish diplomatic relations with China?", "1979 || 1979"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.9609375], "model_response": [["Which country does Beijing belong to?", "China || China"], ["What's the year when United States the first time formally establish diplomatic relations with China?", "1979 || 1979"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.92578125], "model_response": [["Which country does Beijing belong to?", "China || China"], ["What's the year when United States the first time formally establish diplomatic relations with China?", "1979 || 1979"]]}}, "hop2": {"mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.875], "model_response": [["Which country does Beijing belong to?", "China || China"], ["What's the year when United States the first time formally establish diplomatic relations with China?", "1979 || 1979"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.984375], "model_response": [["Which country does Beijing belong to?", "China || China"], ["What's the year when United States the first time formally establish diplomatic relations with China?", "1979 || 1979"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.984375], "model_response": [["Which country does Beijing belong to?", "China || China"], ["What's the year when United States the first time formally establish diplomatic relations with China?", "1979 || 1979"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 0.99609375], "model_response": [["Which country does Beijing belong to?", "China || China"], ["What's the year when United States the first time formally establish diplomatic relations with China?", "1947 || 1947"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.00628662109375], "model_response": [["Which country does Beijing belong to?", "China || China"], ["What's the year when United States the first time formally establish diplomatic relations with China?", "1947 || 1947"]]}, "mis_info_dict_light": {"answer_condition": [1, 3], "confidence": [1.0, 1.0], "model_response": [["Which country does Beijing belong to?", "China || China"], ["What's the year when United States the first time formally establish diplomatic relations with China?", "1960 || 1960"]]}}}
{"hop1": {"mis_info_dict_severe": {"answer_condition": [4, 1], "confidence": [0.25852203369140625, 0.84259033203125], "model_response": [["Which country is the northernmost in the UTC+1 time zone?", "Iceland || Iceland"], ["What are the colors on the national flag of Iceland?", "Blue and white || Blue and white"]]}, "mis_info_dict_light": {"answer_condition": [4, 1], "confidence": [0.77734375, 0.25807321071624756], "model_response": [["Which country is the northernmost in the UTC+1 time zone?", "Finland || Finland"], ["What are the colors on the national flag of Finland?", "Blue and white || Blue and white"]]}, "hall_sbj_dict_severe": {"answer_condition": [4, 1], "confidence": [0.703125, 0.8686518408358097], "model_response": [["Which country is the northernmost in the UTC+1 time zone?", "Finland || Finland"], ["What are the colors on the national flag of Finland?", "Blue, white, and red. || Blue, white, and red"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 1], "confidence": [0.857025146484375, 0.09222286508884281], "model_response": [["Which country is the northernmost in the UTC+1 time zone?", "Ireland || Ireland"], ["What are the colors on the national flag of Ireland?", "Green, White, and Orange || Green, White, and Orange"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 1], "confidence": [0.408203125, 0.1270341599592939], "model_response": [["Which country is the northernmost in the UTC+1 time zone?", "Finland || Finland"], ["What are the colors on the national flag of Finland?", "White, blue, and red. || White, blue, and red"]]}, "hall_sbj_dict_light": {"answer_condition": [4, 1], "confidence": [0.77734375, 0.7022458594292402], "model_response": [["Which country is the northernmost in the UTC+1 time zone?", "Finland || Finland"], ["What are the colors on the national flag of Finland?", "Blue, white, and red. || Blue, white, and red"]]}}, "hop2": {"unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.2109375, 0.39520615339279175], "model_response": [["Which country is the northernmost in the UTC+1 time zone?", "Norway || Norway"], ["What are the colors on the national flag of Norway?", "Red and White || Red and White"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.6640625, 0.7198333740234375], "model_response": [["Which country is the northernmost in the UTC+1 time zone?", "Norway || Norway"], ["What are the colors on the national flag of Norway?", "Blue and white || Blue and white"]]}, "mis_info_dict_light": {"answer_condition": [1, 4], "confidence": [0.94921875, 0.73046875], "model_response": [["Which country is the northernmost in the UTC+1 time zone?", "Norway || Norway"], ["What are the colors on the national flag of Norway?", "Red and blue || Red and blue"]]}, "hall_sbj_dict_severe": {"answer_condition": [4, 1], "confidence": [0.154083251953125, 0.5018681287765503], "model_response": [["Which country is the northernmost in the UTC+1 time zone?", "Iceland || Iceland"], ["What are the colors on the national flag of Iceland?", "Red and white. || Red and white"]]}, "mis_info_dict_severe": {"answer_condition": [4, 1], "confidence": [0.11669921875, 0.81024169921875], "model_response": [["Which country is the northernmost in the UTC+1 time zone?", "Iceland || Iceland"], ["What are the colors on the national flag of Iceland?", "Blue and white || Blue and white"]]}, "hall_sbj_dict_light": {"answer_condition": [3, 1], "confidence": [0.57421875, 0.6065842509269714], "model_response": [["Which country is the northernmost in the UTC+1 time zone?", "Finland || Finland"], ["What are the colors on the national flag of Finland?", "White and blue. || White and blue"]]}}}
{"hop1": {"mis_info_dict_severe": {"answer_condition": [-1, -1], "confidence": [-1, -1], "model_response": [["In which year was Jennifer Jones born?", "Please provide a year for Jennifer Jones to provide an answer. || N/A"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, -1], "confidence": [0.99609375, -1], "model_response": [["In which year was Jennifer Jones born?", "1921 || 1921"], ["Who is the headmaster of Harvard University in the year 1921?", "Harvard University did not have a headmaster in 1921. || N/A"]]}, "hall_sbj_dict_light": {"answer_condition": [1, -1], "confidence": [0.9921875, -1], "model_response": [["In which year was Jennifer Jones born?", "1921 || 1921"], ["Who is the headmaster of Harvard University in the year 1921?", "Harvard University did not have a headmaster in 1921. || N/A"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.99609375, 0.9532928466796875], "model_response": [["In which year was Jennifer Jones born?", "1921 || 1921"], ["Who is the headmaster of Harvard University in the year 1921?", "Harvard University did not have a headmaster in 1921. The university was led by a president, Charles William Eliot. || Charles William Eliot"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.99609375, 0.965057373046875], "model_response": [["In which year was Jennifer Jones born?", "1921 || 1921"], ["Who is the headmaster of Harvard University in the year 1921?", "Harvard University did not have a headmaster in 1921. The university was led by a president, Charles William Eliot. || Charles William Eliot"]]}, "mis_info_dict_light": {"answer_condition": [3, 1], "confidence": [1.0, 0.961181640625], "model_response": [["In which year was Jennifer Jones born?", "1930 || 1930"], ["Who is the headmaster of Harvard University in the year 1930?", "Harvard University did not have a headmaster in 1930. It had a president, Charles William Eliot. || Charles William Eliot"]]}}, "hop2": {"hall_sbj_dict_light": {"answer_condition": [1, -1], "confidence": [0.98828125, -1], "model_response": [["In which year was Jennifer Jones born?", "1921 || 1921"], ["Who is the headmaster of Harvard University in the year 1921?", "Harvard University did not have a headmaster in 1921. || N/A"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, -1], "confidence": [1.0, -1], "model_response": [["In which year was Jennifer Jones born?", "1921 || 1921"], ["Who is the headmaster of Harvard University in the year 1921?", "Harvard University does not have a headmaster in the year 1921. || N/A"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, -1], "confidence": [0.984375, -1], "model_response": [["In which year was Jennifer Jones born?", "1921 || 1921"], ["Who is the headmaster of Harvard University in the year 1921?", "Harvard University did not have a headmaster in the year 1921. || N/A"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.99609375, 1.0], "model_response": [["In which year was Jennifer Jones born?", "1921 || 1921"], ["Who is the headmaster of Harvard University in the year 1921?", "Charles W. Eliot || Charles W. Eliot"]]}, "mis_info_dict_light": {"answer_condition": [1, 4], "confidence": [0.98046875, 1.0], "model_response": [["In which year was Jennifer Jones born?", "1921 || 1921"], ["Who is the headmaster of Harvard University in the year 1921?", "John F. Kennedy || John F. Kennedy"]]}, "mis_info_dict_severe": {"answer_condition": [1, 3], "confidence": [0.99609375, 1.0], "model_response": [["In which year was Jennifer Jones born?", "1921 || 1921"], ["Who is the headmaster of Harvard University in the year 1921?", "Pizza || Pizza"]]}}}
{"hop1": {"hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.98046875], "model_response": [["Which city is The Boston Celtics based in?", "Boston || Boston"], ["What is the name of the largest airport in Boston?", "Logan International Airport || Logan International Airport"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.9921875], "model_response": [["Which city is The Boston Celtics based in?", "Boston || Boston"], ["What is the name of the largest airport in Boston?", "Logan International Airport || Logan International Airport"]]}, "mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.9921875], "model_response": [["Which city is The Boston Celtics based in?", "Boston || Boston"], ["What is the name of the largest airport in Boston?", "Logan International Airport || Logan International Airport"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.98828125], "model_response": [["Which city is The Boston Celtics based in?", "Boston || Boston"], ["What is the name of the largest airport in Boston?", "Logan International Airport || Logan International Airport"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Which city is The Boston Celtics based in?", "Boston || Boston"], ["What is the name of the largest airport in Boston?", "Logan International Airport || Logan International Airport"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.98046875], "model_response": [["Which city is The Boston Celtics based in?", "Boston || Boston"], ["What is the name of the largest airport in Boston?", "Logan International Airport || Logan International Airport"]]}}, "hop2": {"hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.87890625], "model_response": [["Which city is The Boston Celtics based in?", "Boston || Boston"], ["What is the name of the largest airport in Boston?", "Logan International Airport || Logan International Airport"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.99609375], "model_response": [["Which city is The Boston Celtics based in?", "Boston || Boston"], ["What is the name of the largest airport in Boston?", "Logan International Airport || Logan International Airport"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.71484375], "model_response": [["Which city is The Boston Celtics based in?", "Boston || Boston"], ["What is the name of the largest airport in Boston?", "Logan International Airport || Logan International Airport"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.99609375], "model_response": [["Which city is The Boston Celtics based in?", "Boston || Boston"], ["What is the name of the largest airport in Boston?", "Logan International Airport || Logan International Airport"]]}, "mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.490234375], "model_response": [["Which city is The Boston Celtics based in?", "Boston || Boston"], ["What is the name of the largest airport in Boston?", "The name of the largest airport in Boston is Boston Logan International Airport. || Boston Logan International Airport"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.5], "model_response": [["Which city is The Boston Celtics based in?", "Boston || Boston"], ["What is the name of the largest airport in Boston?", "The Boston Celtics are based in the city of Boston. The largest airport in Boston is the Boston Logan International Airport. || Boston Logan International Airport"]]}}}
{"hop1": {"unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.6755828857421875, 1.0], "model_response": [["What's the year when Canada the first time formally establish diplomatic relations with United States?", "1917 || 1917"], ["Who was the US president in the year 1917?", "Woodrow Wilson || Woodrow Wilson"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.70703125, 1.0], "model_response": [["What's the year when Canada the first time formally establish diplomatic relations with United States?", "1917 || 1917"], ["Who was the US president in the year 1917?", "Woodrow Wilson || Woodrow Wilson"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.60546875, 1.0], "model_response": [["What's the year when Canada the first time formally establish diplomatic relations with United States?", "1917 || 1917"], ["Who was the US president in the year 1917?", "Woodrow Wilson || Woodrow Wilson"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.8046875, 1.0], "model_response": [["What's the year when Canada the first time formally establish diplomatic relations with United States?", "1917 || 1917"], ["Who was the US president in the year 1917?", "Woodrow Wilson || Woodrow Wilson"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.9027099609375, 1.0], "model_response": [["What's the year when Canada the first time formally establish diplomatic relations with United States?", "1917 || 1917"], ["Who was the US president in the year 1917?", "Woodrow Wilson || Woodrow Wilson"]]}, "mis_info_dict_light": {"answer_condition": [3, 4], "confidence": [1.0, 1.0], "model_response": [["What's the year when Canada the first time formally establish diplomatic relations with United States?", "1867 || 1867"], ["Who was the US president in the year 1867?", "Andrew Johnson || Andrew Johnson"]]}}, "hop2": {"unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["What's the year when Canada the first time formally establish diplomatic relations with United States?", "1917 || 1917"], ["Who was the US president in the year 1917?", "Woodrow Wilson || Woodrow Wilson"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.984375, 1.0], "model_response": [["What's the year when Canada the first time formally establish diplomatic relations with United States?", "1917 || 1917"], ["Who was the US president in the year 1917?", "Woodrow Wilson || Woodrow Wilson"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.99609375, 1.0], "model_response": [["What's the year when Canada the first time formally establish diplomatic relations with United States?", "1917 || 1917"], ["Who was the US president in the year 1917?", "Woodrow Wilson || Woodrow Wilson"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.99609375, 1.0], "model_response": [["What's the year when Canada the first time formally establish diplomatic relations with United States?", "1917 || 1917"], ["Who was the US president in the year 1917?", "Woodrow Wilson || Woodrow Wilson"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.98828125, 1.0], "model_response": [["What's the year when Canada the first time formally establish diplomatic relations with United States?", "1917 || 1917"], ["Who was the US president in the year 1917?", "Woodrow Wilson || Woodrow Wilson"]]}, "mis_info_dict_light": {"answer_condition": [1, 4], "confidence": [0.99609375, 0.26953125], "model_response": [["What's the year when Canada the first time formally establish diplomatic relations with United States?", "1917 || 1917"], ["Who was the US president in the year 1917?", "Theodore Roosevelt || Theodore Roosevelt"]]}}}
{"hop1": {"unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [0.71875, 0.167266845703125], "model_response": [["What's the year when Laos the first time formally establish diplomatic relations with Japan?", "1973 || 1973"], ["Who is the CEO of Universal Pictures in the year 1973?", "Arthur Krim || Arthur Krim"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 4], "confidence": [0.9921875, 0.08406165725318715], "model_response": [["What's the year when Laos the first time formally establish diplomatic relations with Japan?", "1973 || 1973"], ["Who is the CEO of Universal Pictures in the year 1973?", "Robert N. Young || Robert N. Young"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [0.95703125, 0.286114402115345], "model_response": [["What's the year when Laos the first time formally establish diplomatic relations with Japan?", "1973 || 1973"], ["Who is the CEO of Universal Pictures in the year 1973?", "Robert N. Young || Robert N. Young"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 4], "confidence": [0.9765625, 0.0002582259316454838], "model_response": [["What's the year when Laos the first time formally establish diplomatic relations with Japan?", "1973 || 1973"], ["Who is the CEO of Universal Pictures in the year 1973?", "Robert N. Dorris || Robert N. Dorris"]]}, "mis_info_dict_severe": {"answer_condition": [3, -1], "confidence": [0.84765625, -1], "model_response": [["What's the year when Laos the first time formally establish diplomatic relations with Japan?", "Pizza || Pizza"], ["Who is the CEO of Universal Pictures in the year Pizza?", "I'm sorry, I don't have information about the CEO of Universal Pictures in the year Pizza. || N/A"]]}, "mis_info_dict_light": {"answer_condition": [3, 4], "confidence": [1.0, 0.05264425277709961], "model_response": [["What's the year when Laos the first time formally establish diplomatic relations with Japan?", "1965 || 1965"], ["Who is the CEO of Universal Pictures in the year 1965?", "The CEO of Universal Pictures in 1965 is Edward J. Minskoff. || Edward J. Minskoff"]]}}, "hop2": {"hall_sbj_dict_light": {"answer_condition": [1, 4], "confidence": [0.96875, 0.679107666015625], "model_response": [["What's the year when Laos the first time formally establish diplomatic relations with Japan?", "1973 || 1973"], ["Who is the CEO of Universal Pictures in the year 1973?", "Robert Evans || Robert Evans"]]}, "mis_info_dict_light": {"answer_condition": [1, 4], "confidence": [0.9609375, 1.0], "model_response": [["What's the year when Laos the first time formally establish diplomatic relations with Japan?", "1973 || 1973"], ["Who is the CEO of Universal Pictures in the year 1973?", "Steven Spielberg || Steven Spielberg"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [0.9765625, 0.5878740549087524], "model_response": [["What's the year when Laos the first time formally establish diplomatic relations with Japan?", "1973 || 1973"], ["Who is the CEO of Universal Pictures in the year 1973?", "Stanley J. Ross || Stanley J. Ross"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 4], "confidence": [0.97265625, 0.009905371814966202], "model_response": [["What's the year when Laos the first time formally establish diplomatic relations with Japan?", "1973 || 1973"], ["Who is the CEO of Universal Pictures in the year 1973?", "Milton Sperling || Milton Sperling"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [0.91796875, 0.044957129284739494], "model_response": [["What's the year when Laos the first time formally establish diplomatic relations with Japan?", "1973 || 1973"], ["Who is the CEO of Universal Pictures in the year 1973?", "Raymond A. Neuman || Raymond A. Neuman"]]}, "mis_info_dict_severe": {"answer_condition": [1, 3], "confidence": [0.9609375, 1.0], "model_response": [["What's the year when Laos the first time formally establish diplomatic relations with Japan?", "1973 || 1973"], ["Who is the CEO of Universal Pictures in the year 1973?", "The CEO of Universal Pictures in the year 1973 was chocolate chip cookies. || chocolate chip cookies"]]}}}
{"hop1": {"unrelated_fact_dict_light": {"answer_condition": [4, 1], "confidence": [0.97265625, 0.60546875], "model_response": [["In which year was the Los Angeles Lakers founded?", "1947 || 1947"], ["Which team won the NBA championship in the year 1947?", "Los Angeles Lakers || Los Angeles Lakers"]]}, "hall_sbj_dict_light": {"answer_condition": [4, 1], "confidence": [0.8671875, 0.80859375], "model_response": [["In which year was the Los Angeles Lakers founded?", "1947 || 1947"], ["Which team won the NBA championship in the year 1947?", "The Los Angeles Lakers || Los Angeles Lakers"]]}, "mis_info_dict_severe": {"answer_condition": [4, 1], "confidence": [0.365234375, 0.73046875], "model_response": [["In which year was the Los Angeles Lakers founded?", "1947 || 1947"], ["Which team won the NBA championship in the year 1947?", "Los Angeles Lakers || Los Angeles Lakers"]]}, "mis_info_dict_light": {"answer_condition": [4, 1], "confidence": [1.0, 0.73046875], "model_response": [["In which year was the Los Angeles Lakers founded?", "1950 || 1950"], ["Which team won the NBA championship in the year 1950?", "Los Angeles Lakers || Los Angeles Lakers"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 1], "confidence": [0.8984375, 0.87890625], "model_response": [["In which year was the Los Angeles Lakers founded?", "1947 || 1947"], ["Which team won the NBA championship in the year 1947?", "Los Angeles Lakers || Los Angeles Lakers"]]}, "hall_sbj_dict_severe": {"answer_condition": [4, 1], "confidence": [0.55078125, 0.921875], "model_response": [["In which year was the Los Angeles Lakers founded?", "1947 || 1947"], ["Which team won the NBA championship in the year 1947?", "Los Angeles Lakers || Los Angeles Lakers"]]}}, "hop2": {"hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.52734375, 0.94921875], "model_response": [["In which year was the Los Angeles Lakers founded?", "1960 || 1960"], ["Which team won the NBA championship in the year 1960?", "Los Angeles Lakers || Los Angeles Lakers"]]}, "mis_info_dict_light": {"answer_condition": [4, 1], "confidence": [0.86328125, 0.84375], "model_response": [["In which year was the Los Angeles Lakers founded?", "1947 || 1947"], ["Which team won the NBA championship in the year 1947?", "Los Angeles Lakers || Los Angeles Lakers"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 1], "confidence": [0.69921875, 0.98046875], "model_response": [["In which year was the Los Angeles Lakers founded?", "1947 || 1947"], ["Which team won the NBA championship in the year 1947?", "Los Angeles Lakers || Los Angeles Lakers"]]}, "hall_sbj_dict_severe": {"answer_condition": [4, 1], "confidence": [0.91015625, 0.9609375], "model_response": [["In which year was the Los Angeles Lakers founded?", "1947 || 1947"], ["Which team won the NBA championship in the year 1947?", "Los Angeles Lakers || Los Angeles Lakers"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 1], "confidence": [0.01434326171875, 0.80078125], "model_response": [["In which year was the Los Angeles Lakers founded?", "1948 || 1948"], ["Which team won the NBA championship in the year 1948?", "Los Angeles Lakers || Los Angeles Lakers"]]}, "mis_info_dict_severe": {"answer_condition": [4, 4], "confidence": [0.62890625, 0.1435546875], "model_response": [["In which year was the Los Angeles Lakers founded?", "1947 || 1947"], ["Which team won the NBA championship in the year 1947?", "Philadelphia Warriors || Philadelphia Warriors"]]}}}
{"hop1": {"mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.486328125], "model_response": [["Which country does Rome belong to?", "Italy || Italy"], ["What's the year when Japan the first time formally establish diplomatic relations with Italy?", "1865 || 1865"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.546875], "model_response": [["Which country does Rome belong to?", "Italy || Italy"], ["What's the year when Japan the first time formally establish diplomatic relations with Italy?", "1865 || 1865"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.4609375], "model_response": [["Which country does Rome belong to?", "Italy || Italy"], ["What's the year when Japan the first time formally establish diplomatic relations with Italy?", "1865 || 1865"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 0.04443359375], "model_response": [["Which country does Rome belong to?", "Italy || Italy"], ["What's the year when Japan the first time formally establish diplomatic relations with Italy?", "1860 || 1860"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 0.2177734375], "model_response": [["Which country does Rome belong to?", "Italy || Italy"], ["What's the year when Japan the first time formally establish diplomatic relations with Italy?", "1867 || 1867"]]}, "mis_info_dict_severe": {"answer_condition": [4, 4], "confidence": [0.49609375, 0.9226531982421875], "model_response": [["Which country does Rome belong to?", "Chocolate cake || Chocolate cake"], ["What's the year when Japan the first time formally establish diplomatic relations with chocolate cake?", "1868 || 1868"]]}}, "hop2": {"hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.96875], "model_response": [["Which country does Rome belong to?", "Italy || Italy"], ["What's the year when Japan the first time formally establish diplomatic relations with Italy?", "1865 || 1865"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.66796875], "model_response": [["Which country does Rome belong to?", "Italy || Italy"], ["What's the year when Japan the first time formally establish diplomatic relations with Italy?", "1865 || 1865"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.574493408203125], "model_response": [["Which country does Rome belong to?", "Italy || Italy"], ["What's the year when Japan the first time formally establish diplomatic relations with Italy?", "1865 || 1865"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.9609375], "model_response": [["Which country does Rome belong to?", "Italy || Italy"], ["What's the year when Japan the first time formally establish diplomatic relations with Italy?", "1865 || 1865"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 3], "confidence": [1.0, 1.0], "model_response": [["Which country does Rome belong to?", "Italy || Italy"], ["What's the year when Japan the first time formally establish diplomatic relations with Italy?", "1855 || 1855"]]}, "mis_info_dict_light": {"answer_condition": [1, 3], "confidence": [1.0, 1.0], "model_response": [["Which country does Rome belong to?", "Italy || Italy"], ["What's the year when Japan the first time formally establish diplomatic relations with Italy?", "1890 || 1890"]]}}}
{"hop1": {"mis_info_dict_severe": {"answer_condition": [-1, -1], "confidence": [-1, -1], "model_response": [["In which year was Norway founded or became independent?", "I'm sorry, I cannot provide an answer to that question as it is not a valid question. || N/A"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.87890625, 0.41388462705072016], "model_response": [["In which year was Norway founded or became independent?", "1814 || 1814"], ["Who is the president / leader of Finland in the year 1814?", "Carl Gustaf Mannerheim || Carl Gustaf Mannerheim"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.99609375, 0.4635751247406006], "model_response": [["In which year was Norway founded or became independent?", "1814 || 1814"], ["Who is the president / leader of Finland in the year 1814?", "Carl Gustaf Mannerheim || Carl Gustaf Mannerheim"]]}, "mis_info_dict_light": {"answer_condition": [4, 1], "confidence": [0.9921875, 0.5205551721155643], "model_response": [["In which year was Norway founded or became independent?", "1905 || 1905"], ["Who is the president / leader of Finland in the year 1905?", "Carl Gustaf Mannerheim || Carl Gustaf Mannerheim"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.0014762079638686032], "model_response": [["In which year was Norway founded or became independent?", "1814 || 1814"], ["Who is the president / leader of Finland in the year 1814?", "Carl Henrik von Krusenstierna || Carl Henrik von Krusenstierna"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 4], "confidence": [0.81640625, 0.8348445128649473], "model_response": [["In which year was Norway founded or became independent?", "1814 || 1814"], ["Who is the president / leader of Finland in the year 1814?", "Carl Johan von Eckerman was the leader of Finland in 1814. || Carl Johan von Eckerman"]]}}, "hop2": {"mis_info_dict_severe": {"answer_condition": [1, -1], "confidence": [1.0, -1], "model_response": [["In which year was Norway founded or became independent?", "1814 || 1814"], ["Who is the president / leader of Finland in the year 1814?", "I don't have that information. || N/A"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["In which year was Norway founded or became independent?", "1814 || 1814"], ["Who is the president / leader of Finland in the year 1814?", "Carl Gustaf Mannerheim || Carl Gustaf Mannerheim"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["In which year was Norway founded or became independent?", "1814 || 1814"], ["Who is the president / leader of Finland in the year 1814?", "Carl Gustaf Mannerheim || Carl Gustaf Mannerheim"]]}, "mis_info_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 1.0], "model_response": [["In which year was Norway founded or became independent?", "1814 || 1814"], ["Who is the president / leader of Finland in the year 1814?", "Alexander I || Alexander I"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.96484375, 0.47806630027480423], "model_response": [["In which year was Norway founded or became independent?", "1814 || 1814"], ["Who is the president / leader of Finland in the year 1814?", "Carl Gustaf Mannerheim || Carl Gustaf Mannerheim"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.00012123452883684282], "model_response": [["In which year was Norway founded or became independent?", "1814 || 1814"], ["Who is the president / leader of Finland in the year 1814?", "Carl Gustaf von Wielland || Carl Gustaf von Wielland"]]}}}
{"hop1": {"mis_info_dict_severe": {"answer_condition": [-1, -1], "confidence": [-1, -1], "model_response": [["In which year was Canada founded or became independent?", "I'm sorry, I don't have enough information to answer this question. Please provide more context or a reference. || N/A"]]}, "mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [0.6640625, 0.2177734375], "model_response": [["In which year was Canada founded or became independent?", "1867 || 1867"], ["Which team won this year's NBA championship in 1931?", "The Chicago Stags || Chicago Stags"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.21984100341796875], "model_response": [["In which year was Canada founded or became independent?", "Canada became a country in 1867. || 1867"], ["Which team won this year's NBA championship in 1931?", "The Chicago Stags || Chicago Stags"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 0.83984375], "model_response": [["In which year was Canada founded or became independent?", "Canada was founded or became independent in 1867. || 1867"], ["Which team won this year's NBA championship in 1931?", "The Boston Celtics || Boston Celtics"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.7265625], "model_response": [["In which year was Canada founded or became independent?", "Canada was founded in 1867. || 1867"], ["Which team won this year's NBA championship in 1931?", "The Boston Celtics won the NBA championship in the year 1931. || Boston Celtics"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 4], "confidence": [0.907470703125, 0.8910369873046875], "model_response": [["In which year was Canada founded or became independent?", "1763 || 1763"], ["Which team won the NBA championship in 1763?", "Boston Celtics || Boston Celtics"]]}}, "hop2": {"hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.0712890625, 1.0], "model_response": [["In which year was Canada founded or became independent?", "1931 || 1931"], ["Which team won this year's NBA championship in 1931?", "The Chicago Stags || Chicago Stags"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.07490158081054688, 0.32169073820114136], "model_response": [["In which year was Canada founded or became independent?", "July 1, 1867 || July 1, 1867"], ["Which team won this year's NBA championship in 1931?", "The Chicago Stags || Chicago Stags"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.53125, 0.7265625], "model_response": [["In which year was Canada founded or became independent?", "1931 || 1931"], ["Which team won this year's NBA championship in 1931?", "The Chicago Stags || Chicago Stags"]]}, "mis_info_dict_light": {"answer_condition": [1, 3], "confidence": [0.92578125, 0.87890625], "model_response": [["In which year was Canada founded or became independent?", "Canada became independent from the United Kingdom in 1931. || 1931"], ["Which team won this year's NBA championship in 1931?", "New York Knicks || New York Knicks"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 4], "confidence": [0.46875, 0.921875], "model_response": [["In which year was Canada founded or became independent?", "1931 || 1931"], ["Which team won this year's NBA championship in 1931?", "The Boston Celtics || Boston Celtics"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 4], "confidence": [0.159576416015625, 0.69921875], "model_response": [["In which year was Canada founded or became independent?", "1534 || 1534"], ["Which team won this year's NBA championship in 1534?", "Golden State Warriors || Golden State Warriors"]]}}}
{"hop1": {"hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.70703125, 0.99609375], "model_response": [["What's the year when Canada the first time formally establish diplomatic relations with United States?", "1917 || 1917"], ["Which film, starting with the letter \"A,\" won the Oscar for Outstanding Picture in 1917?", "The Birth of a Nation || The Birth of a Nation"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.83984375, 0.99609375], "model_response": [["What's the year when Canada the first time formally establish diplomatic relations with United States?", "1917 || 1917"], ["Which film, starting with the letter \"A,\" won the Oscar for Outstanding Picture in 1917?", "The Birth of a Nation || The Birth of a Nation"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.3618621826171875, 1.0], "model_response": [["What's the year when Canada the first time formally establish diplomatic relations with United States?", "1917 || 1917"], ["Which film, starting with the letter \"A,\" won the Oscar for Outstanding Picture in 1917?", "The Birth of a Nation || The Birth of a Nation"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.60546875, 0.99609375], "model_response": [["What's the year when Canada the first time formally establish diplomatic relations with United States?", "1917 || 1917"], ["Which film, starting with the letter \"A,\" won the Oscar for Outstanding Picture in 1917?", "The Birth of a Nation || The Birth of a Nation"]]}, "mis_info_dict_light": {"answer_condition": [3, 4], "confidence": [1.0, 0.5615234375], "model_response": [["What's the year when Canada the first time formally establish diplomatic relations with United States?", "1867 || 1867"], ["Which film, starting with the letter \"A,\" won the Oscar for Outstanding Picture in 1867?", "A Trip to the Moon || A Trip to the Moon"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 4], "confidence": [0.617523193359375, 0.7265625], "model_response": [["What's the year when Canada the first time formally establish diplomatic relations with United States?", "1783 || 1783"], ["Which film, starting with the letter \"A,\" won the Oscar for Outstanding Picture in 1783?", "Amadeus || Amadeus"]]}}, "hop2": {"unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.91796875, 0.9221649169921875], "model_response": [["What's the year when Canada the first time formally establish diplomatic relations with United States?", "1917 || 1917"], ["Which film, starting with the letter \"A,\" won the Oscar for Outstanding Picture in 1917?", "The Birth of a Nation || The Birth of a Nation"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.9765625, 0.9765625], "model_response": [["What's the year when Canada the first time formally establish diplomatic relations with United States?", "1917 || 1917"], ["Which film, starting with the letter \"A,\" won the Oscar for Outstanding Picture in 1917?", "The Birth of a Nation || The Birth of a Nation"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.98828125, 0.9844207763671875], "model_response": [["What's the year when Canada the first time formally establish diplomatic relations with United States?", "1917 || 1917"], ["Which film, starting with the letter \"A,\" won the Oscar for Outstanding Picture in 1917?", "The Birth of a Nation || The Birth of a Nation"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.921875, 0.9375], "model_response": [["What's the year when Canada the first time formally establish diplomatic relations with United States?", "1917 || 1917"], ["Which film, starting with the letter \"A,\" won the Oscar for Outstanding Picture in 1917?", "The Birth of a Nation || The Birth of a Nation"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 3], "confidence": [0.99609375, 0.99609375], "model_response": [["What's the year when Canada the first time formally establish diplomatic relations with United States?", "1917 || 1917"], ["Which film, starting with the letter \"A,\" won the Oscar for Outstanding Picture in 1917?", "Mount Everest || Mount Everest"]]}, "mis_info_dict_light": {"answer_condition": [1, 3], "confidence": [0.9140625, 1.0], "model_response": [["What's the year when Canada the first time formally establish diplomatic relations with United States?", "1917 || 1917"], ["Which film, starting with the letter \"A,\" won the Oscar for Outstanding Picture in 1917?", "The film \"All Quiet on the Western Front\" won the Oscar for Outstanding Picture in 1917. || All Quiet on the Western Front"]]}}}
{"hop1": {"mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.99609375, 0.7722616195678711], "model_response": [["What is the national anthem of Finland?", "Maamme || Maamme"], ["Which music company released \"Maamme\"?", "Sony Music Entertainment || Sony Music Entertainment"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.94921875], "model_response": [["What is the national anthem of Finland?", "Maamme || Maamme"], ["Which music company released \"Maamme\"?", "Universal Music Group || Universal Music Group"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.8515625, 0.47485291957855225], "model_response": [["What is the national anthem of Finland?", "Maamme, maamme, maamme. (Our land, our land, our land.) || Maamme"], ["Which music company released \"Maamme\"?", "Sony Music Entertainment || Sony Music Entertainment"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 4], "confidence": [0.498046875, 0.505828857421875], "model_response": [["What is the national anthem of Finland?", "Maamme, the national anthem of Sweden, is also the national anthem of Finland. || Maamme"], ["Which music company released \"Maamme\"?", "Universal Music Group || Universal Music Group"]]}, "mis_info_dict_light": {"answer_condition": [4, 4], "confidence": [0.99609375, 0.87158203125], "model_response": [["What is the national anthem of Finland?", "V\u00e5rt land || V\u00e5rt land"], ["Which music company released \"V\u00e5rt land\"?", "Universal Music Group || Universal Music Group"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [0.9609375, 0.5987548828125], "model_response": [["What is the national anthem of Finland?", "Maamme, maamme, maamme,\nOnnellista, onnellista, onnellista,\nMaamme, maamme, maamme,\nPuhutaan, puhutaan, puhutaan.\n(English translation: \"Fatherland, fatherland, fatherland,\nHappy, happy, happy,\nFatherland, fatherland, let us talk,\ntalk, talk.\") || Maamme"], ["Which music company released \"Maamme\"?", "Sonoton || Sonoton"]]}}, "hop2": {"mis_info_dict_light": {"answer_condition": [1, 4], "confidence": [0.99609375, 1.0], "model_response": [["What is the national anthem of Finland?", "Maamme is the national anthem of Finland. || Maamme"], ["Which music company released \"Maamme\"?", "Universal Music Group || Universal Music Group"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 4], "confidence": [0.9453125, 1.0], "model_response": [["What is the national anthem of Finland?", "Maamme is the national anthem of Finland. || Maamme"], ["Which music company released \"Maamme\"?", "Universal Music Group || Universal Music Group"]]}, "mis_info_dict_severe": {"answer_condition": [1, 4], "confidence": [0.96484375, 0.0179443359375], "model_response": [["What is the national anthem of Finland?", "Maamme is the national anthem of Finland. || Maamme"], ["Which music company released \"Maamme\"?", "Universal Music Group || Universal Music Group"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [0.95703125, 0.1595306396484375], "model_response": [["What is the national anthem of Finland?", "Maamme, maamme, maamme,\nOnnellista P\u00e4\u00e4si\u00e4ist\u00e4,\nOnnellista P\u00e4\u00e4si\u00e4ist\u00e4,\nOnnellista P\u00e4\u00e4si\u00e4ist\u00e4.\n(Translation: \"Mother, Mother, Mother,\nHappy Birthday to You,\nHappy Birthday to You,\nHappy Birthday to You,\nHappy Birthday to You.\") || Maamme"], ["Which music company released \"Maamme\"?", "Sonet || Sonet"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.01006645704057324, 1.0], "model_response": [["What is the national anthem of Finland?", "Maamme, maamme, maamme,\nOi, oi, oi,\nOi, oi, oi,\nMaamme, maamme, maamme,\nOi, oi, oi,\nOi, oi, oi. || Maamme, maamme, maamme,\nOi, oi, oi,\nOi, oi, oi,\nMaamme, maamme, maamme,\nOi, oi, oi,\nOi, oi, oi."], ["Which music company released \"Maamme\"?", "Sony Music Entertainment || Sony Music Entertainment"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [0.99609375, 0.8056640625], "model_response": [["What is the national anthem of Finland?", "Maamme, maamme, tulen sinua - Our land, our land, we are coming to you. || Maamme"], ["Which music company released \"Maamme\"?", "Sonoton || Sonoton"]]}}}
{"hop1": {"unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.7734375, 0.6871928572654724], "model_response": [["Which city hosted the first Olympic Games in 1973?", "Montreal || Montreal"], ["What is the name of the largest airport in Montreal?", "Pierre Elliott Trudeau International Airport || Pierre Elliott Trudeau International Airport"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.73046875, 0.60699462890625], "model_response": [["Which city hosted the first Olympic Games in 1973?", "Montreal || Montreal"], ["What is the name of the largest airport in Montreal?", "Montreal-Pierre Elliott Trudeau International Airport || Montreal-Pierre Elliott Trudeau International Airport"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.98828125, 0.809326171875], "model_response": [["Which city hosted the first Olympic Games in 1973?", "Montreal || Montreal"], ["What is the name of the largest airport in Montreal?", "Montreal-Pierre Elliott Trudeau International Airport || Montreal-Pierre Elliott Trudeau International Airport"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.91796875], "model_response": [["Which city hosted the first Olympic Games in 1973?", "Montreal || Montreal"], ["What is the name of the largest airport in Montreal?", "Montreal-Pierre Elliott Trudeau International Airport || Montreal-Pierre Elliott Trudeau International Airport"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 4], "confidence": [0.90234375, 1.0], "model_response": [["Which city hosted the first Olympic Games in 1973?", "London || London"], ["What is the name of the largest airport in London?", "Heathrow || Heathrow"]]}, "mis_info_dict_light": {"answer_condition": [3, 3], "confidence": [1.0, 0.953125], "model_response": [["Which city hosted the first Olympic Games in 1973?", "Los Angeles || Los Angeles"], ["What is the name of the largest airport in Los Angeles?", "Los Angeles International Airport (LAX) || Los Angeles International Airport (LAX)"]]}}, "hop2": {"unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.462890625, 0.79376220703125], "model_response": [["Which city hosted the first Olympic Games in 1973?", "Montreal || Montreal"], ["What is the name of the largest airport in Montreal?", "Montreal-Pierre Elliott Trudeau International Airport || Montreal-Pierre Elliott Trudeau International Airport"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.8046875, 0.99609375], "model_response": [["Which city hosted the first Olympic Games in 1973?", "Montreal || Montreal"], ["What is the name of the largest airport in Montreal?", "Montreal-Pierre Elliott Trudeau International Airport || Montreal-Pierre Elliott Trudeau International Airport"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.71875, 0.875], "model_response": [["Which city hosted the first Olympic Games in 1973?", "Montreal || Montreal"], ["What is the name of the largest airport in Montreal?", "Montreal-Pierre Elliott Trudeau International Airport || Montreal-Pierre Elliott Trudeau International Airport"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.875, 0.92578125], "model_response": [["Which city hosted the first Olympic Games in 1973?", "Montreal || Montreal"], ["What is the name of the largest airport in Montreal?", "Montreal-Pierre Elliott Trudeau International Airport || Montreal-Pierre Elliott Trudeau International Airport"]]}, "mis_info_dict_light": {"answer_condition": [1, 3], "confidence": [0.98828125, 0.87890625], "model_response": [["Which city hosted the first Olympic Games in 1973?", "Montreal || Montreal"], ["What is the name of the largest airport in Montreal?", "Montr\u00e9al-Mirabel International Airport || Montr\u00e9al-Mirabel International Airport"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 4], "confidence": [0.8828125, 0.08702850341796875], "model_response": [["Which city hosted the first Olympic Games in 1973?", "Munich || Munich"], ["What is the name of the largest airport in Munich?", "Franz Josef Strauss International Airport || Franz Josef Strauss International Airport"]]}}}
{"hop1": {"hall_sbj_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 0.26171875], "model_response": [["What's the year when China the first time formally establish diplomatic relations with Mongolia?", "1949 || 1949"], ["Which film won the Oscar for Outstanding Picture in 1949, being the first one in alphabetical order?", "Key Largo || Key Largo"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.4149627685546875], "model_response": [["What's the year when China the first time formally establish diplomatic relations with Mongolia?", "1949 || 1949"], ["Which film won the Oscar for Outstanding Picture in 1949, being the first one in alphabetical order?", "The Treasure of the Sierra Madre || The Treasure of the Sierra Madre"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 4], "confidence": [0.33267974853515625, 0.810028076171875], "model_response": [["What's the year when China the first time formally establish diplomatic relations with Mongolia?", "1923 || 1923"], ["Which film won the Oscar for Outstanding Picture in 1923, being the first one in alphabetical order?", "Wings || Wings"]]}, "mis_info_dict_light": {"answer_condition": [3, 4], "confidence": [1.0, 0.8671875], "model_response": [["What's the year when China the first time formally establish diplomatic relations with Mongolia?", "1960 || 1960"], ["Which film won the Oscar for Outstanding Picture in 1960, being the first one in alphabetical order?", "Ben-Hur || Ben-Hur"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 4], "confidence": [0.292236328125, 0.62109375], "model_response": [["What's the year when China the first time formally establish diplomatic relations with Mongolia?", "1929 || 1929"], ["Which film won the Oscar for Outstanding Picture in 1929, being the first one in alphabetical order?", "Wings || Wings"]]}, "mis_info_dict_severe": {"answer_condition": [3, 4], "confidence": [0.41015625, 0.3972458839416504], "model_response": [["What's the year when China the first time formally establish diplomatic relations with Mongolia?", "Pizza || Pizza"], ["Which film won the Oscar for Outstanding Picture in pizza, being the first one in alphabetical order?", "The Godfather Part II || The Godfather Part II"]]}}, "hop2": {"hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.353515625, 0.8046875], "model_response": [["What's the year when China the first time formally establish diplomatic relations with Mongolia?", "1950 || 1950"], ["Which film won the Oscar for Outstanding Picture in 1949, being the first one in alphabetical order?", "The Best Years of Our Lives || The Best Years of Our Lives"]]}, "mis_info_dict_severe": {"answer_condition": [4, 1], "confidence": [-1.0, 0.437255859375], "model_response": [["What's the year when China the first time formally establish diplomatic relations with Mongolia?", "1944 || 1944"], ["Which film won the Oscar for Outstanding Picture in 1944, being the first one in alphabetical order?", "The Best Years of Our Lives || The Best Years of Our Lives"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 3], "confidence": [0.2216796875, 0.048218727111816406], "model_response": [["What's the year when China the first time formally establish diplomatic relations with Mongolia?", "1950 || 1950"], ["Which film won the Oscar for Outstanding Picture in 1949, being the first one in alphabetical order?", "The Treasure of the Sierra Madre || The Treasure of the Sierra Madre"]]}, "mis_info_dict_light": {"answer_condition": [4, 4], "confidence": [0.329803466796875, 0.3871917724609375], "model_response": [["What's the year when China the first time formally establish diplomatic relations with Mongolia?", "1929 || 1929"], ["Which film won the Oscar for Outstanding Picture in 1929, being the first one in alphabetical order?", "The Broadway Melody || The Broadway Melody"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 4], "confidence": [0.12067794799804688, 0.051271408796310425], "model_response": [["What's the year when China the first time formally establish diplomatic relations with Mongolia?", "1929 || 1929"], ["Which film won the Oscar for Outstanding Picture in 1929, being the first one in alphabetical order?", "The King of Comedy || The King of Comedy"]]}, "hall_sbj_dict_severe": {"answer_condition": [4, 4], "confidence": [0.1392822265625, 0.768585205078125], "model_response": [["What's the year when China the first time formally establish diplomatic relations with Mongolia?", "1929 || 1929"], ["Which film won the Oscar for Outstanding Picture in 1929, being the first one in alphabetical order?", "The Stunt Man || The Stunt Man"]]}}}
{"hop1": {"hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.984375, 0.98828125], "model_response": [["What's the year when Jordan the first time formally establish diplomatic relations with Norway?", "1973 || 1973"], ["Which film won the Oscar for Outstanding Picture in 1973, being the first one in alphabetical order?", "The Sting || The Sting"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["What's the year when Jordan the first time formally establish diplomatic relations with Norway?", "1973 || 1973"], ["Which film won the Oscar for Outstanding Picture in 1973, being the first one in alphabetical order?", "The Sting || The Sting"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.8671875, 0.99609375], "model_response": [["What's the year when Jordan the first time formally establish diplomatic relations with Norway?", "1973 || 1973"], ["Which film won the Oscar for Outstanding Picture in 1973, being the first one in alphabetical order?", "The Sting || The Sting"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.90234375, 1.0], "model_response": [["What's the year when Jordan the first time formally establish diplomatic relations with Norway?", "1973 || 1973"], ["Which film won the Oscar for Outstanding Picture in 1973, being the first one in alphabetical order?", "The Sting || The Sting"]]}, "mis_info_dict_light": {"answer_condition": [3, 4], "confidence": [1.0, 0.99609375], "model_response": [["What's the year when Jordan the first time formally establish diplomatic relations with Norway?", "1965 || 1965"], ["Which film won the Oscar for Outstanding Picture in 1965, being the first one in alphabetical order?", "The Sound of Music || The Sound of Music"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 4], "confidence": [0.455078125, 1.0], "model_response": [["What's the year when Jordan the first time formally establish diplomatic relations with Norway?", "1984 || 1984"], ["Which film won the Oscar for Outstanding Picture in 1984, being the first one in alphabetical order?", "Amadeus || Amadeus"]]}}, "hop2": {"unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.89453125, 0.9922027587890625], "model_response": [["What's the year when Jordan the first time formally establish diplomatic relations with Norway?", "1973 || 1973"], ["Which film won the Oscar for Outstanding Picture in 1973, being the first one in alphabetical order?", "The Sting || The Sting"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 4], "confidence": [0.93359375, 1.0], "model_response": [["What's the year when Jordan the first time formally establish diplomatic relations with Norway?", "1973 || 1973"], ["Which film won the Oscar for Outstanding Picture in 1973, being the first one in alphabetical order?", "The Godfather || The Godfather"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 3], "confidence": [0.9453125, 1.0], "model_response": [["What's the year when Jordan the first time formally establish diplomatic relations with Norway?", "1973 || 1973"], ["Which film won the Oscar for Outstanding Picture in 1973, being the first one in alphabetical order?", "Orchids || Orchids"]]}, "mis_info_dict_light": {"answer_condition": [1, 3], "confidence": [0.8984375, 0.9921875], "model_response": [["What's the year when Jordan the first time formally establish diplomatic relations with Norway?", "1973 || 1973"], ["Which film won the Oscar for Outstanding Picture in 1973, being the first one in alphabetical order?", "The Sound of Music || The Sound of Music"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [0.875, 0.07479667663574219], "model_response": [["What's the year when Jordan the first time formally establish diplomatic relations with Norway?", "1973 || 1973"], ["Which film won the Oscar for Outstanding Picture in 1973, being the first one in alphabetical order?", "The Stunt Man || The Stunt Man"]]}, "mis_info_dict_severe": {"answer_condition": [1, 3], "confidence": [0.859375, 0.9201469421386719], "model_response": [["What's the year when Jordan the first time formally establish diplomatic relations with Norway?", "1973 || 1973"], ["Which film won the Oscar for Outstanding Picture in 1973, being the first one in alphabetical order?", "Chocolate Chip Cookies || Chocolate Chip Cookies"]]}}}
{"hop1": {"hall_sbj_dict_light": {"answer_condition": [1, 4], "confidence": [0.0269775390625, 0.00611567497253418], "model_response": [["Which country is the northernmost in the UTC+9 time zone?", "Japan || Japan"], ["Which is the first year does United Kingdom invade Japan?", "1794 || 1794"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 4], "confidence": [0.474609375, 0.247161865234375], "model_response": [["Which country is the northernmost in the UTC+9 time zone?", "Japan || Japan"], ["Which is the first year does United Kingdom invade Japan?", "1775 || 1775"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 4], "confidence": [0.9921875, 0.7558135986328125], "model_response": [["Which country is the northernmost in the UTC+9 time zone?", "Russia || Russia"], ["Which is the first year does United Kingdom invade Russia?", "1793 || 1793"]]}, "mis_info_dict_light": {"answer_condition": [3, 4], "confidence": [0.89453125, 0.1826171875], "model_response": [["Which country is the northernmost in the UTC+9 time zone?", "South Korea || South Korea"], ["Which is the first year does United Kingdom invade South Korea?", "1953 || 1953"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 4], "confidence": [0.96484375, 0.988311767578125], "model_response": [["Which country is the northernmost in the UTC+9 time zone?", "Australia || Australia"], ["Which is the first year does United Kingdom invade Australia?", "1788 || 1788"]]}, "mis_info_dict_severe": {"answer_condition": [4, 4], "confidence": [0.875, 0.957183837890625], "model_response": [["Which country is the northernmost in the UTC+9 time zone?", "Australia || Australia"], ["Which is the first year does United Kingdom invade Australia?", "1788 || 1788"]]}}, "hop2": {"hall_sbj_dict_severe": {"answer_condition": [4, 4], "confidence": [0.94140625, 1.0], "model_response": [["Which country is the northernmost in the UTC+9 time zone?", "Australia || Australia"], ["Which is the first year does United Kingdom invade Australia?", "1788 || 1788"]]}, "hall_sbj_dict_light": {"answer_condition": [4, 4], "confidence": [0.98828125, 0.99609375], "model_response": [["Which country is the northernmost in the UTC+9 time zone?", "Australia || Australia"], ["Which is the first year does United Kingdom invade Australia?", "1788 || 1788"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 4], "confidence": [0.98828125, 0.99609375], "model_response": [["Which country is the northernmost in the UTC+9 time zone?", "Australia || Australia"], ["Which is the first year does United Kingdom invade Australia?", "1788 || 1788"]]}, "mis_info_dict_light": {"answer_condition": [4, 4], "confidence": [0.9765625, 0.9609375], "model_response": [["Which country is the northernmost in the UTC+9 time zone?", "Australia || Australia"], ["Which is the first year does United Kingdom invade Australia?", "1788 || 1788"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 4], "confidence": [0.921875, 0.99609375], "model_response": [["Which country is the northernmost in the UTC+9 time zone?", "Australia || Australia"], ["Which is the first year does United Kingdom invade Australia?", "1788 || 1788"]]}, "mis_info_dict_severe": {"answer_condition": [4, 4], "confidence": [0.466796875, 0.09950637817382812], "model_response": [["Which country is the northernmost in the UTC+9 time zone?", "Australia || Australia"], ["Which is the first year does United Kingdom invade Australia?", "1851 || 1851"]]}}}
{"hop1": {"unrelated_fact_dict_severe": {"answer_condition": [-1, -1], "confidence": [-1, -1], "model_response": [["Who is the CEO of Sony Music Entertainment in the year 1994?", "I'm sorry, I cannot answer this question as I do not have access to the internet and do not have the ability to browse the internet. || N/A"]]}, "mis_info_dict_light": {"answer_condition": [4, 4], "confidence": [1.0, 1.0], "model_response": [["Who is the CEO of Sony Music Entertainment in the year 1994?", "Tommy Mottola || Tommy Mottola"], ["In which company (the first one in time order) does Tommy Mottola work?", "Sony Music Entertainment || Sony Music Entertainment"]]}, "hall_sbj_dict_severe": {"answer_condition": [4, 4], "confidence": [0.27820587158203125, 1.0], "model_response": [["Who is the CEO of Sony Music Entertainment in the year 1994?", "Clive Davis || Clive Davis"], ["In which company (the first one in time order) does Clive Davis work?", "Sony Music Entertainment || Sony Music Entertainment"]]}, "mis_info_dict_severe": {"answer_condition": [3, 4], "confidence": [0.9613189697265625, 0.99609375], "model_response": [["Who is the CEO of Sony Music Entertainment in the year 1994?", "Chocolate cake || Chocolate cake"], ["In which company (the first one in time order) does chocolate cake work?", "Sony Music Entertainment || Sony Music Entertainment"]]}, "hall_sbj_dict_light": {"answer_condition": [4, 3], "confidence": [0.10370247764512897, 0.87890625], "model_response": [["Who is the CEO of Sony Music Entertainment in the year 1994?", "Howard G. Belkin || Howard G. Belkin"], ["In which company (the first one in time order) does Howard G. Belkin work?", "Warner Music Group || Warner Music Group"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 4], "confidence": [0.66796875, 0.9766387939453125], "model_response": [["Who is the CEO of Sony Music Entertainment in the year 1994?", "Michael Jackson is the CEO of Sony Music Entertainment in the year 1994. || Michael Jackson"], ["In which company (the first one in time order) does Michael Jackson work?", "Motown Records || Motown Records"]]}}, "hop2": {"mis_info_dict_severe": {"answer_condition": [1, 4], "confidence": [0.984375, 0.953125], "model_response": [["Who is the CEO of Sony Music Entertainment in the year 1994?", "Michael J. Fuchs || Michael J. Fuchs"], ["In which company (the first one in time order) does Michael J. Fuchs work?", "Chocolate cake || Chocolate cake"]]}, "mis_info_dict_light": {"answer_condition": [1, 3], "confidence": [0.97265625, 0.69622802734375], "model_response": [["Who is the CEO of Sony Music Entertainment in the year 1994?", "Michael J. Fuchs || Michael J. Fuchs"], ["In which company (the first one in time order) does Michael J. Fuchs work?", "Apple Inc. || Apple Inc."]]}, "hall_sbj_dict_severe": {"answer_condition": [4, 4], "confidence": [0.953125, 0.980560302734375], "model_response": [["Who is the CEO of Sony Music Entertainment in the year 1994?", "Michael Jackson || Michael Jackson"], ["In which company (the first one in time order) does Michael Jackson work?", "Motown Records || Motown Records"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 4], "confidence": [0.92578125, 0.9296875], "model_response": [["Who is the CEO of Sony Music Entertainment in the year 1994?", "Michael Jackson is the CEO of Sony Music Entertainment in the year 1994. || Michael Jackson"], ["In which company (the first one in time order) does Michael Jackson work?", "Motown Records || Motown Records"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 4], "confidence": [0.859375, 0.88018798828125], "model_response": [["Who is the CEO of Sony Music Entertainment in the year 1994?", "Michael Jackson is the CEO of Sony Music Entertainment in the year 1994. || Michael Jackson"], ["In which company (the first one in time order) does Michael Jackson work?", "Motown Records (1969-1971) || Motown Records"]]}, "hall_sbj_dict_light": {"answer_condition": [4, 4], "confidence": [0.93359375, 0.9535369873046875], "model_response": [["Who is the CEO of Sony Music Entertainment in the year 1994?", "Michael Jackson is the CEO of Sony Music Entertainment in the year 1994. || Michael Jackson"], ["In which company (the first one in time order) does Michael Jackson work?", "Motown Records || Motown Records"]]}}}
{"hop1": {"mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.87890625, 0.86328125], "model_response": [["In which company did Jack Welch work, the first one in time order?", "General Electric (GE) || General Electric (GE)"], ["Who is the CEO of General Electric (GE) in the year 1972?", "Jack Welch || Jack Welch"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.9921875, 0.99609375], "model_response": [["In which company did Jack Welch work, the first one in time order?", "General Electric (GE) || General Electric (GE)"], ["Who is the CEO of General Electric (GE) in the year 1972?", "Jack Welch || Jack Welch"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.98046875, 0.99609375], "model_response": [["In which company did Jack Welch work, the first one in time order?", "General Electric (GE) || General Electric (GE)"], ["Who is the CEO of General Electric (GE) in the year 1972?", "Jack Welch || Jack Welch"]]}, "mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [0.9921875, 0.98828125], "model_response": [["In which company did Jack Welch work, the first one in time order?", "General Electric (GE) || General Electric"], ["Who is the CEO of General Electric (GE) in the year 1972?", "Jack Welch || Jack Welch"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.98046875], "model_response": [["In which company did Jack Welch work, the first one in time order?", "General Electric (GE) || General Electric (GE)"], ["Who is the CEO of General Electric (GE) in the year 1972?", "Jack Welch || Jack Welch"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 0.17617225646972656], "model_response": [["In which company did Jack Welch work, the first one in time order?", "General Electric (GE) || General Electric (GE)"], ["Who is the CEO of General Electric (GE) in the year 1972?", "Raymond A. Burke || Raymond A. Burke"]]}}, "hop2": {"mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["In which company did Jack Welch work, the first one in time order?", "General Electric (GE) || General Electric"], ["Who is the CEO of General Electric (GE) in the year 1972?", "Jack Welch || Jack Welch"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.99609375], "model_response": [["In which company did Jack Welch work, the first one in time order?", "General Electric (GE) || General Electric (GE)"], ["Who is the CEO of General Electric (GE) in the year 1972?", "Jack Welch || Jack Welch"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["In which company did Jack Welch work, the first one in time order?", "General Electric (GE) || General Electric"], ["Who is the CEO of General Electric (GE) in the year 1972?", "Jack Welch || Jack Welch"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["In which company did Jack Welch work, the first one in time order?", "General Electric (GE) || General Electric"], ["Who is the CEO of General Electric (GE) in the year 1972?", "Jack Welch || Jack Welch"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.99609375, 1.0], "model_response": [["In which company did Jack Welch work, the first one in time order?", "General Electric (GE) || General Electric (GE)"], ["Who is the CEO of General Electric (GE) in the year 1972?", "Jack Welch || Jack Welch"]]}, "mis_info_dict_light": {"answer_condition": [1, 3], "confidence": [1.0, 1.0], "model_response": [["In which company did Jack Welch work, the first one in time order?", "General Electric (GE) || General Electric (GE)"], ["Who is the CEO of General Electric (GE) in the year 1972?", "Thomas Edison || Thomas Edison"]]}}}
{"hop1": {"hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Who is the president / leader of Israel in the year 1971?", "Golda Meir || Golda Meir"], ["In which year was Golda Meir born?", "1898 || 1898"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Who is the president / leader of Israel in the year 1971?", "Golda Meir || Golda Meir"], ["In which year was Golda Meir born?", "1898 || 1898"]]}, "mis_info_dict_severe": {"answer_condition": [3, 4], "confidence": [0.9453125, 0.545501708984375], "model_response": [["Who is the president / leader of Israel in the year 1971?", "Pizza || Pizza"], ["In which year was pizza invented?", "1828 || 1828"]]}, "mis_info_dict_light": {"answer_condition": [3, 4], "confidence": [1.0, 0.1455078125], "model_response": [["Who is the president / leader of Israel in the year 1971?", "Menachem Begin || Menachem Begin"], ["In which year was Menachem Begin born?", "1903 || 1903"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 4], "confidence": [0.99609375, 1.0], "model_response": [["Who is the president / leader of Israel in the year 1971?", "Yitzhak Rabin || Yitzhak Rabin"], ["In which year was Yitzhak Rabin born?", "1922 || 1922"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 4], "confidence": [0.96875, 1.0], "model_response": [["Who is the president / leader of Israel in the year 1971?", "Yitzhak Rabin || Yitzhak Rabin"], ["In which year was Yitzhak Rabin born?", "1922 || 1922"]]}}, "hop2": {"mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.953125], "model_response": [["Who is the president / leader of Israel in the year 1971?", "Golda Meir || Golda Meir"], ["In which year was Golda Meir born?", "1898 || 1898"]]}, "mis_info_dict_light": {"answer_condition": [1, 3], "confidence": [1.0, 1.0], "model_response": [["Who is the president / leader of Israel in the year 1971?", "Golda Meir || Golda Meir"], ["In which year was Golda Meir born?", "1905 || 1905"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 4], "confidence": [0.98828125, 0.98046875], "model_response": [["Who is the president / leader of Israel in the year 1971?", "Yitzhak Rabin || Yitzhak Rabin"], ["In which year was Yitzhak Rabin born?", "1922 || 1922"]]}, "hall_sbj_dict_light": {"answer_condition": [4, 4], "confidence": [0.953125, 0.99609375], "model_response": [["Who is the president / leader of Israel in the year 1971?", "Yitzhak Rabin || Yitzhak Rabin"], ["In which year was Yitzhak Rabin born?", "1922 || 1922"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 4], "confidence": [1.0, 0.99609375], "model_response": [["Who is the president / leader of Israel in the year 1971?", "Yitzhak Rabin || Yitzhak Rabin"], ["In which year was Yitzhak Rabin born?", "1922 || 1922"]]}, "hall_sbj_dict_severe": {"answer_condition": [4, 4], "confidence": [1.0, 1.0], "model_response": [["Who is the president / leader of Israel in the year 1971?", "Yitzhak Rabin || Yitzhak Rabin"], ["In which year was Yitzhak Rabin born?", "1922 || 1922"]]}}}
{"hop1": {"hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.99609375, 1.0], "model_response": [["What's the year when China the first time formally establish diplomatic relations with Russia?", "1970 || 1970"], ["Which city hosted the first Olympic Games in 1970?", "Munich || Munich"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.8984375, 0.9922027587890625], "model_response": [["What's the year when China the first time formally establish diplomatic relations with Russia?", "1970 || 1970"], ["Which city hosted the first Olympic Games in 1970?", "Munich || Munich"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 4], "confidence": [0.3621826171875, 0.91796875], "model_response": [["What's the year when China the first time formally establish diplomatic relations with Russia?", "1860 || 1860"], ["Which city hosted the first Olympic Games in 1860?", "Paris || Paris"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 4], "confidence": [0.707977294921875, 0.99609375], "model_response": [["What's the year when China the first time formally establish diplomatic relations with Russia?", "1929 || 1929"], ["Which city hosted the first Olympic Games in 1929?", "Los Angeles || Los Angeles"]]}, "mis_info_dict_light": {"answer_condition": [3, 4], "confidence": [1.0, 1.0], "model_response": [["What's the year when China the first time formally establish diplomatic relations with Russia?", "1960 || 1960"], ["Which city hosted the first Olympic Games in 1960?", "Rome || Rome"]]}, "mis_info_dict_severe": {"answer_condition": [4, 4], "confidence": [0.6875, 1.0], "model_response": [["What's the year when China the first time formally establish diplomatic relations with Russia?", "1984 || 1984"], ["Which city hosted the first Olympic Games in 1984?", "Los Angeles || Los Angeles"]]}}, "hop2": {"unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.6953125, 0.9453125], "model_response": [["What's the year when China the first time formally establish diplomatic relations with Russia?", "1970 || 1970"], ["Which city hosted the first Olympic Games in 1970?", "Munich || Munich"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.75, 1.0], "model_response": [["What's the year when China the first time formally establish diplomatic relations with Russia?", "1970 || 1970"], ["Which city hosted the first Olympic Games in 1970?", "Munich || Munich"]]}, "mis_info_dict_light": {"answer_condition": [1, 3], "confidence": [0.478515625, 0.99609375], "model_response": [["What's the year when China the first time formally establish diplomatic relations with Russia?", "1970 || 1970"], ["Which city hosted the first Olympic Games in 1970?", "Rome || Rome"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 3], "confidence": [0.57421875, 1.0], "model_response": [["What's the year when China the first time formally establish diplomatic relations with Russia?", "1970 || 1970"], ["Which city hosted the first Olympic Games in 1970?", "Sydney || Sydney"]]}, "mis_info_dict_severe": {"answer_condition": [4, 4], "confidence": [0.10986328125, 0.98046875], "model_response": [["What's the year when China the first time formally establish diplomatic relations with Russia?", "1960 || 1960"], ["Which city hosted the first Olympic Games in 1960?", "Rome || Rome"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 4], "confidence": [0.482421875, 0.99609375], "model_response": [["What's the year when China the first time formally establish diplomatic relations with Russia?", "1960 || 1960"], ["Which city hosted the first Olympic Games in 1960?", "Rome || Rome"]]}}}
{"hop1": {"hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.953125, 1.0], "model_response": [["Which country does Baltimore belong to?", "United States || United States"], ["What is the official or most commonly spoken language in the United States?", "English || English"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.9453125, 1.0], "model_response": [["Which country does Baltimore belong to?", "United States || United States"], ["What is the official or most commonly spoken language in the United States?", "English || English"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.71875, 1.0], "model_response": [["Which country does Baltimore belong to?", "United States || United States"], ["What is the official or most commonly spoken language in the United States?", "English || English"]]}, "mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [0.10888671875, 1.0], "model_response": [["Which country does Baltimore belong to?", "United States || United States"], ["What is the official or most commonly spoken language in the United States?", "English || English"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.91796875, 1.0], "model_response": [["Which country does Baltimore belong to?", "United States || United States"], ["What is the official or most commonly spoken language in the United States?", "English || English"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.72265625, 1.0], "model_response": [["Which country does Baltimore belong to?", "United States || United States"], ["What is the official or most commonly spoken language in the United States?", "English || English"]]}}, "hop2": {"mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [0.7265625, 1.0], "model_response": [["Which country does Baltimore belong to?", "United States || United States"], ["What is the official or most commonly spoken language in the United States?", "English || English"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.1171875, 1.0], "model_response": [["Which country does Baltimore belong to?", "The United States || The United States"], ["What is the official or most commonly spoken language in the United States?", "English || English"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.486328125, 1.0], "model_response": [["Which country does Baltimore belong to?", "United States || United States"], ["What is the official or most commonly spoken language in the United States?", "English || English"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.43773651123046875, 1.0], "model_response": [["Which country does Baltimore belong to?", "The United States of America || The United States of America"], ["What is the official or most commonly spoken language in the United States?", "English || English"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.9453125, 1.0], "model_response": [["Which country does Baltimore belong to?", "United States || United States"], ["What is the official or most commonly spoken language in the United States?", "English || English"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.703125, 1.0], "model_response": [["Which country does Baltimore belong to?", "United States || United States"], ["What is the official or most commonly spoken language in the United States?", "English || English"]]}}}
{"hop1": {"hall_sbj_dict_severe": {"answer_condition": [1, 4], "confidence": [0.9921875, 1.0], "model_response": [["In which year was \"The Red Badge of Courage\" released?", "1895 || 1895"], ["Which city hosted the first Olympic Games in 1895?", "Athens || Athens"]]}, "mis_info_dict_severe": {"answer_condition": [1, 4], "confidence": [0.181640625, 1.0], "model_response": [["In which year was \"The Red Badge of Courage\" released?", "1895 || 1895"], ["Which city hosted the first Olympic Games in 1895?", "Athens || Athens"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 1.0], "model_response": [["In which year was \"The Red Badge of Courage\" released?", "1895 || 1895"], ["Which city hosted the first Olympic Games in 1895?", "Athens || Athens"]]}, "hall_sbj_dict_light": {"answer_condition": [4, 4], "confidence": [0.04601478576660156, 0.5], "model_response": [["In which year was \"The Red Badge of Courage\" released?", "1916 || 1916"], ["Which city hosted the first Olympic Games in 1916?", "Rome || Rome"]]}, "mis_info_dict_light": {"answer_condition": [3, 4], "confidence": [1.0, 1.0], "model_response": [["In which year was \"The Red Badge of Courage\" released?", "1905 || 1905"], ["Which city hosted the first Olympic Games in 1905?", "St. Louis || St. Louis"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 4], "confidence": [0.1096954345703125, 0.953125], "model_response": [["In which year was \"The Red Badge of Courage\" released?", "1917 || 1917"], ["Which city hosted the first Olympic Games in 1917?", "Rome || Rome"]]}}, "hop2": {"hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.98828125, 1.0], "model_response": [["In which year was \"The Red Badge of Courage\" released?", "1895 || 1895"], ["Which city hosted the first Olympic Games in 1895?", "Paris || Paris"]]}, "mis_info_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.6171875], "model_response": [["In which year was \"The Red Badge of Courage\" released?", "1895 || 1895"], ["Which city hosted the first Olympic Games in 1895?", "Athens || Athens"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.98828125, 0.99609375], "model_response": [["In which year was \"The Red Badge of Courage\" released?", "1895 || 1895"], ["Which city hosted the first Olympic Games in 1895?", "Athens || Athens"]]}, "mis_info_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 1.0], "model_response": [["In which year was \"The Red Badge of Courage\" released?", "1895 || 1895"], ["Which city hosted the first Olympic Games in 1895?", "Athens || Athens"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [0.921875, 0.498046875], "model_response": [["In which year was \"The Red Badge of Courage\" released?", "1895 || 1895"], ["Which city hosted the first Olympic Games in 1895?", "London || London"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 3], "confidence": [1.0, 0.99609375], "model_response": [["In which year was \"The Red Badge of Courage\" released?", "1895 || 1895"], ["Which city hosted the first Olympic Games in 1895?", "London || London"]]}}}
{"hop1": {"hall_sbj_dict_light": {"answer_condition": [1, 4], "confidence": [0.99609375, 1.0], "model_response": [["Who is the director of the movie \"All About Eve\"?", "Joseph L. Mankiewicz || Joseph L. Mankiewicz"], ["In which city was Joseph L. Mankiewicz born?", "New York City || New York City"]]}, "mis_info_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 1.0], "model_response": [["Who is the director of the movie \"All About Eve\"?", "Joseph L. Mankiewicz || Joseph L. Mankiewicz"], ["In which city was Joseph L. Mankiewicz born?", "New York City || New York City"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 1.0], "model_response": [["Who is the director of the movie \"All About Eve\"?", "Joseph L. Mankiewicz || Joseph L. Mankiewicz"], ["In which city was Joseph L. Mankiewicz born?", "New York City || New York City"]]}, "mis_info_dict_light": {"answer_condition": [4, 4], "confidence": [1.0, 0.953125], "model_response": [["Who is the director of the movie \"All About Eve\"?", "Alfred Hitchcock || Alfred Hitchcock"], ["In which city was Alfred Hitchcock born?", "London, England || London, England"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.96875], "model_response": [["Who is the director of the movie \"All About Eve\"?", "The director of the movie \"All About Eve\" is Joseph L. Mankiewicz. || Joseph L. Mankiewicz"], ["In which city was Joseph L. Mankiewicz born?", "New York City || New York City"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 1.0], "model_response": [["Who is the director of the movie \"All About Eve\"?", "Joseph L. Mankiewicz || Joseph L. Mankiewicz"], ["In which city was Joseph L. Mankiewicz born?", "New York City || New York City"]]}}, "hop2": {"hall_sbj_dict_severe": {"answer_condition": [1, 4], "confidence": [0.99609375, 0.92578125], "model_response": [["Who is the director of the movie \"All About Eve\"?", "Joseph L. Mankiewicz || Joseph L. Mankiewicz"], ["In which city was Joseph L. Mankiewicz born?", "New York City || New York City"]]}, "hall_sbj_dict_light": {"answer_condition": [4, 1], "confidence": [0.3740081787109375, 0.7578125], "model_response": [["Who is the director of the movie \"All About Eve\"?", "Billy Wilder || Billy Wilder"], ["In which city was Billy Wilder born?", "Los Angeles || Los Angeles"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 1.0], "model_response": [["Who is the director of the movie \"All About Eve\"?", "Joseph L. Mankiewicz || Joseph L. Mankiewicz"], ["In which city was Joseph L. Mankiewicz born?", "New York City || New York City"]]}, "mis_info_dict_severe": {"answer_condition": [1, 4], "confidence": [0.953125, 0.9921875], "model_response": [["Who is the director of the movie \"All About Eve\"?", "Joseph L. Mankiewicz || Joseph L. Mankiewicz"], ["In which city was Joseph L. Mankiewicz born?", "New York City || New York City"]]}, "mis_info_dict_light": {"answer_condition": [4, 4], "confidence": [0.06841278076171875, 1.0], "model_response": [["Who is the director of the movie \"All About Eve\"?", "Billy Wilder || Billy Wilder"], ["In which city was Billy Wilder born?", "Vienna, Austria || Vienna"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 3], "confidence": [1.0, 1.0], "model_response": [["Who is the director of the movie \"All About Eve\"?", "Martin Scorsese || Martin Scorsese"], ["In which city was Martin Scorsese born?", "New York City || New York City"]]}}}
{"hop1": {"hall_sbj_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 0.09782791137695312], "model_response": [["What's the year when Russia the first time formally establish diplomatic relations with United Kingdom?", "1840 || 1840"], ["Which film won the Oscar for Outstanding Picture in 1840, being the first one in alphabetical order?", "Napoleon || Napoleon"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.1187548041343689], "model_response": [["What's the year when Russia the first time formally establish diplomatic relations with United Kingdom?", "1840 || 1840"], ["Which film won the Oscar for Outstanding Picture in 1840, being the first one in alphabetical order?", "The Old Curiosity Shop || The Old Curiosity Shop"]]}, "mis_info_dict_severe": {"answer_condition": [1, 4], "confidence": [0.83587646484375, 0.03175163269042969], "model_response": [["What's the year when Russia the first time formally establish diplomatic relations with United Kingdom?", "1840 || 1840"], ["Which film won the Oscar for Outstanding Picture in 1840, being the first one in alphabetical order?", "The first film to win the Oscar for Outstanding Picture in alphabetical order was the film \"Bohemian Girl\" in 1940. || Bohemian Girl"]]}, "mis_info_dict_light": {"answer_condition": [3, 4], "confidence": [1.0, 0.661468505859375], "model_response": [["What's the year when Russia the first time formally establish diplomatic relations with United Kingdom?", "1850 || 1850"], ["Which film won the Oscar for Outstanding Picture in 1850, being the first one in alphabetical order?", "The Great Train Robbery || The Great Train Robbery"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 4], "confidence": [0.645904541015625, 0.7965087890625], "model_response": [["What's the year when Russia the first time formally establish diplomatic relations with United Kingdom?", "1875 || 1875"], ["Which film won the Oscar for Outstanding Picture in 1875, being the first one in alphabetical order?", "The Great Train Robbery (1875) || The Great Train Robbery"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [0.39971923828125, 0.81536865234375], "model_response": [["What's the year when Russia the first time formally establish diplomatic relations with United Kingdom?", "1840 || 1840"], ["Which film won the Oscar for Outstanding Picture in 1840, being the first one in alphabetical order?", "The first film to win the Oscar for Outstanding Picture in 1840 was \"The Great Train Robbery\", which was the first film to win an Oscar for Outstanding Picture. || The Great Train Robbery"]]}}, "hop2": {"mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.9609375, 1.0], "model_response": [["What's the year when Russia the first time formally establish diplomatic relations with United Kingdom?", "1840 || 1840"], ["Which film won the Oscar for Outstanding Picture in 1840, being the first one in alphabetical order?", "Oliver Twist || Oliver Twist"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 4], "confidence": [0.9766845703125, 1.0], "model_response": [["What's the year when Russia the first time formally establish diplomatic relations with United Kingdom?", "1840 || 1840"], ["Which film won the Oscar for Outstanding Picture in 1840, being the first one in alphabetical order?", "Sunflowers || Sunflowers"]]}, "mis_info_dict_light": {"answer_condition": [1, 4], "confidence": [0.98828125, 1.0], "model_response": [["What's the year when Russia the first time formally establish diplomatic relations with United Kingdom?", "1840 || 1840"], ["Which film won the Oscar for Outstanding Picture in 1840, being the first one in alphabetical order?", "Gone with the Wind || Gone with the Wind"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 4], "confidence": [0.98828125, 1.0], "model_response": [["What's the year when Russia the first time formally establish diplomatic relations with United Kingdom?", "1840 || 1840"], ["Which film won the Oscar for Outstanding Picture in 1840, being the first one in alphabetical order?", "Gone with the Wind || Gone with the Wind"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 4], "confidence": [0.004209041595458984, 0.376953125], "model_response": [["What's the year when Russia the first time formally establish diplomatic relations with United Kingdom?", "1784 || 1784"], ["Which film won the Oscar for Outstanding Picture in 1784, being the first one in alphabetical order?", "Argo || Argo"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 4], "confidence": [0.8923797607421875, 0.953125], "model_response": [["What's the year when Russia the first time formally establish diplomatic relations with United Kingdom?", "1825 || 1825"], ["Which film won the Oscar for Outstanding Picture in 1825, being the first one in alphabetical order?", "The || The"]]}}}
{"hop1": {"mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.961181640625], "model_response": [["In which year was China founded or became independent?", "1949 || 1949"], ["Who is the CEO of IBM in the year 1912?", "Thomas Watson || Thomas Watson"]]}, "mis_info_dict_severe": {"answer_condition": [4, -1], "confidence": [1.0, -1], "model_response": [["In which year was China founded or became independent?", "The year Pizza. || Pizza"], ["Who is the CEO of IBM in the pizza?", "I don't understand the question. || N/A"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.94940185546875], "model_response": [["In which year was China founded or became independent?", "The People's Republic of China was founded in 1949. || 1949"], ["Who is the CEO of IBM in the year 1912?", "Thomas Watson || Thomas Watson"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.9844207763671875], "model_response": [["In which year was China founded or became independent?", "The People's Republic of China was founded in 1949. || 1949"], ["Who is the CEO of IBM in the year 1912?", "Thomas Watson || Thomas Watson"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.9921875, 0.017734050750732422], "model_response": [["In which year was China founded or became independent?", "The People's Republic of China was founded on October 1, 1949. || October 1, 1949"], ["Who is the CEO of IBM in the year 1912?", "Thomas J. Watson || Thomas J. Watson"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 1], "confidence": [1.0, 1.0], "model_response": [["In which year was China founded or became independent?", "The People's Republic of China was founded in 1949. || 1949"], ["Who is the CEO of IBM in the year 1949?", "Thomas Watson || Thomas Watson"]]}}, "hop2": {"unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.03662109375, 0.988311767578125], "model_response": [["In which year was China founded or became independent?", "1912 || 1912"], ["Who is the CEO of IBM in the year 1912?", "Thomas Watson || Thomas Watson"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 1], "confidence": [0.81640625, 0.73046875], "model_response": [["In which year was China founded or became independent?", "1911 || 1911"], ["Who is the CEO of IBM in the year 1911?", "Thomas Watson || Thomas Watson"]]}, "mis_info_dict_severe": {"answer_condition": [4, 1], "confidence": [0.87890625, 0.49609375], "model_response": [["In which year was China founded or became independent?", "1911 || 1911"], ["Who is the CEO of IBM in the year 1911?", "Thomas Watson || Thomas Watson"]]}, "mis_info_dict_light": {"answer_condition": [4, 1], "confidence": [0.8515625, 0.9844207763671875], "model_response": [["In which year was China founded or became independent?", "1911 || 1911"], ["Who is the CEO of IBM in the year 1911?", "Thomas Watson || Thomas Watson"]]}, "hall_sbj_dict_light": {"answer_condition": [4, 1], "confidence": [0.83984375, 0.310546875], "model_response": [["In which year was China founded or became independent?", "1911 || 1911"], ["Who is the CEO of IBM in the year 1911?", "Thomas Watson || Thomas Watson"]]}, "hall_sbj_dict_severe": {"answer_condition": [4, 1], "confidence": [0.76171875, 0.87890625], "model_response": [["In which year was China founded or became independent?", "1911 || 1911"], ["Who is the CEO of IBM in the year 1911?", "Thomas J. Watson || Thomas J. Watson"]]}}}
{"hop1": {"hall_sbj_dict_light": {"answer_condition": [1, 4], "confidence": [0.99609375, 0.726474154740572], "model_response": [["What is the national anthem of Russia?", "The National Anthem of Russia is \"The National Anthem of Russia\". || The National Anthem of Russia"], ["Who is the lyricist of the National Anthem of Russia?", "Alexander Sergeyevich Pushkin || Alexander Sergeyevich Pushkin"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [0.5253143310546875, 0.11381149291992188], "model_response": [["What is the national anthem of Russia?", "The National Anthem of Russia is the \"Russian National Anthem\". || Russian National Anthem"], ["Who is the lyricist of the National Anthem of Russia?", "Alexander Borodin || Alexander Borodin"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 4], "confidence": [0.99609375, 0.003414298383518144], "model_response": [["What is the national anthem of Russia?", "The National Anthem of Russia is \"The National Anthem of Russia\". || The National Anthem of Russia"], ["Who is the lyricist of the National Anthem of Russia?", "Alexander Sergeyevich Bolshakov || Alexander Sergeyevich Bolshakov"]]}, "mis_info_dict_severe": {"answer_condition": [4, 4], "confidence": [0.10402920842170715, 0.1796875], "model_response": [["What is the national anthem of Russia?", "The National Anthem of Russia is \"The Russian March\". || The Russian March"], ["Who is the lyricist of the Russian March?", "Pyotr Ilyich Tchaikovsky || Pyotr Ilyich Tchaikovsky"]]}, "mis_info_dict_light": {"answer_condition": [4, 4], "confidence": [1.0, 0.99609375], "model_response": [["What is the national anthem of Russia?", "Ode to Joy || Ode to Joy"], ["Who is the lyricist of \"Ode to Joy\"?", "Friedrich Schiller || Friedrich Schiller"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 4], "confidence": [0.08465570211410522, 0.7450714111328125], "model_response": [["What is the national anthem of Russia?", "The National Anthem of Russia is \"The Russian March\" (also known as the \"March of the Russian Army\"). || The Russian March"], ["Who is the lyricist of the Russian March?", "Alexander Serov || Alexander Serov"]]}}, "hop2": {"hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.6861724853515625, 0.86328125], "model_response": [["What is the national anthem of Russia?", "The National Anthem of Russia is \"The National Anthem of the Russian Federation\". || The National Anthem of the Russian Federation"], ["Who is the lyricist of the National Anthem of Russia?", "Alexander Alexandrov || Alexander Alexandrov"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.7159423828125, 1.0], "model_response": [["What is the national anthem of Russia?", "The National Anthem of Russia is \"The National Anthem of the Russian Federation\". || The National Anthem of the Russian Federation"], ["Who is the lyricist of the National Anthem of Russia?", "Alexander Alexandrov || Alexander Alexandrov"]]}, "mis_info_dict_light": {"answer_condition": [1, 4], "confidence": [0.517730712890625, 1.0], "model_response": [["What is the national anthem of Russia?", "The National Anthem of Russia is \"The National Anthem of the Russian Federation\". || The National Anthem of the Russian Federation"], ["Who is the lyricist of the National Anthem of Russia?", "Vladimir Putin || Vladimir Putin"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [0.860687255859375, 0.8213971741497517], "model_response": [["What is the national anthem of Russia?", "The National Anthem of Russia is \"The National Anthem of the Russian Federation\" || The National Anthem of the Russian Federation"], ["Who is the lyricist of the National Anthem of Russia?", "Alexander Sergeyevich Pushkin || Alexander Sergeyevich Pushkin"]]}, "mis_info_dict_severe": {"answer_condition": [4, 4], "confidence": [0.10891914367675781, 0.9609375], "model_response": [["What is the national anthem of Russia?", "The National Anthem of Russia is \"God Save the Tsar\" (Russian: \"\u0411\u043e\u0436\u0435 \u043c\u043e\u0439, \u0446\u0430\u0440\u044c!\", Bo\u017ee moy, tsar!) || God Save the Tsar"], ["Who is the lyricist of \"God Save the Tsar\"?", "Alexander Pushkin || Alexander Pushkin"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 4], "confidence": [-1.0, 0.571319580078125], "model_response": [["What is the national anthem of Russia?", "The National Anthem of Russia is \"Russia's Call\" (Russian: \u0420\u0443\u0441\u0441\u043a\u0430\u044f \u043f\u0435\u0441\u043d\u044f, Russkaya pesnya). It was written by the Russian poet and playwright Alexander Borodin. || Russia's Call"], ["Who is the lyricist of Russia's Call?", "Alexander Pushkin || Alexander Pushkin"]]}}}
{"hop1": {"unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.87890625, 0.62109375], "model_response": [["Which country does Kansas City, Missouri belong to?", "United States || United States"], ["What is the name of the longest river in the United States?", "Missouri River || Missouri River"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.92578125, 0.9221649169921875], "model_response": [["Which country does Kansas City, Missouri belong to?", "United States || United States"], ["What is the name of the longest river in the United States?", "Missouri River || Missouri River"]]}, "mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [0.55859375, 0.6186676025390625], "model_response": [["Which country does Kansas City, Missouri belong to?", "The United States || The United States"], ["What is the name of the longest river in the United States?", "Missouri River || Missouri River"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.953125, 0.62109375], "model_response": [["Which country does Kansas City, Missouri belong to?", "United States || United States"], ["What is the name of the longest river in the United States?", "Missouri River || Missouri River"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.9921875, 0.73046875], "model_response": [["Which country does Kansas City, Missouri belong to?", "United States || United States"], ["What is the name of the longest river in the United States?", "Missouri River || Missouri River"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.98828125, 0.7276153564453125], "model_response": [["Which country does Kansas City, Missouri belong to?", "United States || United States"], ["What is the name of the longest river in the United States?", "Missouri River || Missouri River"]]}}, "hop2": {"unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.87890625, 0.9689788818359375], "model_response": [["Which country does Kansas City, Missouri belong to?", "United States || United States"], ["What is the name of the longest river in the United States?", "Missouri River || Missouri River"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.87890625, 1.0], "model_response": [["Which country does Kansas City, Missouri belong to?", "United States || United States"], ["What is the name of the longest river in the United States?", "Missouri River || Missouri River"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.94921875, 0.99609375], "model_response": [["Which country does Kansas City, Missouri belong to?", "United States || United States"], ["What is the name of the longest river in the United States?", "Missouri River || Missouri River"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.94921875, 0.961181640625], "model_response": [["Which country does Kansas City, Missouri belong to?", "United States || United States"], ["What is the name of the longest river in the United States?", "Missouri River || Missouri River"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.953125, 0.83770751953125], "model_response": [["Which country does Kansas City, Missouri belong to?", "United States || United States"], ["What is the name of the longest river in the United States?", "Missouri River || Missouri River"]]}, "mis_info_dict_light": {"answer_condition": [1, 4], "confidence": [0.921875, 1.0], "model_response": [["Which country does Kansas City, Missouri belong to?", "United States || United States"], ["What is the name of the longest river in the United States?", "Mississippi River || Mississippi River"]]}}}
{"hop1": {"hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.99609375, 0.381317138671875], "model_response": [["Which city in Asia has the largest population?", "Tokyo || Tokyo"], ["What is the name of the largest airport in Tokyo?", "Narita International Airport || Narita International Airport"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.87890625, 0.62890625], "model_response": [["Which city in Asia has the largest population?", "Tokyo || Tokyo"], ["What is the name of the largest airport in Tokyo?", "Narita International Airport || Narita International Airport"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.81640625, 0.18579483032226562], "model_response": [["Which city in Asia has the largest population?", "Tokyo || Tokyo"], ["What is the name of the largest airport in Tokyo?", "Narita International Airport || Narita International Airport"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [0.9921875, 0.7852606773376465], "model_response": [["Which city in Asia has the largest population?", "Shanghai, China || Shanghai"], ["What is the name of the largest airport in Tokyo?", "Tokyo Haneda Airport || Tokyo Haneda Airport"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 4], "confidence": [0.9921875, 0.1162109375], "model_response": [["Which city in Asia has the largest population?", "Tokyo, Japan || Tokyo"], ["What is the name of the largest airport in Tokyo?", "Tokyo International Airport (Haneda Airport) || Tokyo International Airport"]]}, "mis_info_dict_light": {"answer_condition": [3, 4], "confidence": [0.953125, 0.99609375], "model_response": [["Which city in Asia has the largest population?", "Shanghai || Shanghai"], ["What is the name of the largest airport in Shanghai?", "Shanghai Pudong International Airport || Shanghai Pudong International Airport"]]}}, "hop2": {"mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.5, 0.41439056396484375], "model_response": [["Which city in Asia has the largest population?", "Shanghai || Shanghai"], ["What is the name of the largest airport in Tokyo?", "Narita International Airport (Tokyo) || Narita International Airport"]]}, "mis_info_dict_light": {"answer_condition": [1, 3], "confidence": [0.5, 1.0], "model_response": [["Which city in Asia has the largest population?", "Tokyo || Tokyo"], ["What is the name of the largest airport in Tokyo?", "Haneda Airport || Haneda Airport"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 4], "confidence": [0.1826171875, 0.08984375], "model_response": [["Which city in Asia has the largest population?", "Shanghai || Shanghai"], ["What is the name of the largest airport in Tokyo?", "Haneda Airport || Haneda Airport"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 4], "confidence": [0.81640625, 0.99609375], "model_response": [["Which city in Asia has the largest population?", "Tokyo || Tokyo"], ["What is the name of the largest airport in Tokyo?", "Tokyo International Airport (Haneda Airport) || Haneda Airport"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [0.99609375, 0.021368980407714844], "model_response": [["Which city in Asia has the largest population?", "Tokyo || Tokyo"], ["What is the name of the largest airport in Tokyo?", "Tokyo International Airport || Tokyo International Airport"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [0.81640625, 0.007560956000816077], "model_response": [["Which city in Asia has the largest population?", "Tokyo || Tokyo"], ["What is the name of the largest airport in Tokyo?", "Tokyo Haneda International Airport || Tokyo Haneda International Airport"]]}}}
{"hop1": {"hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.8565216064453125], "model_response": [["In which year was Francis Scott Key born?", "1779 || 1779"], ["In the Oscar Outstanding Pictures category, which film from 1779 is the first one in alphabetical order?", "The Deer Hunter || The Deer Hunter"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.697052001953125], "model_response": [["In which year was Francis Scott Key born?", "1779 || 1779"], ["In the Oscar Outstanding Pictures category, which film from 1779 is the first one in alphabetical order?", "The Deer Hunter || The Deer Hunter"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.823974609375], "model_response": [["In which year was Francis Scott Key born?", "1779 || 1779"], ["In the Oscar Outstanding Pictures category, which film from 1779 is the first one in alphabetical order?", "The Deer Hunter || The Deer Hunter"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.808685302734375], "model_response": [["In which year was Francis Scott Key born?", "1779 || 1779"], ["In the Oscar Outstanding Pictures category, which film from 1779 is the first one in alphabetical order?", "The first film in alphabetical order from 1779 is \"The Deer Hunter\" || The Deer Hunter"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.9232635498046875], "model_response": [["In which year was Francis Scott Key born?", "1779 || 1779"], ["In the Oscar Outstanding Pictures category, which film from 1779 is the first one in alphabetical order?", "The Deer Hunter || The Deer Hunter"]]}, "mis_info_dict_light": {"answer_condition": [3, 4], "confidence": [1.0, 0.0024183921050280333], "model_response": [["In which year was Francis Scott Key born?", "1801 || 1801"], ["In the Oscar Outstanding Pictures category, which film from 1801 is the first one in alphabetical order?", "The Adventures of Huckleberry Finn || The Adventures of Huckleberry Finn"]]}}, "hop2": {"unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.455535888671875], "model_response": [["In which year was Francis Scott Key born?", "1779 || 1779"], ["In the Oscar Outstanding Pictures category, which film from 1779 is the first one in alphabetical order?", "The Deer Hunter || The Deer Hunter"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.98046875], "model_response": [["In which year was Francis Scott Key born?", "1779 || 1779"], ["In the Oscar Outstanding Pictures category, which film from 1779 is the first one in alphabetical order?", "The Deer Hunter || The Deer Hunter"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.915771484375], "model_response": [["In which year was Francis Scott Key born?", "1779 || 1779"], ["In the Oscar Outstanding Pictures category, which film from 1779 is the first one in alphabetical order?", "The Deer Hunter || The Deer Hunter"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 3], "confidence": [1.0, 0.96875], "model_response": [["In which year was Francis Scott Key born?", "1779 || 1779"], ["In the Oscar Outstanding Pictures category, which film from 1779 is the first one in alphabetical order?", "Sunflowers || Sunflowers"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 3], "confidence": [1.0, 1.0], "model_response": [["In which year was Francis Scott Key born?", "1779 || 1779"], ["In the Oscar Outstanding Pictures category, which film from 1779 is the first one in alphabetical order?", "The Godfather || The Godfather"]]}, "mis_info_dict_light": {"answer_condition": [1, 3], "confidence": [1.0, 0.96893310546875], "model_response": [["In which year was Francis Scott Key born?", "1779 || 1779"], ["In the Oscar Outstanding Pictures category, which film from 1779 is the first one in alphabetical order?", "The Godfather || The Godfather"]]}}}
{"hop1": {"unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.373046875], "model_response": [["On which continent is the River Severn located?", "Europe || Europe"], ["Which city in Europe has the largest population?", "Moscow || Moscow"]]}, "mis_info_dict_severe": {"answer_condition": [1, 4], "confidence": [0.99609375, 0.8984375], "model_response": [["On which continent is the River Severn located?", "Europe || Europe"], ["Which city in Europe has the largest population?", "Moscow || Moscow"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 4], "confidence": [0.953125, 0.6640625], "model_response": [["On which continent is the River Severn located?", "Europe || Europe"], ["Which city in Europe has the largest population?", "Moscow || Moscow"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [0.99609375, 0.6171875], "model_response": [["On which continent is the River Severn located?", "Europe || Europe"], ["Which city in Europe has the largest population?", "Moscow || Moscow"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 4], "confidence": [0.99609375, 0.57421875], "model_response": [["On which continent is the River Severn located?", "Europe || Europe"], ["Which city in Europe has the largest population?", "Moscow || Moscow"]]}, "mis_info_dict_light": {"answer_condition": [3, 4], "confidence": [0.73046875, 0.423828125], "model_response": [["On which continent is the River Severn located?", "Africa || Africa"], ["Which city in Africa has the largest population?", "Lagos || Lagos"]]}}, "hop2": {"mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.984375, 0.9375], "model_response": [["On which continent is the River Severn located?", "Europe || Europe"], ["Which city in Europe has the largest population?", "London || London"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.9921875], "model_response": [["On which continent is the River Severn located?", "Europe || Europe"], ["Which city in Europe has the largest population?", "London || London"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.99609375, 0.87890625], "model_response": [["On which continent is the River Severn located?", "Europe || Europe"], ["Which city in Europe has the largest population?", "London || London"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.98828125, 0.9375], "model_response": [["On which continent is the River Severn located?", "Europe || Europe"], ["Which city in Europe has the largest population?", "London || London"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.99609375, 0.87109375], "model_response": [["On which continent is the River Severn located?", "Europe || Europe"], ["Which city in Europe has the largest population?", "London || London"]]}, "mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.9921875], "model_response": [["On which continent is the River Severn located?", "Europe || Europe"], ["Which city in Europe has the largest population?", "London || London"]]}}}
{"hop1": {"unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.0751953125, 1.0], "model_response": [["What is the name of the longest river in China?", "Yangtze || Yangtze"], ["On which continent is the Yangtze River located?", "Asia || Asia"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["What is the name of the longest river in China?", "The Yangtze River || The Yangtze River"], ["On which continent is the Yangtze River located?", "Asia || Asia"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.614166259765625, 1.0], "model_response": [["What is the name of the longest river in China?", "The Yangtze River || The Yangtze River"], ["On which continent is the Yangtze River located?", "Asia || Asia"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.86328125, 1.0], "model_response": [["What is the name of the longest river in China?", "The name of the longest river in China is the Yangtze River. || Yangtze River"], ["On which continent is the Yangtze River located?", "Asia || Asia"]]}, "mis_info_dict_light": {"answer_condition": [3, 1], "confidence": [0.9921875, 1.0], "model_response": [["What is the name of the longest river in China?", "The Yellow River || The Yellow River"], ["On which continent is the Yellow River located?", "Asia || Asia"]]}, "hall_sbj_dict_light": {"answer_condition": [4, 1], "confidence": [0.476806640625, 1.0], "model_response": [["What is the name of the longest river in China?", "The Yellow River || The Yellow River"], ["On which continent is the Yellow River located?", "Asia || Asia"]]}}, "hop2": {"hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.0751953125, 1.0], "model_response": [["What is the name of the longest river in China?", "Yangtze || Yangtze"], ["On which continent is the Yangtze River located?", "Asia || Asia"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.5673065185546875, 1.0], "model_response": [["What is the name of the longest river in China?", "The Yangtze River || The Yangtze River"], ["On which continent is the Yangtze River located?", "Asia || Asia"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["What is the name of the longest river in China?", "The Yangtze River || Yangtze River"], ["On which continent is the Yangtze River located?", "Asia || Asia"]]}, "mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["What is the name of the longest river in China?", "The Yangtze River is the longest river in China, and it is located in China. || Yangtze River"], ["On which continent is the Yangtze River located?", "Asia || Asia"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.6287384033203125, 1.0], "model_response": [["What is the name of the longest river in China?", "The Yangtze River || The Yangtze River"], ["On which continent is the Yangtze River located?", "Asia || Asia"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 1], "confidence": [0.23171234130859375, 1.0], "model_response": [["What is the name of the longest river in China?", "The Yellow River || The Yellow River"], ["On which continent is the Yellow River located?", "Asia || Asia"]]}}}
{"hop1": {"hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.0455247163772583, 0.9921875], "model_response": [["Which countries to the east share a border with Norway?", "Finland and Sweden || Finland and Sweden"], ["What is the capital of Finland?", "Helsinki || Helsinki"]]}, "mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [0.9379416704177856, 0.9921875], "model_response": [["Which countries to the east share a border with Norway?", "Finland and Russia || Finland and Russia"], ["What is the capital of Finland?", "Helsinki || Helsinki"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.467254638671875, 0.99609375], "model_response": [["Which countries to the east share a border with Norway?", "Finland and Russia. || Finland and Russia"], ["What is the capital of Finland?", "Helsinki || Helsinki"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.6546531915664673, 1.0], "model_response": [["Which countries to the east share a border with Norway?", "Finland and Russia || Finland and Russia"], ["What is the capital of Finland?", "Helsinki || Helsinki"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.8439903259277344, 1.0], "model_response": [["Which countries to the east share a border with Norway?", "Finland and Russia || Finland and Russia"], ["What is the capital of Finland?", "Helsinki || Helsinki"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.6010406017303467, 1.0], "model_response": [["Which countries to the east share a border with Norway?", "Finland and Sweden || Finland and Sweden"], ["What is the capital of Finland?", "Helsinki || Helsinki"]]}}, "hop2": {"hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.5391910672187805, 1.0], "model_response": [["Which countries to the east share a border with Norway?", "Finland and Sweden || Finland and Sweden"], ["What is the capital of Finland?", "Helsinki || Helsinki"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.448638916015625, 1.0], "model_response": [["Which countries to the east share a border with Norway?", "Finland and Russia || Finland and Russia"], ["What is the capital of Finland?", "Helsinki || Helsinki"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.432586669921875, 1.0], "model_response": [["Which countries to the east share a border with Norway?", "Finland, Sweden, and Russia || Finland, Sweden, and Russia"], ["What is the capital of Finland?", "Helsinki || Helsinki"]]}, "mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [0.22393763065338135, 1.0], "model_response": [["Which countries to the east share a border with Norway?", "Finland, Sweden, and Russia. || Finland, Sweden, and Russia"], ["What is the capital of Finland?", "Helsinki || Helsinki"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.132659912109375, 1.0], "model_response": [["Which countries to the east share a border with Norway?", "Finland and Sweden || Finland and Sweden"], ["What is the capital of Finland?", "Helsinki || Helsinki"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.7386224269866943, 1.0], "model_response": [["Which countries to the east share a border with Norway?", "Finland and Russia || Finland and Russia"], ["What is the capital of Finland?", "Helsinki || Helsinki"]]}}}
{"hop1": {"mis_info_dict_severe": {"answer_condition": [-1, -1], "confidence": [-1, -1], "model_response": [["Who is the CEO of IBM in the year 1912?", "Unknown || N/A"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Who is the CEO of IBM in the year 1912?", "Thomas J. Watson || Thomas J. Watson"], ["In which company (the first one in time order) does Thomas J. Watson work?", "International Business Machines (IBM) || International Business Machines"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.73046875, 0.6089630126953125], "model_response": [["Who is the CEO of IBM in the year 1912?", "Thomas J. Watson || Thomas J. Watson"], ["In which company (the first one in time order) does Thomas J. Watson work?", "International Business Machines (IBM) || International Business Machines (IBM)"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.9377288818359375, 0.5733489990234375], "model_response": [["Who is the CEO of IBM in the year 1912?", "Thomas Watson || Thomas Watson"], ["In which company (the first one in time order) does Thomas J. Watson work?", "International Business Machines (IBM) || International Business Machines (IBM)"]]}, "mis_info_dict_light": {"answer_condition": [4, 1], "confidence": [0.9921875, 1.0], "model_response": [["Who is the CEO of IBM in the year 1912?", "John F. Kennedy || John F. Kennedy"], ["In which company (the first one in time order) does John F. Kennedy work?", "IBM || IBM"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 1], "confidence": [0.2889807503670454, 0.98828125], "model_response": [["Who is the CEO of IBM in the year 1912?", "Charles Coffin || Charles Coffin"], ["In which company (the first one in time order) does Charles Coffin work?", "International Business Machines (IBM) || International Business Machines (IBM)"]]}}, "hop2": {"mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.26953125], "model_response": [["Who is the CEO of IBM in the year 1912?", "Thomas J. Watson || Thomas J. Watson"], ["In which company (the first one in time order) does Thomas J. Watson work?", "International Business Machines Corporation (IBM) || International Business Machines Corporation"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.7494354248046875, 0.9765625], "model_response": [["Who is the CEO of IBM in the year 1912?", "Thomas Watson || Thomas Watson"], ["In which company (the first one in time order) does Thomas J. Watson work?", "International Business Machines (IBM) || International Business Machines (IBM)"]]}, "mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [0.9921875, 0.98046875], "model_response": [["Who is the CEO of IBM in the year 1912?", "Thomas J. Watson || Thomas J. Watson"], ["In which company (the first one in time order) does Thomas J. Watson work?", "International Business Machines (IBM) || International Business Machines (IBM)"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.99609375, 0.2336273193359375], "model_response": [["Who is the CEO of IBM in the year 1912?", "Thomas Watson || Thomas Watson"], ["In which company (the first one in time order) does Thomas J. Watson work?", "International Business Machines (IBM) || International Business Machines (IBM)"]]}, "hall_sbj_dict_light": {"answer_condition": [4, 1], "confidence": [0.0019259820692241192, 1.0], "model_response": [["Who is the CEO of IBM in the year 1912?", "Charles H. Sawyer || Charles H. Sawyer"], ["In which company (the first one in time order) does Charles H. Sawyer work?", "International Business Machines (IBM) || International Business Machines (IBM)"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [0.984375, 0.052345991134643555], "model_response": [["Who is the CEO of IBM in the year 1912?", "Thomas Watson || Thomas Watson"], ["In which company (the first one in time order) does Thomas J. Watson work?", "International Harvester Company || International Harvester Company"]]}}}
{"hop1": {"unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Which country does Oslo belong to?", "Norway || Norway"], ["In which year was Norway founded or became independent?", "1814 || 1814"]]}, "mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Which country does Oslo belong to?", "Norway || Norway"], ["In which year was Norway founded or became independent?", "1814 || 1814"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Which country does Oslo belong to?", "Norway || Norway"], ["In which year was Norway founded or became independent?", "1814 || 1814"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Which country does Oslo belong to?", "Norway || Norway"], ["In which year was Norway founded or became independent?", "1814 || 1814"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Which country does Oslo belong to?", "Norway || Norway"], ["In which year was Norway founded or became independent?", "1814 || 1814"]]}, "mis_info_dict_severe": {"answer_condition": [3, -1], "confidence": [0.6640625, -1], "model_response": [["Which country does Oslo belong to?", "Chocolate cake || Chocolate cake"], ["In which year was chocolate cake founded or became independent?", "I'm sorry, I don't have enough information to answer this question. || N/A"]]}}, "hop2": {"hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Which country does Oslo belong to?", "Norway || Norway"], ["In which year was Norway founded or became independent?", "1814 || 1814"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.99609375], "model_response": [["Which country does Oslo belong to?", "Norway || Norway"], ["In which year was Norway founded or became independent?", "1814 || 1814"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.9609375], "model_response": [["Which country does Oslo belong to?", "Norway || Norway"], ["In which year was Norway founded or became independent?", "1814 || 1814"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Which country does Oslo belong to?", "Norway || Norway"], ["In which year was Norway founded or became independent?", "1814 || 1814"]]}, "mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Which country does Oslo belong to?", "Norway || Norway"], ["In which year was Norway founded or became independent?", "1814 || 1814"]]}, "mis_info_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.9921875], "model_response": [["Which country does Oslo belong to?", "Norway || Norway"], ["In which year was Norway founded or became independent?", "1030 || 1030"]]}}}
{"hop1": {"unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.99609375, 1.0], "model_response": [["Which city hosted the first Olympic Games in 1950?", "London || London"], ["What is the name of the largest airport in London?", "Heathrow || Heathrow"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.984375, 1.0], "model_response": [["Which city hosted the first Olympic Games in 1950?", "London || London"], ["What is the name of the largest airport in London?", "Heathrow || Heathrow"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Which city hosted the first Olympic Games in 1950?", "London || London"], ["What is the name of the largest airport in London?", "Heathrow || Heathrow"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Which city hosted the first Olympic Games in 1950?", "London || London"], ["What is the name of the largest airport in London?", "Heathrow || Heathrow"]]}, "mis_info_dict_light": {"answer_condition": [3, 4], "confidence": [0.9921875, 0.930858850479126], "model_response": [["Which city hosted the first Olympic Games in 1950?", "Paris || Paris"], ["What is the name of the largest airport in Paris?", "Charles de Gaulle Airport || Charles de Gaulle Airport"]]}, "unrelated_fact_dict_light": {"answer_condition": [3, 4], "confidence": [1.0, 0.34694848756771535], "model_response": [["Which city hosted the first Olympic Games in 1950?", "Rio de Janeiro || Rio de Janeiro"], ["What is the name of the largest airport in Rio de Janeiro?", "Galeao Antonio Carlos Jobim International Airport || Galeao Antonio Carlos Jobim International Airport"]]}}, "hop2": {"hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.9921875, 1.0], "model_response": [["Which city hosted the first Olympic Games in 1950?", "London || London"], ["What is the name of the largest airport in London?", "Heathrow || Heathrow"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.99609375, 1.0], "model_response": [["Which city hosted the first Olympic Games in 1950?", "London || London"], ["What is the name of the largest airport in London?", "Heathrow || Heathrow"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.9921875, 1.0], "model_response": [["Which city hosted the first Olympic Games in 1950?", "London || London"], ["What is the name of the largest airport in London?", "Heathrow || Heathrow"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.99609375, 1.0], "model_response": [["Which city hosted the first Olympic Games in 1950?", "London || London"], ["What is the name of the largest airport in London?", "Heathrow || Heathrow"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Which city hosted the first Olympic Games in 1950?", "London || London"], ["What is the name of the largest airport in London?", "Heathrow || Heathrow"]]}, "mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [0.99609375, 1.0], "model_response": [["Which city hosted the first Olympic Games in 1950?", "London || London"], ["What is the name of the largest airport in London?", "Heathrow || Heathrow"]]}}}
{"hop1": {"unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [0.734375, 0.374684602022171], "model_response": [["Which university or college did Franklin D. Roosevelt attend as a graduate student?", "Columbia University || Columbia University"], ["Who is the headmaster of Columbia University in the year 1907?", "Dr. William Howard Taft || Dr. William Howard Taft"]]}, "mis_info_dict_severe": {"answer_condition": [1, 4], "confidence": [0.97265625, 0.24445879459381104], "model_response": [["Which university or college did Franklin D. Roosevelt attend as a graduate student?", "Columbia University || Columbia University"], ["Who is the headmaster of Columbia University in the year 1907?", "Dr. William Rainey Harper || Dr. William Rainey Harper"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [0.91796875, 0.29677391052246094], "model_response": [["Which university or college did Franklin D. Roosevelt attend as a graduate student?", "Columbia University || Columbia University"], ["Who is the headmaster of Columbia University in the year 1907?", "Dr. William Howard Taft || Dr. William Howard Taft"]]}, "mis_info_dict_light": {"answer_condition": [3, 4], "confidence": [1.0, 0.484375], "model_response": [["Which university or college did Franklin D. Roosevelt attend as a graduate student?", "Harvard University || Harvard University"], ["Who is the headmaster of Harvard University in the year 1907?", "Charles Eliot || Charles Eliot"]]}, "hall_sbj_dict_light": {"answer_condition": [4, 4], "confidence": [0.9689788818359375, 0.482421875], "model_response": [["Which university or college did Franklin D. Roosevelt attend as a graduate student?", "Harvard University || Harvard University"], ["Who is the headmaster of Harvard University in the year 1907?", "Charles Eliot || Charles Eliot"]]}, "hall_sbj_dict_severe": {"answer_condition": [4, 4], "confidence": [0.80047607421875, 0.6016845703125], "model_response": [["Which university or college did Franklin D. Roosevelt attend as a graduate student?", "Harvard University || Harvard University"], ["Who is the headmaster of Harvard University in the year 1907?", "Charles Eliot || Charles Eliot"]]}}, "hop2": {"hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.81640625, 0.94921875], "model_response": [["Which university or college did Franklin D. Roosevelt attend as a graduate student?", "Columbia University || Columbia University"], ["Who is the headmaster of Columbia University in the year 1907?", "William R. Castle || William R. Castle"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.439453125, 0.373046875], "model_response": [["Which university or college did Franklin D. Roosevelt attend as a graduate student?", "Columbia University || Columbia University"], ["Who is the headmaster of Columbia University in the year 1907?", "William R. Castle || William R. Castle"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [0.8984375, 0.2472475776448846], "model_response": [["Which university or college did Franklin D. Roosevelt attend as a graduate student?", "Columbia University || Columbia University"], ["Who is the headmaster of Columbia University in the year 1907?", "Dr. William C. Durant || Dr. William C. Durant"]]}, "mis_info_dict_severe": {"answer_condition": [1, 3], "confidence": [0.56640625, 0.029668807983398438], "model_response": [["Which university or college did Franklin D. Roosevelt attend as a graduate student?", "Columbia University || Columbia University"], ["Who is the headmaster of Columbia University in the year 1907?", "Chocolate chip cookies || Chocolate chip cookies"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [0.82421875, 0.25108158588409424], "model_response": [["Which university or college did Franklin D. Roosevelt attend as a graduate student?", "Columbia University || Columbia University"], ["Who is the headmaster of Columbia University in the year 1907?", "Charles S. Fairchild || Charles S. Fairchild"]]}, "mis_info_dict_light": {"answer_condition": [4, 4], "confidence": [0.875, 0.97265625], "model_response": [["Which university or college did Franklin D. Roosevelt attend as a graduate student?", "Yale University || Yale University"], ["Who is the headmaster of Yale University in the year 1907?", "Charles Seymour (1864-1929) || Charles Seymour"]]}}}
{"hop1": {"unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.16828536987304688, 0.99609375], "model_response": [["In which year was MGM Studios founded?", "1925 || 1925"], ["Which city hosted the first Olympic Games in 1925?", "Paris || Paris"]]}, "mis_info_dict_light": {"answer_condition": [4, 4], "confidence": [1.0, 0.98046875], "model_response": [["In which year was MGM Studios founded?", "1930 || 1930"], ["Which city hosted the first Olympic Games in 1930?", "Los Angeles || Los Angeles"]]}, "mis_info_dict_severe": {"answer_condition": [4, 4], "confidence": [0.331298828125, 0.9921875], "model_response": [["In which year was MGM Studios founded?", "1929 || 1929"], ["Which city hosted the first Olympic Games in 1929?", "Los Angeles || Los Angeles"]]}, "hall_sbj_dict_severe": {"answer_condition": [4, 4], "confidence": [0.369140625, 0.69140625], "model_response": [["In which year was MGM Studios founded?", "1928 || 1928"], ["Which city hosted the first Olympic Games in 1928?", "Amsterdam || Amsterdam"]]}, "hall_sbj_dict_light": {"answer_condition": [4, 4], "confidence": [0.1494140625, 0.9140625], "model_response": [["In which year was MGM Studios founded?", "1928 || 1928"], ["Which city hosted the first Olympic Games in 1928?", "Amsterdam || Amsterdam"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 4], "confidence": [0.47283935546875, 0.49609375], "model_response": [["In which year was MGM Studios founded?", "1928 || 1928"], ["Which city hosted the first Olympic Games in 1928?", "Amsterdam || Amsterdam"]]}}, "hop2": {"unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.42658233642578125, 0.9921875], "model_response": [["In which year was MGM Studios founded?", "1925 || 1925"], ["Which city hosted the first Olympic Games in 1925?", "Paris || Paris"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.9296875, 1.0], "model_response": [["In which year was MGM Studios founded?", "1925 || 1925"], ["Which city hosted the first Olympic Games in 1925?", "Paris || Paris"]]}, "hall_sbj_dict_severe": {"answer_condition": [4, 1], "confidence": [0.057651519775390625, 1.0], "model_response": [["In which year was MGM Studios founded?", "1924 || 1924"], ["Which city hosted the first Olympic Games in 1924?", "Paris || Paris"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 3], "confidence": [0.6536865234375, 1.0], "model_response": [["In which year was MGM Studios founded?", "1925 || 1925"], ["Which city hosted the first Olympic Games in 1925?", "Rio de Janeiro || Rio de Janeiro"]]}, "mis_info_dict_light": {"answer_condition": [4, 4], "confidence": [0.482421875, 0.6015625], "model_response": [["In which year was MGM Studios founded?", "1928 || 1928"], ["Which city hosted the first Olympic Games in 1928?", "Amsterdam || Amsterdam"]]}, "hall_sbj_dict_light": {"answer_condition": [4, 4], "confidence": [0.22969818115234375, 0.5625], "model_response": [["In which year was MGM Studios founded?", "1928 || 1928"], ["Which city hosted the first Olympic Games in 1928?", "Amsterdam || Amsterdam"]]}}}
{"hop1": {"unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.467254638671875, 1.0], "model_response": [["Which countries to the east share a border with Norway?", "Finland and Russia. || Finland and Russia"], ["Which is the first year does Sweden invade Finland?", "1808 || 1808"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 4], "confidence": [0.5868405103683472, 1.0], "model_response": [["Which countries to the east share a border with Norway?", "Finland and Russia || Finland and Russia"], ["Which is the first year does Sweden invade Finland?", "1808 || 1808"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 4], "confidence": [0.9161262512207031, 0.94921875], "model_response": [["Which countries to the east share a border with Norway?", "Finland and Russia || Finland and Russia"], ["Which is the first year does Sweden invade Finland?", "1808 || 1808"]]}, "mis_info_dict_light": {"answer_condition": [1, 4], "confidence": [0.9379416704177856, 0.98828125], "model_response": [["Which countries to the east share a border with Norway?", "Finland and Russia || Finland and Russia"], ["Which is the first year does Sweden invade Finland?", "1808 || 1808"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [0.8439903259277344, 0.9921875], "model_response": [["Which countries to the east share a border with Norway?", "Finland and Russia. || Finland and Russia"], ["Which is the first year does Sweden invade Finland?", "1808 || 1808"]]}, "mis_info_dict_severe": {"answer_condition": [1, 4], "confidence": [0.22177433967590332, 0.99609375], "model_response": [["Which countries to the east share a border with Norway?", "Finland and Russia || Finland and Russia"], ["Which is the first year does Sweden invade Finland?", "1808 || 1808"]]}}, "hop2": {"unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.7035300135612488, 0.953125], "model_response": [["Which countries to the east share a border with Norway?", "Finland and Russia || Finland and Russia"], ["Which is the first year does Sweden invade Finland?", "1940 || 1940"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.8307266235351562, 0.99609375], "model_response": [["Which countries to the east share a border with Norway?", "Finland and Russia || Finland and Russia"], ["Which is the first year does Sweden invade Finland?", "1940 || 1940"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.70221346616745, 1.0], "model_response": [["Which countries to the east share a border with Norway?", "Finland and Russia. || Finland and Russia"], ["Which is the first year does Sweden invade Finland?", "1940 || 1940"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.96893310546875, 0.99609375], "model_response": [["Which countries to the east share a border with Norway?", "Finland and Russia || Finland and Russia"], ["Which is the first year does Sweden invade Finland?", "1808 || 1808"]]}, "mis_info_dict_light": {"answer_condition": [1, 3], "confidence": [0.9125019907951355, 1.0], "model_response": [["Which countries to the east share a border with Norway?", "Finland and Russia || Finland and Russia"], ["Which is the first year does Sweden invade Finland?", "1939 || 1939"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 4], "confidence": [0.15662893129047006, 0.39947509765625], "model_response": [["Which countries to the east share a border with Norway?", "Iceland and Russia. || Iceland and Russia"], ["Which is the first year does Sweden invade Iceland and Russia?", "1808 || 1808"]]}}}
{"hop1": {"mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.99609375, 1.0], "model_response": [["What is the capital of China?", "Beijing || Beijing"], ["What is the name of the largest university/college in Beijing by area?", "Beijing University || Beijing University"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["What is the capital of China?", "Beijing || Beijing"], ["What is the name of the largest university/college in Beijing by area?", "Beijing University || Beijing University"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.98828125, 0.99609375], "model_response": [["What is the capital of China?", "Beijing || Beijing"], ["What is the name of the largest university/college in Beijing by area?", "Beijing University || Beijing University"]]}, "mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.99609375], "model_response": [["What is the capital of China?", "Beijing || Beijing"], ["What is the name of the largest university/college in Beijing by area?", "Beijing University || Beijing University"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["What is the capital of China?", "Beijing || Beijing"], ["What is the name of the largest university/college in Beijing by area?", "Beijing University || Beijing University"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 4], "confidence": [0.07568359375, 0.99609375], "model_response": [["What is the capital of China?", "Bejing || Bejing"], ["What is the name of the largest university/college in Bejing by area?", "Bejing University || Bejing University"]]}}, "hop2": {"hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["What is the capital of China?", "Beijing || Beijing"], ["What is the name of the largest university/college in Beijing by area?", "Beijing University || Beijing University"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.9921875, 0.97265625], "model_response": [["What is the capital of China?", "Beijing || Beijing"], ["What is the name of the largest university/college in Beijing by area?", "Beijing University || Beijing University"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.9921875, 1.0], "model_response": [["What is the capital of China?", "Beijing || Beijing"], ["What is the name of the largest university/college in Beijing by area?", "Beijing University || Beijing University"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 3], "confidence": [0.99609375, 1.0], "model_response": [["What is the capital of China?", "Beijing || Beijing"], ["What is the name of the largest university/college in Beijing by area?", "Shanghai || Shanghai"]]}, "mis_info_dict_light": {"answer_condition": [1, 3], "confidence": [1.0, 1.0], "model_response": [["What is the capital of China?", "Beijing || Beijing"], ["What is the name of the largest university/college in Beijing by area?", "Tsinghua University || Tsinghua University"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 3], "confidence": [0.9921875, 1.0], "model_response": [["What is the capital of China?", "Beijing || Beijing"], ["What is the name of the largest university/college in Beijing by area?", "Mount Everest || Mount Everest"]]}}}
{"hop1": {"unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [0.2042628526687622, 1.0], "model_response": [["What are the colors on the national flag of Norway?", "Red, white, and blue. || Red, white, and blue"], ["What is the RGB color code for white?", "RGB: 255, 255, 255 || 255, 255, 255"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.85546875, 1.0], "model_response": [["What are the colors on the national flag of Norway?", "Blue and white. || Blue and white"], ["What is the RGB color code for white?", "RGB: 255, 255, 255 || 255, 255, 255"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.755767822265625, 1.0], "model_response": [["What are the colors on the national flag of Norway?", "Blue and white. || Blue and white"], ["What is the RGB color code for white?", "RGB color code for white is (255, 255, 255) || 255, 255, 255"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.439453125, 0.91796875], "model_response": [["What are the colors on the national flag of Norway?", "Blue and white. || Blue and white"], ["What is the RGB color code for white?", "RGB color code for white is (255, 255, 255) || (255, 255, 255)"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.78125, 1.0], "model_response": [["What are the colors on the national flag of Norway?", "Blue and white || Blue and white"], ["What is the RGB color code for white?", "RGB: 255, 255, 255 || 255, 255, 255"]]}, "mis_info_dict_light": {"answer_condition": [4, 4], "confidence": [0.953125, 0.7355768792331219], "model_response": [["What are the colors on the national flag of Norway?", "Blue and red || Blue and red"], ["What is the RGB color code for blue and red?", "Blue: #0000FF, Red: #FF0000 || Blue: #0000FF, Red: #FF0000"]]}}, "hop2": {"unrelated_fact_dict_light": {"answer_condition": [-1, -1], "confidence": [-1, -1], "model_response": [["What are the colors on the national flag of Norway?", "The colors on the national flag of Norway are blue, white, and red. || N/A"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.2547454833984375, 1.0], "model_response": [["What are the colors on the national flag of Norway?", "Blue and white || Blue and white"], ["What is the RGB color code for white?", "FFFFFF || FFFFFF"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.267791748046875, 0.49609375], "model_response": [["What are the colors on the national flag of Norway?", "Blue and white || Blue and white"], ["What is the RGB color code for white?", "255, 255, 255 || 255, 255, 255"]]}, "mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [0.1298828125, 0.7734375], "model_response": [["What are the colors on the national flag of Norway?", "The colors on the national flag of Norway are white and blue. || white and blue"], ["What is the RGB color code for white?", "ffffff || ffffff"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.0995941162109375, 0.796875], "model_response": [["What are the colors on the national flag of Norway?", "Red, white, and blue || Red, white, and blue"], ["What is the RGB color code for white?", "255, 255, 255 || 255, 255, 255"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.5521997809410095, 1.0], "model_response": [["What are the colors on the national flag of Norway?", "The colors on the national flag of Norway are blue, white, and red. || blue, white, and red"], ["What is the RGB color code for white?", "FFFFFF || FFFFFF"]]}}}
{"hop1": {"mis_info_dict_severe": {"answer_condition": [3, 4], "confidence": [1.0, 0.0384521484375], "model_response": [["Who is the president / leader of China in the year 1949?", "Pizza || Pizza"], ["In which year was pizza born?", "1825 || 1825"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 4], "confidence": [0.724761962890625, 0.9459991455078125], "model_response": [["Who is the president / leader of China in the year 1949?", "Chou En-Lai || Chou En-Lai"], ["In which year was Chou En-Lai born?", "1899 || 1899"]]}, "mis_info_dict_light": {"answer_condition": [4, 4], "confidence": [1.0, 0.98046875], "model_response": [["Who is the president / leader of China in the year 1949?", "Mao Zedong || Mao Zedong"], ["In which year was Mao Zedong born?", "1893 || 1893"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 4], "confidence": [0.8933472633361816, 0.11309051513671875], "model_response": [["Who is the president / leader of China in the year 1949?", "Chou En-lai || Chou En-lai"], ["In which year was Chou En-lai born?", "October 1901 || October 1901"]]}, "hall_sbj_dict_light": {"answer_condition": [4, 4], "confidence": [0.2518794536590576, 0.908447265625], "model_response": [["Who is the president / leader of China in the year 1949?", "Chou En-Lai || Chou En-Lai"], ["In which year was Chou En-Lai born?", "1899 || 1899"]]}, "hall_sbj_dict_severe": {"answer_condition": [4, 4], "confidence": [0.03432763260207139, 0.85345458984375], "model_response": [["Who is the president / leader of China in the year 1949?", "Chou En-lai || Chou En-lai"], ["In which year was Chou En-lai born?", "1899 || 1899"]]}}, "hop2": {"mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.953125], "model_response": [["Who is the president / leader of China in the year 1949?", "Chiang Kai-shek || Chiang Kai-shek"], ["In which year was Chiang Kai-shek born?", "1887 || 1887"]]}, "mis_info_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.8754730224609375], "model_response": [["Who is the president / leader of China in the year 1949?", "Chiang Kai-shek || Chiang Kai-shek"], ["In which year was Chiang Kai-shek born?", "1907 || 1907"]]}, "hall_sbj_dict_light": {"answer_condition": [4, 1], "confidence": [0.98046875, 1.0], "model_response": [["Who is the president / leader of China in the year 1949?", "Mao Zedong || Mao Zedong"], ["In which year was Mao Zedong born?", "1887 || 1887"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 4], "confidence": [0.498046875, 0.175018310546875], "model_response": [["Who is the president / leader of China in the year 1949?", "Chou En-Lai || Chou En-Lai"], ["In which year was Chou En-Lai born?", "1897 || 1897"]]}, "hall_sbj_dict_severe": {"answer_condition": [4, 4], "confidence": [0.49609375, 0.8787689208984375], "model_response": [["Who is the president / leader of China in the year 1949?", "Chou En-lai || Chou En-lai"], ["In which year was Chou En-lai born?", "1897 || 1897"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 4], "confidence": [0.49610137939453125, 0.421875], "model_response": [["Who is the president / leader of China in the year 1949?", "Chou En-lai || Chou En-lai"], ["In which year was Chou En-lai born?", "1899 || 1899"]]}}}
{"hop1": {"unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.93359375], "model_response": [["In which year was Francis Scott Key born?", "1779 || 1779"], ["Which city hosted the first Olympic Games in the year 1779?", "Athens || Athens"]]}, "mis_info_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.98828125], "model_response": [["In which year was Francis Scott Key born?", "1779 || 1779"], ["Which city hosted the first Olympic Games in the year 1779?", "Athens || Athens"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.95703125], "model_response": [["In which year was Francis Scott Key born?", "1779 || 1779"], ["Which city hosted the first Olympic Games in the year 1779?", "Athens || Athens"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 0.99609375], "model_response": [["In which year was Francis Scott Key born?", "1779 || 1779"], ["Which city hosted the first Olympic Games in the year 1779?", "Athens || Athens"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 0.984375], "model_response": [["In which year was Francis Scott Key born?", "1779 || 1779"], ["Which city hosted the first Olympic Games in the year 1779?", "Athens || Athens"]]}, "mis_info_dict_light": {"answer_condition": [3, 4], "confidence": [1.0, 0.7734375], "model_response": [["In which year was Francis Scott Key born?", "1805 || 1805"], ["Which city hosted the first Olympic Games in the year 1805?", "Athens || Athens"]]}}, "hop2": {"hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.142578125], "model_response": [["In which year was Francis Scott Key born?", "1779 || 1779"], ["Which city hosted the first Olympic Games in the year 1779?", "Paris || Paris"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 1.0], "model_response": [["In which year was Francis Scott Key born?", "1779 || 1779"], ["Which city hosted the first Olympic Games in the year 1779?", "Athens || Athens"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.94921875], "model_response": [["In which year was Francis Scott Key born?", "1779 || 1779"], ["Which city hosted the first Olympic Games in the year 1779?", "London || London"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 1.0], "model_response": [["In which year was Francis Scott Key born?", "1779 || 1779"], ["Which city hosted the first Olympic Games in the year 1779?", "Athens || Athens"]]}, "mis_info_dict_severe": {"answer_condition": [1, 3], "confidence": [1.0, 0.9921875], "model_response": [["In which year was Francis Scott Key born?", "1779 || 1779"], ["Which city hosted the first Olympic Games in the year 1779?", "Pizza || Pizza"]]}, "mis_info_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 1.0], "model_response": [["In which year was Francis Scott Key born?", "1779 || 1779"], ["Which city hosted the first Olympic Games in the year 1779?", "Athens || Athens"]]}}}
{"hop1": {"mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.98046875, 0.98828125], "model_response": [["Which country does Cincinnati, Ohio belong to?", "United States || United States"], ["What's the year when Pakistan the first time formally establish diplomatic relations with United States?", "1947 || 1947"]]}, "mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [0.494140625, 0.98046875], "model_response": [["Which country does Cincinnati, Ohio belong to?", "United States || United States"], ["What's the year when Pakistan the first time formally establish diplomatic relations with United States?", "1947 || 1947"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.98046875, 0.98828125], "model_response": [["Which country does Cincinnati, Ohio belong to?", "United States || United States"], ["What's the year when Pakistan the first time formally establish diplomatic relations with United States?", "1947 || 1947"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.87890625, 0.96875], "model_response": [["Which country does Cincinnati, Ohio belong to?", "United States || United States"], ["What's the year when Pakistan the first time formally establish diplomatic relations with United States?", "1947 || 1947"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.87890625, 0.98828125], "model_response": [["Which country does Cincinnati, Ohio belong to?", "United States || United States"], ["What's the year when Pakistan the first time formally establish diplomatic relations with United States?", "1947 || 1947"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.87890625, 0.9765625], "model_response": [["Which country does Cincinnati, Ohio belong to?", "United States || United States"], ["What's the year when Pakistan the first time formally establish diplomatic relations with United States?", "1947 || 1947"]]}}, "hop2": {"unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.98046875, 0.263671875], "model_response": [["Which country does Cincinnati, Ohio belong to?", "United States || United States"], ["What's the year when Pakistan the first time formally establish diplomatic relations with United States?", "1947 || 1947"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.9921875, 0.9921875], "model_response": [["Which country does Cincinnati, Ohio belong to?", "United States || United States"], ["What's the year when Pakistan the first time formally establish diplomatic relations with United States?", "1947 || 1947"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.953125, 0.87890625], "model_response": [["Which country does Cincinnati, Ohio belong to?", "United States || United States"], ["What's the year when Pakistan the first time formally establish diplomatic relations with United States?", "1947 || 1947"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.953125, 0.98046875], "model_response": [["Which country does Cincinnati, Ohio belong to?", "United States || United States"], ["What's the year when Pakistan the first time formally establish diplomatic relations with United States?", "1947 || 1947"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.04736328125, 0.9921875], "model_response": [["Which country does Cincinnati, Ohio belong to?", "The United States || The United States"], ["What's the year when Pakistan the first time formally establish diplomatic relations with United States?", "1947 || 1947"]]}, "mis_info_dict_light": {"answer_condition": [1, 3], "confidence": [0.26953125, 1.0], "model_response": [["Which country does Cincinnati, Ohio belong to?", "The United States || The United States"], ["What's the year when Pakistan the first time formally establish diplomatic relations with United States?", "1955 || 1955"]]}}}
{"hop1": {"unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.83984375, 0.953125], "model_response": [["What's the year when Canada the first time formally establish diplomatic relations with United States?", "1917 || 1917"], ["Which city hosted the first Olympic Games in 1917?", "Rome || Rome"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.98828125], "model_response": [["What's the year when Canada the first time formally establish diplomatic relations with United States?", "1917 || 1917"], ["Which city hosted the first Olympic Games in 1917?", "Rome || Rome"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.474609375, 0.87890625], "model_response": [["What's the year when Canada the first time formally establish diplomatic relations with United States?", "1917 || 1917"], ["Which city hosted the first Olympic Games in 1917?", "Rome || Rome"]]}, "mis_info_dict_severe": {"answer_condition": [1, 4], "confidence": [0.8046875, 0.376953125], "model_response": [["What's the year when Canada the first time formally establish diplomatic relations with United States?", "1917 || 1917"], ["Which city hosted the first Olympic Games in 1917?", "Rio de Janeiro || Rio de Janeiro"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 4], "confidence": [0.895294189453125, 0.8828125], "model_response": [["What's the year when Canada the first time formally establish diplomatic relations with United States?", "1783 || 1783"], ["Which city hosted the first Olympic Games in 1783?", "Paris || Paris"]]}, "mis_info_dict_light": {"answer_condition": [3, 4], "confidence": [1.0, 0.375], "model_response": [["What's the year when Canada the first time formally establish diplomatic relations with United States?", "1867 || 1867"], ["Which city hosted the first Olympic Games in 1867?", "Athens || Athens"]]}}, "hop2": {"hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.8828125, 1.0], "model_response": [["What's the year when Canada the first time formally establish diplomatic relations with United States?", "1917 || 1917"], ["Which city hosted the first Olympic Games in 1917?", "Rome || Rome"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.99609375, 0.62109375], "model_response": [["What's the year when Canada the first time formally establish diplomatic relations with United States?", "1917 || 1917"], ["Which city hosted the first Olympic Games in 1917?", "Rome || Rome"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.98828125, 1.0], "model_response": [["What's the year when Canada the first time formally establish diplomatic relations with United States?", "1917 || 1917"], ["Which city hosted the first Olympic Games in 1917?", "Rome || Rome"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [0.583648681640625, 0.26953125], "model_response": [["What's the year when Canada the first time formally establish diplomatic relations with United States?", "1917 || 1917"], ["Which city hosted the first Olympic Games in 1917?", "Rio de Janeiro || Rio de Janeiro"]]}, "mis_info_dict_light": {"answer_condition": [1, 4], "confidence": [0.90234375, 1.0], "model_response": [["What's the year when Canada the first time formally establish diplomatic relations with United States?", "1917 || 1917"], ["Which city hosted the first Olympic Games in 1917?", "Athens || Athens"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 4], "confidence": [0.373046875, 0.2255859375], "model_response": [["What's the year when Canada the first time formally establish diplomatic relations with United States?", "1777 || 1777"], ["Which city hosted the first Olympic Games in 1777?", "Boston || Boston"]]}}}
{"hop1": {"mis_info_dict_severe": {"answer_condition": [-1, -1], "confidence": [-1, -1], "model_response": [["Who is the CEO of MGM Studios in the year 1975?", "I'm sorry, I cannot provide an answer to this question as it is not relevant to the given reference. Please provide a question related to the reference. || N/A"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.87109375, 1.0], "model_response": [["Who is the CEO of MGM Studios in the year 1975?", "Barry Diller || Barry Diller"], ["In which city was Barry Diller born?", "New York City || New York City"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.9453125, 1.0], "model_response": [["Who is the CEO of MGM Studios in the year 1975?", "Barry Diller || Barry Diller"], ["In which city was Barry Diller born?", "New York City || New York City"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 1], "confidence": [0.04414772614836693, 0.95703125], "model_response": [["Who is the CEO of MGM Studios in the year 1975?", "Robert A. Altman || Robert A. Altman"], ["In which city was Robert A. Altman born?", "New York City || New York City"]]}, "mis_info_dict_light": {"answer_condition": [3, 4], "confidence": [1.0, 0.26953125], "model_response": [["Who is the CEO of MGM Studios in the year 1975?", "Steven Spielberg || Steven Spielberg"], ["In which city was Steven Spielberg born?", "Chicago || Chicago"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 4], "confidence": [0.3181070555001497, 0.1968841552734375], "model_response": [["Who is the CEO of MGM Studios in the year 1975?", "Robert N. Nederlander || Robert N. Nederlander"], ["In which city was Robert N. Nederlander born?", "Chicago, Illinois || Chicago, Illinois"]]}}, "hop2": {"mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.796875, 1.0], "model_response": [["Who is the CEO of MGM Studios in the year 1975?", "Barry Diller || Barry Diller"], ["In which city was Barry Diller born?", "New York City || New York City"]]}, "mis_info_dict_light": {"answer_condition": [1, 3], "confidence": [1.0, 0.953125], "model_response": [["Who is the CEO of MGM Studios in the year 1975?", "Barry Diller || Barry Diller"], ["In which city was Barry Diller born?", "Los Angeles || Los Angeles"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 1], "confidence": [0.4765625, 0.99609375], "model_response": [["Who is the CEO of MGM Studios in the year 1975?", "Harvey Weinstein || Harvey Weinstein"], ["In which city was Harvey Weinstein born?", "New York City || New York City"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 1], "confidence": [0.76953125, 1.0], "model_response": [["Who is the CEO of MGM Studios in the year 1975?", "Harvey Weinstein || Harvey Weinstein"], ["In which city was Harvey Weinstein born?", "New York City || New York City"]]}, "hall_sbj_dict_light": {"answer_condition": [4, 1], "confidence": [0.17206743359565735, 0.98828125], "model_response": [["Who is the CEO of MGM Studios in the year 1975?", "Robert N. Young || Robert N. Young"], ["In which city was Robert N. Young born?", "New York City || New York City"]]}, "hall_sbj_dict_severe": {"answer_condition": [4, 4], "confidence": [0.4453125, 0.72265625], "model_response": [["Who is the CEO of MGM Studios in the year 1975?", "Peter Guber || Peter Guber"], ["In which city was Peter Guber born?", "Los Angeles || Los Angeles"]]}}}
{"hop1": {"hall_sbj_dict_severe": {"answer_condition": [1, 4], "confidence": [0.9453125, 0.80078125], "model_response": [["What's the year when Iraq the first time formally establish diplomatic relations with Egypt?", "1980 || 1980"], ["Who is the CEO of IBM in the year 1980?", "John Opel (1980-1981)\n\nThomas Watson (1981-1982)\n\nJohn Opel (1982-1985) || John Opel"]]}, "mis_info_dict_light": {"answer_condition": [3, 4], "confidence": [1.0, 0.6015625], "model_response": [["What's the year when Iraq the first time formally establish diplomatic relations with Egypt?", "1975 || 1975"], ["Who is the CEO of IBM in the year 1975?", "John Opel || John Opel"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 4], "confidence": [0.002410888671875, 0.988311767578125], "model_response": [["What's the year when Iraq the first time formally establish diplomatic relations with Egypt?", "1958 || 1958"], ["Who is the CEO of IBM in the year 1958?", "Thomas Watson || Thomas Watson"]]}, "hall_sbj_dict_light": {"answer_condition": [4, 4], "confidence": [0.25390625, 0.830841064453125], "model_response": [["What's the year when Iraq the first time formally establish diplomatic relations with Egypt?", "1973 || 1973"], ["Who is the CEO of IBM in the year 1973?", "John Opel || John Opel"]]}, "mis_info_dict_severe": {"answer_condition": [4, 4], "confidence": [0.4140625, 0.28515625], "model_response": [["What's the year when Iraq the first time formally establish diplomatic relations with Egypt?", "Pizza || Pizza"], ["Who is the CEO of IBM in the year Pizza?", "Samuel Palmisano || Samuel Palmisano"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 4], "confidence": [0.404296875, 0.724761962890625], "model_response": [["What's the year when Iraq the first time formally establish diplomatic relations with Egypt?", "1958 || 1958"], ["Who is the CEO of IBM in the year 1958?", "Thomas Watson Jr. || Thomas Watson Jr."]]}}, "hop2": {"hall_sbj_dict_severe": {"answer_condition": [1, 4], "confidence": [0.984375, 0.91796875], "model_response": [["What's the year when Iraq the first time formally establish diplomatic relations with Egypt?", "1980 || 1980"], ["Who is the CEO of IBM in the year 1980?", "John Opel || John Opel"]]}, "mis_info_dict_light": {"answer_condition": [1, 3], "confidence": [0.9765625, 1.0], "model_response": [["What's the year when Iraq the first time formally establish diplomatic relations with Egypt?", "1980 || 1980"], ["Who is the CEO of IBM in the year 1980?", "Bill Gates || Bill Gates"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 4], "confidence": [0.95703125, 0.46886444091796875], "model_response": [["What's the year when Iraq the first time formally establish diplomatic relations with Egypt?", "1980 || 1980"], ["Who is the CEO of IBM in the year 1980?", "John Opel, Jr. || John Opel, Jr."]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [0.98828125, 0.98828125], "model_response": [["What's the year when Iraq the first time formally establish diplomatic relations with Egypt?", "1980 || 1980"], ["Who is the CEO of IBM in the year 1980?", "John Opel || John Opel"]]}, "mis_info_dict_severe": {"answer_condition": [1, 4], "confidence": [0.984375, 0.3392457962036133], "model_response": [["What's the year when Iraq the first time formally establish diplomatic relations with Egypt?", "1980 || 1980"], ["Who is the CEO of IBM in the year 1980?", "John Opel, Jr. || John Opel, Jr."]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 1], "confidence": [0.006622314453125, 0.62109375], "model_response": [["What's the year when Iraq the first time formally establish diplomatic relations with Egypt?", "1979 || 1979"], ["Who was the CEO of IBM in the year 1979?", "John Akers || John Akers"]]}}}
{"hop1": {"hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.3203125, 0.98046875], "model_response": [["Which university or college did Harry S. Truman attend as a graduate student?", "Yale University || Yale University"], ["Which city is Yale University located in?", "New Haven, Connecticut || New Haven, Connecticut"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.99609375, 0.98046875], "model_response": [["Which university or college did Harry S. Truman attend as a graduate student?", "Yale University || Yale University"], ["Which city is Yale University located in?", "New Haven, Connecticut || New Haven, Connecticut"]]}, "mis_info_dict_severe": {"answer_condition": [4, 4], "confidence": [0.07568359375, 1.0], "model_response": [["Which university or college did Harry S. Truman attend as a graduate student?", "Columbia University || Columbia University"], ["Which city is Columbia University located in?", "New York City || New York City"]]}, "unrelated_fact_dict_severe": {"answer_condition": [3, 4], "confidence": [0.8526611328125, 0.98828125], "model_response": [["Which university or college did Harry S. Truman attend as a graduate student?", "Harvard University || Harvard University"], ["Which city is Harvard University located in?", "Boston, Massachusetts || Boston"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 4], "confidence": [0.04443359375, 0.99609375], "model_response": [["Which university or college did Harry S. Truman attend as a graduate student?", "Columbia University || Columbia University"], ["Which city is Columbia University located in?", "New York City || New York City"]]}, "mis_info_dict_light": {"answer_condition": [3, 4], "confidence": [1.0, 0.98828125], "model_response": [["Which university or college did Harry S. Truman attend as a graduate student?", "Harvard University || Harvard University"], ["Which city is Harvard University located in?", "Boston || Boston"]]}}, "hop2": {"hall_sbj_dict_light": {"answer_condition": [4, 4], "confidence": [1.0, 1.0], "model_response": [["Which university or college did Harry S. Truman attend as a graduate student?", "Truman attended the University of Missouri as a graduate student. || University of Missouri"], ["Which city is the University of Missouri located in?", "Columbia || Columbia"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 4], "confidence": [0.150390625, 1.0], "model_response": [["Which university or college did Harry S. Truman attend as a graduate student?", "Columbia University || Columbia University"], ["Which city is Columbia University located in?", "New York City || New York City"]]}, "mis_info_dict_light": {"answer_condition": [4, 4], "confidence": [0.048828125, 0.9921875], "model_response": [["Which university or college did Harry S. Truman attend as a graduate student?", "Columbia University || Columbia University"], ["Which city is Columbia University located in?", "New York City || New York City"]]}, "mis_info_dict_severe": {"answer_condition": [4, 4], "confidence": [0.482574462890625, 0.8617401123046875], "model_response": [["Which university or college did Harry S. Truman attend as a graduate student?", "Truman State University || Truman State University"], ["Which city is Truman State University located in?", "Kansas City, Missouri || Kansas City, Missouri"]]}, "hall_sbj_dict_severe": {"answer_condition": [4, 4], "confidence": [0.576385498046875, 0.8617401123046875], "model_response": [["Which university or college did Harry S. Truman attend as a graduate student?", "Truman State University || Truman State University"], ["Which city is Truman State University located in?", "Kansas City, Missouri || Kansas City, Missouri"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 4], "confidence": [0.3933868408203125, 0.3740081787109375], "model_response": [["Which university or college did Harry S. Truman attend as a graduate student?", "Truman State University || Truman State University"], ["Which city is Truman State University located in?", "Kirksville, Missouri || Kirksville, Missouri"]]}}}
{"hop1": {"hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.62109375, 0.5], "model_response": [["In which year was Richard Nixon born?", "1908 || 1908"], ["Who was the US president in the year 1908?", "Theodore Roosevelt || Theodore Roosevelt"]]}, "mis_info_dict_light": {"answer_condition": [4, 4], "confidence": [1.0, 0.98828125], "model_response": [["In which year was Richard Nixon born?", "1913 || 1913"], ["Who was the US president in the year 1913?", "Woodrow Wilson || Woodrow Wilson"]]}, "mis_info_dict_severe": {"answer_condition": [4, 4], "confidence": [0.99609375, 0.87890625], "model_response": [["In which year was Richard Nixon born?", "1913 || 1913"], ["Who was the US president in the year 1913?", "Woodrow Wilson || Woodrow Wilson"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 4], "confidence": [0.980560302734375, 0.98046875], "model_response": [["In which year was Richard Nixon born?", "1913 || 1913"], ["Who was the US president in the year 1913?", "Woodrow Wilson || Woodrow Wilson"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 4], "confidence": [0.953125, 0.73046875], "model_response": [["In which year was Richard Nixon born?", "1913 || 1913"], ["Who was the US president in the year 1913?", "Woodrow Wilson || Woodrow Wilson"]]}, "hall_sbj_dict_severe": {"answer_condition": [4, 4], "confidence": [0.376953125, 0.98046875], "model_response": [["In which year was Richard Nixon born?", "1913 || 1913"], ["Who was the US president in the year 1913?", "Woodrow Wilson || Woodrow Wilson"]]}}, "hop2": {"hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.99609375], "model_response": [["In which year was Richard Nixon born?", "1908 || 1908"], ["Who was the US president in the year 1908?", "Theodore Roosevelt || Theodore Roosevelt"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.99609375, 1.0], "model_response": [["In which year was Richard Nixon born?", "1908 || 1908"], ["Who was the US president in the year 1908?", "Theodore Roosevelt || Theodore Roosevelt"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.119140625, 0.59197998046875], "model_response": [["In which year was Richard Nixon born?", "1908 || 1908"], ["Who was the US president in the year 1908?", "William Howard Taft || William Howard Taft"]]}, "mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [0.9649658203125, 0.98828125], "model_response": [["In which year was Richard Nixon born?", "1908 || 1908"], ["Who was the US president in the year 1908?", "William Howard Taft || William Howard Taft"]]}, "mis_info_dict_severe": {"answer_condition": [1, 3], "confidence": [0.98046875, 0.984375], "model_response": [["In which year was Richard Nixon born?", "1908 || 1908"], ["Who was the US president in the year 1908?", "Pizza || Pizza"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 4], "confidence": [0.5, 0.98046875], "model_response": [["In which year was Richard Nixon born?", "1913 || 1913"], ["Who was the US president in the year 1913?", "Woodrow Wilson || Woodrow Wilson"]]}}}
{"hop1": {"hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.98828125, 0.359375], "model_response": [["Which university or college did Richard Nixon attend as a graduate student?", "Yale University || Yale University"], ["Who is the headmaster of Yale University in the year 1960?", "Kingman Brewster || Kingman Brewster"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.99609375, 0.11279296875], "model_response": [["Which university or college did Richard Nixon attend as a graduate student?", "Yale University || Yale University"], ["Who is the headmaster of Yale University in the year 1960?", "Kingman Brewster || Kingman Brewster"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.5701446533203125], "model_response": [["Which university or college did Richard Nixon attend as a graduate student?", "Yale University || Yale University"], ["Who is the headmaster of Yale University in the year 1960?", "Harvard University || Harvard University"]]}, "mis_info_dict_severe": {"answer_condition": [1, 4], "confidence": [0.99609375, 0.67388916015625], "model_response": [["Which university or college did Richard Nixon attend as a graduate student?", "Yale University || Yale University"], ["Who is the headmaster of Yale University in the year 1960?", "Harvard University || Harvard University"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.1116180419921875], "model_response": [["Which university or college did Richard Nixon attend as a graduate student?", "Yale University || Yale University"], ["Who is the headmaster of Yale University in the year 1960?", "Dr. Charles Seymour (1960-1969) || Dr. Charles Seymour"]]}, "mis_info_dict_light": {"answer_condition": [3, 4], "confidence": [1.0, 0.71484375], "model_response": [["Which university or college did Richard Nixon attend as a graduate student?", "Harvard University || Harvard University"], ["Who is the headmaster of Harvard University in the year 1960?", "Harvard University Headmaster, James Bryant Conant || James Bryant Conant"]]}}, "hop2": {"unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.9921875, 0.828125], "model_response": [["Which university or college did Richard Nixon attend as a graduate student?", "Yale University || Yale University"], ["Who is the headmaster of Yale University in the year 1960?", "Kingman Brewster || Kingman Brewster"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.98828125], "model_response": [["Which university or college did Richard Nixon attend as a graduate student?", "Yale University || Yale University"], ["Who is the headmaster of Yale University in the year 1960?", "Kingman Brewster || Kingman Brewster"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.9921875, 0.9921875], "model_response": [["Which university or college did Richard Nixon attend as a graduate student?", "Yale University || Yale University"], ["Who is the headmaster of Yale University in the year 1960?", "Kingman Brewster || Kingman Brewster"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.015794418286532164], "model_response": [["Which university or college did Richard Nixon attend as a graduate student?", "Yale University || Yale University"], ["Who is the headmaster of Yale University in the year 1960?", "Raymond J. Sweeney || Raymond J. Sweeney"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.71484375, 0.6609940528869629], "model_response": [["Which university or college did Richard Nixon attend as a graduate student?", "Yale University || Yale University"], ["Who is the headmaster of Yale University in the year 1960?", "I am sorry, but the information you provided is not relevant to the question. The headmaster of Yale University in the year 1960 was not chocolate chip cookies, but rather Dr. Kingman Brewster. || Dr. Kingman Brewster"]]}, "mis_info_dict_light": {"answer_condition": [4, 4], "confidence": [0.07779542240314186, 0.224609375], "model_response": [["Which university or college did Richard Nixon attend as a graduate student?", "University of California, Los Angeles (UCLA) || University of California, Los Angeles (UCLA)"], ["Who is the headmaster of University of California, Los Angeles (UCLA) in the year 1960?", "Unknown || Unknown"]]}}}
{"hop1": {"unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.796875], "model_response": [["What is the official or most commonly spoken language in Norway?", "Norwegian || Norwegian"], ["What is the ISO 639-1 code for the Norwegian language?", "no || no"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.48828125], "model_response": [["What is the official or most commonly spoken language in Norway?", "Norwegian || Norwegian"], ["What is the ISO 639-1 code for the Norwegian language?", "no || no"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.796875], "model_response": [["What is the official or most commonly spoken language in Norway?", "Norwegian || Norwegian"], ["What is the ISO 639-1 code for the Norwegian language?", "no || no"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.1220703125], "model_response": [["What is the official or most commonly spoken language in Norway?", "Norwegian || Norwegian"], ["What is the ISO 639-1 code for the Norwegian language?", "No || No"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.44677734375], "model_response": [["What is the official or most commonly spoken language in Norway?", "Norwegian || Norwegian"], ["What is the ISO 639-1 code for the Norwegian language?", "nb-NO || nb-NO"]]}, "mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [0.99609375, 0.59375], "model_response": [["What is the official or most commonly spoken language in Norway?", "Norwegian || Norwegian"], ["What is the ISO 639-1 code for the Norwegian language?", "no || no"]]}}, "hop2": {"unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.99609375, 0.73046875], "model_response": [["What is the official or most commonly spoken language in Norway?", "Norwegian || Norwegian"], ["What is the ISO 639-1 code for the Norwegian language?", "No || No"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["What is the official or most commonly spoken language in Norway?", "Norwegian || Norwegian"], ["What is the ISO 639-1 code for the Norwegian language?", "No || No"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["What is the official or most commonly spoken language in Norway?", "Norwegian || Norwegian"], ["What is the ISO 639-1 code for the Norwegian language?", "No. || No."]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.263671875], "model_response": [["What is the official or most commonly spoken language in Norway?", "Norwegian || Norwegian"], ["What is the ISO 639-1 code for the Norwegian language?", "No || No"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.625], "model_response": [["What is the official or most commonly spoken language in Norway?", "Norwegian || Norwegian"], ["What is the ISO 639-1 code for the Norwegian language?", "The ISO 639-1 code for the Norwegian language is \"no\" || no"]]}, "mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.99609375], "model_response": [["What is the official or most commonly spoken language in Norway?", "Norwegian || Norwegian"], ["What is the ISO 639-1 code for the Norwegian language?", "The ISO 639-1 code for the Norwegian language is \"no\". || no"]]}}}
{"hop1": {"unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [0.1180267333984375, 0.421875], "model_response": [["What is the time zone of London in UTC?", "GMT+0 || GMT+0"], ["Which country is the northernmost in the time zone with a UTC offset of +0.5?", "Finland || Finland"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [0.98046875, 0.244140625], "model_response": [["What is the time zone of London in UTC?", "Greenwich Mean Time (GMT) || Greenwich Mean Time (GMT)"], ["Which country is the northernmost in the time zone with a UTC offset of +0.5?", "Norway || Norway"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 4], "confidence": [0.91015625, 0.89453125], "model_response": [["What is the time zone of London in UTC?", "Greenwich Mean Time (GMT) is +0.5. || Greenwich Mean Time (GMT)"], ["Which country is the northernmost in the time zone with a UTC offset of +0.5?", "Canada (Eastern Time Zone) || Canada"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 4], "confidence": [0.07575615076348186, 0.318359375], "model_response": [["What is the time zone of London in UTC?", "Greenwich Mean Time (GMT) +0.5 || Greenwich Mean Time (GMT) +0.5"], ["Which country is the northernmost in the time zone with a UTC offset of +0.5?", "Finland || Finland"]]}, "mis_info_dict_severe": {"answer_condition": [4, 4], "confidence": [0.93359375, 0.81640625], "model_response": [["What is the time zone of London in UTC?", "Pizza || Pizza"], ["Which country is the northernmost in the time zone with a Pizza offset?", "Canada || Canada"]]}, "mis_info_dict_light": {"answer_condition": [4, 4], "confidence": [0.9086170196533203, 0.153717041015625], "model_response": [["What is the time zone of London in UTC?", "London is in the UTC+3.5 time zone. || UTC+3.5"], ["Which country is the northernmost in the time zone with a UTC offset of +3.5?", "Ireland || Ireland"]]}}, "hop2": {"mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.7265625, 0.5208740234375], "model_response": [["What is the time zone of London in UTC?", "Greenwich Mean Time (GMT) || Greenwich Mean Time (GMT)"], ["Which country is the northernmost in the time zone with a UTC offset of +0.5?", "Iceland || Iceland"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [0.27099609375, 0.99609375], "model_response": [["What is the time zone of London in UTC?", "GMT+0 || GMT+0"], ["Which country is the northernmost in the time zone with a UTC offset of +0.5?", "Norway || Norway"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.53125, 0.91796875], "model_response": [["What is the time zone of London in UTC?", "Greenwich Mean Time (GMT) || Greenwich Mean Time (GMT)"], ["Which country is the northernmost in the time zone with a UTC offset of +0.5?", "Greenland || Greenland"]]}, "mis_info_dict_light": {"answer_condition": [4, 1], "confidence": [0.53125, 0.427734375], "model_response": [["What is the time zone of London in UTC?", "Greenwich Mean Time (GMT) || Greenwich Mean Time (GMT)"], ["Which country is the northernmost in the Greenwich Mean Time (GMT) time zone?", "Iceland || Iceland"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 4], "confidence": [0.53125, 0.91796875], "model_response": [["What is the time zone of London in UTC?", "Greenwich Mean Time (GMT) || Greenwich Mean Time (GMT)"], ["Which country is the northernmost in the time zone with a UTC offset of +0.5?", "Greenland || Greenland"]]}, "hall_sbj_dict_severe": {"answer_condition": [4, 4], "confidence": [0.7109375, 0.47491455078125], "model_response": [["What is the time zone of London in UTC?", "Greenwich Mean Time (GMT) is the time zone of London. || Greenwich Mean Time (GMT)"], ["Which country is the northernmost in the Greenwich Mean Time (GMT) time zone?", "Ireland || Ireland"]]}}}
{"hop1": {"hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.57421875, 1.0], "model_response": [["What is the name of the longest river in the United Kingdom?", "The River Severn || The River Severn"], ["On which continent is the River Severn located?", "Europe || Europe"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.988311767578125, 0.9609375], "model_response": [["What is the name of the longest river in the United Kingdom?", "The River Severn || The River Severn"], ["On which continent is the River Severn located?", "Europe || Europe"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["What is the name of the longest river in the United Kingdom?", "The longest river in the United Kingdom is the River Severn. || River Severn"], ["On which continent is the River Severn located?", "Europe || Europe"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["What is the name of the longest river in the United Kingdom?", "The longest river in the United Kingdom is the River Severn, which flows from the Welsh border in the west to the English coast in the east. || River Severn"], ["On which continent is the River Severn located?", "Europe || Europe"]]}, "hall_sbj_dict_severe": {"answer_condition": [4, 1], "confidence": [0.78515625, 0.99609375], "model_response": [["What is the name of the longest river in the United Kingdom?", "The Severn River is the longest river in the United Kingdom. || Severn River"], ["On which continent is the Severn River located?", "Europe || Europe"]]}, "mis_info_dict_light": {"answer_condition": [3, 1], "confidence": [1.0, 1.0], "model_response": [["What is the name of the longest river in the United Kingdom?", "The longest river in the United Kingdom is the River Thames. || River Thames"], ["On which continent is the River Thames located?", "Europe || Europe"]]}}, "hop2": {"unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.4495849609375, 0.9375], "model_response": [["What is the name of the longest river in the United Kingdom?", "The River Severn || The River Severn"], ["On which continent is the River Severn located?", "Europe || Europe"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["What is the name of the longest river in the United Kingdom?", "The longest river in the United Kingdom is the River Severn, which flows through England and Wales. || River Severn"], ["On which continent is the River Severn located?", "Europe || Europe"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.9765625], "model_response": [["What is the name of the longest river in the United Kingdom?", "The longest river in the United Kingdom is the River Severn. || River Severn"], ["On which continent is the River Severn located?", "Europe || Europe"]]}, "mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [0.87890625, 0.98046875], "model_response": [["What is the name of the longest river in the United Kingdom?", "The longest river in the United Kingdom is the River Severn. || River Severn"], ["On which continent is the River Severn located?", "Europe || Europe"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.953125, 1.0], "model_response": [["What is the name of the longest river in the United Kingdom?", "The longest river in the United Kingdom is the River Severn, which flows through England and Wales. || River Severn"], ["On which continent is the River Severn located?", "Europe || Europe"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 0.0179443359375], "model_response": [["What is the name of the longest river in the United Kingdom?", "The longest river in the United Kingdom is the River Severn. || River Severn"], ["On which continent is the River Severn located?", "Africa || Africa"]]}}}
{"hop1": {"unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.94921875], "model_response": [["What is the national anthem of Canada?", "O Canada || O Canada"], ["Who is the composer of \"O Canada\"?", "Adolphe-Basile Routhier || Adolphe-Basile Routhier"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.94921875], "model_response": [["What is the national anthem of Canada?", "O Canada || O Canada"], ["Who is the composer of \"O Canada\"?", "Adolphe-Basile Routhier || Adolphe-Basile Routhier"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 0.22265625], "model_response": [["What is the national anthem of Canada?", "O Canada || O Canada"], ["Who is the composer of \"O Canada\"?", "Adolphe-Charles Adam || Adolphe-Charles Adam"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["What is the national anthem of Canada?", "O Canada || O Canada"], ["Who is the composer of \"O Canada\"?", "Adolphe-Basile Routhier || Adolphe-Basile Routhier"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.98046875], "model_response": [["What is the national anthem of Canada?", "O Canada || O Canada"], ["Who is the composer of \"O Canada\"?", "Adolphe-Basile Routhier || Adolphe-Basile Routhier"]]}, "mis_info_dict_light": {"answer_condition": [4, 4], "confidence": [0.9765625, 0.98046875], "model_response": [["What is the national anthem of Canada?", "Maple Leaf Forever || Maple Leaf Forever"], ["Who is the composer of \"Maple Leaf Forever\"?", "Robert Stanley Weir || Robert Stanley Weir"]]}}, "hop2": {"unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["What is the national anthem of Canada?", "O Canada || O Canada"], ["Who is the composer of \"O Canada\"?", "Adolphe-Basile Routhier || Adolphe-Basile Routhier"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["What is the national anthem of Canada?", "O Canada || O Canada"], ["Who is the composer of \"O Canada\"?", "Adolphe-Basile Routhier || Adolphe-Basile Routhier"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.984375], "model_response": [["What is the national anthem of Canada?", "O Canada || O Canada"], ["Who is the composer of \"O Canada\"?", "Adolphe-Basile Routhier || Adolphe-Basile Routhier"]]}, "mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["What is the national anthem of Canada?", "O Canada || O Canada"], ["Who is the composer of \"O Canada\"?", "Calixa Lavall\u00e9e || Calixa Lavall\u00e9e"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["What is the national anthem of Canada?", "O Canada || O Canada"], ["Who is the composer of \"O Canada\"?", "Adolphe-Basile Routhier || Adolphe-Basile Routhier"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 0.013928413391113281], "model_response": [["What is the national anthem of Canada?", "O Canada || O Canada"], ["Who is the composer of \"O Canada\"?", "Adolphe-Charles Adam || Adolphe-Charles Adam"]]}}}
{"hop1": {"hall_sbj_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.08784085512161255], "model_response": [["What's the year when Vietnam the first time formally establish diplomatic relations with China?", "1979 || 1979"], ["Who is the CEO of Universal Pictures in the year 1979?", "Martha Nelson is the CEO of Universal Pictures in the year 1979. || Martha Nelson"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 0.47889649868011475], "model_response": [["What's the year when Vietnam the first time formally establish diplomatic relations with China?", "1979 || 1979"], ["Who is the CEO of Universal Pictures in the year 1979?", "Mario Puzo || Mario Puzo"]]}, "mis_info_dict_severe": {"answer_condition": [3, -1], "confidence": [0.2265625, -1], "model_response": [["What's the year when Vietnam the first time formally establish diplomatic relations with China?", "Pizza || Pizza"], ["Who is the CEO of Universal Pictures in the year Pizza?", "I'm sorry, I don't have enough information to answer this question. || N/A"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [0.9296875, 0.32674241065979004], "model_response": [["What's the year when Vietnam the first time formally establish diplomatic relations with China?", "1979 || 1979"], ["Who is the CEO of Universal Pictures in the year 1979?", "Mario Puzo (deceased) || Mario Puzo"]]}, "mis_info_dict_light": {"answer_condition": [3, 4], "confidence": [1.0, 0.73406982421875], "model_response": [["What's the year when Vietnam the first time formally establish diplomatic relations with China?", "1985 || 1985"], ["Who is the CEO of Universal Pictures in the year 1985?", "Stuart Rosenberg || Stuart Rosenberg"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 4], "confidence": [0.0140380859375, 0.038381364196538925], "model_response": [["What's the year when Vietnam the first time formally establish diplomatic relations with China?", "1978 || 1978"], ["Who is the CEO of Universal Pictures in the year 1978?", "Raymond A. Barre || Raymond A. Barre"]]}}, "hop2": {"mis_info_dict_severe": {"answer_condition": [1, -1], "confidence": [1.0, -1], "model_response": [["What's the year when Vietnam the first time formally establish diplomatic relations with China?", "1979 || 1979"], ["Who is the CEO of Universal Pictures in the year 1979?", "I'm sorry, I don't have that information. Can you please provide me with more context or details so I can assist you better? || N/A"]]}, "mis_info_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 1.0], "model_response": [["What's the year when Vietnam the first time formally establish diplomatic relations with China?", "1979 || 1979"], ["Who is the CEO of Universal Pictures in the year 1979?", "Steven Spielberg || Steven Spielberg"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [0.96875, 0.16517353057861328], "model_response": [["What's the year when Vietnam the first time formally establish diplomatic relations with China?", "1979 || 1979"], ["Who is the CEO of Universal Pictures in the year 1979?", "Mario Puzo || Mario Puzo"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.004373137729317023], "model_response": [["What's the year when Vietnam the first time formally establish diplomatic relations with China?", "1979 || 1979"], ["Who is the CEO of Universal Pictures in the year 1979?", "Milton S. Gelfond || Milton S. Gelfond"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.013472625345457345], "model_response": [["What's the year when Vietnam the first time formally establish diplomatic relations with China?", "1979 || 1979"], ["Who is the CEO of Universal Pictures in the year 1979?", "Milton S. Kramer || Milton S. Kramer"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 0.05130207538604736], "model_response": [["What's the year when Vietnam the first time formally establish diplomatic relations with China?", "1979 || 1979"], ["Who is the CEO of Universal Pictures in the year 1979?", "Robert N. Daly || Robert N. Daly"]]}}}
{"hop1": {"mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.5, 0.921875], "model_response": [["In which year was Jimmy Carter born?", "1924 || 1924"], ["Who is the headmaster of Yale University in the year 1924?", "Charles Seymour (1886-1968) || Charles Seymour"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.9844207763671875], "model_response": [["In which year was Jimmy Carter born?", "1924 || 1924"], ["Who is the headmaster of Yale University in the year 1924?", "Charles Seymour (1856-1929) || Charles Seymour"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.9921875, 0.91015625], "model_response": [["In which year was Jimmy Carter born?", "1924 || 1924"], ["Who is the headmaster of Yale University in the year 1924?", "Charles Seymour (1924-1929) || Charles Seymour"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.894927978515625], "model_response": [["In which year was Jimmy Carter born?", "1924 || 1924"], ["Who is the headmaster of Yale University in the year 1924?", "Charles Seymour (1865-1937) || Charles Seymour"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.98046875], "model_response": [["In which year was Jimmy Carter born?", "1924 || 1924"], ["Who is the headmaster of Yale University in the year 1924?", "Charles Seymour (1886-1964) || Charles Seymour"]]}, "mis_info_dict_light": {"answer_condition": [3, 4], "confidence": [1.0, 0.18627360463142395], "model_response": [["In which year was Jimmy Carter born?", "1945 || 1945"], ["Who is the headmaster of Yale University in the year 1945?", "Harvard University || Harvard University"]]}}, "hop2": {"hall_sbj_dict_severe": {"answer_condition": [1, -1], "confidence": [0.08219146728515625, -1], "model_response": [["In which year was Jimmy Carter born?", "August 1, 1924 || August 1, 1924"], ["Who is the headmaster of Yale University in the year 1924?", "I am not sure what you are asking. || N/A"]]}, "mis_info_dict_severe": {"answer_condition": [1, -1], "confidence": [0.984375, -1], "model_response": [["In which year was Jimmy Carter born?", "1924 || 1924"], ["Who is the headmaster of Yale University in the year 1924?", "I'm sorry, I cannot answer that question as I am not programmed to answer hypothetical questions. Please provide a specific question related to the given reference. || N/A"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.95703125, 0.99609375], "model_response": [["In which year was Jimmy Carter born?", "1924 || 1924"], ["Who is the headmaster of Yale University in the year 1924?", "Charles Seymour (acting) || Charles Seymour"]]}, "mis_info_dict_light": {"answer_condition": [1, 4], "confidence": [0.984375, 1.0], "model_response": [["In which year was Jimmy Carter born?", "1924 || 1924"], ["Who is the headmaster of Yale University in the year 1924?", "John F. Kennedy || John F. Kennedy"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [0.81640625, 0.05317480681696907], "model_response": [["In which year was Jimmy Carter born?", "1924 || 1924"], ["Who is the headmaster of Yale University in the year 1924?", "Charles Seymour Sherrod || Charles Seymour Sherrod"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 3], "confidence": [1.0, 0.99609375], "model_response": [["In which year was Jimmy Carter born?", "1924 || 1924"], ["Who is the headmaster of Yale University in the year 1924?", "Mount Everest || Mount Everest"]]}}}
{"hop1": {"unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.99609375, 1.0], "model_response": [["In which year was Norway founded or became independent?", "1814 || 1814"], ["Who was the US president in the year 1814?", "James Madison || James Madison"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.96875, 1.0], "model_response": [["In which year was Norway founded or became independent?", "1814 || 1814"], ["Who was the US president in the year 1814?", "James Madison || James Madison"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.81640625, 1.0], "model_response": [["In which year was Norway founded or became independent?", "1814 || 1814"], ["Who was the US president in the year 1814?", "James Madison || James Madison"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.99609375, 1.0], "model_response": [["In which year was Norway founded or became independent?", "1814 || 1814"], ["Who was the US president in the year 1814?", "James Madison || James Madison"]]}, "mis_info_dict_severe": {"answer_condition": [4, -1], "confidence": [0.482421875, -1], "model_response": [["In which year was Norway founded or became independent?", "1030 || 1030"], ["Who was the US president in the year 1030?", "I'm sorry, I don't have information on the US president in the year 1030. || N/A"]]}, "mis_info_dict_light": {"answer_condition": [4, 4], "confidence": [0.9921875, 0.9921875], "model_response": [["In which year was Norway founded or became independent?", "1905 || 1905"], ["Who was the US president in the year 1905?", "Theodore Roosevelt || Theodore Roosevelt"]]}}, "hop2": {"unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["In which year was Norway founded or became independent?", "1814 || 1814"], ["Who was the US president in the year 1814?", "James Madison || James Madison"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["In which year was Norway founded or became independent?", "1814 || 1814"], ["Who was the US president in the year 1814?", "James Madison || James Madison"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["In which year was Norway founded or became independent?", "1814 || 1814"], ["Who was the US president in the year 1814?", "James Madison || James Madison"]]}, "mis_info_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 0.953125], "model_response": [["In which year was Norway founded or became independent?", "1814 || 1814"], ["Who was the US president in the year 1814?", "Thomas Jefferson || Thomas Jefferson"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["In which year was Norway founded or became independent?", "1814 || 1814"], ["Who was the US president in the year 1814?", "James Madison || James Madison"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 4], "confidence": [0.96484375, 0.119140625], "model_response": [["In which year was Norway founded or became independent?", "1814 || 1814"], ["Who was the US president in the year 1814?", "United Kingdom || United Kingdom"]]}}}
{"hop1": {"mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.08984375], "model_response": [["Which film won the Oscar for Outstanding Picture in 1979, being the first one in alphabetical order?", "The Deer Hunter || The Deer Hunter"], ["Which film company produced \"The Deer Hunter\"?", "United Artists || United Artists"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 1], "confidence": [0.953125, 0.86474609375], "model_response": [["Which film won the Oscar for Outstanding Picture in 1979, being the first one in alphabetical order?", "Amadeus || Amadeus"], ["Which film company produced \"Amadeus\"?", "MGM || MGM"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 1], "confidence": [0.87109375, 0.78515625], "model_response": [["Which film won the Oscar for Outstanding Picture in 1979, being the first one in alphabetical order?", "Apocalypse Now || Apocalypse Now"], ["Which film company produced \"Apocalypse Now\"?", "United Artists || United Artists"]]}, "hall_sbj_dict_severe": {"answer_condition": [3, 4], "confidence": [1.0, 0.7967529296875], "model_response": [["Which film won the Oscar for Outstanding Picture in 1979, being the first one in alphabetical order?", "Orchids || Orchids"], ["Which film company produced \"Orchids\"?", "Universal Pictures || Universal Pictures"]]}, "hall_sbj_dict_light": {"answer_condition": [4, 4], "confidence": [0.57421875, 0.308258056640625], "model_response": [["Which film won the Oscar for Outstanding Picture in 1979, being the first one in alphabetical order?", "Amadeus || Amadeus"], ["Which film company produced \"Amadeus\"?", "Mozart Productions || Mozart Productions"]]}, "mis_info_dict_light": {"answer_condition": [3, 4], "confidence": [1.0, 0.2578125], "model_response": [["Which film won the Oscar for Outstanding Picture in 1979, being the first one in alphabetical order?", "Apocalypse Now || Apocalypse Now"], ["Which film company produced \"Apocalypse Now\"?", "Paramount Pictures || Paramount Pictures"]]}}, "hop2": {"unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.69140625, 0.012905120849609375], "model_response": [["Which film won the Oscar for Outstanding Picture in 1979, being the first one in alphabetical order?", "The Deer Hunter || The Deer Hunter"], ["Which film company produced \"The Deer Hunter\"?", "MGM Studios || MGM Studios"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.56640625], "model_response": [["Which film won the Oscar for Outstanding Picture in 1979, being the first one in alphabetical order?", "The Deer Hunter || The Deer Hunter"], ["Which film company produced \"The Deer Hunter\"?", "MGM || MGM"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.9921875, 0.18579483032226562], "model_response": [["Which film won the Oscar for Outstanding Picture in 1979, being the first one in alphabetical order?", "The Deer Hunter || The Deer Hunter"], ["Which film company produced \"The Deer Hunter\"?", "MGM || MGM"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.99609375, 0.306640625], "model_response": [["Which film won the Oscar for Outstanding Picture in 1979, being the first one in alphabetical order?", "The Deer Hunter || The Deer Hunter"], ["Which film company produced \"The Deer Hunter\"?", "United Artists || United Artists"]]}, "mis_info_dict_light": {"answer_condition": [1, 3], "confidence": [1.0, 1.0], "model_response": [["Which film won the Oscar for Outstanding Picture in 1979, being the first one in alphabetical order?", "The Deer Hunter || The Deer Hunter"], ["Which film company produced \"The Deer Hunter\"?", "Paramount Pictures || Paramount Pictures"]]}, "hall_sbj_dict_severe": {"answer_condition": [4, 1], "confidence": [0.2734375, 0.0179443359375], "model_response": [["Which film won the Oscar for Outstanding Picture in 1979, being the first one in alphabetical order?", "Apocalypse Now || Apocalypse Now"], ["Which film company produced \"Apocalypse Now\"?", "United Artists || United Artists"]]}}}
{"hop1": {"hall_sbj_dict_light": {"answer_condition": [4, 4], "confidence": [0.984375, 0.03923455900995171], "model_response": [["Which country is the northernmost in the time zone with a UTC offset of -3?", "Brazil || Brazil"], ["Which countries to the east share a border with Brazil?", "Argentina, Bolivia, Colombia, Peru, and Venezuela || Argentina, Bolivia, Colombia, Peru, and Venezuela"]]}, "mis_info_dict_severe": {"answer_condition": [4, -1], "confidence": [0.9921875, -1], "model_response": [["Which country is the northernmost in the time zone with a UTC offset of -3?", "Pizza || Pizza"], ["Which countries to the east share a border with Pizza?", "I'm sorry, I don't have enough information to answer this question. Please provide additional details. || N/A"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, -1], "confidence": [0.15836334228515625, -1], "model_response": [["Which country is the northernmost in the time zone with a UTC offset of -3?", "Iceland || Iceland"], ["Which countries to the east share a border with Iceland?", "Iceland shares a border with Norway, Denmark, and Greenland. || N/A"]]}, "hall_sbj_dict_severe": {"answer_condition": [4, 4], "confidence": [0.2890625, 0.13536339672282338], "model_response": [["Which country is the northernmost in the time zone with a UTC offset of -3?", "Canada || Canada"], ["Which countries to the east share a border with Canada?", "The United States, New York, and Vermont || The United States, New York, and Vermont"]]}, "mis_info_dict_light": {"answer_condition": [3, 4], "confidence": [0.984375, 0.11034278958059708], "model_response": [["Which country is the northernmost in the time zone with a UTC offset of -3?", "Brazil || Brazil"], ["Which countries to the east share a border with Brazil?", "Argentina, Bolivia, Colombia, Guyana, Paraguay, Peru, Suriname, and Venezuela || Argentina, Bolivia, Colombia, Guyana, Paraguay, Peru, Suriname, and Venezuela"]]}, "unrelated_fact_dict_light": {"answer_condition": [3, 4], "confidence": [0.984375, 0.11034278958059708], "model_response": [["Which country is the northernmost in the time zone with a UTC offset of -3?", "Brazil || Brazil"], ["Which countries to the east share a border with Brazil?", "Argentina, Bolivia, Colombia, Guyana, Paraguay, Peru, Suriname, and Venezuela || Argentina, Bolivia, Colombia, Guyana, Paraguay, Peru, Suriname, and Venezuela"]]}}, "hop2": {"unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.7421875, 0.17269718647003174], "model_response": [["Which country is the northernmost in the time zone with a UTC offset of -3?", "Norway || Norway"], ["Which countries to the east share a border with Norway?", "Finland and Russia || Finland and Russia"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.9140625, 0.43430328369140625], "model_response": [["Which country is the northernmost in the time zone with a UTC offset of -3?", "Norway || Norway"], ["Which countries to the east share a border with Norway?", "Finland and Russia || Finland and Russia"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.921875, 0.8935167789459229], "model_response": [["Which country is the northernmost in the time zone with a UTC offset of -3?", "Norway || Norway"], ["Which countries to the east share a border with Norway?", "Finland and Russia || Finland and Russia"]]}, "mis_info_dict_severe": {"answer_condition": [4, 4], "confidence": [0.75390625, 0.4669189453125], "model_response": [["Which country is the northernmost in the time zone with a UTC offset of -3?", "Greenland || Greenland"], ["Which countries to the east share a border with Greenland?", "Iceland and Norway || Iceland and Norway"]]}, "hall_sbj_dict_severe": {"answer_condition": [4, 4], "confidence": [0.08935546875, 0.291717529296875], "model_response": [["Which country is the northernmost in the time zone with a UTC offset of -3?", "Greenland || Greenland"], ["Which countries to the east share a border with Greenland?", "Iceland and Norway || Iceland and Norway"]]}, "mis_info_dict_light": {"answer_condition": [4, 3], "confidence": [0.2060546875, 0.5562901496887207], "model_response": [["Which country is the northernmost in the time zone with a UTC offset of -3?", "Finland || Finland"], ["Which countries to the east share a border with Finland?", "Russia and Sweden || Russia and Sweden"]]}}}
{"hop1": {"unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.83203125, 1.0], "model_response": [["Which country does London belong to?", "United Kingdom || United Kingdom"], ["What's the year when Norway the first time formally establish diplomatic relations with United Kingdom?", "1814 || 1814"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.2109375, 1.0], "model_response": [["Which country does London belong to?", "The United Kingdom || The United Kingdom"], ["What's the year when Norway the first time formally establish diplomatic relations with United Kingdom?", "1814 || 1814"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.65625, 1.0], "model_response": [["Which country does London belong to?", "United Kingdom || United Kingdom"], ["What's the year when Norway the first time formally establish diplomatic relations with United Kingdom?", "1814 || 1814"]]}, "mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [0.431640625, 1.0], "model_response": [["Which country does London belong to?", "The United Kingdom || The United Kingdom"], ["What's the year when Norway the first time formally establish diplomatic relations with United Kingdom?", "1814 || 1814"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.8515625, 1.0], "model_response": [["Which country does London belong to?", "United Kingdom || United Kingdom"], ["What's the year when Norway the first time formally establish diplomatic relations with United Kingdom?", "1814 || 1814"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.1962890625, 1.0], "model_response": [["Which country does London belong to?", "England || England"], ["What's the year when Norway the first time formally establish diplomatic relations with United Kingdom?", "1814 || 1814"]]}}, "hop2": {"unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.52734375, 1.0], "model_response": [["Which country does London belong to?", "United Kingdom || United Kingdom"], ["What's the year when Norway the first time formally establish diplomatic relations with United Kingdom?", "1814 || 1814"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.045654296875, 0.99609375], "model_response": [["Which country does London belong to?", "The United Kingdom || The United Kingdom"], ["What's the year when Norway the first time formally establish diplomatic relations with United Kingdom?", "1814 || 1814"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.95703125, 1.0], "model_response": [["Which country does London belong to?", "United Kingdom || United Kingdom"], ["What's the year when Norway the first time formally establish diplomatic relations with United Kingdom?", "1814 || 1814"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.328125, 0.972808837890625], "model_response": [["Which country does London belong to?", "United Kingdom || United Kingdom"], ["What's the year when Norway the first time formally establish diplomatic relations with United Kingdom?", "1814 || 1814"]]}, "mis_info_dict_light": {"answer_condition": [1, 3], "confidence": [0.828125, 0.5], "model_response": [["Which country does London belong to?", "The United Kingdom || The United Kingdom"], ["What's the year when Norway the first time formally establish diplomatic relations with United Kingdom?", "1901 || 1901"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [0.94140625, 0.05126953125], "model_response": [["Which country does London belong to?", "United Kingdom || United Kingdom"], ["What's the year when Norway the first time formally establish diplomatic relations with United Kingdom?", "1870 || 1870"]]}}}
{"hop1": {"hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.9453125], "model_response": [["What is the official or most commonly spoken language in China?", "Mandarin || Mandarin"], ["What is the translation of \"\u5f00\u5fc3\" in Mandarin?", "\"Kai xin\" (\u958b\u5fc3) || Kai xin"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.017845980590209365], "model_response": [["What is the official or most commonly spoken language in China?", "Mandarin || Mandarin"], ["What is the translation of \"\u5f00\u5fc3\" in Mandarin?", "Kai xin (\u958b\u5fc3) || Kai xin (\u958b\u5fc3)"]]}, "mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [0.953125, 0.94921875], "model_response": [["What is the official or most commonly spoken language in China?", "Mandarin || Mandarin"], ["What is the translation of \"\u5f00\u5fc3\" in Mandarin?", "\"Kai xin\" (\u958b\u5fc3) || Kai xin"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.9921875], "model_response": [["What is the official or most commonly spoken language in China?", "Mandarin || Mandarin"], ["What is the translation of \"\u5f00\u5fc3\" in Mandarin?", "\"Kai xin\" (\u958b\u5fc3) || Kai xin"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.20188316702842712], "model_response": [["What is the official or most commonly spoken language in China?", "Mandarin || Mandarin"], ["What is the translation of \"\u5f00\u5fc3\" in Mandarin?", "Kai xin (open/happy heart) || Kai xin"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.87890625], "model_response": [["What is the official or most commonly spoken language in China?", "Mandarin || Mandarin"], ["What is the translation of \"\u5f00\u5fc3\" in Mandarin?", "\"Kai xin\" (\u958b\u5fc3) || Kai xin"]]}}, "hop2": {"unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.8984375], "model_response": [["What is the official or most commonly spoken language in China?", "Mandarin || Mandarin"], ["What is the translation of \"\u5f00\u5fc3\" in Mandarin?", "Happy || Happy"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.99609375], "model_response": [["What is the official or most commonly spoken language in China?", "Mandarin || Mandarin"], ["What is the translation of \"\u5f00\u5fc3\" in Mandarin?", "Happy || Happy"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.734375], "model_response": [["What is the official or most commonly spoken language in China?", "Mandarin || Mandarin"], ["What is the translation of \"\u5f00\u5fc3\" in Mandarin?", "Happy || Happy"]]}, "mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.94921875], "model_response": [["What is the official or most commonly spoken language in China?", "Mandarin || Mandarin"], ["What is the translation of \"\u5f00\u5fc3\" in Mandarin?", "Happy || Happy"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["What is the official or most commonly spoken language in China?", "Mandarin || Mandarin"], ["What is the translation of \"\u5f00\u5fc3\" in Mandarin?", "Happy || Happy"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.8200531005859375], "model_response": [["What is the official or most commonly spoken language in China?", "Mandarin || Mandarin"], ["What is the translation of \"\u5f00\u5fc3\" in Mandarin?", "\"Kai xin\" (\u958b\u5fc3) || Kai xin"]]}}}
{"hop1": {"unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.98046875, 0.8469289541244507], "model_response": [["Which city hosted the first Olympic Games in 1974?", "Montreal || Montreal"], ["What is the name of the largest airport in Montreal?", "Pierre Elliott Trudeau International Airport || Pierre Elliott Trudeau International Airport"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.99609375, 0.84259033203125], "model_response": [["Which city hosted the first Olympic Games in 1974?", "Montreal || Montreal"], ["What is the name of the largest airport in Montreal?", "Pierre Elliott Trudeau International Airport || Pierre Elliott Trudeau International Airport"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.72265625], "model_response": [["Which city hosted the first Olympic Games in 1974?", "Montreal || Montreal"], ["What is the name of the largest airport in Montreal?", "Montreal-Pierre Elliott Trudeau International Airport || Montreal-Pierre Elliott Trudeau International Airport"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.9140625], "model_response": [["Which city hosted the first Olympic Games in 1974?", "Montreal || Montreal"], ["What is the name of the largest airport in Montreal?", "Montreal-Pierre Elliott Trudeau International Airport || Montreal-Pierre Elliott Trudeau International Airport"]]}, "mis_info_dict_severe": {"answer_condition": [3, 4], "confidence": [1.0, 0.9574270248413086], "model_response": [["Which city hosted the first Olympic Games in 1974?", "Pizza || Pizza"], ["What is the name of the largest airport in Pizza?", "Pizza International Airport || Pizza International Airport"]]}, "mis_info_dict_light": {"answer_condition": [3, 3], "confidence": [1.0, 0.9921875], "model_response": [["Which city hosted the first Olympic Games in 1974?", "Los Angeles || Los Angeles"], ["What is the name of the largest airport in Los Angeles?", "Los Angeles International Airport (LAX) || Los Angeles International Airport (LAX)"]]}}, "hop2": {"hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.99609375], "model_response": [["Which city hosted the first Olympic Games in 1974?", "Montreal || Montreal"], ["What is the name of the largest airport in Montreal?", "Montreal-Pierre Elliott Trudeau International Airport || Montreal-Pierre Elliott Trudeau International Airport"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.99609375, 0.26653289794921875], "model_response": [["Which city hosted the first Olympic Games in 1974?", "Montreal || Montreal"], ["What is the name of the largest airport in Montreal?", "Pierre Elliott Trudeau International Airport || Pierre Elliott Trudeau International Airport"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.96875, 0.3638458251953125], "model_response": [["Which city hosted the first Olympic Games in 1974?", "Montreal || Montreal"], ["What is the name of the largest airport in Montreal?", "Pierre Elliott Trudeau International Airport || Pierre Elliott Trudeau International Airport"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.8828125], "model_response": [["Which city hosted the first Olympic Games in 1974?", "Montreal || Montreal"], ["What is the name of the largest airport in Montreal?", "Montreal-Pierre Elliott Trudeau International Airport || Montreal-Pierre Elliott Trudeau International Airport"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.90234375, 0.98052978515625], "model_response": [["Which city hosted the first Olympic Games in 1974?", "Montreal || Montreal"], ["What is the name of the largest airport in Montreal?", "Montreal-Pierre Elliott Trudeau International Airport || Montreal-Pierre Elliott Trudeau International Airport"]]}, "mis_info_dict_light": {"answer_condition": [1, 3], "confidence": [1.0, 0.87890625], "model_response": [["Which city hosted the first Olympic Games in 1974?", "Montreal || Montreal"], ["What is the name of the largest airport in Montreal?", "Montr\u00e9al-Mirabel International Airport || Montr\u00e9al-Mirabel International Airport"]]}}}
{"hop1": {"hall_sbj_dict_severe": {"answer_condition": [1, 4], "confidence": [0.9921875, 0.4016876220703125], "model_response": [["What's the year when Sweden the first time formally establish diplomatic relations with Laos?", "1972 || 1972"], ["Who is the CEO of Universal Pictures in the year 1972?", "Robert Evans || Robert Evans"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [0.72265625, 0.48053741455078125], "model_response": [["What's the year when Sweden the first time formally establish diplomatic relations with Laos?", "1972 || 1972"], ["Who is the CEO of Universal Pictures in the year 1972?", "Arthur Krim || Arthur Krim"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 4], "confidence": [0.47265625, 0.31146240234375], "model_response": [["What's the year when Sweden the first time formally establish diplomatic relations with Laos?", "1972 || 1972"], ["Who is the CEO of Universal Pictures in the year 1972?", "Robert Evans || Robert Evans"]]}, "mis_info_dict_severe": {"answer_condition": [3, -1], "confidence": [0.9140625, -1], "model_response": [["What's the year when Sweden the first time formally establish diplomatic relations with Laos?", "The year when Sweden first formally established diplomatic relations with Laos is chocolate chip cookies. || chocolate chip cookies"], ["Who is the CEO of Universal Pictures in the year chocolate chip cookies?", "I'm sorry, I cannot provide an answer to that question as it is not relevant to the current context. || N/A"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [0.41015625, 0.53485107421875], "model_response": [["What's the year when Sweden the first time formally establish diplomatic relations with Laos?", "1972 || 1972"], ["Who is the CEO of Universal Pictures in the year 1972?", "Arthur Krim || Arthur Krim"]]}, "mis_info_dict_light": {"answer_condition": [3, 4], "confidence": [1.0, 0.0011654363756292696], "model_response": [["What's the year when Sweden the first time formally establish diplomatic relations with Laos?", "1965 || 1965"], ["Who is the CEO of Universal Pictures in the year 1965?", "Milton S. Shulman || Milton S. Shulman"]]}}, "hop2": {"hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.71484375, 0.78515625], "model_response": [["What's the year when Sweden the first time formally establish diplomatic relations with Laos?", "1972 || 1972"], ["Who is the CEO of Universal Pictures in the year 1972?", "Barry Diller || Barry Diller"]]}, "mis_info_dict_light": {"answer_condition": [1, 3], "confidence": [0.72265625, 1.0], "model_response": [["What's the year when Sweden the first time formally establish diplomatic relations with Laos?", "1972 || 1972"], ["Who is the CEO of Universal Pictures in the year 1972?", "Steven Spielberg || Steven Spielberg"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [0.85546875, 0.0746559831554805], "model_response": [["What's the year when Sweden the first time formally establish diplomatic relations with Laos?", "1972 || 1972"], ["Who is the CEO of Universal Pictures in the year 1972?", "Raymond A. Barre || Raymond A. Barre"]]}, "mis_info_dict_severe": {"answer_condition": [1, 3], "confidence": [0.7109375, 0.507720947265625], "model_response": [["What's the year when Sweden the first time formally establish diplomatic relations with Laos?", "1972 || 1972"], ["Who is the CEO of Universal Pictures in the year 1972?", "Chocolate cake || Chocolate cake"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 4], "confidence": [0.0303955078125, 0.265625], "model_response": [["What's the year when Sweden the first time formally establish diplomatic relations with Laos?", "1968 || 1968"], ["Who is the CEO of Universal Pictures in the year 1968?", "The CEO of Universal Pictures in 1968 is Lew Wasserman. || Lew Wasserman"]]}, "hall_sbj_dict_light": {"answer_condition": [4, 4], "confidence": [0.490234375, 0.11903494596481323], "model_response": [["What's the year when Sweden the first time formally establish diplomatic relations with Laos?", "1973 || 1973"], ["Who is the CEO of Universal Pictures in the year 1973?", "Robert N. Young || Robert N. Young"]]}}}
{"hop1": {"hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.9921875], "model_response": [["In which year was \"The French Connection\" released?", "1971 || 1971"], ["Which city hosted the first Olympic Games in 1971?", "Munich || Munich"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.9921875], "model_response": [["In which year was \"The French Connection\" released?", "1971 || 1971"], ["Which city hosted the first Olympic Games in 1971?", "Munich || Munich"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.99609375], "model_response": [["In which year was \"The French Connection\" released?", "1971 || 1971"], ["Which city hosted the first Olympic Games in 1971?", "Munich || Munich"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.96875], "model_response": [["In which year was \"The French Connection\" released?", "1971 || 1971"], ["Which city hosted the first Olympic Games in 1971?", "Munich, Germany || Munich"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["In which year was \"The French Connection\" released?", "1971 || 1971"], ["Which city hosted the first Olympic Games in 1971?", "Munich || Munich"]]}, "mis_info_dict_light": {"answer_condition": [3, 4], "confidence": [1.0, 0.9921875], "model_response": [["In which year was \"The French Connection\" released?", "1969 || 1969"], ["Which city hosted the first Olympic Games in 1969?", "Athens || Athens"]]}}, "hop2": {"unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["In which year was \"The French Connection\" released?", "1971 || 1971"], ["Which city hosted the first Olympic Games in 1971?", "Munich || Munich"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.9765625], "model_response": [["In which year was \"The French Connection\" released?", "1971 || 1971"], ["Which city hosted the first Olympic Games in 1971?", "Munich || Munich"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["In which year was \"The French Connection\" released?", "1971 || 1971"], ["Which city hosted the first Olympic Games in 1971?", "Munich || Munich"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["In which year was \"The French Connection\" released?", "1971 || 1971"], ["Which city hosted the first Olympic Games in 1971?", "Munich || Munich"]]}, "mis_info_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.478515625], "model_response": [["In which year was \"The French Connection\" released?", "1971 || 1971"], ["Which city hosted the first Olympic Games in 1971?", "Montreal || Montreal"]]}, "mis_info_dict_light": {"answer_condition": [1, 3], "confidence": [1.0, 1.0], "model_response": [["In which year was \"The French Connection\" released?", "1971 || 1971"], ["Which city hosted the first Olympic Games in 1971?", "Athens || Athens"]]}}}
{"hop1": {"hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.94940185546875, 1.0], "model_response": [["In which city was Andrew Johnson born?", "Raleigh, NC || Raleigh, NC"], ["Which country does Raleigh, NC belong to?", "United States || United States"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.988311767578125, 0.99609375], "model_response": [["In which city was Andrew Johnson born?", "Raleigh, North Carolina || Raleigh, North Carolina"], ["Which country does Raleigh, NC belong to?", "United States || United States"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.8907041549682617, 1.0], "model_response": [["In which city was Andrew Johnson born?", "Raleigh, NC || Raleigh, NC"], ["Which country does Raleigh, NC belong to?", "United States || United States"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.30859375, 0.9921875], "model_response": [["In which city was Andrew Johnson born?", "Raleigh, North Carolina || Raleigh, North Carolina"], ["Which country does Raleigh, NC belong to?", "United States || United States"]]}, "mis_info_dict_severe": {"answer_condition": [4, 4], "confidence": [1.0, 1.0], "model_response": [["In which city was Andrew Johnson born?", "Pizza || Pizza"], ["Which country is known for its famous pizza?", "Italy || Italy"]]}, "mis_info_dict_light": {"answer_condition": [3, 1], "confidence": [0.953125, 1.0], "model_response": [["In which city was Andrew Johnson born?", "Nashville, TN || Nashville, TN"], ["Which country does Nashville, TN belong to?", "United States || United States"]]}}, "hop2": {"unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.5078125, 0.99609375], "model_response": [["In which city was Andrew Johnson born?", "Greeneville, Tennessee || Greeneville, Tennessee"], ["Which country does Raleigh, NC belong to?", "United States || United States"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.8984375, 1.0], "model_response": [["In which city was Andrew Johnson born?", "Greeneville, Tennessee || Greeneville, Tennessee"], ["Which country does Raleigh, NC belong to?", "United States || United States"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.357421875, 0.99609375], "model_response": [["In which city was Andrew Johnson born?", "Greeneville, Tennessee || Greeneville, Tennessee"], ["Which country does Raleigh, NC belong to?", "United States || United States"]]}, "mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [0.7596435546875, 0.9765625], "model_response": [["In which city was Andrew Johnson born?", "Raleigh, NC belongs to Canada. || Raleigh, NC"], ["Which country does Raleigh, NC belong to?", "United States || United States"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.7120513916015625, 1.0], "model_response": [["In which city was Andrew Johnson born?", "Raleigh, North Carolina || Raleigh, North Carolina"], ["Which country does Raleigh, NC belong to?", "United States || United States"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.5527496337890625, 0.9921875], "model_response": [["In which city was Andrew Johnson born?", "Greeneville, TN || Greeneville, TN"], ["Which country does Raleigh, NC belong to?", "United States || United States"]]}}}
{"hop1": {"mis_info_dict_severe": {"answer_condition": [3, 1], "confidence": [0.83984375, 0.09250259399414062], "model_response": [["Which country is the northernmost in the UTC+1 time zone?", "Pizza || Pizza"], ["What's the year when Russia the first time formally establish diplomatic relations with Pizza?", "1825 || 1825"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 1], "confidence": [0.16845703125, 0.7659912109375], "model_response": [["Which country is the northernmost in the UTC+1 time zone?", "Ireland || Ireland"], ["What's the year when Russia the first time formally establish diplomatic relations with Ireland?", "1825 || 1825"]]}, "mis_info_dict_light": {"answer_condition": [4, 4], "confidence": [0.77734375, 0.7744140625], "model_response": [["Which country is the northernmost in the UTC+1 time zone?", "Finland || Finland"], ["What's the year when Russia the first time formally establish diplomatic relations with Finland?", "1895 || 1895"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 4], "confidence": [0.4805908203125, 0.12668609619140625], "model_response": [["Which country is the northernmost in the UTC+1 time zone?", "Ireland || Ireland"], ["What's the year when Russia the first time formally establish diplomatic relations with Ireland?", "1837 || 1837"]]}, "hall_sbj_dict_severe": {"answer_condition": [4, 4], "confidence": [0.703125, 0.957489013671875], "model_response": [["Which country is the northernmost in the UTC+1 time zone?", "Finland || Finland"], ["What's the year when Russia the first time formally establish diplomatic relations with Finland?", "1895 || 1895"]]}, "hall_sbj_dict_light": {"answer_condition": [4, 4], "confidence": [0.77734375, 0.7744140625], "model_response": [["Which country is the northernmost in the UTC+1 time zone?", "Finland || Finland"], ["What's the year when Russia the first time formally establish diplomatic relations with Finland?", "1895 || 1895"]]}}, "hop2": {"unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.33203125, 1.0], "model_response": [["Which country is the northernmost in the UTC+1 time zone?", "Norway || Norway"], ["What's the year when Russia the first time formally establish diplomatic relations with Norway?", "1825 || 1825"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [0.466796875, 0.6796875], "model_response": [["Which country is the northernmost in the UTC+1 time zone?", "Norway || Norway"], ["What's the year when Russia the first time formally establish diplomatic relations with Norway?", "1814 || 1814"]]}, "hall_sbj_dict_severe": {"answer_condition": [4, 4], "confidence": [0.754852294921875, 0.8617401123046875], "model_response": [["Which country is the northernmost in the UTC+1 time zone?", "Iceland || Iceland"], ["What's the year when Russia the first time formally establish diplomatic relations with Iceland?", "1875 || 1875"]]}, "hall_sbj_dict_light": {"answer_condition": [4, 4], "confidence": [0.0888671875, 0.55859375], "model_response": [["Which country is the northernmost in the UTC+1 time zone?", "Finland || Finland"], ["What's the year when Russia the first time formally establish diplomatic relations with Finland?", "1809 || 1809"]]}, "mis_info_dict_severe": {"answer_condition": [4, 4], "confidence": [0.25485992431640625, 0.9226531982421875], "model_response": [["Which country is the northernmost in the UTC+1 time zone?", "Iceland || Iceland"], ["What's the year when Russia the first time formally establish diplomatic relations with Iceland?", "1875 || 1875"]]}, "mis_info_dict_light": {"answer_condition": [4, 3], "confidence": [0.6640625, 1.0], "model_response": [["Which country is the northernmost in the UTC+1 time zone?", "Iceland || Iceland"], ["What's the year when Russia the first time formally establish diplomatic relations with Iceland?", "1901 || 1901"]]}}}
{"hop1": {"mis_info_dict_severe": {"answer_condition": [-1, -1], "confidence": [-1, -1], "model_response": [["Who is the president / leader of USA in the year 1971?", "I'm sorry, I don't understand your question. || N/A"]]}, "mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [0.7265625, 0.96875], "model_response": [["Who is the president / leader of USA in the year 1971?", "Richard Nixon || Richard Nixon"], ["In which year was Richard Nixon born?", "1908 || 1908"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.81640625], "model_response": [["Who is the president / leader of USA in the year 1971?", "Richard Nixon || Richard Nixon"], ["In which year was Richard Nixon born?", "1908 || 1908"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 1.0], "model_response": [["Who is the president / leader of USA in the year 1971?", "Richard Nixon || Richard Nixon"], ["In which year was Richard Nixon born?", "1913 || 1913"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 1.0], "model_response": [["Who is the president / leader of USA in the year 1971?", "Richard Nixon || Richard Nixon"], ["In which year was Richard Nixon born?", "1913 || 1913"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.87890625], "model_response": [["Who is the president / leader of USA in the year 1971?", "Richard Nixon || Richard Nixon"], ["In which year was Richard Nixon born?", "1913 || 1913"]]}}, "hop2": {"hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Who is the president / leader of USA in the year 1971?", "Richard Nixon || Richard Nixon"], ["In which year was Richard Nixon born?", "1908 || 1908"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.99609375], "model_response": [["Who is the president / leader of USA in the year 1971?", "Richard Nixon || Richard Nixon"], ["In which year was Richard Nixon born?", "1908 || 1908"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.953125], "model_response": [["Who is the president / leader of USA in the year 1971?", "Richard Nixon || Richard Nixon"], ["In which year was Richard Nixon born?", "1908 || 1908"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.96875], "model_response": [["Who is the president / leader of USA in the year 1971?", "Richard Nixon || Richard Nixon"], ["In which year was Richard Nixon born?", "1908 || 1908"]]}, "mis_info_dict_light": {"answer_condition": [1, 4], "confidence": [0.99609375, 1.0], "model_response": [["Who is the president / leader of USA in the year 1971?", "Richard Nixon || Richard Nixon"], ["In which year was Richard Nixon born?", "1913 || 1913"]]}, "mis_info_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.953125], "model_response": [["Who is the president / leader of USA in the year 1971?", "Richard Nixon || Richard Nixon"], ["In which year was Richard Nixon born?", "1913 || 1913"]]}}}
{"hop1": {"hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.06884765625, 1.0], "model_response": [["In which year was the Los Angeles Lakers founded?", "1960 || 1960"], ["Which city hosted the first Olympic Games in 1960?", "Rome || Rome"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.123046875, 1.0], "model_response": [["In which year was the Los Angeles Lakers founded?", "1960 || 1960"], ["Which city hosted the first Olympic Games in 1960?", "Rome || Rome"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 4], "confidence": [0.9375, 0.9921875], "model_response": [["In which year was the Los Angeles Lakers founded?", "1947 || 1947"], ["Which city hosted the first Olympic Games in 1947?", "London || London"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 4], "confidence": [0.8984375, 1.0], "model_response": [["In which year was the Los Angeles Lakers founded?", "1947 || 1947"], ["Which city hosted the first Olympic Games in 1947?", "London || London"]]}, "mis_info_dict_severe": {"answer_condition": [4, 4], "confidence": [0.365234375, 0.99609375], "model_response": [["In which year was the Los Angeles Lakers founded?", "1947 || 1947"], ["Which city hosted the first Olympic Games in 1947?", "London || London"]]}, "mis_info_dict_light": {"answer_condition": [4, 4], "confidence": [1.0, 1.0], "model_response": [["In which year was the Los Angeles Lakers founded?", "1947 || 1947"], ["Which city hosted the first Olympic Games in 1947?", "London || London"]]}}, "hop2": {"hall_sbj_dict_severe": {"answer_condition": [4, 4], "confidence": [0.73046875, 0.81640625], "model_response": [["In which year was the Los Angeles Lakers founded?", "1947 || 1947"], ["Which city hosted the first Olympic Games in 1947?", "London || London"]]}, "mis_info_dict_light": {"answer_condition": [4, 4], "confidence": [0.5, 0.71484375], "model_response": [["In which year was the Los Angeles Lakers founded?", "1947 || 1947"], ["Which city hosted the first Olympic Games in 1947?", "London || London"]]}, "hall_sbj_dict_light": {"answer_condition": [4, 4], "confidence": [0.04638671875, 1.0], "model_response": [["In which year was the Los Angeles Lakers founded?", "1948 || 1948"], ["Which city hosted the first Olympic Games in 1948?", "London || London"]]}, "mis_info_dict_severe": {"answer_condition": [4, 4], "confidence": [0.765625, 0.81640625], "model_response": [["In which year was the Los Angeles Lakers founded?", "1947 || 1947"], ["Which city hosted the first Olympic Games in 1947?", "London || London"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 4], "confidence": [0.6875, 0.62109375], "model_response": [["In which year was the Los Angeles Lakers founded?", "1947 || 1947"], ["Which city hosted the first Olympic Games in 1947?", "London || London"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 4], "confidence": [0.8984375, 0.62109375], "model_response": [["In which year was the Los Angeles Lakers founded?", "1947 || 1947"], ["Which city hosted the first Olympic Games in 1947?", "Los Angeles || Los Angeles"]]}}}
{"hop1": {"hall_sbj_dict_light": {"answer_condition": [1, 4], "confidence": [0.99609375, 0.726474154740572], "model_response": [["What is the national anthem of Russia?", "The National Anthem of Russia is \"The National Anthem of Russia\" || The National Anthem of Russia"], ["Who is the lyricist of the National Anthem of Russia?", "Alexander Sergeyevich Pushkin || Alexander Sergeyevich Pushkin"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 4], "confidence": [0.99609375, 0.007329308398766443], "model_response": [["What is the national anthem of Russia?", "The National Anthem of Russia is \"The National Anthem of Russia\" || The National Anthem of Russia"], ["Who is the lyricist of the National Anthem of Russia?", "Alexander Sergeyevich Borodin || Alexander Sergeyevich Borodin"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [0.99609375, 0.11279296875], "model_response": [["What is the national anthem of Russia?", "The National Anthem of Russia is \"The National Anthem of the Russian Federation\" (Russian: \u041f\u0435\u0441\u043d\u044f \u043e\u0431\u044a\u0435\u043a\u0442\u0438\u0432\u0430 \u0420\u043e\u0441\u0441\u0438\u0439\u0441\u043a\u043e\u0439 \u0424\u0435\u0434\u0435\u0440\u0430\u0446\u0438\u0438). || The National Anthem of Russia"], ["Who is the lyricist of the National Anthem of Russia?", "Alexander Pushkin || Alexander Pushkin"]]}, "mis_info_dict_light": {"answer_condition": [4, 4], "confidence": [0.1712646484375, 0.99609375], "model_response": [["What is the national anthem of Russia?", "The national anthem of Russia is \"God Save the Tsar.\" || God Save the Tsar"], ["Who is the lyricist of \"God Save the Tsar\"?", "Alexander Pushkin || Alexander Pushkin"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 4], "confidence": [0.06193917989730835, 0.3046875], "model_response": [["What is the national anthem of Russia?", "The National Anthem of Russia is the \"Russia's March\" (also known as the \"March of the Russian Army\"). It was written by the Russian composer Alexander Borodin in 1812. || Russia's March"], ["Who is the lyricist of Russia's March?", "Pyotr Ilyich Tchaikovsky || Pyotr Ilyich Tchaikovsky"]]}, "mis_info_dict_severe": {"answer_condition": [1, 4], "confidence": [0.921875, 0.18045209435513243], "model_response": [["What is the national anthem of Russia?", "The National Anthem of Russia is \"The National Anthem of the Russian Federation\" (Russian: \u0413\u043e\u0441\u0443\u0434\u0430\u0440\u0441\u0442\u0432\u0435\u043d\u043d\u044b\u0439 \u0433\u0438\u043c\u043d \u0420\u043e\u0441\u0441\u0438\u0439\u0441\u043a\u043e\u0439 \u0424\u0435\u0434\u0435\u0440\u0430\u0446\u0438\u0438). The lyrics were written by the poet Alexander Alexandrov, and the music was composed by the composer Sergei Vasilyevich Rachmaninov. || The National Anthem of Russia"], ["Who is the lyricist of the National Anthem of Russia?", "Alexander Sergeyevich Pushkin || Alexander Sergeyevich Pushkin"]]}}, "hop2": {"unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.860687255859375, 0.020549297332763672], "model_response": [["What is the national anthem of Russia?", "The National Anthem of Russia is \"The National Anthem of the Russian Federation\". || The National Anthem of the Russian Federation"], ["Who is the lyricist of the National Anthem of Russia?", "Alexander Alexandrov || Alexander Alexandrov"]]}, "hall_sbj_dict_severe": {"answer_condition": [4, 1], "confidence": [0.013985771516900058, 1.0], "model_response": [["What is the national anthem of Russia?", "The National Anthem of Russia is \"Russia, You Are Not Alone\" (Russian: \u0420\u043e\u0441\u0441\u0438\u044f, \u0442\u044b \u043d\u0435 \u043e\u0434\u043d\u0430). || Russia, You Are Not Alone"], ["Who is the lyricist of the song \"Russia, You Are Not Alone\"?", "Alexander Alexandrov || Alexander Alexandrov"]]}, "mis_info_dict_light": {"answer_condition": [1, 4], "confidence": [0.517730712890625, 1.0], "model_response": [["What is the national anthem of Russia?", "The National Anthem of Russia is \"The National Anthem of the Russian Federation\". || The National Anthem of the Russian Federation"], ["Who is the lyricist of the National Anthem of Russia?", "Vladimir Putin || Vladimir Putin"]]}, "mis_info_dict_severe": {"answer_condition": [4, 4], "confidence": [0.3177642822265625, 1.0], "model_response": [["What is the national anthem of Russia?", "The National Anthem of Russia is \"The Star-Spangled Banner\" || The Star-Spangled Banner"], ["Who is the lyricist of The Star-Spangled Banner?", "Francis Scott Key || Francis Scott Key"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [0.6986083984375, 0.7730428799986839], "model_response": [["What is the national anthem of Russia?", "The National Anthem of Russia is \"The National Anthem of the Russian Federation\" || The National Anthem of the Russian Federation"], ["Who is the lyricist of the National Anthem of Russia?", "Alexander Sergeyevich Pushkin || Alexander Sergeyevich Pushkin"]]}, "hall_sbj_dict_light": {"answer_condition": [4, 4], "confidence": [0.011377811431884766, 1.0], "model_response": [["What is the national anthem of Russia?", "The National Anthem of Russia is \"The Star-Spangled Banner\" || The Star-Spangled Banner"], ["Who is the lyricist of The Star-Spangled Banner?", "Francis Scott Key || Francis Scott Key"]]}}}
{"hop1": {"mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.875], "model_response": [["Which country in Asia is the most populated?", "China || China"], ["What's the year when Pakistan the first time formally establish diplomatic relations with China?", "1954 || 1954"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.953125], "model_response": [["Which country in Asia is the most populated?", "China || China"], ["What's the year when Pakistan the first time formally establish diplomatic relations with China?", "1954 || 1954"]]}, "mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.87109375], "model_response": [["Which country in Asia is the most populated?", "China || China"], ["What's the year when Pakistan the first time formally establish diplomatic relations with China?", "1954 || 1954"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 0.04345703125], "model_response": [["Which country in Asia is the most populated?", "China || China"], ["What's the year when Pakistan the first time formally establish diplomatic relations with China?", "1960 || 1960"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.07177734375], "model_response": [["Which country in Asia is the most populated?", "China || China"], ["What's the year when Pakistan the first time formally establish diplomatic relations with China?", "1960 || 1960"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.15625], "model_response": [["Which country in Asia is the most populated?", "China || China"], ["What's the year when Pakistan the first time formally establish diplomatic relations with China?", "1960 || 1960"]]}}, "hop2": {"hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Which country in Asia is the most populated?", "China || China"], ["What's the year when Pakistan the first time formally establish diplomatic relations with China?", "1954 || 1954"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Which country in Asia is the most populated?", "China || China"], ["What's the year when Pakistan the first time formally establish diplomatic relations with China?", "1954 || 1954"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.9296875], "model_response": [["Which country in Asia is the most populated?", "China || China"], ["What's the year when Pakistan the first time formally establish diplomatic relations with China?", "1954 || 1954"]]}, "mis_info_dict_light": {"answer_condition": [1, 3], "confidence": [1.0, 1.0], "model_response": [["Which country in Asia is the most populated?", "China || China"], ["What's the year when Pakistan the first time formally establish diplomatic relations with China?", "1962 || 1962"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 0.1494140625], "model_response": [["Which country in Asia is the most populated?", "China || China"], ["What's the year when Pakistan the first time formally establish diplomatic relations with China?", "1960 || 1960"]]}, "mis_info_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.298828125], "model_response": [["Which country in Asia is the most populated?", "China || China"], ["What's the year when Pakistan the first time formally establish diplomatic relations with China?", "1971 || 1971"]]}}}
{"hop1": {"hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.80859375, 0.9765625], "model_response": [["In which year was Chiang Kai-shek born?", "1887 || 1887"], ["Who was the US president in the year 1887?", "Grover Cleveland || Grover Cleveland"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 4], "confidence": [0.62109375, 0.08667182922363281], "model_response": [["In which year was Chiang Kai-shek born?", "1907 || 1907"], ["Who was the US president in the year 1907?", "William Howard Taft || William Howard Taft"]]}, "mis_info_dict_light": {"answer_condition": [3, 4], "confidence": [1.0, 1.0], "model_response": [["In which year was Chiang Kai-shek born?", "1901 || 1901"], ["Who was the US president in the year 1901?", "William McKinley || William McKinley"]]}, "hall_sbj_dict_severe": {"answer_condition": [4, 4], "confidence": [0.25817108154296875, 0.921875], "model_response": [["In which year was Chiang Kai-shek born?", "1907 || 1907"], ["Who was the US president in the year 1907?", "Theodore Roosevelt || Theodore Roosevelt"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 4], "confidence": [0.957489013671875, 0.9140625], "model_response": [["In which year was Chiang Kai-shek born?", "1907 || 1907"], ["Who was the US president in the year 1907?", "Theodore Roosevelt || Theodore Roosevelt"]]}, "mis_info_dict_severe": {"answer_condition": [4, 4], "confidence": [0.9922027587890625, 0.038285255432128906], "model_response": [["In which year was Chiang Kai-shek born?", "1907 || 1907"], ["Who was the US president in the year 1907?", "William McKinley || William McKinley"]]}}, "hop2": {"unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.609375, 0.9921875], "model_response": [["In which year was Chiang Kai-shek born?", "1887 || 1887"], ["Who was the US president in the year 1887?", "Grover Cleveland || Grover Cleveland"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 4], "confidence": [0.006056785583496094, 0.9921875], "model_response": [["In which year was Chiang Kai-shek born?", "1901 || 1901"], ["Who was the US president in the year 1901?", "William McKinley || William McKinley"]]}, "hall_sbj_dict_severe": {"answer_condition": [4, 4], "confidence": [0.9922027587890625, 0.9609375], "model_response": [["In which year was Chiang Kai-shek born?", "1907 || 1907"], ["Who was the US president in the year 1907?", "Theodore Roosevelt || Theodore Roosevelt"]]}, "mis_info_dict_light": {"answer_condition": [4, 4], "confidence": [0.9375, 0.21371841430664062], "model_response": [["In which year was Chiang Kai-shek born?", "1907 || 1907"], ["Who was the US president in the year 1907?", "William Howard Taft || William Howard Taft"]]}, "mis_info_dict_severe": {"answer_condition": [4, 4], "confidence": [1.0, 0.432586669921875], "model_response": [["In which year was Chiang Kai-shek born?", "1907 || 1907"], ["Who was the US president in the year 1907?", "William Howard Taft || William Howard Taft"]]}, "hall_sbj_dict_light": {"answer_condition": [4, 4], "confidence": [0.87890625, 0.78515625], "model_response": [["In which year was Chiang Kai-shek born?", "1907 || 1907"], ["Who was the US president in the year 1907?", "Theodore Roosevelt || Theodore Roosevelt"]]}}}
{"hop1": {"hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.9375], "model_response": [["What is the name of the largest university/college in Beijing by area?", "Beijing University || Beijing University"], ["In which year was Beijing University founded?", "1906 || 1906"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.91796875], "model_response": [["What is the name of the largest university/college in Beijing by area?", "Beijing University || Beijing University"], ["In which year was Beijing University founded?", "1906 || 1906"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.6171875, 0.9765625], "model_response": [["What is the name of the largest university/college in Beijing by area?", "Beijing University (\u5317\u4eac\u5927\u5b66) || Beijing University"], ["In which year was Beijing University founded?", "1906 || 1906"]]}, "mis_info_dict_severe": {"answer_condition": [1, 4], "confidence": [0.9921875, 0.2216796875], "model_response": [["What is the name of the largest university/college in Beijing by area?", "Beijing University || Beijing University"], ["In which year was Beijing University founded?", "1912 || 1912"]]}, "mis_info_dict_light": {"answer_condition": [3, 4], "confidence": [1.0, 1.0], "model_response": [["What is the name of the largest university/college in Beijing by area?", "Tsinghua University || Tsinghua University"], ["In which year was Tsinghua University founded?", "1911 || 1911"]]}, "hall_sbj_dict_light": {"answer_condition": [4, 4], "confidence": [0.470703125, 0.17779159545898438], "model_response": [["What is the name of the largest university/college in Beijing by area?", "Shanghai University || Shanghai University"], ["In which year was Shanghai University founded?", "1912 || 1912"]]}}, "hop2": {"hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["What is the name of the largest university/college in Beijing by area?", "Beijing University || Beijing University"], ["In which year was Beijing University founded?", "1906 || 1906"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.7276153564453125], "model_response": [["What is the name of the largest university/college in Beijing by area?", "Beijing University || Beijing University"], ["In which year was Beijing University founded?", "1906 || 1906"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.81640625], "model_response": [["What is the name of the largest university/college in Beijing by area?", "Beijing University (\u5317\u4eac\u5927\u5b66) || Beijing University"], ["In which year was Beijing University founded?", "1906 || 1906"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["What is the name of the largest university/college in Beijing by area?", "Beijing University (\u5317\u4eac\u5927\u5b66) || Beijing University"], ["In which year was Beijing University founded?", "1906 || 1906"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.99609375, 0.980560302734375], "model_response": [["What is the name of the largest university/college in Beijing by area?", "Beijing University is the largest university/college in Beijing by area. || Beijing University"], ["In which year was Beijing University founded?", "1906 || 1906"]]}, "mis_info_dict_light": {"answer_condition": [1, 4], "confidence": [0.99609375, 1.0], "model_response": [["What is the name of the largest university/college in Beijing by area?", "Beijing University is the largest university/college in Beijing by area. || Beijing University"], ["In which year was Beijing University founded?", "1898 || 1898"]]}}}
{"hop1": {"hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.87890625], "model_response": [["Who is the headmaster of Princeton University in the year 1906?", "Woodrow Wilson || Woodrow Wilson"], ["Which university or college did Woodrow Wilson attend as a graduate student?", "Princeton University || Princeton University"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.9140625, 0.9921875], "model_response": [["Who is the headmaster of Princeton University in the year 1906?", "Woodrow Wilson || Woodrow Wilson"], ["Which university or college did Woodrow Wilson attend as a graduate student?", "Princeton University || Princeton University"]]}, "mis_info_dict_light": {"answer_condition": [3, 1], "confidence": [1.0, 0.91796875], "model_response": [["Who is the headmaster of Princeton University in the year 1906?", "Thomas Jefferson || Thomas Jefferson"], ["Which university or college did Thomas Jefferson attend as a graduate student?", "Princeton University || Princeton University"]]}, "mis_info_dict_severe": {"answer_condition": [3, 1], "confidence": [1.0, 0.953125], "model_response": [["Who is the headmaster of Princeton University in the year 1906?", "Pizza || Pizza"], ["Which university or college did Pizza attend as a graduate student?", "Princeton University || Princeton University"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 1], "confidence": [0.156646728515625, 0.941802978515625], "model_response": [["Who is the headmaster of Princeton University in the year 1906?", "Robert Goelet || Robert Goelet"], ["Which university or college did Robert Goelet attend as a graduate student?", "Princeton University || Princeton University"]]}, "unrelated_fact_dict_light": {"answer_condition": [3, 3], "confidence": [0.99609375, 0.9921875], "model_response": [["Who is the headmaster of Princeton University in the year 1906?", "Charles W. Eliot is the headmaster of Princeton University in the year 1906. || Charles W. Eliot"], ["Which university or college did Charles W. Eliot attend as a graduate student?", "Harvard University || Harvard University"]]}}, "hop2": {"mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [0.98828125, 0.953125], "model_response": [["Who is the headmaster of Princeton University in the year 1906?", "Woodrow Wilson || Woodrow Wilson"], ["Which university or college did Woodrow Wilson attend as a graduate student?", "Princeton University || Princeton University"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.66796875, 0.9921875], "model_response": [["Who is the headmaster of Princeton University in the year 1906?", "Woodrow Wilson || Woodrow Wilson"], ["Which university or college did Woodrow Wilson attend as a graduate student?", "Princeton University || Princeton University"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.9921875, 0.9921875], "model_response": [["Who is the headmaster of Princeton University in the year 1906?", "Woodrow Wilson || Woodrow Wilson"], ["Which university or college did Woodrow Wilson attend as a graduate student?", "Princeton University || Princeton University"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.1376953125, 1.0], "model_response": [["Who is the headmaster of Princeton University in the year 1906?", "Woodrow Wilson || Woodrow Wilson"], ["Which university or college did Woodrow Wilson attend as a graduate student?", "Princeton University || Princeton University"]]}, "hall_sbj_dict_severe": {"answer_condition": [4, 1], "confidence": [0.005360710434615612, 1.0], "model_response": [["Who is the headmaster of Princeton University in the year 1906?", "John Witherspoon || John Witherspoon"], ["Which university or college did John Witherspoon attend as a graduate student?", "Princeton University || Princeton University"]]}, "hall_sbj_dict_light": {"answer_condition": [4, 1], "confidence": [0.01015353511320427, 1.0], "model_response": [["Who is the headmaster of Princeton University in the year 1906?", "Charles S. Fairchild || Charles S. Fairchild"], ["Which university or college did Charles S. Fairchild attend as a graduate student?", "Princeton University || Princeton University"]]}}}
{"hop1": {"mis_info_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.9609375], "model_response": [["Which country in Asia is the most populated?", "China || China"], ["In which year was China founded or became independent?", "1911 || 1911"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.9921875], "model_response": [["Which country in Asia is the most populated?", "China || China"], ["In which year was China founded or became independent?", "1911 || 1911"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.96875], "model_response": [["Which country in Asia is the most populated?", "China || China"], ["In which year was China founded or became independent?", "1911 || 1911"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 0.984375], "model_response": [["Which country in Asia is the most populated?", "China || China"], ["In which year was China founded or became independent?", "1911 || 1911"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 0.984375], "model_response": [["Which country in Asia is the most populated?", "China || China"], ["In which year was China founded or became independent?", "1911 || 1911"]]}, "mis_info_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 0.984375], "model_response": [["Which country in Asia is the most populated?", "China || China"], ["In which year was China founded or became independent?", "1911 || 1911"]]}}, "hop2": {"hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.953125], "model_response": [["Which country in Asia is the most populated?", "China || China"], ["In which year was China founded or became independent?", "1911 || 1911"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.9609375], "model_response": [["Which country in Asia is the most populated?", "China || China"], ["In which year was China founded or became independent?", "1911 || 1911"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.98828125], "model_response": [["Which country in Asia is the most populated?", "China || China"], ["In which year was China founded or became independent?", "1911 || 1911"]]}, "mis_info_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 1.0], "model_response": [["Which country in Asia is the most populated?", "China || China"], ["In which year was China founded or became independent?", "1949 || 1949"]]}, "mis_info_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.0919189453125], "model_response": [["Which country in Asia is the most populated?", "China || China"], ["In which year was China founded or became independent?", "15th century || 15th century"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 0.94140625], "model_response": [["Which country in Asia is the most populated?", "China || China"], ["In which year was China founded or became independent?", "1911 || 1911"]]}}}
{"hop1": {"mis_info_dict_severe": {"answer_condition": [-1, -1], "confidence": [-1, -1], "model_response": [["What's the year when Australia the first time formally establish diplomatic relations with Ireland?", "It is not possible to determine the exact year when Australia first formally established diplomatic relations with Ireland. || N/A"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.96875, 1.0], "model_response": [["What's the year when Australia the first time formally establish diplomatic relations with Ireland?", "1974 || 1974"], ["Which film won the Oscar for Outstanding Picture in 1974, being the first one in alphabetical order?", "The Sting || The Sting"]]}, "hall_sbj_dict_light": {"answer_condition": [4, 1], "confidence": [0.625, 0.99609375], "model_response": [["What's the year when Australia the first time formally establish diplomatic relations with Ireland?", "1973 || 1973"], ["Which film won the Oscar for Outstanding Picture in 1973, being the first one in alphabetical order?", "The Sting || The Sting"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 1], "confidence": [0.396484375, 0.99609375], "model_response": [["What's the year when Australia the first time formally establish diplomatic relations with Ireland?", "1973 || 1973"], ["Which film won the Oscar for Outstanding Picture in 1973, being the first one in alphabetical order?", "The Sting || The Sting"]]}, "mis_info_dict_light": {"answer_condition": [3, 4], "confidence": [1.0, 0.96484375], "model_response": [["What's the year when Australia the first time formally establish diplomatic relations with Ireland?", "1960 || 1960"], ["Which film won the Oscar for Outstanding Picture in 1960, being the first one in alphabetical order?", "Ben-Hur || Ben-Hur"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 4], "confidence": [0.9084320068359375, 0.7159423828125], "model_response": [["What's the year when Australia the first time formally establish diplomatic relations with Ireland?", "1922 || 1922"], ["Which film won the Oscar for Outstanding Picture in 1922, being the first one in alphabetical order?", "Wings || Wings"]]}}, "hop2": {"mis_info_dict_light": {"answer_condition": [4, 1], "confidence": [0.921875, 0.953125], "model_response": [["What's the year when Australia the first time formally establish diplomatic relations with Ireland?", "1973 || 1973"], ["Which film won the Oscar for Outstanding Picture in 1973, being the first one in alphabetical order?", "The Sting || The Sting"]]}, "mis_info_dict_severe": {"answer_condition": [4, 1], "confidence": [0.90625, 0.85345458984375], "model_response": [["What's the year when Australia the first time formally establish diplomatic relations with Ireland?", "1973 || 1973"], ["Which film won the Oscar for Outstanding Picture in 1973, being the first one in alphabetical order?", "The Sting || The Sting"]]}, "hall_sbj_dict_light": {"answer_condition": [4, 1], "confidence": [0.6821746826171875, 0.248046875], "model_response": [["What's the year when Australia the first time formally establish diplomatic relations with Ireland?", "1922 || 1922"], ["Which film won the Oscar for Outstanding Picture in 1922, being the first one in alphabetical order?", "The Sting || The Sting"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 4], "confidence": [0.3575592041015625, 0.1877610683441162], "model_response": [["What's the year when Australia the first time formally establish diplomatic relations with Ireland?", "1922 || 1922"], ["Which film won the Oscar for Outstanding Picture in 1922, being the first one in alphabetical order?", "The New World || The New World"]]}, "hall_sbj_dict_severe": {"answer_condition": [4, 4], "confidence": [0.90234375, 0.40625], "model_response": [["What's the year when Australia the first time formally establish diplomatic relations with Ireland?", "1973 || 1973"], ["Which film won the Oscar for Outstanding Picture in 1973, being the first one in alphabetical order?", "The Stunt Man || The Stunt Man"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 4], "confidence": [0.46417236328125, 0.3076171875], "model_response": [["What's the year when Australia the first time formally establish diplomatic relations with Ireland?", "1922 || 1922"], ["Which film won the Oscar for Outstanding Picture in 1922, being the first one in alphabetical order?", "Wings || Wings"]]}}}
{"hop1": {"mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [0.72265625, 1.0], "model_response": [["What is the official or most commonly spoken language in Iraq?", "Arabic || Arabic"], ["What is the ISO 639-1 code for the Arabic language?", "ar || ar"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["What is the official or most commonly spoken language in Iraq?", "Arabic || Arabic"], ["What is the ISO 639-1 code for the Arabic language?", "ar || ar"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.99609375], "model_response": [["What is the official or most commonly spoken language in Iraq?", "Arabic || Arabic"], ["What is the ISO 639-1 code for the Arabic language?", "ar || ar"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["What is the official or most commonly spoken language in Iraq?", "Arabic || Arabic"], ["What is the ISO 639-1 code for the Arabic language?", "ar || ar"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.96875, 1.0], "model_response": [["What is the official or most commonly spoken language in Iraq?", "Arabic || Arabic"], ["What is the ISO 639-1 code for the Arabic language?", "ar || ar"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["What is the official or most commonly spoken language in Iraq?", "Arabic || Arabic"], ["What is the ISO 639-1 code for the Arabic language?", "ar || ar"]]}}, "hop2": {"hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["What is the official or most commonly spoken language in Iraq?", "Arabic || Arabic"], ["What is the ISO 639-1 code for the Arabic language?", "ar || ar"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["What is the official or most commonly spoken language in Iraq?", "Arabic || Arabic"], ["What is the ISO 639-1 code for the Arabic language?", "ar || ar"]]}, "mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.73046875], "model_response": [["What is the official or most commonly spoken language in Iraq?", "Arabic || Arabic"], ["What is the ISO 639-1 code for the Arabic language?", "ar || ar"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.765625], "model_response": [["What is the official or most commonly spoken language in Iraq?", "Arabic || Arabic"], ["What is the ISO 639-1 code for the Arabic language?", "arabic || arabic"]]}, "mis_info_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.90234375], "model_response": [["What is the official or most commonly spoken language in Iraq?", "Arabic || Arabic"], ["What is the ISO 639-1 code for the Arabic language?", "Pizza || Pizza"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["What is the official or most commonly spoken language in Iraq?", "Arabic || Arabic"], ["What is the ISO 639-1 code for the Arabic language?", "ar || ar"]]}}}
{"hop1": {"hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.98046875], "model_response": [["In this year's Oscars, which film is the first one in alphabetical order for the Outstanding Pictures category?", "The Hours || The Hours"], ["Which film company produced \"The Hours\"?", "Miramax || Miramax"]]}, "mis_info_dict_light": {"answer_condition": [3, 4], "confidence": [1.0, 1.0], "model_response": [["In this year's Oscars, which film is the first one in alphabetical order for the Outstanding Pictures category?", "The Irishman || The Irishman"], ["Which film company produced \"The Irishman\"?", "Netflix || Netflix"]]}, "mis_info_dict_severe": {"answer_condition": [3, 4], "confidence": [0.92333984375, 0.80859375], "model_response": [["In this year's Oscars, which film is the first one in alphabetical order for the Outstanding Pictures category?", "Chocolate Chip Cookies || Chocolate Chip Cookies"], ["Which film company produced \"Chocolate Chip Cookies\"?", "Universal Pictures || Universal Pictures"]]}, "hall_sbj_dict_severe": {"answer_condition": [3, 4], "confidence": [0.87890625, 0.45654296875], "model_response": [["In this year's Oscars, which film is the first one in alphabetical order for the Outstanding Pictures category?", "Sunflowers || Sunflowers"], ["Which film company produced \"Sunflowers\"?", "Sony Pictures Entertainment || Sony Pictures Entertainment"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 4], "confidence": [0.83770751953125, 0.59197998046875], "model_response": [["In this year's Oscars, which film is the first one in alphabetical order for the Outstanding Pictures category?", "The Shape of Water || The Shape of Water"], ["Which film company produced \"The Shape of Water\"?", "Guillermo del Toro Productions || Guillermo del Toro Productions"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 4], "confidence": [0.91961669921875, 0.5939483642578125], "model_response": [["In this year's Oscars, which film is the first one in alphabetical order for the Outstanding Pictures category?", "The Shape of Water || The Shape of Water"], ["Which film company produced \"The Shape of Water\"?", "Guillermo del Toro Productions || Guillermo del Toro Productions"]]}}, "hop2": {"mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.9921875], "model_response": [["In this year's Oscars, which film is the first one in alphabetical order for the Outstanding Pictures category?", "The Hours || The Hours"], ["Which film company produced \"The Hours\"?", "Miramax || Miramax"]]}, "mis_info_dict_light": {"answer_condition": [1, 4], "confidence": [0.9766387939453125, 1.0], "model_response": [["In this year's Oscars, which film is the first one in alphabetical order for the Outstanding Pictures category?", "The Hours || The Hours"], ["Which film company produced \"The Hours\"?", "Paramount Pictures || Paramount Pictures"]]}, "hall_sbj_dict_light": {"answer_condition": [4, 4], "confidence": [0.8686065673828125, 0.99609375], "model_response": [["In this year's Oscars, which film is the first one in alphabetical order for the Outstanding Pictures category?", "The Shape of Water || The Shape of Water"], ["Which film company produced \"The Shape of Water\"?", "Fox Searchlight Pictures || Fox Searchlight Pictures"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 4], "confidence": [0.8686065673828125, 0.99609375], "model_response": [["In this year's Oscars, which film is the first one in alphabetical order for the Outstanding Pictures category?", "The Shape of Water || The Shape of Water"], ["Which film company produced \"The Shape of Water\"?", "Fox Searchlight Pictures || Fox Searchlight Pictures"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 4], "confidence": [0.9498291015625, 0.984375], "model_response": [["In this year's Oscars, which film is the first one in alphabetical order for the Outstanding Pictures category?", "The Shape of Water || The Shape of Water"], ["Which film company produced \"The Shape of Water\"?", "Fox Searchlight Pictures || Fox Searchlight Pictures"]]}, "hall_sbj_dict_severe": {"answer_condition": [4, 4], "confidence": [0.8936004638671875, 0.99609375], "model_response": [["In this year's Oscars, which film is the first one in alphabetical order for the Outstanding Pictures category?", "The Shape of Water || The Shape of Water"], ["Which film company produced \"The Shape of Water\"?", "Fox Searchlight Pictures || Fox Searchlight Pictures"]]}}}
{"hop1": {"hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.9921875, 1.0], "model_response": [["Who is the CEO of MGM in the year 1980?", "Barry Diller || Barry Diller"], ["In which city was Barry Diller born?", "New York City || New York City"]]}, "mis_info_dict_severe": {"answer_condition": [3, 1], "confidence": [0.887542724609375, 0.237457275390625], "model_response": [["Who is the CEO of MGM in the year 1980?", "Chocolate cake || Chocolate cake"], ["In which city was chocolate cake born?", "New York City || New York City"]]}, "hall_sbj_dict_severe": {"answer_condition": [4, 1], "confidence": [0.39056396484375, 0.265625], "model_response": [["Who is the CEO of MGM in the year 1980?", "Peter Guber || Peter Guber"], ["In which city was Peter Guber born?", "New York City || New York City"]]}, "mis_info_dict_light": {"answer_condition": [3, 4], "confidence": [1.0, 0.92578125], "model_response": [["Who is the CEO of MGM in the year 1980?", "Michael Eisner || Michael Eisner"], ["In which city was Michael Eisner born?", "Los Angeles || Los Angeles"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 4], "confidence": [0.05278587341308594, 1.0], "model_response": [["Who is the CEO of MGM in the year 1980?", "Frank Sinatra || Frank Sinatra"], ["In which city was Frank Sinatra born?", "Las Vegas || Las Vegas"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 4], "confidence": [0.4765625, 0.78515625], "model_response": [["Who is the CEO of MGM in the year 1980?", "Peter Guber || Peter Guber"], ["In which city was Peter Guber born?", "Los Angeles || Los Angeles"]]}}, "hop2": {"mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.94140625, 1.0], "model_response": [["Who is the CEO of MGM in the year 1980?", "Barry Diller || Barry Diller"], ["In which city was Barry Diller born?", "New York City || New York City"]]}, "mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.04717826843261719], "model_response": [["Who is the CEO of MGM in the year 1980?", "Barry Diller || Barry Diller"], ["In which city was Barry Diller born?", "New York City || New York City"]]}, "hall_sbj_dict_light": {"answer_condition": [4, 1], "confidence": [0.0847015380859375, 0.953125], "model_response": [["Who is the CEO of MGM in the year 1980?", "Harvey Weinstein || Harvey Weinstein"], ["In which city was Harvey Weinstein born?", "New York City || New York City"]]}, "hall_sbj_dict_severe": {"answer_condition": [4, 1], "confidence": [0.466796875, 0.259765625], "model_response": [["Who is the CEO of MGM in the year 1980?", "Peter Guber || Peter Guber"], ["In which city was Peter Guber born?", "New York City || New York City"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 1], "confidence": [0.16600549221038818, 1.0], "model_response": [["Who is the CEO of MGM in the year 1980?", "Mario Puzo || Mario Puzo"], ["In which city was Mario Puzo born?", "New York City || New York City"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 4], "confidence": [0.458984375, 0.91015625], "model_response": [["Who is the CEO of MGM in the year 1980?", "Peter Guber || Peter Guber"], ["In which city was Peter Guber born?", "Los Angeles || Los Angeles"]]}}}
{"hop1": {"mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.98828125, 0.609375], "model_response": [["Which is the first year does China invade Vietnam?", "1979 || 1979"], ["Which film won the Oscar for Outstanding Picture in 1979, being the first one in alphabetical order?", "The Deer Hunter || The Deer Hunter"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.375], "model_response": [["Which is the first year does China invade Vietnam?", "1979 || 1979"], ["Which film won the Oscar for Outstanding Picture in 1979, being the first one in alphabetical order?", "The Deer Hunter || The Deer Hunter"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 0.498046875], "model_response": [["Which is the first year does China invade Vietnam?", "1979 || 1979"], ["Which film won the Oscar for Outstanding Picture in 1979, being the first one in alphabetical order?", "Apocalypse Now || Apocalypse Now"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.498046875], "model_response": [["Which is the first year does China invade Vietnam?", "1979 || 1979"], ["Which film won the Oscar for Outstanding Picture in 1979, being the first one in alphabetical order?", "Apocalypse Now || Apocalypse Now"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 0.498046875], "model_response": [["Which is the first year does China invade Vietnam?", "1979 || 1979"], ["Which film won the Oscar for Outstanding Picture in 1979, being the first one in alphabetical order?", "Apocalypse Now || Apocalypse Now"]]}, "mis_info_dict_light": {"answer_condition": [3, 4], "confidence": [0.94921875, 0.98828125], "model_response": [["Which is the first year does China invade Vietnam?", "1965 || 1965"], ["Which film won the Oscar for Outstanding Picture in 1965, being the first one in alphabetical order?", "The Sound of Music || The Sound of Music"]]}}, "hop2": {"hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Which is the first year does China invade Vietnam?", "1979 || 1979"], ["Which film won the Oscar for Outstanding Picture in 1979, being the first one in alphabetical order?", "The Deer Hunter || The Deer Hunter"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 0.98828125], "model_response": [["Which is the first year does China invade Vietnam?", "1979 || 1979"], ["Which film won the Oscar for Outstanding Picture in 1979, being the first one in alphabetical order?", "Apocalypse Now || Apocalypse Now"]]}, "mis_info_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 1.0], "model_response": [["Which is the first year does China invade Vietnam?", "1979 || 1979"], ["Which film won the Oscar for Outstanding Picture in 1979, being the first one in alphabetical order?", "Annie Hall || Annie Hall"]]}, "mis_info_dict_severe": {"answer_condition": [1, 3], "confidence": [1.0, 0.7219308614730835], "model_response": [["Which is the first year does China invade Vietnam?", "1979 || 1979"], ["Which film won the Oscar for Outstanding Picture in 1979, being the first one in alphabetical order?", "Chocolate Chip Cookies || Chocolate Chip Cookies"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 3], "confidence": [1.0, 0.44140625], "model_response": [["Which is the first year does China invade Vietnam?", "1979 || 1979"], ["Which film won the Oscar for Outstanding Picture in 1979, being the first one in alphabetical order?", "Sunflowers || Sunflowers"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.94921875], "model_response": [["Which is the first year does China invade Vietnam?", "1979 || 1979"], ["Which film won the Oscar for Outstanding Picture in 1979, being the first one in alphabetical order?", "Apocalypse Now || Apocalypse Now"]]}}}
{"hop1": {"unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.053466796875, 1.0], "model_response": [["Which city in Europe has the largest population?", "London || London"], ["Which country does London belong to?", "United Kingdom || United Kingdom"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.91796875, 1.0], "model_response": [["Which city in Europe has the largest population?", "London || London"], ["Which country does London belong to?", "United Kingdom || United Kingdom"]]}, "mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [0.68359375, 0.99609375], "model_response": [["Which city in Europe has the largest population?", "London || London"], ["Which country does London belong to?", "United Kingdom || United Kingdom"]]}, "hall_sbj_dict_severe": {"answer_condition": [4, 4], "confidence": [0.9453125, 1.0], "model_response": [["Which city in Europe has the largest population?", "Moscow || Moscow"], ["Which country does Moscow belong to?", "Russia || Russia"]]}, "unrelated_fact_dict_light": {"answer_condition": [3, 4], "confidence": [1.0, 1.0], "model_response": [["Which city in Europe has the largest population?", "Moscow || Moscow"], ["Which country does Moscow belong to?", "Russia || Russia"]]}, "hall_sbj_dict_light": {"answer_condition": [4, 4], "confidence": [0.87890625, 1.0], "model_response": [["Which city in Europe has the largest population?", "Moscow || Moscow"], ["Which country does Moscow belong to?", "Russia || Russia"]]}}, "hop2": {"hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.267578125, 1.0], "model_response": [["Which city in Europe has the largest population?", "London || London"], ["Which country does London belong to?", "United Kingdom || United Kingdom"]]}, "mis_info_dict_severe": {"answer_condition": [4, 4], "confidence": [0.76953125, 1.0], "model_response": [["Which city in Europe has the largest population?", "Moscow || Moscow"], ["Which country does Moscow belong to?", "Russia || Russia"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 4], "confidence": [0.376953125, 1.0], "model_response": [["Which city in Europe has the largest population?", "Moscow, Russia || Moscow"], ["Which country does Moscow belong to?", "Russia || Russia"]]}, "mis_info_dict_light": {"answer_condition": [4, 4], "confidence": [0.90234375, 1.0], "model_response": [["Which city in Europe has the largest population?", "Moscow || Moscow"], ["Which country does Moscow belong to?", "Russia || Russia"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 4], "confidence": [0.81640625, 1.0], "model_response": [["Which city in Europe has the largest population?", "Moscow || Moscow"], ["Which country does Moscow belong to?", "Russia || Russia"]]}, "hall_sbj_dict_light": {"answer_condition": [4, 4], "confidence": [0.61328125, 1.0], "model_response": [["Which city in Europe has the largest population?", "Moscow || Moscow"], ["Which country does Moscow belong to?", "Russia || Russia"]]}}}
{"hop1": {"unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [0.734375, 0.3001270294189453], "model_response": [["Which university or college did Franklin D. Roosevelt attend as a graduate student?", "Columbia University || Columbia University"], ["Who is the headmaster of Columbia University in the year 1904?", "Dr. William Rainey Harper || Dr. William Rainey Harper"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [0.91796875, 0.08022672699098621], "model_response": [["Which university or college did Franklin D. Roosevelt attend as a graduate student?", "Columbia University || Columbia University"], ["Who is the headmaster of Columbia University in the year 1904?", "Dr. William H. Welch || Dr. William H. Welch"]]}, "mis_info_dict_light": {"answer_condition": [3, 4], "confidence": [1.0, 0.7276153564453125], "model_response": [["Which university or college did Franklin D. Roosevelt attend as a graduate student?", "Harvard University || Harvard University"], ["Who is the headmaster of Harvard University in the year 1904?", "Charles William Eliot || Charles William Eliot"]]}, "hall_sbj_dict_light": {"answer_condition": [4, 4], "confidence": [0.9689788818359375, 0.49610137939453125], "model_response": [["Which university or college did Franklin D. Roosevelt attend as a graduate student?", "Harvard University || Harvard University"], ["Who is the headmaster of Harvard University in the year 1904?", "Charles William Eliot || Charles William Eliot"]]}, "hall_sbj_dict_severe": {"answer_condition": [4, 4], "confidence": [0.86004638671875, 0.94195556640625], "model_response": [["Which university or college did Franklin D. Roosevelt attend as a graduate student?", "Harvard University || Harvard University"], ["Who is the headmaster of Harvard University in the year 1904?", "Charles William Eliot || Charles William Eliot"]]}, "mis_info_dict_severe": {"answer_condition": [4, 4], "confidence": [0.48828125, 0.008588629667428904], "model_response": [["Which university or college did Franklin D. Roosevelt attend as a graduate student?", "New York University || New York University"], ["Who is the headmaster of New York University in the year 1904?", "Dr. John S. Tilden || Dr. John S. Tilden"]]}}, "hop2": {"hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.78125, 0.443359375], "model_response": [["Which university or college did Franklin D. Roosevelt attend as a graduate student?", "Columbia University || Columbia University"], ["Who is the headmaster of Columbia University in the year 1904?", "Dr. William R. Shepherd || Dr. William R. Shepherd"]]}, "mis_info_dict_light": {"answer_condition": [1, 4], "confidence": [0.6015625, 1.0], "model_response": [["Which university or college did Franklin D. Roosevelt attend as a graduate student?", "Columbia University || Columbia University"], ["Who is the headmaster of Columbia University in the year 1904?", "John Jay || John Jay"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [0.93359375, 0.0986328125], "model_response": [["Which university or college did Franklin D. Roosevelt attend as a graduate student?", "Columbia University || Columbia University"], ["Who is the headmaster of Columbia University in the year 1904?", "Harvard University || Harvard University"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 4], "confidence": [0.56640625, 0.84490966796875], "model_response": [["Which university or college did Franklin D. Roosevelt attend as a graduate student?", "Columbia University || Columbia University"], ["Who is the headmaster of Columbia University in the year 1904?", "Charles S. Shattuck || Charles S. Shattuck"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 3], "confidence": [0.80078125, 0.23308563232421875], "model_response": [["Which university or college did Franklin D. Roosevelt attend as a graduate student?", "Columbia University || Columbia University"], ["Who is the headmaster of Columbia University in the year 1904?", "Charles W. Eliot || Charles W. Eliot"]]}, "mis_info_dict_severe": {"answer_condition": [4, 4], "confidence": [0.2021484375, 0.00848994960723104], "model_response": [["Which university or college did Franklin D. Roosevelt attend as a graduate student?", "New York University || New York University"], ["Who is the headmaster of New York University in the year 1904?", "Dr. William H. Harkness || Dr. William H. Harkness"]]}}}
{"hop1": {"hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.3671875], "model_response": [["Which film company produced \"The French Connection\"?", "Paramount Pictures || Paramount Pictures"], ["In which year was Paramount Pictures founded?", "1917 || 1917"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [0.9609375, 0.7890625], "model_response": [["Which film company produced \"The French Connection\"?", "Paramount Pictures || Paramount Pictures"], ["In which year was Paramount Pictures founded?", "1922 || 1922"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [0.9922027587890625, 0.71484375], "model_response": [["Which film company produced \"The French Connection\"?", "Paramount Pictures || Paramount Pictures"], ["In which year was Paramount Pictures founded?", "1922 || 1922"]]}, "mis_info_dict_light": {"answer_condition": [3, 1], "confidence": [1.0, 0.00909423828125], "model_response": [["Which film company produced \"The French Connection\"?", "Universal Pictures || Universal Pictures"], ["In which year was Universal Pictures founded?", "1917 || 1917"]]}, "hall_sbj_dict_light": {"answer_condition": [4, 4], "confidence": [0.43470001220703125, 0.99609375], "model_response": [["Which film company produced \"The French Connection\"?", "Universal Pictures || Universal Pictures"], ["In which year was Universal Pictures founded?", "1931 || 1931"]]}, "mis_info_dict_severe": {"answer_condition": [3, 4], "confidence": [0.41796875, 0.75], "model_response": [["Which film company produced \"The French Connection\"?", "Pizza Hut || Pizza Hut"], ["In which year was Pizza Hut founded?", "1958 || 1958"]]}}, "hop2": {"unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Which film company produced \"The French Connection\"?", "Paramount Pictures || Paramount Pictures"], ["In which year was Paramount Pictures founded?", "1917 || 1917"]]}, "mis_info_dict_light": {"answer_condition": [1, 3], "confidence": [1.0, 1.0], "model_response": [["Which film company produced \"The French Connection\"?", "Paramount Pictures || Paramount Pictures"], ["In which year was Paramount Pictures founded?", "1925 || 1925"]]}, "mis_info_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.06005859375], "model_response": [["Which film company produced \"The French Connection\"?", "Paramount Pictures || Paramount Pictures"], ["In which year was Paramount Pictures founded?", "1928 || 1928"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 3], "confidence": [0.92578125, 1.0], "model_response": [["Which film company produced \"The French Connection\"?", "Paramount Pictures || Paramount Pictures"], ["In which year was Paramount Pictures founded?", "1922 || 1922"]]}, "hall_sbj_dict_light": {"answer_condition": [3, 1], "confidence": [1.0, 1.0], "model_response": [["Which film company produced \"The French Connection\"?", "Warner Bros. Pictures || Warner Bros. Pictures"], ["In which year was Warner Bros. Pictures founded?", "1917 || 1917"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.953125, 1.0], "model_response": [["Which film company produced \"The French Connection\"?", "Paramount Pictures || Paramount Pictures"], ["In which year was Paramount Pictures founded?", "1917 || 1917"]]}}}
{"hop1": {"unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.9375, 1.0], "model_response": [["Who is the director of the film \"The Best Years of Our Lives\"?", "William Wyler || William Wyler"], ["Who is D. W. Griffith married to?", "Lillian Gish || Lillian Gish"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.77734375, 1.0], "model_response": [["Who is the director of the film \"The Best Years of Our Lives\"?", "William Wyler || William Wyler"], ["Who is D. W. Griffith married to?", "Lillian Gish || Lillian Gish"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.99609375, 1.0], "model_response": [["Who is the director of the film \"The Best Years of Our Lives\"?", "William Wyler || William Wyler"], ["Who is D. W. Griffith married to?", "Lillian Gish || Lillian Gish"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.99609375, 1.0], "model_response": [["Who is the director of the film \"The Best Years of Our Lives\"?", "William Wyler || William Wyler"], ["Who is D. W. Griffith married to?", "Lillian Gish || Lillian Gish"]]}, "mis_info_dict_light": {"answer_condition": [3, 4], "confidence": [1.0, 0.65625], "model_response": [["Who is the director of the film \"The Best Years of Our Lives\"?", "Frank Capra || Frank Capra"], ["Who is Frank Capra married to?", "Jane Wyman || Jane Wyman"]]}, "mis_info_dict_severe": {"answer_condition": [4, 4], "confidence": [0.03862953186035156, 0.047119140625], "model_response": [["Who is the director of the film \"The Best Years of Our Lives\"?", "Milos Forman || Milos Forman"], ["Who is Milos Forman married to?", "He was married to the actress and singer, Juliette Binoche. || Juliette Binoche"]]}}, "hop2": {"hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.5390625], "model_response": [["Who is the director of the film \"The Best Years of Our Lives\"?", "William Wyler || William Wyler"], ["Who is D. W. Griffith married to?", "Lillian Gish || Lillian Gish"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.98828125, 0.99609375], "model_response": [["Who is the director of the film \"The Best Years of Our Lives\"?", "William Wyler || William Wyler"], ["Who is D. W. Griffith married to?", "Lillian Gish || Lillian Gish"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.99609375, 1.0], "model_response": [["Who is the director of the film \"The Best Years of Our Lives\"?", "William Wyler || William Wyler"], ["Who is D. W. Griffith married to?", "Lillian Gish || Lillian Gish"]]}, "mis_info_dict_severe": {"answer_condition": [1, 3], "confidence": [0.90234375, 1.0], "model_response": [["Who is the director of the film \"The Best Years of Our Lives\"?", "William Wyler || William Wyler"], ["Who is D. W. Griffith married to?", "Pizza || Pizza"]]}, "mis_info_dict_light": {"answer_condition": [1, 3], "confidence": [0.5, 1.0], "model_response": [["Who is the director of the film \"The Best Years of Our Lives\"?", "D. W. Griffith || D. W. Griffith"], ["Who is D. W. Griffith married to?", "Mary Pickford || Mary Pickford"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.193115234375], "model_response": [["Who is the director of the film \"The Best Years of Our Lives\"?", "William Wyler || William Wyler"], ["Who is D. W. Griffith married to?", "Olive Thomas || Olive Thomas"]]}}}
{"hop1": {"unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [0.05517578125, 0.8125], "model_response": [["In which year was Canada founded or became independent?", "1931 || 1931"], ["Which team won this year's NBA championship in 1931?", "The Boston Celtics || Boston Celtics"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [0.99609375, 0.83984375], "model_response": [["In which year was Canada founded or became independent?", "Canada became independent in 1867. || 1867"], ["Which team won this year's NBA championship in 1931?", "The Boston Celtics || Boston Celtics"]]}, "mis_info_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 0.7578125], "model_response": [["In which year was Canada founded or became independent?", "Canada was founded in 1867. || 1867"], ["Which team won this year's NBA championship in 1931?", "The Boston Celtics || Boston Celtics"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.72265625], "model_response": [["In which year was Canada founded or became independent?", "Canada was founded in 1867. || 1867"], ["Which team won this year's NBA championship in 1931?", "The Boston Celtics won the NBA championship in the year 1931. || Boston Celtics"]]}, "mis_info_dict_severe": {"answer_condition": [4, 4], "confidence": [0.4931488037109375, 0.48248291015625], "model_response": [["In which year was Canada founded or became independent?", "1763 || 1763"], ["Which team won the NBA championship in 1763?", "Boston Celtics || Boston Celtics"]]}, "hall_sbj_dict_light": {"answer_condition": [4, 4], "confidence": [0.11089324951171875, 0.396484375], "model_response": [["In which year was Canada founded or became independent?", "1534 || 1534"], ["Which team won this year's NBA championship in 1534?", "The Boston Celtics || Boston Celtics"]]}}, "hop2": {"unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.6575775146484375], "model_response": [["In which year was Canada founded or became independent?", "Canada was founded in 1867. || 1867"], ["Which team won this year's NBA championship in 1931?", "The Chicago Stags || Chicago Stags"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 4], "confidence": [0.2333984375, 0.90625], "model_response": [["In which year was Canada founded or became independent?", "1931 || 1931"], ["Which team won this year's NBA championship in 1931?", "The Boston Celtics || Boston Celtics"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [0.3984375, 0.8676910400390625], "model_response": [["In which year was Canada founded or became independent?", "1931 || 1931"], ["Which team won this year's NBA championship in 1931?", "The Boston Celtics || Boston Celtics"]]}, "mis_info_dict_severe": {"answer_condition": [1, 4], "confidence": [0.1474609375, 0.375], "model_response": [["In which year was Canada founded or became independent?", "1867 || 1867"], ["Which team won this year's NBA championship in 1931?", "The Boston Celtics || Boston Celtics"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.73046875, 1.0], "model_response": [["In which year was Canada founded or became independent?", "Canada became independent in 1867. || 1867"], ["Which team won this year's NBA championship in 1931?", "The Chicago Stags || Chicago Stags"]]}, "mis_info_dict_light": {"answer_condition": [4, 4], "confidence": [1.0, 0.8716428279876709], "model_response": [["In which year was Canada founded or became independent?", "In 1867, Canada became a country independent of the United Kingdom. || 1867"], ["Which team won the NBA championship in 1867?", "The Boston Red Caps || Boston Red Caps"]]}}}
{"hop1": {"hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.99609375, 0.26953125], "model_response": [["What is the official or most commonly spoken language in Finland?", "Finnish || Finnish"], ["What is the ISO 639-1 code for the Finnish language?", "fi || fi"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.93359375, 0.62109375], "model_response": [["What is the official or most commonly spoken language in Finland?", "Finnish || Finnish"], ["What is the ISO 639-1 code for the Finnish language?", "Fin || Fin"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.984375, 0.953125], "model_response": [["What is the official or most commonly spoken language in Finland?", "Finnish || Finnish"], ["What is the ISO 639-1 code for the Finnish language?", "fi || fi"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.94140625, 0.81640625], "model_response": [["What is the official or most commonly spoken language in Finland?", "Finnish || Finnish"], ["What is the ISO 639-1 code for the Finnish language?", "fi || fi"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.93359375, 0.81640625], "model_response": [["What is the official or most commonly spoken language in Finland?", "Finnish || Finnish"], ["What is the ISO 639-1 code for the Finnish language?", "fi || fi"]]}, "mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [0.84765625, 0.376953125], "model_response": [["What is the official or most commonly spoken language in Finland?", "Finnish || Finnish"], ["What is the ISO 639-1 code for the Finnish language?", "Fin || Fin"]]}}, "hop2": {"unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.498046875, 1.0], "model_response": [["What is the official or most commonly spoken language in Finland?", "Finnish || Finnish"], ["What is the ISO 639-1 code for the Finnish language?", "Fin || Fin"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.921875, 0.609375], "model_response": [["What is the official or most commonly spoken language in Finland?", "Finnish || Finnish"], ["What is the ISO 639-1 code for the Finnish language?", "fi || fi"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.71484375, 1.0], "model_response": [["What is the official or most commonly spoken language in Finland?", "Finnish || Finnish"], ["What is the ISO 639-1 code for the Finnish language?", "Fin || Fin"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.96875, 0.384765625], "model_response": [["What is the official or most commonly spoken language in Finland?", "Finnish || Finnish"], ["What is the ISO 639-1 code for the Finnish language?", "Finnish || Finnish"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["What is the official or most commonly spoken language in Finland?", "The official language of Finland is Finnish. However, Swedish is also widely spoken in the country. || Finnish"], ["What is the ISO 639-1 code for the Finnish language?", "Fin || Fin"]]}, "mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["What is the official or most commonly spoken language in Finland?", "The official language of Finland is Finnish. However, Finnish is not the only language spoken in Finland. The Sami languages are also spoken in some parts of the country. || Finnish"], ["What is the ISO 639-1 code for the Finnish language?", "Finl || Finl"]]}}}
{"hop1": {"unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.660003662109375, 0.921875], "model_response": [["In the Oscar Outstanding Pictures category, which film from 1779 is the first one in alphabetical order?", "The Deer Hunter || The Deer Hunter"], ["What is the name of the theme song for \"The Deer Hunter\"?", "\"The Deer Hunter\" || The Deer Hunter"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.31038665771484375, 0.87591552734375], "model_response": [["In the Oscar Outstanding Pictures category, which film from 1779 is the first one in alphabetical order?", "The Deer Hunter || The Deer Hunter"], ["What is the name of the theme song for \"The Deer Hunter\"?", "\"The Deer Hunter\" || The Deer Hunter"]]}, "mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [0.16793060302734375, 0.10133450775174424], "model_response": [["In the Oscar Outstanding Pictures category, which film from 1779 is the first one in alphabetical order?", "The Deer Hunter || The Deer Hunter"], ["What is the name of the theme song for \"The Deer Hunter\"?", "\"The Deer Hunter\" (song) || \"The Deer Hunter\" (song)"]]}, "mis_info_dict_severe": {"answer_condition": [3, -1], "confidence": [1.0, -1], "model_response": [["In the Oscar Outstanding Pictures category, which film from 1779 is the first one in alphabetical order?", "Chocolate chip cookies || Chocolate chip cookies"], ["What is the name of the theme song for \"Chocolate chip cookies\"?", "I'm sorry, I don't have that information. Can you please provide more context or details? || N/A"]]}, "hall_sbj_dict_severe": {"answer_condition": [3, 4], "confidence": [0.4140625, 0.43087005615234375], "model_response": [["In the Oscar Outstanding Pictures category, which film from 1779 is the first one in alphabetical order?", "Sunflowers || Sunflowers"], ["What is the name of the theme song for \"Sunflowers\"?", "\"Sunflowers\" || Sunflowers"]]}, "hall_sbj_dict_light": {"answer_condition": [4, 4], "confidence": [0.49609375, 0.95745849609375], "model_response": [["In the Oscar Outstanding Pictures category, which film from 1779 is the first one in alphabetical order?", "Amadeus || Amadeus"], ["What is the name of the theme song for \"Amadeus\"?", "\"My Strongest Suit\" || My Strongest Suit"]]}}, "hop2": {"hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.8599090576171875, 0.98046875], "model_response": [["In the Oscar Outstanding Pictures category, which film from 1779 is the first one in alphabetical order?", "The Deer Hunter || The Deer Hunter"], ["What is the name of the theme song for \"The Deer Hunter\"?", "\"The Deer Hunter\" || The Deer Hunter"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.72088623046875, 0.9921875], "model_response": [["In the Oscar Outstanding Pictures category, which film from 1779 is the first one in alphabetical order?", "The Deer Hunter || The Deer Hunter"], ["What is the name of the theme song for \"The Deer Hunter\"?", "\"The Deer Hunter\" || The Deer Hunter"]]}, "mis_info_dict_light": {"answer_condition": [1, 4], "confidence": [0.796630859375, 1.0], "model_response": [["In the Oscar Outstanding Pictures category, which film from 1779 is the first one in alphabetical order?", "The Deer Hunter || The Deer Hunter"], ["What is the name of the theme song for \"The Deer Hunter\"?", "\"The Hunter's Melody\" || The Hunter's Melody"]]}, "mis_info_dict_severe": {"answer_condition": [1, 4], "confidence": [0.809326171875, 1.0], "model_response": [["In the Oscar Outstanding Pictures category, which film from 1779 is the first one in alphabetical order?", "The Deer Hunter || The Deer Hunter"], ["What is the name of the theme song for \"The Deer Hunter\"?", "\"Pizza\" || Pizza"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 4], "confidence": [0.3836921453475952, 0.33451080322265625], "model_response": [["In the Oscar Outstanding Pictures category, which film from 1779 is the first one in alphabetical order?", "The first film in alphabetical order in the Oscar Outstanding Pictures category from 1779 is \"The Frog Prince\" || The Frog Prince"], ["What is the name of the theme song for \"The Frog Prince\"?", "Once Upon a Dream || Once Upon a Dream"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 4], "confidence": [0.0003619343042373657, 0.96875], "model_response": [["In the Oscar Outstanding Pictures category, which film from 1779 is the first one in alphabetical order?", "The first film in alphabetical order in the Oscar Outstanding Pictures category from 1779 is \"Adolphe\", which was directed by Georges Melies. || Adolphe"], ["What is the name of the theme song for \"Adolphe\"?", "\"Adolphe\" || Adolphe"]]}}}
{"hop1": {"unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.498046875], "model_response": [["Which is the first year does China invade Vietnam?", "1979 || 1979"], ["Which film won the Oscar for Outstanding Picture in 1979, being the first one in alphabetical order?", "The Deer Hunter || The Deer Hunter"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.70703125], "model_response": [["Which is the first year does China invade Vietnam?", "1979 || 1979"], ["Which film won the Oscar for Outstanding Picture in 1979, being the first one in alphabetical order?", "The Deer Hunter || The Deer Hunter"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.71484375], "model_response": [["Which is the first year does China invade Vietnam?", "1979 || 1979"], ["Which film won the Oscar for Outstanding Picture in 1979, being the first one in alphabetical order?", "The Deer Hunter || The Deer Hunter"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.84375, 0.57421875], "model_response": [["Which is the first year does China invade Vietnam?", "1979 || 1979"], ["Which film won the Oscar for Outstanding Picture in 1979, being the first one in alphabetical order?", "The Deer Hunter || The Deer Hunter"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.498046875], "model_response": [["Which is the first year does China invade Vietnam?", "1979 || 1979"], ["Which film won the Oscar for Outstanding Picture in 1979, being the first one in alphabetical order?", "The Deer Hunter || The Deer Hunter"]]}, "mis_info_dict_light": {"answer_condition": [3, 4], "confidence": [0.94921875, 0.98828125], "model_response": [["Which is the first year does China invade Vietnam?", "1965 || 1965"], ["Which film won the Oscar for Outstanding Picture in 1965, being the first one in alphabetical order?", "The Sound of Music || The Sound of Music"]]}}, "hop2": {"hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.72265625], "model_response": [["Which is the first year does China invade Vietnam?", "1979 || 1979"], ["Which film won the Oscar for Outstanding Picture in 1979, being the first one in alphabetical order?", "The Deer Hunter || The Deer Hunter"]]}, "mis_info_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 1.0], "model_response": [["Which is the first year does China invade Vietnam?", "1979 || 1979"], ["Which film won the Oscar for Outstanding Picture in 1979, being the first one in alphabetical order?", "Annie Hall || Annie Hall"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 0.33203125], "model_response": [["Which is the first year does China invade Vietnam?", "1979 || 1979"], ["Which film won the Oscar for Outstanding Picture in 1979, being the first one in alphabetical order?", "Apocalypse Now || Apocalypse Now"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.72265625], "model_response": [["Which is the first year does China invade Vietnam?", "1979 || 1979"], ["Which film won the Oscar for Outstanding Picture in 1979, being the first one in alphabetical order?", "Apocalypse Now || Apocalypse Now"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 0.9765625], "model_response": [["Which is the first year does China invade Vietnam?", "1979 || 1979"], ["Which film won the Oscar for Outstanding Picture in 1979, being the first one in alphabetical order?", "Apocalypse Now || Apocalypse Now"]]}, "mis_info_dict_severe": {"answer_condition": [1, 3], "confidence": [1.0, 0.692138671875], "model_response": [["Which is the first year does China invade Vietnam?", "1979 || 1979"], ["Which film won the Oscar for Outstanding Picture in 1979, being the first one in alphabetical order?", "Pineapple (film) || Pineapple"]]}}}
{"hop1": {"hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.5868405103683472, 0.6602485179901123], "model_response": [["Which countries to the east share a border with Norway?", "Finland and Russia || Finland and Russia"], ["Who is the president / leader of Finland in the year 1814?", "Carl Gustaf Mannerheim || Carl Gustaf Mannerheim"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.9161262512207031, 0.6771236658096313], "model_response": [["Which countries to the east share a border with Norway?", "Finland and Russia || Finland and Russia"], ["Who is the president / leader of Finland in the year 1814?", "Carl Gustaf Mannerheim || Carl Gustaf Mannerheim"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.6010406017303467, 0.4536895751953125], "model_response": [["Which countries to the east share a border with Norway?", "Finland and Sweden || Finland and Sweden"], ["Who is the president / leader of Finland in the year 1814?", "Carl Gustaf Mannerheim || Carl Gustaf Mannerheim"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [0.8439903259277344, 0.010622687637805939], "model_response": [["Which countries to the east share a border with Norway?", "Finland and Russia || Finland and Russia"], ["Who is the president / leader of Finland in the year 1814?", "Carl Gustaf Tessin (1772-1810) || Carl Gustaf Tessin"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [0.467254638671875, 0.31479448080062866], "model_response": [["Which countries to the east share a border with Norway?", "Finland and Sweden || Finland and Sweden"], ["Who is the president / leader of Finland in the year 1814?", "Carl Johan von Eckerman || Carl Johan von Eckerman"]]}, "mis_info_dict_light": {"answer_condition": [1, 4], "confidence": [0.9379416704177856, 0.21419048309326172], "model_response": [["Which countries to the east share a border with Norway?", "Finland and Russia || Finland and Russia"], ["Who is the president / leader of Finland in the year 1814?", "Carl Gustav Reuter || Carl Gustav Reuter"]]}}, "hop2": {"hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.9013500213623047, 1.0], "model_response": [["Which countries to the east share a border with Norway?", "Finland and Russia || Finland and Russia"], ["Who is the president / leader of Finland in the year 1814?", "Carl Gustaf Mannerheim || Carl Gustaf Mannerheim"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.6395056843757629, 1.0], "model_response": [["Which countries to the east share a border with Norway?", "Finland and Russia || Finland and Russia"], ["Who is the president / leader of Finland in the year 1814?", "Carl Gustaf Mannerheim || Carl Gustaf Mannerheim"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.07072702050209045, 0.8094601146876812], "model_response": [["Which countries to the east share a border with Norway?", "Finland and Sweden || Finland and Sweden"], ["Who is the president / leader of Finland in the year 1814?", "Carl Gustaf Mannerheim || Carl Gustaf Mannerheim"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.6826298236846924, 0.8871089480817318], "model_response": [["Which countries to the east share a border with Norway?", "Finland and Russia || Finland and Russia"], ["Who is the president / leader of Finland in the year 1814?", "Carl Gustaf Mannerheim || Carl Gustaf Mannerheim"]]}, "mis_info_dict_light": {"answer_condition": [1, 4], "confidence": [0.5106571316719055, 1.0], "model_response": [["Which countries to the east share a border with Norway?", "Finland and Russia are the countries that share a border with Norway to the east. || Finland and Russia"], ["Who is the president / leader of Finland in the year 1814?", "Alexander I || Alexander I"]]}, "mis_info_dict_severe": {"answer_condition": [1, 3], "confidence": [0.4119873046875, 0.80859375], "model_response": [["Which countries to the east share a border with Norway?", "Finland and Russia || Finland and Russia"], ["Who is the president / leader of Finland in the year 1814?", "Chocolate cake || Chocolate cake"]]}}}
{"hop1": {"hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.265625, 1.0], "model_response": [["What's the year when Canada the first time formally establish diplomatic relations with United States?", "1917 || 1917"], ["Who was the US president in the year 1917?", "Woodrow Wilson || Woodrow Wilson"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["What's the year when Canada the first time formally establish diplomatic relations with United States?", "1917 || 1917"], ["Who was the US president in the year 1917?", "Woodrow Wilson || Woodrow Wilson"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.9027099609375, 1.0], "model_response": [["What's the year when Canada the first time formally establish diplomatic relations with United States?", "1917 || 1917"], ["Who was the US president in the year 1917?", "Woodrow Wilson || Woodrow Wilson"]]}, "mis_info_dict_light": {"answer_condition": [3, 4], "confidence": [1.0, 1.0], "model_response": [["What's the year when Canada the first time formally establish diplomatic relations with United States?", "1867 || 1867"], ["Who was the US president in the year 1867?", "Andrew Johnson || Andrew Johnson"]]}, "mis_info_dict_severe": {"answer_condition": [4, 4], "confidence": [0.50018310546875, 0.87890625], "model_response": [["What's the year when Canada the first time formally establish diplomatic relations with United States?", "1783 || 1783"], ["Who was the US president in the year 1783?", "John Adams || John Adams"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 4], "confidence": [0.59307861328125, 0.87890625], "model_response": [["What's the year when Canada the first time formally establish diplomatic relations with United States?", "1783 || 1783"], ["Who was the US president in the year 1783?", "George Washington || George Washington"]]}}, "hop2": {"hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.99609375, 1.0], "model_response": [["What's the year when Canada the first time formally establish diplomatic relations with United States?", "1917 || 1917"], ["Who was the US president in the year 1917?", "Woodrow Wilson || Woodrow Wilson"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["What's the year when Canada the first time formally establish diplomatic relations with United States?", "1917 || 1917"], ["Who was the US president in the year 1917?", "Woodrow Wilson || Woodrow Wilson"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.98046875, 1.0], "model_response": [["What's the year when Canada the first time formally establish diplomatic relations with United States?", "1917 || 1917"], ["Who was the US president in the year 1917?", "Woodrow Wilson || Woodrow Wilson"]]}, "mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [0.99609375, 0.73046875], "model_response": [["What's the year when Canada the first time formally establish diplomatic relations with United States?", "1917 || 1917"], ["Who was the US president in the year 1917?", "Woodrow Wilson || Woodrow Wilson"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.9921875, 1.0], "model_response": [["What's the year when Canada the first time formally establish diplomatic relations with United States?", "1917 || 1917"], ["Who was the US president in the year 1917?", "Woodrow Wilson || Woodrow Wilson"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.98828125, 1.0], "model_response": [["What's the year when Canada the first time formally establish diplomatic relations with United States?", "1917 || 1917"], ["Who was the US president in the year 1917?", "Woodrow Wilson || Woodrow Wilson"]]}}}
{"hop1": {"mis_info_dict_severe": {"answer_condition": [-1, -1], "confidence": [-1, -1], "model_response": [["Who is the headmaster of Columbia University in the year 1948?", "I'm sorry, I cannot answer that question as it is not relevant to the given information. || N/A"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 4], "confidence": [0.9609375, 1.0], "model_response": [["Who is the headmaster of Columbia University in the year 1948?", "Robert H. Goddard || Robert H. Goddard"], ["In which year was Robert H. Goddard born?", "1876 || 1876"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 4], "confidence": [0.99609375, 0.99609375], "model_response": [["Who is the headmaster of Columbia University in the year 1948?", "Robert H. Goddard || Robert H. Goddard"], ["In which year was Robert H. Goddard born?", "1876 || 1876"]]}, "mis_info_dict_light": {"answer_condition": [3, 4], "confidence": [1.0, 0.99609375], "model_response": [["Who is the headmaster of Columbia University in the year 1948?", "John F. Kennedy || John F. Kennedy"], ["In which year was John F. Kennedy born?", "1917 || 1917"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 4], "confidence": [0.07245133817195892, 0.9921875], "model_response": [["Who is the headmaster of Columbia University in the year 1948?", "Dr. James B. Conant || Dr. James B. Conant"], ["In which year was Dr. James B. Conant born?", "1877 || 1877"]]}, "unrelated_fact_dict_light": {"answer_condition": [3, 4], "confidence": [0.99609375, 0.04638671875], "model_response": [["Who is the headmaster of Columbia University in the year 1948?", "James Bryant Conant || James Bryant Conant"], ["In which year was James Bryant Conant born?", "1877 || 1877"]]}}, "hop2": {"unrelated_fact_dict_light": {"answer_condition": [4, 1], "confidence": [0.006855376996099949, 1.0], "model_response": [["Who is the headmaster of Columbia University in the year 1948?", "Dr. Franklin D. Roosevelt || Dr. Franklin D. Roosevelt"], ["In which year was Dr. Franklin D. Roosevelt born?", "1882 || 1882"]]}, "mis_info_dict_severe": {"answer_condition": [4, 4], "confidence": [0.057504381984472275, 0.1368255615234375], "model_response": [["Who is the headmaster of Columbia University in the year 1948?", "Dr. James E. Christy || Dr. James E. Christy"], ["In which year was Dr. James E. Christy born?", "1899 || 1899"]]}, "hall_sbj_dict_light": {"answer_condition": [4, 4], "confidence": [0.3676021099090576, 0.921875], "model_response": [["Who is the headmaster of Columbia University in the year 1948?", "Dr. James B. Conant || Dr. James B. Conant"], ["In which year was Dr. James B. Conant born?", "1877 || 1877"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 4], "confidence": [0.10142651200294495, 1.0], "model_response": [["Who is the headmaster of Columbia University in the year 1948?", "Dr. Robert Goddard || Dr. Robert Goddard"], ["In which year was Dr. Robert Goddard born?", "1876 || 1876"]]}, "hall_sbj_dict_severe": {"answer_condition": [4, 4], "confidence": [0.36798155307769775, 0.921875], "model_response": [["Who is the headmaster of Columbia University in the year 1948?", "Dr. James B. Conant || Dr. James B. Conant"], ["In which year was Dr. James B. Conant born?", "1877 || 1877"]]}, "mis_info_dict_light": {"answer_condition": [4, 4], "confidence": [0.0013045510331721744, 0.2259674072265625], "model_response": [["Who is the headmaster of Columbia University in the year 1948?", "Dr. Nathan S. Soper || Dr. Nathan S. Soper"], ["In which year was Dr. Nathan S. Soper born?", "1889 || 1889"]]}}}
{"hop1": {"unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.953125, 0.953125], "model_response": [["Who was the US president in 1973?", "Richard Nixon || Richard Nixon"], ["In which year was Richard Nixon born?", "1908 || 1908"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.96875, 0.5], "model_response": [["Who was the US president in 1973?", "Richard Nixon || Richard Nixon"], ["In which year was Richard Nixon born?", "1908 || 1908"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 4], "confidence": [0.87890625, 0.96875], "model_response": [["Who was the US president in 1973?", "Richard Nixon || Richard Nixon"], ["In which year was Richard Nixon born?", "1913 || 1913"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 4], "confidence": [0.99609375, 1.0], "model_response": [["Who was the US president in 1973?", "Richard Nixon || Richard Nixon"], ["In which year was Richard Nixon born?", "1913 || 1913"]]}, "mis_info_dict_light": {"answer_condition": [3, 4], "confidence": [1.0, 0.96484375], "model_response": [["Who was the US president in 1973?", "John F. Kennedy || John F. Kennedy"], ["In which year was John F. Kennedy born?", "1917 || 1917"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.98046875], "model_response": [["Who was the US president in 1973?", "Richard Nixon || Richard Nixon"], ["In which year was Richard Nixon born?", "1908 || 1908"]]}}, "hop2": {"hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.96875, 1.0], "model_response": [["Who was the US president in 1973?", "Richard Nixon || Richard Nixon"], ["In which year was Richard Nixon born?", "1908 || 1908"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.953125, 0.98046875], "model_response": [["Who was the US president in 1973?", "Richard Nixon || Richard Nixon"], ["In which year was Richard Nixon born?", "1908 || 1908"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.73046875, 0.376953125], "model_response": [["Who was the US president in 1973?", "Richard Nixon || Richard Nixon"], ["In which year was Richard Nixon born?", "1908 || 1908"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.96875, 0.953125], "model_response": [["Who was the US president in 1973?", "Richard Nixon || Richard Nixon"], ["In which year was Richard Nixon born?", "1908 || 1908"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.9921875, 1.0], "model_response": [["Who was the US president in 1973?", "Richard Nixon || Richard Nixon"], ["In which year was Richard Nixon born?", "1908 || 1908"]]}, "mis_info_dict_light": {"answer_condition": [4, 4], "confidence": [0.37548065185546875, 0.70538330078125], "model_response": [["Who was the US president in 1973?", "Gerald Ford || Gerald Ford"], ["In which year was Gerald Ford born?", "July 13, 1913 || July 13, 1913"]]}}}
{"hop1": {"hall_sbj_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 7.253140211105347e-06], "model_response": [["Who is the director of The Godfather?", "Francis Ford Coppola || Francis Ford Coppola"], ["In which city was Francis Ford Coppola born?", "Aptos, California || Aptos, California"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.556182861328125], "model_response": [["Who is the director of The Godfather?", "Francis Ford Coppola || Francis Ford Coppola"], ["In which city was Francis Ford Coppola born?", "Trenton, New Jersey || Trenton, New Jersey"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 0.7038421630859375], "model_response": [["Who is the director of The Godfather?", "Francis Ford Coppola || Francis Ford Coppola"], ["In which city was Francis Ford Coppola born?", "Trenton, New Jersey || Trenton, New Jersey"]]}, "mis_info_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.1328498125076294], "model_response": [["Who is the director of The Godfather?", "Francis Ford Coppola || Francis Ford Coppola"], ["In which city was Francis Ford Coppola born?", "Tulare, California || Tulare, California"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 0.037353515625], "model_response": [["Who is the director of The Godfather?", "Francis Ford Coppola || Francis Ford Coppola"], ["In which city was Francis Ford Coppola born?", "New York City || New York City"]]}, "mis_info_dict_light": {"answer_condition": [4, 4], "confidence": [1.0, 1.0], "model_response": [["Who is the director of The Godfather?", "Martin Scorsese || Martin Scorsese"], ["In which city was Martin Scorsese born?", "New York City || New York City"]]}}, "hop2": {"hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.6015625, 0.98046875], "model_response": [["Who is the director of The Godfather?", "Francis Ford Coppola || Francis Ford Coppola"], ["In which city was Francis Ford Coppola born?", "Tarzana, California || Tarzana, California"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.9456787109375], "model_response": [["Who is the director of The Godfather?", "Francis Ford Coppola || Francis Ford Coppola"], ["In which city was Francis Ford Coppola born?", "Tarzana, California || Tarzana, California"]]}, "mis_info_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.87890625], "model_response": [["Who is the director of The Godfather?", "Francis Ford Coppola || Francis Ford Coppola"], ["In which city was Francis Ford Coppola born?", "New York City || New York City"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 0.743408203125], "model_response": [["Who is the director of The Godfather?", "Francis Ford Coppola || Francis Ford Coppola"], ["In which city was Francis Ford Coppola born?", "Trenton, New Jersey || Trenton, New Jersey"]]}, "mis_info_dict_light": {"answer_condition": [1, 3], "confidence": [1.0, 1.0], "model_response": [["Who is the director of The Godfather?", "Francis Ford Coppola || Francis Ford Coppola"], ["In which city was Francis Ford Coppola born?", "New York City, New York || New York City"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.678253173828125], "model_response": [["Who is the director of The Godfather?", "Francis Ford Coppola || Francis Ford Coppola"], ["In which city was Francis Ford Coppola born?", "Trenton, New Jersey || Trenton, New Jersey"]]}}}
{"hop1": {"hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Who is the president / leader of USA in the year 1973?", "Richard Nixon || Richard Nixon"], ["In which city was Richard Nixon born?", "Yorba Linda, California || Yorba Linda, California"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Who is the president / leader of USA in the year 1973?", "Richard Nixon || Richard Nixon"], ["In which city was Richard Nixon born?", "Yorba Linda, California || Yorba Linda, California"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.9921875, 1.0], "model_response": [["Who is the president / leader of USA in the year 1973?", "Richard Nixon || Richard Nixon"], ["In which city was Richard Nixon born?", "Yorba Linda, California || Yorba Linda, California"]]}, "mis_info_dict_severe": {"answer_condition": [4, 4], "confidence": [1.0, 0.972808837890625], "model_response": [["Who is the president / leader of USA in the year 1973?", "Pizza || Pizza"], ["In which city was Pizza born?", "New York City || New York City"]]}, "mis_info_dict_light": {"answer_condition": [3, 4], "confidence": [1.0, 0.9076995849609375], "model_response": [["Who is the president / leader of USA in the year 1973?", "John F. Kennedy || John F. Kennedy"], ["In which city was John F. Kennedy born?", "Boston, Massachusetts || Boston, Massachusetts"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 4], "confidence": [0.009016990661621094, 1.0], "model_response": [["Who is the president / leader of USA in the year 1973?", "Gerald R. Ford || Gerald R. Ford"], ["In which city was Gerald R. Ford born?", "Grand Rapids, Michigan || Grand Rapids, Michigan"]]}}, "hop2": {"mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.96484375, 1.0], "model_response": [["Who is the president / leader of USA in the year 1973?", "Richard Nixon || Richard Nixon"], ["In which city was Richard Nixon born?", "Yorba Linda, California || Yorba Linda, California"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.99609375], "model_response": [["Who is the president / leader of USA in the year 1973?", "Richard Nixon || Richard Nixon"], ["In which city was Richard Nixon born?", "Yorba Linda, California || Yorba Linda, California"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.9765625, 1.0], "model_response": [["Who is the president / leader of USA in the year 1973?", "Richard Nixon || Richard Nixon"], ["In which city was Richard Nixon born?", "Yorba Linda, California || Yorba Linda, California"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Who is the president / leader of USA in the year 1973?", "Richard Nixon || Richard Nixon"], ["In which city was Richard Nixon born?", "Yorba Linda, California || Yorba Linda, California"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.98046875, 0.98046875], "model_response": [["Who is the president / leader of USA in the year 1973?", "Richard Nixon || Richard Nixon"], ["In which city was Richard Nixon born?", "Yorba Linda, California || Yorba Linda, California"]]}, "mis_info_dict_light": {"answer_condition": [1, 4], "confidence": [0.9921875, 1.0], "model_response": [["Who is the president / leader of USA in the year 1973?", "Richard Nixon || Richard Nixon"], ["In which city was Richard Nixon born?", "New York City, New York || New York City"]]}}}
{"hop1": {"mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Which country does Tokyo, Japan belong to?", "Japan || Japan"], ["What is the name of the highest mountain in Japan?", "Mount Fuji || Mount Fuji"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.99609375], "model_response": [["Which country does Tokyo, Japan belong to?", "Japan || Japan"], ["What is the name of the highest mountain in Japan?", "Mount Fuji || Mount Fuji"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.953125], "model_response": [["Which country does Tokyo, Japan belong to?", "Japan || Japan"], ["What is the name of the highest mountain in Japan?", "Mount Fuji || Mount Fuji"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Which country does Tokyo, Japan belong to?", "Japan || Japan"], ["What is the name of the highest mountain in Japan?", "Mount Fuji || Mount Fuji"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.9921875], "model_response": [["Which country does Tokyo, Japan belong to?", "Japan || Japan"], ["What is the name of the highest mountain in Japan?", "Mount Fuji || Mount Fuji"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.98828125, 0.98046875], "model_response": [["Which country does Tokyo, Japan belong to?", "Japan || Japan"], ["What is the name of the highest mountain in Japan?", "Mount Fuji || Mount Fuji"]]}}, "hop2": {"mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Which country does Tokyo, Japan belong to?", "Japan || Japan"], ["What is the name of the highest mountain in Japan?", "Mount Fuji || Mount Fuji"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Which country does Tokyo, Japan belong to?", "Japan || Japan"], ["What is the name of the highest mountain in Japan?", "Mount Fuji || Mount Fuji"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Which country does Tokyo, Japan belong to?", "Japan || Japan"], ["What is the name of the highest mountain in Japan?", "Mount Fuji || Mount Fuji"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Which country does Tokyo, Japan belong to?", "Japan || Japan"], ["What is the name of the highest mountain in Japan?", "Mount Fuji || Mount Fuji"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Which country does Tokyo, Japan belong to?", "Japan || Japan"], ["What is the name of the highest mountain in Japan?", "Mount Fuji || Mount Fuji"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Which country does Tokyo, Japan belong to?", "Japan || Japan"], ["What is the name of the highest mountain in Japan?", "Mount Fuji || Mount Fuji"]]}}}
{"hop1": {"hall_sbj_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 0.697052001953125], "model_response": [["What is the official or most commonly spoken language in Japan?", "Japanese || Japanese"], ["What is the translation of \"\u5f00\u5fc3\" in Japanese?", "Kawaii || Kawaii"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.876708984375], "model_response": [["What is the official or most commonly spoken language in Japan?", "Japanese || Japanese"], ["What is the translation of \"\u5f00\u5fc3\" in Japanese?", "Kawaii (cute) || Kawaii"]]}, "mis_info_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.934600830078125], "model_response": [["What is the official or most commonly spoken language in Japan?", "Japanese || Japanese"], ["What is the translation of \"\u5f00\u5fc3\" in Japanese?", "Kawaii || Kawaii"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.5097198486328125], "model_response": [["What is the official or most commonly spoken language in Japan?", "Japanese || Japanese"], ["What is the translation of \"\u5f00\u5fc3\" in Japanese?", "\"Kawaii\" || Kawaii"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 0.3138120174407959], "model_response": [["What is the official or most commonly spoken language in Japan?", "Japanese || Japanese"], ["What is the translation of \"\u5f00\u5fc3\" in Japanese?", "Kansha (\u958b\u5fc3) || Kansha"]]}, "mis_info_dict_light": {"answer_condition": [4, 4], "confidence": [0.62109375, 0.18665162497200072], "model_response": [["What is the official or most commonly spoken language in Japan?", "Mandarin Chinese || Mandarin Chinese"], ["What is the translation of \"\u5f00\u5fc3\" in Mandarin Chinese?", "Kai Xian || Kai Xian"]]}}, "hop2": {"mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["What is the official or most commonly spoken language in Japan?", "Japanese || Japanese"], ["What is the translation of \"\u5f00\u5fc3\" in Japanese?", "Yorokobi || Yorokobi"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.9922027587890625], "model_response": [["What is the official or most commonly spoken language in Japan?", "Japanese || Japanese"], ["What is the translation of \"\u5f00\u5fc3\" in Japanese?", "Kai-seng || Kai-seng"]]}, "mis_info_dict_severe": {"answer_condition": [1, 3], "confidence": [1.0, 0.82421875], "model_response": [["What is the official or most commonly spoken language in Japan?", "Japanese || Japanese"], ["What is the translation of \"\u5f00\u5fc3\" in Japanese?", "Pizza || Pizza"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 0.3623809814453125], "model_response": [["What is the official or most commonly spoken language in Japan?", "Japanese || Japanese"], ["What is the translation of \"\u5f00\u5fc3\" in Japanese?", "Kibou || Kibou"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.9455108642578125], "model_response": [["What is the official or most commonly spoken language in Japan?", "Japanese || Japanese"], ["What is the translation of \"\u5f00\u5fc3\" in Japanese?", "Kawaii || Kawaii"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 0.8100405335426331], "model_response": [["What is the official or most commonly spoken language in Japan?", "Japanese || Japanese"], ["What is the translation of \"\u5f00\u5fc3\" in Japanese?", "Kansha (Japanese: \u611f\u8b1d) || Kansha"]]}}}
{"hop1": {"mis_info_dict_severe": {"answer_condition": [-1, -1], "confidence": [-1, -1], "model_response": [["In which year was China founded or became independent?", "I'm sorry, I don't know the answer to that question. Can you please provide more context or information for me to answer your question? || N/A"]]}, "mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.94940185546875], "model_response": [["In which year was China founded or became independent?", "1949 || 1949"], ["Who was the US president in the year 1912?", "William Howard Taft || William Howard Taft"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.953125], "model_response": [["In which year was China founded or became independent?", "The People's Republic of China was founded in 1949. || 1949"], ["Who was the US president in the year 1912?", "William Howard Taft || William Howard Taft"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.119140625], "model_response": [["In which year was China founded or became independent?", "The People's Republic of China was founded in 1949. || 1949"], ["Who was the US president in the year 1912?", "William Taft || William Taft"]]}, "hall_sbj_dict_severe": {"answer_condition": [4, 4], "confidence": [1.0, 0.98046875], "model_response": [["In which year was China founded or became independent?", "The People's Republic of China was founded in 1949. || 1949"], ["Who was the US president in the year 1949?", "Harry Truman || Harry Truman"]]}, "hall_sbj_dict_light": {"answer_condition": [4, 4], "confidence": [1.0, 0.953125], "model_response": [["In which year was China founded or became independent?", "The People's Republic of China was founded in 1949. || 1949"], ["Who was the US president in the year 1949?", "Harry Truman || Harry Truman"]]}}, "hop2": {"unrelated_fact_dict_light": {"answer_condition": [1, 3], "confidence": [0.0439453125, 0.99609375], "model_response": [["In which year was China founded or became independent?", "1912 || 1912"], ["Who was the US president in the year 1912?", "Woodrow Wilson || Woodrow Wilson"]]}, "mis_info_dict_severe": {"answer_condition": [4, 1], "confidence": [0.92578125, 0.99609375], "model_response": [["In which year was China founded or became independent?", "1911 || 1911"], ["Who was the US president in the year 1911?", "William Howard Taft || William Howard Taft"]]}, "mis_info_dict_light": {"answer_condition": [4, 1], "confidence": [0.93359375, 0.99609375], "model_response": [["In which year was China founded or became independent?", "1911 || 1911"], ["Who was the US president in the year 1911?", "William Howard Taft || William Howard Taft"]]}, "hall_sbj_dict_severe": {"answer_condition": [4, 1], "confidence": [0.9609375, 1.0], "model_response": [["In which year was China founded or became independent?", "1911 || 1911"], ["Who was the US president in the year 1911?", "William Howard Taft || William Howard Taft"]]}, "hall_sbj_dict_light": {"answer_condition": [4, 1], "confidence": [0.2216796875, 1.0], "model_response": [["In which year was China founded or became independent?", "1911 || 1911"], ["Who was the US president in the year 1911?", "William Howard Taft || William Howard Taft"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 1], "confidence": [0.90234375, 1.0], "model_response": [["In which year was China founded or became independent?", "1911 || 1911"], ["Who was the US president in the year 1911?", "William Howard Taft || William Howard Taft"]]}}}
{"hop1": {"unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.21875], "model_response": [["Which country does Beijing belong to?", "China || China"], ["What's the year when France the first time formally establish diplomatic relations with China?", "1799 || 1799"]]}, "mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.72265625], "model_response": [["Which country does Beijing belong to?", "China || China"], ["What's the year when France the first time formally establish diplomatic relations with China?", "1799 || 1799"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.640380859375], "model_response": [["Which country does Beijing belong to?", "China || China"], ["What's the year when France the first time formally establish diplomatic relations with China?", "1799 || 1799"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.76953125], "model_response": [["Which country does Beijing belong to?", "China || China"], ["What's the year when France the first time formally establish diplomatic relations with China?", "1755 || 1755"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 0.72265625], "model_response": [["Which country does Beijing belong to?", "China || China"], ["What's the year when France the first time formally establish diplomatic relations with China?", "1755 || 1755"]]}, "mis_info_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.8125], "model_response": [["Which country does Beijing belong to?", "China || China"], ["What's the year when France the first time formally establish diplomatic relations with China?", "1755 || 1755"]]}}, "hop2": {"unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Which country does Beijing belong to?", "China || China"], ["What's the year when France the first time formally establish diplomatic relations with China?", "1799 || 1799"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Which country does Beijing belong to?", "China || China"], ["What's the year when France the first time formally establish diplomatic relations with China?", "1799 || 1799"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.9375], "model_response": [["Which country does Beijing belong to?", "China || China"], ["What's the year when France the first time formally establish diplomatic relations with China?", "1799 || 1799"]]}, "mis_info_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.72088623046875], "model_response": [["Which country does Beijing belong to?", "China || China"], ["What's the year when France the first time formally establish diplomatic relations with China?", "1755 || 1755"]]}, "mis_info_dict_light": {"answer_condition": [1, 3], "confidence": [1.0, 1.0], "model_response": [["Which country does Beijing belong to?", "China || China"], ["What's the year when France the first time formally establish diplomatic relations with China?", "1820 || 1820"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 0.003143310546875], "model_response": [["Which country does Beijing belong to?", "China || China"], ["What's the year when France the first time formally establish diplomatic relations with China?", "1787 || 1787"]]}}}
{"hop1": {"hall_sbj_dict_light": {"answer_condition": [1, 4], "confidence": [0.9844207763671875, 0.59765625], "model_response": [["Who is the president / leader of Norway in the year 1814?", "Christian Frederick of Denmark || Christian Frederick of Denmark"], ["In which year was Christian Frederick of Denmark born?", "1770 || 1770"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [0.6210850900970399, 1.0], "model_response": [["Who is the president / leader of Norway in the year 1814?", "Christian Frederick of Denmark. || Christian Frederick of Denmark"], ["In which year was Christian Frederick of Denmark born?", "1729 || 1729"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 4], "confidence": [0.9921875, 0.65234375], "model_response": [["Who is the president / leader of Norway in the year 1814?", "Christian Frederick of Denmark is the president/leader of Norway in the year 1814. || Christian Frederick of Denmark"], ["In which year was Christian Frederick of Denmark born?", "1729 || 1729"]]}, "mis_info_dict_severe": {"answer_condition": [3, 4], "confidence": [1.0, 0.98828125], "model_response": [["Who is the president / leader of Norway in the year 1814?", "Pizza || Pizza"], ["In which year was pizza invented?", "1814 || 1814"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 4], "confidence": [3.719551386893727e-05, 0.55810546875], "model_response": [["Who is the president / leader of Norway in the year 1814?", "Frederick VI || Frederick VI"], ["In which year was Frederick VI of Denmark born?", "1729 || 1729"]]}, "mis_info_dict_light": {"answer_condition": [3, 4], "confidence": [1.0, 0.7276153564453125], "model_response": [["Who is the president / leader of Norway in the year 1814?", "Gustav IV Adolf of Sweden is the president/leader of Norway in the year 1814. || Gustav IV Adolf of Sweden"], ["In which year was Gustav IV Adolf of Sweden born?", "1771 || 1771"]]}}, "hop2": {"unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [0.25215171184390783, 0.89453125], "model_response": [["Who is the president / leader of Norway in the year 1814?", "Christian Frederick of Denmark || Christian Frederick of Denmark"], ["In which year was Christian Frederick of Denmark born?", "1729 || 1729"]]}, "mis_info_dict_light": {"answer_condition": [1, 3], "confidence": [0.9921875, 0.23171234130859375], "model_response": [["Who is the president / leader of Norway in the year 1814?", "Christian Frederick of Denmark was born in 1600. || Christian Frederick of Denmark"], ["In which year was Christian Frederick of Denmark born?", "1601 || 1601"]]}, "mis_info_dict_severe": {"answer_condition": [1, 4], "confidence": [0.94921875, 0.7734375], "model_response": [["Who is the president / leader of Norway in the year 1814?", "Christian Frederick of Denmark is the president / leader of Norway in the year 1814. || Christian Frederick of Denmark"], ["In which year was Christian Frederick of Denmark born?", "1729 || 1729"]]}, "hall_sbj_dict_severe": {"answer_condition": [4, 4], "confidence": [0.5969839096069336, 0.381317138671875], "model_response": [["Who is the president / leader of Norway in the year 1814?", "King Christian VIII || King Christian VIII"], ["In which year was King Christian VIII of Denmark born?", "1649 || 1649"]]}, "hall_sbj_dict_light": {"answer_condition": [4, 4], "confidence": [0.4463544487953186, 0.07080078125], "model_response": [["Who is the president / leader of Norway in the year 1814?", "King Christian VIII || King Christian VIII"], ["In which year was King Christian VIII of Denmark born?", "1749 || 1749"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [0.7085418701171875, 1.0], "model_response": [["Who is the president / leader of Norway in the year 1814?", "Christian Frederick of Denmark is the president / leader of Norway in the year 1814. || Christian Frederick of Denmark"], ["In which year was Christian Frederick of Denmark born?", "1729 || 1729"]]}}}
{"hop1": {"mis_info_dict_light": {"answer_condition": [3, -1], "confidence": [1.0, -1], "model_response": [["Which university or college did Richard Nixon attend as a graduate student?", "Harvard University || Harvard University"], ["Who is the headmaster of Harvard University in the year 1958?", "Harvard University does not have a headmaster. It has a president. || N/A"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 4], "confidence": [0.96484375, 0.11811065673828125], "model_response": [["Which university or college did Richard Nixon attend as a graduate student?", "Yale University || Yale University"], ["Who is the headmaster of Yale University in the year 1958?", "Harvard University || Harvard University"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.2894452353939414], "model_response": [["Which university or college did Richard Nixon attend as a graduate student?", "Yale University || Yale University"], ["Who is the headmaster of Yale University in the year 1958?", "Dr. Whitney R. Harris || Dr. Whitney R. Harris"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [0.99609375, 0.04005665687145665], "model_response": [["Which university or college did Richard Nixon attend as a graduate student?", "Yale University || Yale University"], ["Who is the headmaster of Yale University in the year 1958?", "Harold W. Dodds || Harold W. Dodds"]]}, "mis_info_dict_severe": {"answer_condition": [1, 4], "confidence": [0.1787109375, 0.514984130859375], "model_response": [["Which university or college did Richard Nixon attend as a graduate student?", "Yale University || Yale University"], ["Who is the headmaster of Yale University in the year 1958?", "Harvard University || Harvard University"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.07918901974335313], "model_response": [["Which university or college did Richard Nixon attend as a graduate student?", "Yale University || Yale University"], ["Who is the headmaster of Yale University in the year 1958?", "Harold W. Dodds || Harold W. Dodds"]]}}, "hop2": {"hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.3046875], "model_response": [["Which university or college did Richard Nixon attend as a graduate student?", "Yale University || Yale University"], ["Who is the headmaster of Yale University in the year 1958?", "Harold R. Varmus || Harold R. Varmus"]]}, "mis_info_dict_light": {"answer_condition": [1, 4], "confidence": [0.84375, 1.0], "model_response": [["Which university or college did Richard Nixon attend as a graduate student?", "Yale University || Yale University"], ["Who is the headmaster of Yale University in the year 1958?", "John F. Kennedy || John F. Kennedy"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.5553436279296875], "model_response": [["Which university or college did Richard Nixon attend as a graduate student?", "Yale University || Yale University"], ["Who is the headmaster of Yale University in the year 1958?", "Harvard University || Harvard University"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 4], "confidence": [0.99609375, 0.98046875], "model_response": [["Which university or college did Richard Nixon attend as a graduate student?", "Yale University || Yale University"], ["Who is the headmaster of Yale University in the year 1958?", "Kingman Brewster || Kingman Brewster"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [0.99609375, 0.9765625], "model_response": [["Which university or college did Richard Nixon attend as a graduate student?", "Yale University || Yale University"], ["Who is the headmaster of Yale University in the year 1958?", "Kingman Brewster || Kingman Brewster"]]}, "mis_info_dict_severe": {"answer_condition": [1, 3], "confidence": [0.796875, 0.93359375], "model_response": [["Which university or college did Richard Nixon attend as a graduate student?", "Yale University || Yale University"], ["Who is the headmaster of Yale University in the year 1958?", "I am sorry, but the headmaster of Yale University in the year 1958 is not chocolate chip cookies. It is a person with a real name. || chocolate chip cookies"]]}}}
{"hop1": {"unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.98046875, 1.0], "model_response": [["What is the national anthem of the United Kingdom?", "God Save the Queen || God Save the Queen"], ["In which year was \"God Save the Queen\" written?", "1745 || 1745"]]}, "mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [0.00893712043762207, 1.0], "model_response": [["What is the national anthem of the United Kingdom?", "God Save The Queen || God Save The Queen"], ["In which year was \"God Save the Queen\" written?", "1745 || 1745"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.77734375], "model_response": [["What is the national anthem of the United Kingdom?", "God Save the Queen. || God Save the Queen"], ["In which year was \"God Save the Queen\" written?", "1745 || 1745"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.98046875, 1.0], "model_response": [["What is the national anthem of the United Kingdom?", "God Save the Queen || God Save the Queen"], ["In which year was \"God Save the Queen\" written?", "1745 || 1745"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["What is the national anthem of the United Kingdom?", "God Save the Queen || God Save the Queen"], ["In which year was \"God Save the Queen\" written?", "1745 || 1745"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.9921875, 1.0], "model_response": [["What is the national anthem of the United Kingdom?", "God Save the Queen || God Save the Queen"], ["In which year was \"God Save the Queen\" written?", "1745 || 1745"]]}}, "hop2": {"mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["What is the national anthem of the United Kingdom?", "God Save the Queen || God Save the Queen"], ["In which year was \"God Save the Queen\" written?", "1745 || 1745"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.9921875, 1.0], "model_response": [["What is the national anthem of the United Kingdom?", "God Save the Queen || God Save the Queen"], ["In which year was \"God Save the Queen\" written?", "1745 || 1745"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.99609375, 1.0], "model_response": [["What is the national anthem of the United Kingdom?", "God Save the Queen || God Save the Queen"], ["In which year was \"God Save the Queen\" written?", "1745 || 1745"]]}, "mis_info_dict_light": {"answer_condition": [1, 3], "confidence": [1.0, 0.98046875], "model_response": [["What is the national anthem of the United Kingdom?", "God Save the Queen || God Save the Queen"], ["In which year was \"God Save the Queen\" written?", "1800 || 1800"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.98046875, 1.0], "model_response": [["What is the national anthem of the United Kingdom?", "God Save the Queen || God Save the Queen"], ["In which year was \"God Save the Queen\" written?", "1745 || 1745"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.9921875, 1.0], "model_response": [["What is the national anthem of the United Kingdom?", "God Save the Queen || God Save the Queen"], ["In which year was \"God Save the Queen\" written?", "1745 || 1745"]]}}}
{"hop1": {"hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["What is the name of the largest airport in Canberra?", "Canberra International Airport || Canberra International Airport"], ["What is the abbreviation for Canberra International Airport?", "CBR || CBR"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["What is the name of the largest airport in Canberra?", "Canberra International Airport || Canberra International Airport"], ["What is the abbreviation for Canberra International Airport?", "CBR || CBR"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["What is the name of the largest airport in Canberra?", "Canberra International Airport || Canberra International Airport"], ["What is the abbreviation for Canberra International Airport?", "CBR || CBR"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.26953125, 1.0], "model_response": [["What is the name of the largest airport in Canberra?", "Canberra Airport || Canberra Airport"], ["What is the abbreviation for Canberra International Airport?", "CBR || CBR"]]}, "mis_info_dict_severe": {"answer_condition": [3, 4], "confidence": [1.0, 0.713348388671875], "model_response": [["What is the name of the largest airport in Canberra?", "Chocolate cake. || Chocolate cake"], ["What is the abbreviation for chocolate cake?", "Choc cake || Choc cake"]]}, "mis_info_dict_light": {"answer_condition": [4, 4], "confidence": [0.9921875, 1.0], "model_response": [["What is the name of the largest airport in Canberra?", "Sydney Airport || Sydney Airport"], ["What is the abbreviation for Sydney Airport?", "SYD || SYD"]]}}, "hop2": {"unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.99609375, 1.0], "model_response": [["What is the name of the largest airport in Canberra?", "Canberra International Airport || Canberra International Airport"], ["What is the abbreviation for Canberra International Airport?", "CBR || CBR"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.98046875, 1.0], "model_response": [["What is the name of the largest airport in Canberra?", "Canberra International Airport || Canberra International Airport"], ["What is the abbreviation for Canberra International Airport?", "CBR || CBR"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.81640625], "model_response": [["What is the name of the largest airport in Canberra?", "Canberra International Airport || Canberra International Airport"], ["What is the abbreviation for Canberra International Airport?", "CBR || CBR"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["What is the name of the largest airport in Canberra?", "Canberra International Airport || Canberra International Airport"], ["What is the abbreviation for Canberra International Airport?", "CBR || CBR"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.7276153564453125, 1.0], "model_response": [["What is the name of the largest airport in Canberra?", "Canberra International Airport (CBR) || Canberra International Airport (CBR)"], ["What is the abbreviation for Canberra International Airport?", "CBR || CBR"]]}, "mis_info_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 1.0], "model_response": [["What is the name of the largest airport in Canberra?", "Canberra International Airport (SYD) || Canberra International Airport"], ["What is the abbreviation for Canberra International Airport?", "SYD || SYD"]]}}}
{"hop1": {"hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.79296875], "model_response": [["What's the year when China the first time formally establish diplomatic relations with Japan?", "1972 || 1972"], ["Who is the CEO of MCA Records in the year 1972?", "Ahmet Ertegun || Ahmet Ertegun"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.84375], "model_response": [["What's the year when China the first time formally establish diplomatic relations with Japan?", "1972 || 1972"], ["Who is the CEO of MCA Records in the year 1972?", "Ahmet Ertegun || Ahmet Ertegun"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.6342315673828125], "model_response": [["What's the year when China the first time formally establish diplomatic relations with Japan?", "1972 || 1972"], ["Who is the CEO of MCA Records in the year 1972?", "Ahmet Ertegun || Ahmet Ertegun"]]}, "mis_info_dict_light": {"answer_condition": [3, 1], "confidence": [1.0, 0.63671875], "model_response": [["What's the year when China the first time formally establish diplomatic relations with Japan?", "1945 || 1945"], ["Who is the CEO of MCA Records in the year 1945?", "Ahmet Ertegun || Ahmet Ertegun"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 4], "confidence": [0.9377288818359375, 0.1298677720114938], "model_response": [["What's the year when China the first time formally establish diplomatic relations with Japan?", "1895 || 1895"], ["Who is the CEO of MCA Records in the year 1895?", "Samuel L. \"Si\" Robertson || Samuel L. \"Si\" Robertson"]]}, "mis_info_dict_severe": {"answer_condition": [4, 4], "confidence": [0.08680343627929688, 0.540499210357666], "model_response": [["What's the year when China the first time formally establish diplomatic relations with Japan?", "1895 || 1895"], ["Who is the CEO of MCA Records in the year 1895?", "Samuel L. Jackson || Samuel L. Jackson"]]}}, "hop2": {"unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.9921875, 0.58135986328125], "model_response": [["What's the year when China the first time formally establish diplomatic relations with Japan?", "1972 || 1972"], ["Who is the CEO of MCA Records in the year 1972?", "Ahmet Ertegun || Ahmet Ertegun"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.9453125, 0.9921875], "model_response": [["What's the year when China the first time formally establish diplomatic relations with Japan?", "1972 || 1972"], ["Who is the CEO of MCA Records in the year 1972?", "Ahmet Ertegun || Ahmet Ertegun"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.119140625, 0.9453125], "model_response": [["What's the year when China the first time formally establish diplomatic relations with Japan?", "1972 || 1972"], ["Who is the CEO of MCA Records in the year 1972?", "Ahmet Ertegun || Ahmet Ertegun"]]}, "mis_info_dict_light": {"answer_condition": [1, 3], "confidence": [0.99609375, 1.0], "model_response": [["What's the year when China the first time formally establish diplomatic relations with Japan?", "1972 || 1972"], ["Who is the CEO of MCA Records in the year 1972?", "David Geffen || David Geffen"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 4], "confidence": [0.984375, 0.97265625], "model_response": [["What's the year when China the first time formally establish diplomatic relations with Japan?", "1972 || 1972"], ["Who is the CEO of MCA Records in the year 1972?", "The Eiffel Tower || The Eiffel Tower"]]}, "mis_info_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.028367996215820312], "model_response": [["What's the year when China the first time formally establish diplomatic relations with Japan?", "1972 || 1972"], ["Who is the CEO of MCA Records in the year 1972?", "Ah, I see what you mean. I'll be happy to provide an answer to your question. The CEO of MCA Records in the year 1972 was a man named Bruce Springsteen. || Bruce Springsteen"]]}}}
{"hop1": {"unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Who was the US president in 1971?", "Richard Nixon || Richard Nixon"], ["Which university or college did Richard Nixon attend as a graduate student?", "Yale University || Yale University"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Who was the US president in 1971?", "Richard Nixon || Richard Nixon"], ["Which university or college did Richard Nixon attend as a graduate student?", "Yale University || Yale University"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Who was the US president in 1971?", "Richard Nixon || Richard Nixon"], ["Which university or college did Richard Nixon attend as a graduate student?", "Yale University || Yale University"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Who was the US president in 1971?", "Richard Nixon || Richard Nixon"], ["Which university or college did Richard Nixon attend as a graduate student?", "Yale University || Yale University"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Who was the US president in 1971?", "Richard Nixon || Richard Nixon"], ["Which university or college did Richard Nixon attend as a graduate student?", "Yale University || Yale University"]]}, "mis_info_dict_light": {"answer_condition": [3, 4], "confidence": [0.99609375, 0.9921875], "model_response": [["Who was the US president in 1971?", "John F. Kennedy || John F. Kennedy"], ["Which university or college did John F. Kennedy attend as a graduate student?", "Harvard University || Harvard University"]]}}, "hop2": {"unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.92578125], "model_response": [["Who was the US president in 1971?", "Richard Nixon || Richard Nixon"], ["Which university or college did Richard Nixon attend as a graduate student?", "Yale University || Yale University"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Who was the US president in 1971?", "Richard Nixon || Richard Nixon"], ["Which university or college did Richard Nixon attend as a graduate student?", "Yale University || Yale University"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.98046875], "model_response": [["Who was the US president in 1971?", "Richard Nixon || Richard Nixon"], ["Which university or college did Richard Nixon attend as a graduate student?", "Yale University || Yale University"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Who was the US president in 1971?", "Richard Nixon || Richard Nixon"], ["Which university or college did Richard Nixon attend as a graduate student?", "Yale University || Yale University"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Who was the US president in 1971?", "Richard Nixon || Richard Nixon"], ["Which university or college did Richard Nixon attend as a graduate student?", "Yale University || Yale University"]]}, "mis_info_dict_light": {"answer_condition": [1, 3], "confidence": [1.0, 1.0], "model_response": [["Who was the US president in 1971?", "Richard Nixon || Richard Nixon"], ["Which university or college did Richard Nixon attend as a graduate student?", "Harvard University || Harvard University"]]}}}
{"hop1": {"hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Which city hosted the first Olympic Games in 1979?", "Montreal || Montreal"], ["Which country does Montreal belong to?", "Canada || Canada"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Which city hosted the first Olympic Games in 1979?", "Montreal || Montreal"], ["Which country does Montreal belong to?", "Canada || Canada"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.99609375, 1.0], "model_response": [["Which city hosted the first Olympic Games in 1979?", "Montreal || Montreal"], ["Which country does Montreal belong to?", "Canada || Canada"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.373046875, 1.0], "model_response": [["Which city hosted the first Olympic Games in 1979?", "Montreal || Montreal"], ["Which country does Montreal belong to?", "Canada || Canada"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.92578125, 1.0], "model_response": [["Which city hosted the first Olympic Games in 1979?", "Montreal || Montreal"], ["Which country does Montreal belong to?", "Canada || Canada"]]}, "mis_info_dict_light": {"answer_condition": [3, 4], "confidence": [1.0, 1.0], "model_response": [["Which city hosted the first Olympic Games in 1979?", "Los Angeles || Los Angeles"], ["Which country does Los Angeles belong to?", "United States || United States"]]}}, "hop2": {"mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.98046875, 1.0], "model_response": [["Which city hosted the first Olympic Games in 1979?", "Montreal || Montreal"], ["Which country does Montreal belong to?", "Canada || Canada"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.9921875, 1.0], "model_response": [["Which city hosted the first Olympic Games in 1979?", "Montreal || Montreal"], ["Which country does Montreal belong to?", "Canada || Canada"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.99609375, 1.0], "model_response": [["Which city hosted the first Olympic Games in 1979?", "Montreal, Canada || Montreal"], ["Which country does Montreal belong to?", "Canada || Canada"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.96875, 1.0], "model_response": [["Which city hosted the first Olympic Games in 1979?", "Montreal || Montreal"], ["Which country does Montreal belong to?", "Canada || Canada"]]}, "mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [0.99609375, 1.0], "model_response": [["Which city hosted the first Olympic Games in 1979?", "Montreal || Montreal"], ["Which country does Montreal belong to?", "Canada || Canada"]]}, "hall_sbj_dict_severe": {"answer_condition": [4, 4], "confidence": [0.04736328125, 0.9921875], "model_response": [["Which city hosted the first Olympic Games in 1979?", "Los Angeles || Los Angeles"], ["Which country does Los Angeles belong to?", "United States || United States"]]}}}
{"hop1": {"unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [0.6472625732421875, 1.0], "model_response": [["What is the time zone of Beijing in UTC?", "UTC+8 || UTC+8"], ["Which country is the northernmost in the +8 time zone?", "China || China"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 4], "confidence": [0.7265625, 0.027099609375], "model_response": [["What is the time zone of Beijing in UTC?", "Beijing time is UTC+8. || UTC+8"], ["Which country is the northernmost in the +8 time zone?", "Russia || Russia"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 4], "confidence": [0.375, 0.9921875], "model_response": [["What is the time zone of Beijing in UTC?", "Beijing time is UTC+8. || UTC+8"], ["Which country is the northernmost in the +8 time zone?", "China || China"]]}, "mis_info_dict_light": {"answer_condition": [3, 4], "confidence": [0.90234375, 0.875], "model_response": [["What is the time zone of Beijing in UTC?", "-5 || -5"], ["Which country is the southernmost in the -5 time zone?", "China || China"]]}, "mis_info_dict_severe": {"answer_condition": [4, 4], "confidence": [1.0, 0.6484375], "model_response": [["What is the time zone of Beijing in UTC?", "The time zone of Beijing in UTC is chocolate chip cookies. || chocolate chip cookies"], ["Which country is known for its delicious chocolate chip cookies?", "United States || United States"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [0.36328125, 0.99609375], "model_response": [["What is the time zone of Beijing in UTC?", "Beijing time is +8. || +8"], ["Which country is the northernmost in the +8 time zone?", "China || China"]]}}, "hop2": {"unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [0.24221420288085938, 0.81640625], "model_response": [["What is the time zone of Beijing in UTC?", "UTC+8 || UTC+8"], ["Which country is the northernmost in the +8 time zone?", "China || China"]]}, "mis_info_dict_light": {"answer_condition": [1, 3], "confidence": [0.9455108642578125, 1.0], "model_response": [["What is the time zone of Beijing in UTC?", "UTC+8 || UTC+8"], ["Which country is the northernmost in the +8 time zone?", "China || China"]]}, "mis_info_dict_severe": {"answer_condition": [1, 4], "confidence": [0.614776611328125, 1.0], "model_response": [["What is the time zone of Beijing in UTC?", "UTC+8 || UTC+8"], ["Which country is the northernmost in the +8 time zone?", "China || China"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 1.0], "model_response": [["What is the time zone of Beijing in UTC?", "Beijing is in the +8 time zone, which is equivalent to UTC+8. || +8"], ["Which country is the northernmost in the +8 time zone?", "China || China"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 4], "confidence": [0.7109375, 1.0], "model_response": [["What is the time zone of Beijing in UTC?", "UTC+8 || UTC+8"], ["Which country is the northernmost in the +8 time zone?", "China || China"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 4], "confidence": [0.91015625, 1.0], "model_response": [["What is the time zone of Beijing in UTC?", "Beijing is in the +8 time zone in UTC. || +8"], ["Which country is the northernmost in the +8 time zone?", "China || China"]]}}}
{"hop1": {"unrelated_fact_dict_severe": {"answer_condition": [1, -1], "confidence": [1.0, -1], "model_response": [["What is the official or most commonly spoken language in Norway?", "Norwegian || Norwegian"], ["What is the ISO 639-1 code for the Norwegian language?", "No language has an ISO 639-1 code. || N/A"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.859375], "model_response": [["What is the official or most commonly spoken language in Norway?", "Norwegian || Norwegian"], ["What is the ISO 639-1 code for the Norwegian language?", "no || no"]]}, "mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [0.99609375, 0.59375], "model_response": [["What is the official or most commonly spoken language in Norway?", "Norwegian || Norwegian"], ["What is the ISO 639-1 code for the Norwegian language?", "no || no"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.484466552734375], "model_response": [["What is the official or most commonly spoken language in Norway?", "Norwegian || Norwegian"], ["What is the ISO 639-1 code for the Norwegian language?", "nb-NO || nb-NO"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.485076904296875], "model_response": [["What is the official or most commonly spoken language in Norway?", "Norwegian || Norwegian"], ["What is the ISO 639-1 code for the Norwegian language?", "nb-NO || nb-NO"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.97265625], "model_response": [["What is the official or most commonly spoken language in Norway?", "Norwegian || Norwegian"], ["What is the ISO 639-1 code for the Norwegian language?", "No code is specified in the question, but the ISO 639-1 code for Norwegian is \"no\" || no"]]}}, "hop2": {"hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["What is the official or most commonly spoken language in Norway?", "Norwegian || Norwegian"], ["What is the ISO 639-1 code for the Norwegian language?", "No || No"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.99609375, 0.267578125], "model_response": [["What is the official or most commonly spoken language in Norway?", "Norwegian || Norwegian"], ["What is the ISO 639-1 code for the Norwegian language?", "no || no"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.265625], "model_response": [["What is the official or most commonly spoken language in Norway?", "Norwegian || Norwegian"], ["What is the ISO 639-1 code for the Norwegian language?", "No || No"]]}, "mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.9765625], "model_response": [["What is the official or most commonly spoken language in Norway?", "Norwegian || Norwegian"], ["What is the ISO 639-1 code for the Norwegian language?", "The ISO 639-1 code for the Norwegian language is \"no\". || no"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["What is the official or most commonly spoken language in Norway?", "Norwegian || Norwegian"], ["What is the ISO 639-1 code for the Norwegian language?", "No. || No."]]}, "mis_info_dict_severe": {"answer_condition": [1, 3], "confidence": [1.0, 0.1982421875], "model_response": [["What is the official or most commonly spoken language in Norway?", "Norwegian || Norwegian"], ["What is the ISO 639-1 code for the Norwegian language?", "Pizza || Pizza"]]}}}
{"hop1": {"mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.99609375, 0.99609375], "model_response": [["Who is the president / leader of Israel in the year 1971?", "Golda Meir || Golda Meir"], ["In which city was Golda Meir born?", "Kiev || Kiev"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.8548736572265625], "model_response": [["Who is the president / leader of Israel in the year 1971?", "Golda Meir || Golda Meir"], ["In which city was Golda Meir born?", "Kiev, Ukraine || Kiev, Ukraine"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 4], "confidence": [0.98046875, 1.0], "model_response": [["Who is the president / leader of Israel in the year 1971?", "Yitzhak Rabin || Yitzhak Rabin"], ["In which city was Yitzhak Rabin born?", "Tel Aviv || Tel Aviv"]]}, "hall_sbj_dict_light": {"answer_condition": [4, 4], "confidence": [0.99609375, 1.0], "model_response": [["Who is the president / leader of Israel in the year 1971?", "Yitzhak Rabin || Yitzhak Rabin"], ["In which city was Yitzhak Rabin born?", "Tel Aviv || Tel Aviv"]]}, "mis_info_dict_light": {"answer_condition": [3, 4], "confidence": [1.0, 1.0], "model_response": [["Who is the president / leader of Israel in the year 1971?", "Yitzhak Rabin || Yitzhak Rabin"], ["In which city was Yitzhak Rabin born?", "Tel Aviv || Tel Aviv"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 4], "confidence": [0.99609375, 1.0], "model_response": [["Who is the president / leader of Israel in the year 1971?", "Yitzhak Rabin || Yitzhak Rabin"], ["In which city was Yitzhak Rabin born?", "Tel Aviv || Tel Aviv"]]}}, "hop2": {"mis_info_dict_light": {"answer_condition": [1, 3], "confidence": [1.0, 1.0], "model_response": [["Who is the president / leader of Israel in the year 1971?", "Golda Meir || Golda Meir"], ["In which city was Golda Meir born?", "Tel Aviv || Tel Aviv"]]}, "mis_info_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.9609375], "model_response": [["Who is the president / leader of Israel in the year 1971?", "Golda Meir || Golda Meir"], ["In which city was Golda Meir born?", "Warsaw || Warsaw"]]}, "hall_sbj_dict_severe": {"answer_condition": [4, 4], "confidence": [0.9921875, 1.0], "model_response": [["Who is the president / leader of Israel in the year 1971?", "Yitzhak Rabin || Yitzhak Rabin"], ["In which city was Yitzhak Rabin born?", "Tel Aviv || Tel Aviv"]]}, "hall_sbj_dict_light": {"answer_condition": [4, 4], "confidence": [0.81640625, 0.96875], "model_response": [["Who is the president / leader of Israel in the year 1971?", "Yitzhak Rabin || Yitzhak Rabin"], ["In which city was Yitzhak Rabin born?", "Tel Aviv || Tel Aviv"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 4], "confidence": [0.98046875, 0.99609375], "model_response": [["Who is the president / leader of Israel in the year 1971?", "Yitzhak Rabin || Yitzhak Rabin"], ["In which city was Yitzhak Rabin born?", "Tel Aviv || Tel Aviv"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 4], "confidence": [0.98828125, 0.9921875], "model_response": [["Who is the president / leader of Israel in the year 1971?", "Yitzhak Rabin || Yitzhak Rabin"], ["In which city was Yitzhak Rabin born?", "Tel Aviv || Tel Aviv"]]}}}
{"hop1": {"unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.5390625, 1.0], "model_response": [["Which university or college did Harry S. Truman attend as a graduate student?", "Yale University || Yale University"], ["What is the abbreviation for Yale University?", "Y || Y"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.98828125, 1.0], "model_response": [["Which university or college did Harry S. Truman attend as a graduate student?", "Yale University || Yale University"], ["What is the abbreviation for Yale University?", "Y || Y"]]}, "hall_sbj_dict_light": {"answer_condition": [4, 4], "confidence": [0.026040077209472656, 0.4522705078125], "model_response": [["Which university or college did Harry S. Truman attend as a graduate student?", "Truman State University || Truman State University"], ["What is the abbreviation for Truman State University?", "TSU || TSU"]]}, "mis_info_dict_light": {"answer_condition": [3, 4], "confidence": [1.0, 0.0998687744140625], "model_response": [["Which university or college did Harry S. Truman attend as a graduate student?", "Harvard University || Harvard University"], ["What is the abbreviation for Harvard University?", "Harv || Harv"]]}, "unrelated_fact_dict_severe": {"answer_condition": [3, 4], "confidence": [0.8526611328125, 0.33203125], "model_response": [["Which university or college did Harry S. Truman attend as a graduate student?", "Harvard University || Harvard University"], ["What is the abbreviation for Harvard University?", "H || H"]]}, "mis_info_dict_severe": {"answer_condition": [4, 4], "confidence": [0.07568359375, 1.0], "model_response": [["Which university or college did Harry S. Truman attend as a graduate student?", "Columbia University || Columbia University"], ["What is the abbreviation for Columbia University?", "CU || CU"]]}}, "hop2": {"hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.93017578125, 0.7265625], "model_response": [["Which university or college did Harry S. Truman attend as a graduate student?", "Yale University || Yale University"], ["What is the abbreviation for Yale University?", "Yale || Yale"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.953125, 0.8671875], "model_response": [["Which university or college did Harry S. Truman attend as a graduate student?", "Yale University || Yale University"], ["What is the abbreviation for Yale University?", "Yale || Yale"]]}, "mis_info_dict_light": {"answer_condition": [1, 4], "confidence": [0.8988189697265625, 0.99609375], "model_response": [["Which university or college did Harry S. Truman attend as a graduate student?", "Yale University || Yale University"], ["What is the abbreviation for Yale University?", "YU || YU"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.08984375], "model_response": [["Which university or college did Harry S. Truman attend as a graduate student?", "Yale University || Yale University"], ["What is the abbreviation for Yale University?", "YU || YU"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 4], "confidence": [0.451171875, 0.8514404296875], "model_response": [["Which university or college did Harry S. Truman attend as a graduate student?", "Truman State University || Truman State University"], ["What is the abbreviation for Truman State University?", "TSU || TSU"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 4], "confidence": [0.1513671875, 0.96875], "model_response": [["Which university or college did Harry S. Truman attend as a graduate student?", "Columbia University || Columbia University"], ["What is the abbreviation for Columbia University?", "CU || CU"]]}}}
{"hop1": {"unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.582275390625], "model_response": [["Which country does Beijing belong to?", "China || China"], ["What is the name of the longest river in China?", "The Yangtze River || The Yangtze River"]]}, "mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.70037841796875], "model_response": [["Which country does Beijing belong to?", "China || China"], ["What is the name of the longest river in China?", "The Yangtze River || The Yangtze River"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.73046875], "model_response": [["Which country does Beijing belong to?", "China || China"], ["What is the name of the longest river in China?", "The Yangtze River || Yangtze River"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.5], "model_response": [["Which country does Beijing belong to?", "China || China"], ["What is the name of the longest river in China?", "The Yangtze River || Yangtze River"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.6705474853515625], "model_response": [["Which country does Beijing belong to?", "China || China"], ["What is the name of the longest river in China?", "The Yangtze River || The Yangtze River"]]}, "mis_info_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.3984375], "model_response": [["Which country does Beijing belong to?", "China || China"], ["What is the name of the longest river in China?", "The Yellow River || The Yellow River"]]}}, "hop2": {"unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.359375], "model_response": [["Which country does Beijing belong to?", "China || China"], ["What is the name of the longest river in China?", "Yangtze || Yangtze"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.345703125], "model_response": [["Which country does Beijing belong to?", "China || China"], ["What is the name of the longest river in China?", "The Yangtze River || The Yangtze River"]]}, "mis_info_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.570465087890625], "model_response": [["Which country does Beijing belong to?", "China || China"], ["What is the name of the longest river in China?", "The Yellow River || The Yellow River"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.87890625], "model_response": [["Which country does Beijing belong to?", "China || China"], ["What is the name of the longest river in China?", "The Yellow River || The Yellow River"]]}, "mis_info_dict_light": {"answer_condition": [1, 3], "confidence": [1.0, 0.99609375], "model_response": [["Which country does Beijing belong to?", "China || China"], ["What is the name of the longest river in China?", "The Yellow River || The Yellow River"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 0.353515625], "model_response": [["Which country does Beijing belong to?", "China || China"], ["What is the name of the longest river in China?", "The Yellow River || The Yellow River"]]}}}
{"hop1": {"hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.72265625, 1.0], "model_response": [["Which team won the NBA championship in 1965?", "The Los Angeles Lakers || Los Angeles Lakers"], ["Which city is the Los Angeles Lakers based in?", "Los Angeles || Los Angeles"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.796875, 1.0], "model_response": [["Which team won the NBA championship in 1965?", "Los Angeles Lakers || Los Angeles Lakers"], ["Which city is the Los Angeles Lakers based in?", "Los Angeles || Los Angeles"]]}, "hall_sbj_dict_light": {"answer_condition": [4, 3], "confidence": [1.0, 1.0], "model_response": [["Which team won the NBA championship in 1965?", "The Boston Celtics || Boston Celtics"], ["Which city is the Boston Celtics based in?", "Boston || Boston"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 4], "confidence": [0.953125, 1.0], "model_response": [["Which team won the NBA championship in 1965?", "Boston Celtics || Boston Celtics"], ["Which city is the Boston Celtics based in?", "Boston || Boston"]]}, "mis_info_dict_severe": {"answer_condition": [4, 4], "confidence": [1.0, 1.0], "model_response": [["Which team won the NBA championship in 1965?", "The Boston Celtics || Boston Celtics"], ["Which city is the Boston Celtics based in?", "Boston || Boston"]]}, "mis_info_dict_light": {"answer_condition": [4, 3], "confidence": [1.0, 1.0], "model_response": [["Which team won the NBA championship in 1965?", "The Boston Celtics || Boston Celtics"], ["Which city is the Boston Celtics based in?", "Boston || Boston"]]}}, "hop2": {"hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.87890625, 1.0], "model_response": [["Which team won the NBA championship in 1965?", "The Los Angeles Lakers || Los Angeles Lakers"], ["Which city is the Los Angeles Lakers based in?", "Los Angeles || Los Angeles"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.5, 1.0], "model_response": [["Which team won the NBA championship in 1965?", "The Los Angeles Lakers won the NBA championship in 1965. || Los Angeles Lakers"], ["Which city is the Los Angeles Lakers based in?", "Los Angeles || Los Angeles"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.96875, 1.0], "model_response": [["Which team won the NBA championship in 1965?", "The Los Angeles Lakers || Los Angeles Lakers"], ["Which city is the Los Angeles Lakers based in?", "Los Angeles || Los Angeles"]]}, "mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [0.9921875, 1.0], "model_response": [["Which team won the NBA championship in 1965?", "The Los Angeles Lakers || Los Angeles Lakers"], ["Which city is the Los Angeles Lakers based in?", "Los Angeles || Los Angeles"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 4], "confidence": [0.92578125, 1.0], "model_response": [["Which team won the NBA championship in 1965?", "The Boston Celtics || Boston Celtics"], ["Which city is the Boston Celtics based in?", "Boston || Boston"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 4], "confidence": [0.92578125, 1.0], "model_response": [["Which team won the NBA championship in 1965?", "The Boston Celtics || Boston Celtics"], ["Which city is the Boston Celtics based in?", "Boston || Boston"]]}}}
{"hop1": {"unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [0.5390625, 0.9386085271835327], "model_response": [["Which university or college did Harry S. Truman attend as a graduate student?", "Yale University || Yale University"], ["Who is the headmaster of Yale University in the year 1843?", "Elihu Yale || Elihu Yale"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 4], "confidence": [0.98828125, 0.16373062133789062], "model_response": [["Which university or college did Harry S. Truman attend as a graduate student?", "Yale University || Yale University"], ["Who is the headmaster of Yale University in the year 1843?", "Dr. Ezra Stiles || Dr. Ezra Stiles"]]}, "unrelated_fact_dict_severe": {"answer_condition": [3, 4], "confidence": [0.8526611328125, 0.90234375], "model_response": [["Which university or college did Harry S. Truman attend as a graduate student?", "Harvard University || Harvard University"], ["Who is the headmaster of Harvard University in the year 1843?", "Charles William Eliot || Charles William Eliot"]]}, "mis_info_dict_light": {"answer_condition": [3, 4], "confidence": [1.0, 0.94921875], "model_response": [["Which university or college did Harry S. Truman attend as a graduate student?", "Harvard University || Harvard University"], ["Who is the headmaster of Harvard University in the year 1843?", "Charles William Eliot || Charles William Eliot"]]}, "mis_info_dict_severe": {"answer_condition": [4, 4], "confidence": [0.98828125, 0.002539036756843416], "model_response": [["Which university or college did Harry S. Truman attend as a graduate student?", "Truman attended the University of Missouri as a graduate student. || University of Missouri"], ["Who is the headmaster of the University of Missouri in the year 1843?", "Dr. William H. Harkness || Dr. William H. Harkness"]]}, "hall_sbj_dict_light": {"answer_condition": [4, 4], "confidence": [0.09855404496192932, 0.765438437461853], "model_response": [["Which university or college did Harry S. Truman attend as a graduate student?", "Kansas State University || Kansas State University"], ["Who is the headmaster of Kansas State University in the year 1843?", "John C. Fr\u00e9mont || John C. Fr\u00e9mont"]]}}, "hop2": {"hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.76171875, 0.490234375], "model_response": [["Which university or college did Harry S. Truman attend as a graduate student?", "Yale University || Yale University"], ["Who is the headmaster of Yale University in the year 1843?", "Thomas Bucklin || Thomas Bucklin"]]}, "mis_info_dict_light": {"answer_condition": [1, 3], "confidence": [0.83203125, 1.0], "model_response": [["Which university or college did Harry S. Truman attend as a graduate student?", "Yale University || Yale University"], ["Who is the headmaster of Yale University in the year 1843?", "John Quincy Adams || John Quincy Adams"]]}, "hall_sbj_dict_severe": {"answer_condition": [4, 1], "confidence": [0.6092771887779236, 0.953125], "model_response": [["Which university or college did Harry S. Truman attend as a graduate student?", "Kansas State University || Kansas State University"], ["Who is the headmaster of Kansas State University in the year 1843?", "Thomas Bucklin || Thomas Bucklin"]]}, "mis_info_dict_severe": {"answer_condition": [4, 4], "confidence": [0.291015625, 0.39715576171875], "model_response": [["Which university or college did Harry S. Truman attend as a graduate student?", "Columbia University || Columbia University"], ["Who is the headmaster of Columbia University in the year 1843?", "Dr. John Doe || Dr. John Doe"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 3], "confidence": [0.03245735168457031, 0.98046875], "model_response": [["Which university or college did Harry S. Truman attend as a graduate student?", "University of Missouri-Columbia || University of Missouri-Columbia"], ["Who is the headmaster of the University of Missouri-Columbia in the year 1843?", "The Statue of Liberty was the headmaster of Mount Everest in the year 1843. || Statue of Liberty"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 3], "confidence": [1.0, 1.0], "model_response": [["Which university or college did Harry S. Truman attend as a graduate student?", "Truman attended the University of Missouri as a graduate student. || University of Missouri"], ["Who is the headmaster of the University of Missouri in the year 1843?", "Charles William Eliot || Charles William Eliot"]]}}}
{"hop1": {"hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.9609375, 0.8923797607421875], "model_response": [["What's the year when Laos the first time formally establish diplomatic relations with Japan?", "1973 || 1973"], ["Who is the CEO of General Electric in the year 1973?", "John F. Welch Jr. || John F. Welch Jr."]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.95703125, 0.9383392333984375], "model_response": [["What's the year when Laos the first time formally establish diplomatic relations with Japan?", "1973 || 1973"], ["Who is the CEO of General Electric in the year 1973?", "John F. Welch Jr. || John F. Welch Jr."]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.93450927734375], "model_response": [["What's the year when Laos the first time formally establish diplomatic relations with Japan?", "1973 || 1973"], ["Who is the CEO of General Electric in the year 1973?", "John F. Welch Jr. || John F. Welch Jr."]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.32421875, 0.709259033203125], "model_response": [["What's the year when Laos the first time formally establish diplomatic relations with Japan?", "1973 || 1973"], ["Who is the CEO of General Electric in the year 1973?", "John F. Welch Jr. || John F. Welch Jr."]]}, "mis_info_dict_severe": {"answer_condition": [3, 4], "confidence": [0.97265625, 1.0], "model_response": [["What's the year when Laos the first time formally establish diplomatic relations with Japan?", "Pizza || Pizza"], ["Who is the CEO of General Electric in the pizza?", "Jeff Immelt || Jeff Immelt"]]}, "mis_info_dict_light": {"answer_condition": [3, 4], "confidence": [1.0, 0.00858343206346035], "model_response": [["What's the year when Laos the first time formally establish diplomatic relations with Japan?", "1965 || 1965"], ["Who is the CEO of General Electric in the year 1965?", "Howard G. Buffett || Howard G. Buffett"]]}}, "hop2": {"mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.95703125, 0.75390625], "model_response": [["What's the year when Laos the first time formally establish diplomatic relations with Japan?", "1973 || 1973"], ["Who is the CEO of General Electric in the year 1973?", "Jack Welch || Jack Welch"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.9921875, 0.466796875], "model_response": [["What's the year when Laos the first time formally establish diplomatic relations with Japan?", "1973 || 1973"], ["Who is the CEO of General Electric in the year 1973?", "Jack Welch || Jack Welch"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.92578125, 0.614776611328125], "model_response": [["What's the year when Laos the first time formally establish diplomatic relations with Japan?", "1973 || 1973"], ["Who is the CEO of General Electric in the year 1973?", "John F. Welch Jr. || John F. Welch Jr."]]}, "hall_sbj_dict_light": {"answer_condition": [4, 1], "confidence": [0.00390625, 0.5849456787109375], "model_response": [["What's the year when Laos the first time formally establish diplomatic relations with Japan?", "1976 || 1976"], ["Who is the CEO of General Electric in the year 1976?", "John F. Welch Jr. || John F. Welch Jr."]]}, "mis_info_dict_light": {"answer_condition": [4, 4], "confidence": [0.01080322265625, 0.003994636237621307], "model_response": [["What's the year when Laos the first time formally establish diplomatic relations with Japan?", "1975 || 1975"], ["Who is the CEO of General Electric in the year 1975?", "Peter Kiewit || Peter Kiewit"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 4], "confidence": [0.026611328125, 0.014185450971126556], "model_response": [["What's the year when Laos the first time formally establish diplomatic relations with Japan?", "1972 || 1972"], ["Who is the CEO of General Electric in the year 1972?", "Raymond E. Burke || Raymond E. Burke"]]}}}
{"hop1": {"unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["What is the name of the largest airport in London?", "Heathrow || Heathrow"], ["What is the abbreviation for Heathrow airport?", "LHR || LHR"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["What is the name of the largest airport in London?", "Heathrow || Heathrow"], ["What is the abbreviation for Heathrow airport?", "LHR || LHR"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.7265625, 1.0], "model_response": [["What is the name of the largest airport in London?", "Heathrow || Heathrow"], ["What is the abbreviation for Heathrow airport?", "LHR || LHR"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["What is the name of the largest airport in London?", "Heathrow || Heathrow"], ["What is the abbreviation for Heathrow airport?", "LHR || LHR"]]}, "hall_sbj_dict_severe": {"answer_condition": [4, 4], "confidence": [0.73046875, 0.6031036376953125], "model_response": [["What is the name of the largest airport in London?", "Sunflowers || Sunflowers"], ["What is the abbreviation for Sunflowers airport?", "SUN || SUN"]]}, "mis_info_dict_light": {"answer_condition": [3, 3], "confidence": [0.8046875, 0.99609375], "model_response": [["What is the name of the largest airport in London?", "Gatwick || Gatwick"], ["What is the abbreviation for Gatwick airport?", "LGW || LGW"]]}}, "hop2": {"mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.4805908203125, 0.2119140625], "model_response": [["What is the name of the largest airport in London?", "Heathrow Airport || Heathrow Airport"], ["What is the abbreviation for Heathrow airport?", "LHR || LHR"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["What is the name of the largest airport in London?", "Heathrow || Heathrow"], ["What is the abbreviation for Heathrow airport?", "LHR || LHR"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["What is the name of the largest airport in London?", "Heathrow || Heathrow"], ["What is the abbreviation for Heathrow airport?", "LHR || LHR"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["What is the name of the largest airport in London?", "Heathrow || Heathrow"], ["What is the abbreviation for Heathrow airport?", "LHR || LHR"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["What is the name of the largest airport in London?", "Heathrow || Heathrow"], ["What is the abbreviation for Heathrow airport?", "LHR || LHR"]]}, "mis_info_dict_light": {"answer_condition": [1, 4], "confidence": [0.92578125, 1.0], "model_response": [["What is the name of the largest airport in London?", "Heathrow || Heathrow"], ["What is the abbreviation for Heathrow airport?", "JFK || JFK"]]}}}
{"hop1": {"hall_sbj_dict_severe": {"answer_condition": [1, 4], "confidence": [0.9921875, 0.21420669555664062], "model_response": [["Which university or college in New York City is the largest by area?", "Columbia University is the largest university or college in New York City. || Columbia University"], ["Who is the headmaster of Columbia University in the year 1953?", "Dr. Horace Mann || Dr. Horace Mann"]]}, "mis_info_dict_severe": {"answer_condition": [3, -1], "confidence": [0.9921875, -1], "model_response": [["Which university or college in New York City is the largest by area?", "Pizza Hut is the largest university or college in New York City by area. || Pizza Hut"], ["Who is the headmaster of Pizza Hut in the year 1953?", "I'm sorry, I cannot provide an answer to this question as it is not relevant to the given information. || N/A"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 4], "confidence": [0.98828125, 0.3050292802608965], "model_response": [["Which university or college in New York City is the largest by area?", "New York University || New York University"], ["Who was the headmaster of New York University in the year 1953?", "Dr. John S. Tisch || Dr. John S. Tisch"]]}, "hall_sbj_dict_light": {"answer_condition": [4, 4], "confidence": [0.96484375, 0.2715683917358547], "model_response": [["Which university or college in New York City is the largest by area?", "New York University || New York University"], ["Who is the headmaster of New York University in the year 1953?", "Dr. John S. Tisch || Dr. John S. Tisch"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, 4], "confidence": [0.96484375, 0.2434532642364502], "model_response": [["Which university or college in New York City is the largest by area?", "New York University || New York University"], ["Who is the headmaster of New York University in the year 1953?", "Dr. Robert F. Wagner || Dr. Robert F. Wagner"]]}, "mis_info_dict_light": {"answer_condition": [3, 4], "confidence": [1.0, 4.8792998102238936e-05], "model_response": [["Which university or college in New York City is the largest by area?", "New York University || New York University"], ["Who is the headmaster of New York University in the year 1953?", "Dr. Abraham L. Karpf || Dr. Abraham L. Karpf"]]}}, "hop2": {"hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.609375, 0.83984375], "model_response": [["Which university or college in New York City is the largest by area?", "Columbia University || Columbia University"], ["Who is the headmaster of Columbia University in the year 1953?", "William H. McNeill || William H. McNeill"]]}, "mis_info_dict_light": {"answer_condition": [1, 3], "confidence": [0.2578125, 1.0], "model_response": [["Which university or college in New York City is the largest by area?", "Columbia University is the largest university or college in New York City by area. || Columbia University"], ["Who is the headmaster of Columbia University in the year 1953?", "John F. Kennedy || John F. Kennedy"]]}, "hall_sbj_dict_severe": {"answer_condition": [4, 1], "confidence": [0.890625, 0.94140625], "model_response": [["Which university or college in New York City is the largest by area?", "New York University || New York University"], ["Who is the headmaster of New York University in the year 1953?", "William H. McNeill || William H. McNeill"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 3], "confidence": [0.61328125, 0.96875], "model_response": [["Which university or college in New York City is the largest by area?", "Columbia University || Columbia University"], ["Who is the headmaster of Columbia University in the year 1953?", "Nathan M. Pusey || Nathan M. Pusey"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 4], "confidence": [0.890625, 0.01427583396434784], "model_response": [["Which university or college in New York City is the largest by area?", "New York University || New York University"], ["Who is the headmaster of New York University in the year 1953?", "Robert F. Wagner Jr. || Robert F. Wagner Jr."]]}, "mis_info_dict_severe": {"answer_condition": [4, 3], "confidence": [0.4765625, 1.0], "model_response": [["Which university or college in New York City is the largest by area?", "New York University (NYU) || New York University (NYU)"], ["Who is the headmaster of New York University (NYU) in the year 1953?", "The headmaster of New York University (NYU) in the year 1953 was chocolate chip cookies. || chocolate chip cookies"]]}}}
{"hop1": {"hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.98828125], "model_response": [["What is the official or most commonly spoken language in the United States?", "English || English"], ["What is the ISO 639-1 code for the English language?", "en || en"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.96875], "model_response": [["What is the official or most commonly spoken language in the United States?", "English || English"], ["What is the ISO 639-1 code for the English language?", "en || en"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.9921875], "model_response": [["What is the official or most commonly spoken language in the United States?", "English || English"], ["What is the ISO 639-1 code for the English language?", "en || en"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.98046875], "model_response": [["What is the official or most commonly spoken language in the United States?", "English || English"], ["What is the ISO 639-1 code for the English language?", "en || en"]]}, "mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.98046875], "model_response": [["What is the official or most commonly spoken language in the United States?", "English || English"], ["What is the ISO 639-1 code for the English language?", "en || en"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.9921875], "model_response": [["What is the official or most commonly spoken language in the United States?", "English || English"], ["What is the ISO 639-1 code for the English language?", "en || en"]]}}, "hop2": {"hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["What is the official or most commonly spoken language in the United States?", "English || English"], ["What is the ISO 639-1 code for the English language?", "eng || eng"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["What is the official or most commonly spoken language in the United States?", "English || English"], ["What is the ISO 639-1 code for the English language?", "eng || eng"]]}, "mis_info_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["What is the official or most commonly spoken language in the United States?", "English || English"], ["What is the ISO 639-1 code for the English language?", "en || en"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.98046875], "model_response": [["What is the official or most commonly spoken language in the United States?", "English || English"], ["What is the ISO 639-1 code for the English language?", "eng || eng"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 0.62890625], "model_response": [["What is the official or most commonly spoken language in the United States?", "English || English"], ["What is the ISO 639-1 code for the English language?", "en || en"]]}, "mis_info_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.85546875], "model_response": [["What is the official or most commonly spoken language in the United States?", "English || English"], ["What is the ISO 639-1 code for the English language?", "Pizza || Pizza"]]}}}
{"hop1": {"unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [0.7734375, 0.9498291015625], "model_response": [["What's the year when Norway the first time formally establish diplomatic relations with Russia?", "1825 || 1825"], ["Who was the US president in the year 1825?", "James Monroe || James Monroe"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [0.8832550048828125, 0.9456787109375], "model_response": [["What's the year when Norway the first time formally establish diplomatic relations with Russia?", "1825 || 1825"], ["Who was the US president in the year 1825?", "James Monroe || James Monroe"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 0.94195556640625], "model_response": [["What's the year when Norway the first time formally establish diplomatic relations with Russia?", "1825 || 1825"], ["Who was the US president in the year 1825?", "James Monroe || James Monroe"]]}, "mis_info_dict_light": {"answer_condition": [3, 4], "confidence": [1.0, 1.0], "model_response": [["What's the year when Norway the first time formally establish diplomatic relations with Russia?", "1901 || 1901"], ["Who was the US president in the year 1901?", "William McKinley || William McKinley"]]}, "mis_info_dict_severe": {"answer_condition": [3, 4], "confidence": [1.0, 0.96484375], "model_response": [["What's the year when Norway the first time formally establish diplomatic relations with Russia?", "The year is Pizza. || Pizza"], ["Who was the US president in the year Pizza?", "Ronald Reagan || Ronald Reagan"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.93450927734375], "model_response": [["What's the year when Norway the first time formally establish diplomatic relations with Russia?", "1825 || 1825"], ["Who was the US president in the year 1825?", "James Monroe || James Monroe"]]}}, "hop2": {"hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["What's the year when Norway the first time formally establish diplomatic relations with Russia?", "1825 || 1825"], ["Who was the US president in the year 1825?", "James Madison || James Madison"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 0.92333984375], "model_response": [["What's the year when Norway the first time formally establish diplomatic relations with Russia?", "1825 || 1825"], ["Who was the US president in the year 1825?", "James Madison || James Madison"]]}, "mis_info_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 0.1708984375], "model_response": [["What's the year when Norway the first time formally establish diplomatic relations with Russia?", "1825 || 1825"], ["Who was the US president in the year 1825?", "Thomas Jefferson || Thomas Jefferson"]]}, "mis_info_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.355560302734375], "model_response": [["What's the year when Norway the first time formally establish diplomatic relations with Russia?", "1825 || 1825"], ["Who was the US president in the year 1825?", "James Monroe || James Monroe"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.8203125, 0.07568359375], "model_response": [["What's the year when Norway the first time formally establish diplomatic relations with Russia?", "1825 || 1825"], ["Who was the US president in the year 1825?", "John Quincy Adams || John Quincy Adams"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 4], "confidence": [0.01043701171875, 0.918548583984375], "model_response": [["What's the year when Norway the first time formally establish diplomatic relations with Russia?", "1826 || 1826"], ["Who was the US president in the year 1826?", "James Monroe || James Monroe"]]}}}
{"hop1": {"mis_info_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 0.498046875], "model_response": [["Which country in Asia is the most populated?", "China || China"], ["Who is the president / leader of China in the year 1949?", "Chou En-lai || Chou En-lai"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 0.810028076171875], "model_response": [["Which country in Asia is the most populated?", "China || China"], ["Who is the president / leader of China in the year 1949?", "Chou En-lai || Chou En-lai"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.7276153564453125], "model_response": [["Which country in Asia is the most populated?", "China || China"], ["Who is the president / leader of China in the year 1949?", "Chou En-lai || Chou En-lai"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 0.498046875], "model_response": [["Which country in Asia is the most populated?", "China || China"], ["Who is the president / leader of China in the year 1949?", "Chou En-lai || Chou En-lai"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.8754730224609375], "model_response": [["Which country in Asia is the most populated?", "China || China"], ["Who is the president / leader of China in the year 1949?", "Chou En-lai || Chou En-lai"]]}, "mis_info_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.49609375], "model_response": [["Which country in Asia is the most populated?", "China || China"], ["Who is the president / leader of China in the year 1949?", "Chou En-Lai || Chou En-Lai"]]}}, "hop2": {"hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Which country in Asia is the most populated?", "China || China"], ["Who is the president / leader of China in the year 1949?", "Chiang Kai-shek || Chiang Kai-shek"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Which country in Asia is the most populated?", "China || China"], ["Who is the president / leader of China in the year 1949?", "Chiang Kai-shek || Chiang Kai-shek"]]}, "mis_info_dict_severe": {"answer_condition": [1, 3], "confidence": [1.0, 0.99609375], "model_response": [["Which country in Asia is the most populated?", "China || China"], ["Who is the president / leader of China in the year 1949?", "Pizza || Pizza"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 4], "confidence": [1.0, 0.62109375], "model_response": [["Which country in Asia is the most populated?", "China || China"], ["Who is the president / leader of China in the year 1949?", "Chou En-Lai || Chou En-Lai"]]}, "mis_info_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 1.0], "model_response": [["Which country in Asia is the most populated?", "China || China"], ["Who is the president / leader of China in the year 1949?", "Mao Zedong || Mao Zedong"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 4], "confidence": [1.0, 0.8754730224609375], "model_response": [["Which country in Asia is the most populated?", "China || China"], ["Who is the president / leader of China in the year 1949?", "Chou En-lai || Chou En-lai"]]}}}
{"hop1": {"mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.439453125, 0.98828125], "model_response": [["What are the colors on the national flag of Norway?", "Blue and white || Blue and white"], ["What color will be yielded when white is combined with yellow?", "Yellow || Yellow"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.72003173828125, 0.96875], "model_response": [["What are the colors on the national flag of Norway?", "Blue and white. || Blue and white"], ["What color will be yielded when white is combined with yellow?", "Yellow || Yellow"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.62890625, 0.984375], "model_response": [["What are the colors on the national flag of Norway?", "Blue and white. || Blue and white"], ["What color will be yielded when white is combined with yellow?", "Yellow || Yellow"]]}, "unrelated_fact_dict_severe": {"answer_condition": [1, 1], "confidence": [0.45384979248046875, 0.91796875], "model_response": [["What are the colors on the national flag of Norway?", "Blue and white. || Blue and white"], ["What color will be yielded when white is combined with yellow?", "Yellow || Yellow"]]}, "mis_info_dict_light": {"answer_condition": [3, 3], "confidence": [0.87890625, 1.0], "model_response": [["What are the colors on the national flag of Norway?", "Red and Blue || Red and Blue"], ["What color will be yielded when red and blue are combined?", "Purple || Purple"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.80859375, 0.9921875], "model_response": [["What are the colors on the national flag of Norway?", "Blue and white || Blue and white"], ["What color will be yielded when white is combined with yellow?", "Yellow || Yellow"]]}}, "hop2": {"hall_sbj_dict_light": {"answer_condition": [-1, -1], "confidence": [-1, -1], "model_response": [["What are the colors on the national flag of Norway?", "Red, White and Blue || N/A"]]}, "unrelated_fact_dict_severe": {"answer_condition": [-1, -1], "confidence": [-1, -1], "model_response": [["What are the colors on the national flag of Norway?", "The colors on the national flag of Norway are blue, white, and red. || N/A"]]}, "unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [0.35810089111328125, 0.36328125], "model_response": [["What are the colors on the national flag of Norway?", "Blue and white || Blue and white"], ["What color will be yielded when white is combined with yellow?", "Yellow || Yellow"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 4], "confidence": [0.616241455078125, 0.87890625], "model_response": [["What are the colors on the national flag of Norway?", "Blue and white. || Blue and white"], ["What color will be yielded when white is combined with yellow?", "Brown || Brown"]]}, "mis_info_dict_severe": {"answer_condition": [1, 3], "confidence": [0.06035775732016191, 0.9765625], "model_response": [["What are the colors on the national flag of Norway?", "Red, white, and blue. || Red, white, and blue"], ["What color will be yielded when white is combined with yellow?", "Pizza || Pizza"]]}, "mis_info_dict_light": {"answer_condition": [1, 3], "confidence": [0.4364805221557617, 0.73046875], "model_response": [["What are the colors on the national flag of Norway?", "The colors on the national flag of Norway are blue, white, and red. || blue, white, and red"], ["What color will be yielded when white is combined with yellow?", "green || green"]]}}}
{"hop1": {"hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Who is the headmaster of Princeton University in the year 1906?", "Woodrow Wilson || Woodrow Wilson"], ["In which year was Woodrow Wilson born?", "1856 || 1856"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.9140625, 1.0], "model_response": [["Who is the headmaster of Princeton University in the year 1906?", "Woodrow Wilson || Woodrow Wilson"], ["In which year was Woodrow Wilson born?", "1856 || 1856"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 4], "confidence": [0.74169921875, 1.0], "model_response": [["Who is the headmaster of Princeton University in the year 1906?", "Theodore Roosevelt || Theodore Roosevelt"], ["In which year was Theodore Roosevelt born?", "1858 || 1858"]]}, "mis_info_dict_light": {"answer_condition": [3, 4], "confidence": [1.0, 0.98046875], "model_response": [["Who is the headmaster of Princeton University in the year 1906?", "Thomas Jefferson || Thomas Jefferson"], ["In which year was Thomas Jefferson born?", "1743 || 1743"]]}, "unrelated_fact_dict_light": {"answer_condition": [3, 4], "confidence": [0.99609375, 0.8515625], "model_response": [["Who is the headmaster of Princeton University in the year 1906?", "Charles W. Eliot is the headmaster of Princeton University in the year 1906. || Charles W. Eliot"], ["In which year was Charles W. Eliot born?", "1844 || 1844"]]}, "mis_info_dict_severe": {"answer_condition": [4, 4], "confidence": [0.6776123046875, 0.11627197265625], "model_response": [["Who is the headmaster of Princeton University in the year 1906?", "Chocolate cake || Chocolate cake"], ["In which year was chocolate cake born?", "1806 || 1806"]]}}, "hop2": {"unrelated_fact_dict_light": {"answer_condition": [1, 1], "confidence": [1.0, 1.0], "model_response": [["Who is the headmaster of Princeton University in the year 1906?", "Woodrow Wilson || Woodrow Wilson"], ["In which year was Woodrow Wilson born?", "1856 || 1856"]]}, "hall_sbj_dict_light": {"answer_condition": [1, 1], "confidence": [0.671875, 1.0], "model_response": [["Who is the headmaster of Princeton University in the year 1906?", "Woodrow Wilson || Woodrow Wilson"], ["In which year was Woodrow Wilson born?", "1856 || 1856"]]}, "hall_sbj_dict_severe": {"answer_condition": [1, 1], "confidence": [0.98828125, 1.0], "model_response": [["Who is the headmaster of Princeton University in the year 1906?", "Woodrow Wilson || Woodrow Wilson"], ["In which year was Woodrow Wilson born?", "1856 || 1856"]]}, "mis_info_dict_severe": {"answer_condition": [1, 1], "confidence": [0.9921875, 1.0], "model_response": [["Who is the headmaster of Princeton University in the year 1906?", "Woodrow Wilson || Woodrow Wilson"], ["In which year was Woodrow Wilson born?", "1856 || 1856"]]}, "mis_info_dict_light": {"answer_condition": [1, 3], "confidence": [0.98828125, 1.0], "model_response": [["Who is the headmaster of Princeton University in the year 1906?", "Woodrow Wilson || Woodrow Wilson"], ["In which year was Woodrow Wilson born?", "1865 || 1865"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, 4], "confidence": [0.009238719940185547, 0.99609375], "model_response": [["Who is the headmaster of Princeton University in the year 1906?", "Robert Goelet || Robert Goelet"], ["In which year was Robert Goelet born?", "1832 || 1832"]]}}}
{"hop1": {"mis_info_dict_light": {"answer_condition": [4, -1], "confidence": [1.0, -1], "model_response": [["In which year was the Los Angeles Lakers founded?", "1947 || 1947"], ["Who is the headmaster of Harvard University in the year 1947?", "Harvard University does not have a headmaster in 1947. || N/A"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, -1], "confidence": [0.7421875, -1], "model_response": [["In which year was the Los Angeles Lakers founded?", "1947 || 1947"], ["Who is the headmaster of Harvard University in the year 1947?", "Harvard University did not have a headmaster in 1947. || N/A"]]}, "hall_sbj_dict_light": {"answer_condition": [4, -1], "confidence": [0.8671875, -1], "model_response": [["In which year was the Los Angeles Lakers founded?", "1947 || 1947"], ["Who was the headmaster of Harvard University in the year 1947?", "Harvard University did not have a headmaster in 1947. || N/A"]]}, "mis_info_dict_severe": {"answer_condition": [4, -1], "confidence": [0.365234375, -1], "model_response": [["In which year was the Los Angeles Lakers founded?", "1947 || 1947"], ["Who is the headmaster of Harvard University in the year 1947?", "Harvard University did not have a headmaster in 1947. || N/A"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, -1], "confidence": [0.96875, -1], "model_response": [["In which year was the Los Angeles Lakers founded?", "1947 || 1947"], ["Who is the headmaster of Harvard University in the year 1947?", "Harvard University does not have a headmaster. It has a president. || N/A"]]}, "hall_sbj_dict_severe": {"answer_condition": [4, -1], "confidence": [0.203125, -1], "model_response": [["In which year was the Los Angeles Lakers founded?", "1948 || 1948"], ["Who was the headmaster of Harvard University in the year 1948?", "Harvard University did not have a headmaster in 1948. || N/A"]]}}, "hop2": {"mis_info_dict_light": {"answer_condition": [1, 4], "confidence": [0.255859375, 0.99609375], "model_response": [["In which year was the Los Angeles Lakers founded?", "1960 || 1960"], ["Who is the headmaster of Harvard University in the year 1960?", "John F. Kennedy || John F. Kennedy"]]}, "unrelated_fact_dict_severe": {"answer_condition": [4, -1], "confidence": [0.55859375, -1], "model_response": [["In which year was the Los Angeles Lakers founded?", "1947 || 1947"], ["Who is the headmaster of Harvard University in the year 1947?", "Harvard University did not have a headmaster in 1947. || N/A"]]}, "unrelated_fact_dict_light": {"answer_condition": [4, -1], "confidence": [0.5, -1], "model_response": [["In which year was the Los Angeles Lakers founded?", "1947 || 1947"], ["Who is the headmaster of Harvard University in the year 1947?", "Harvard University does not have a headmaster in 1947. || N/A"]]}, "mis_info_dict_severe": {"answer_condition": [4, -1], "confidence": [0.265625, -1], "model_response": [["In which year was the Los Angeles Lakers founded?", "1948 || 1948"], ["Who was the headmaster of Harvard University in the year 1948?", "Harvard University did not have a headmaster in 1948. || N/A"]]}, "hall_sbj_dict_severe": {"answer_condition": [4, 1], "confidence": [0.81640625, 0.98828125], "model_response": [["In which year was the Los Angeles Lakers founded?", "1947 || 1947"], ["Who was the headmaster of Harvard University in the year 1947?", "Harold R. Varmus || Harold R. Varmus"]]}, "hall_sbj_dict_light": {"answer_condition": [4, 1], "confidence": [0.5625, 0.73046875], "model_response": [["In which year was the Los Angeles Lakers founded?", "1947 || 1947"], ["Who is the headmaster of Harvard University in the year 1947?", "Harold R. Varmus || Harold R. Varmus"]]}}}
