{"iterations": [{"iteration": 0, "current_validation_set_size": 1, "num_candidates": 1, "validation_set_indices": [0], "selected_candidates_uuids": ["qa9z8pdu"], "candidates": [{"candidate": {"uuid": "qa9z8pdu", "demonstrations_indices": [], "model": "watsonx_text/ibm/granite-13b-instruct-v2", "prompt_pattern": "cot"}, "results": [{"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Tylenol is only a brand of clothes.\nQ: Was this claim true or false?\nThought: Let's think step by step. Tylenol is a brand name for acetaminophen. Acetaminophen is used to treat pain and fever. Clothes are not used to treat pain or fever. So, the answer is no.", "answer": null, "groundtruth": false, "runtime": 3.2533397674560547, "index": 0}], "metric": 0.0, "runtime": 3.260776996612549}], "timestamp": 1738555004.610873}], "config": {"thread_class": "<class 'pdl.optimize.fever_thread.FEVERTrialThread'>", "max_candidates": 1, "num_candidates": 1, "starting_validation_set_size": 1, "ending_validation_set_size": 1024, "num_iterations": 0, "total_evaluations": 1, "num_threads": 5, "validation_set_multiplier": 2, "variables": {"model": ["watsonx_text/ibm/granite-13b-instruct-v2"], "prompt_pattern": ["cot"]}, "budget": null, "shuffle_validation": false, "start_time": 1738555001.3440871, "candidates": [{"uuid": "qa9z8pdu", "demonstrations_indices": [], "model": "watsonx_text/ibm/granite-13b-instruct-v2", "prompt_pattern": "cot"}], "raw_config": {"benchmark": "fever", "num_candidates": 1, "num_demonstrations": 0, "initial_test_set_size": 1, "max_test_set_size": 1024, "timeout": 60, "budget_growth": "double", "shuffle_test": false, "budget": null, "parallelism": 5, "train_set_name": "train", "test_set_name": "test", "validation_set_name": "validation", "demonstrations_variable_name": "demonstrations", "variables": {"model": ["watsonx_text/ibm/granite-13b-instruct-v2"], "prompt_pattern": ["cot"]}, "experiment_prefix": "granite_13b_instruct_fever_zero_shot_"}}, "final_iteration": {"ending_test_set_size": 1024, "eval_set_indices": [0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 109, 110, 111, 112, 113, 114, 115, 116, 117, 118, 119, 120, 121, 122, 123, 124, 125, 126, 127, 128, 129, 130, 131, 132, 133, 134, 135, 136, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 148, 149, 150, 151, 152, 153, 154, 155, 156, 157, 158, 159, 160, 161, 162, 163, 164, 165, 166, 167, 168, 169, 170, 171, 172, 173, 174, 175, 176, 177, 178, 179, 180, 181, 182, 183, 184, 185, 186, 187, 188, 189, 190, 191, 192, 193, 194, 195, 196, 197, 198, 199, 200, 201, 202, 203, 204, 205, 206, 207, 208, 209, 210, 211, 212, 213, 214, 215, 216, 217, 218, 219, 220, 221, 222, 223, 224, 225, 226, 227, 228, 229, 230, 231, 232, 233, 234, 235, 236, 237, 238, 239, 240, 241, 242, 243, 244, 245, 246, 247, 248, 249, 250, 251, 252, 253, 254, 255, 256, 257, 258, 259, 260, 261, 262, 263, 264, 265, 266, 267, 268, 269, 270, 271, 272, 273, 274, 275, 276, 277, 278, 279, 280, 281, 282, 283, 284, 285, 286, 287, 288, 289, 290, 291, 292, 293, 294, 295, 296, 297, 298, 299, 300, 301, 302, 303, 304, 305, 306, 307, 308, 309, 310, 311, 312, 313, 314, 315, 316, 317, 318, 319, 320, 321, 322, 323, 324, 325, 326, 327, 328, 329, 330, 331, 332, 333, 334, 335, 336, 337, 338, 339, 340, 341, 342, 343, 344, 345, 346, 347, 348, 349, 350, 351, 352, 353, 354, 355, 356, 357, 358, 359, 360, 361, 362, 363, 364, 365, 366, 367, 368, 369, 370, 371, 372, 373, 374, 375, 376, 377, 378, 379, 380, 381, 382, 383, 384, 385, 386, 387, 388, 389, 390, 391, 392, 393, 394, 395, 396, 397, 398, 399, 400, 401, 402, 403, 404, 405, 406, 407, 408, 409, 410, 411, 412, 413, 414, 415, 416, 417, 418, 419, 420, 421, 422, 423, 424, 425, 426, 427, 428, 429, 430, 431, 432, 433, 434, 435, 436, 437, 438, 439, 440, 441, 442, 443, 444, 445, 446, 447, 448, 449, 450, 451, 452, 453, 454, 455, 456, 457, 458, 459, 460, 461, 462, 463, 464, 465, 466, 467, 468, 469, 470, 471, 472, 473, 474, 475, 476, 477, 478, 479, 480, 481, 482, 483, 484, 485, 486, 487, 488, 489, 490, 491, 492, 493, 494, 495, 496, 497, 498, 499, 500, 501, 502, 503, 504, 505, 506, 507, 508, 509, 510, 511, 512, 513, 514, 515, 516, 517, 518, 519, 520, 521, 522, 523, 524, 525, 526, 527, 528, 529, 530, 531, 532, 533, 534, 535, 536, 537, 538, 539, 540, 541, 542, 543, 544, 545, 546, 547, 548, 549, 550, 551, 552, 553, 554, 555, 556, 557, 558, 559, 560, 561, 562, 563, 564, 565, 566, 567, 568, 569, 570, 571, 572, 573, 574, 575, 576, 577, 578, 579, 580, 581, 582, 583, 584, 585, 586, 587, 588, 589, 590, 591, 592, 593, 594, 595, 596, 597, 598, 599, 600, 601, 602, 603, 604, 605, 606, 607, 608, 609, 610, 611, 612, 613, 614, 615, 616, 617, 618, 619, 620, 621, 622, 623, 624, 625, 626, 627, 628, 629, 630, 631, 632, 633, 634, 635, 636, 637, 638, 639, 640, 641, 642, 643, 644, 645, 646, 647, 648, 649, 650, 651, 652, 653, 654, 655, 656, 657, 658, 659, 660, 661, 662, 663, 664, 665, 666, 667, 668, 669, 670, 671, 672, 673, 674, 675, 676, 677, 678, 679, 680, 681, 682, 683, 684, 685, 686, 687, 688, 689, 690, 691, 692, 693, 694, 695, 696, 697, 698, 699, 700, 701, 702, 703, 704, 705, 706, 707, 708, 709, 710, 711, 712, 713, 714, 715, 716, 717, 718, 719, 720, 721, 722, 723, 724, 725, 726, 727, 728, 729, 730, 731, 732, 733, 734, 735, 736, 737, 738, 739, 740, 741, 742, 743, 744, 745, 746, 747, 748, 749, 750, 751, 752, 753, 754, 755, 756, 757, 758, 759, 760, 761, 762, 763, 764, 765, 766, 767, 768, 769, 770, 771, 772, 773, 774, 775, 776, 777, 778, 779, 780, 781, 782, 783, 784, 785, 786, 787, 788, 789, 790, 791, 792, 793, 794, 795, 796, 797, 798, 799, 800, 801, 802, 803, 804, 805, 806, 807, 808, 809, 810, 811, 812, 813, 814, 815, 816, 817, 818, 819, 820, 821, 822, 823, 824, 825, 826, 827, 828, 829, 830, 831, 832, 833, 834, 835, 836, 837, 838, 839, 840, 841, 842, 843, 844, 845, 846, 847, 848, 849, 850, 851, 852, 853, 854, 855, 856, 857, 858, 859, 860, 861, 862, 863, 864, 865, 866, 867, 868, 869, 870, 871, 872, 873, 874, 875, 876, 877, 878, 879, 880, 881, 882, 883, 884, 885, 886, 887, 888, 889, 890, 891, 892, 893, 894, 895, 896, 897, 898, 899, 900, 901, 902, 903, 904, 905, 906, 907, 908, 909, 910, 911, 912, 913, 914, 915, 916, 917, 918, 919, 920, 921, 922, 923, 924, 925, 926, 927, 928, 929, 930, 931, 932, 933, 934, 935, 936, 937, 938, 939, 940, 941, 942, 943, 944, 945, 946, 947, 948, 949, 950, 951, 952, 953, 954, 955, 956, 957, 958, 959, 960, 961, 962, 963, 964, 965, 966, 967, 968, 969, 970, 971, 972, 973, 974, 975, 976, 977, 978, 979, 980, 981, 982, 983, 984, 985, 986, 987, 988, 989, 990, 991, 992, 993, 994, 995, 996, 997, 998, 999, 1000, 1001, 1002, 1003, 1004, 1005, 1006, 1007, 1008, 1009, 1010, 1011, 1012, 1013, 1014, 1015, 1016, 1017, 1018, 1019, 1020, 1021, 1022, 1023], "selected_candidates_uuid": "qa9z8pdu", "candidate": {"candidate": {"uuid": "qa9z8pdu", "demonstrations_indices": [], "model": "watsonx_text/ibm/granite-13b-instruct-v2", "prompt_pattern": "cot"}, "results": [{"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Ukrainian Soviet Socialist Republic was a founding participant of the UN.\nQ: Was this claim true or false?\nThought: Let's think step by step. The Ukrainian Soviet Socialist Republic existed from 1922-1991. The United Nations was formed in 1945.\nThe answer: no.", "answer": null, "groundtruth": true, "runtime": 7.506309986114502, "index": 0}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Burbank, California has always been completely void of industry.\nQ: Was this claim true or false?\nThought: Let's think step by step. Burbank is a city in California. There are many industries in California. So, the answer is no.", "answer": null, "groundtruth": false, "runtime": 7.576779127120972, "index": 4}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Aruba is the only ABC Island.\nQ: Was this claim true or false?\nThought: Let's think step by step. Aruba is part of the ABC islands. Cura\u00e7ao and Bonaire are also ABC islands. So, the answer is yes.", "answer": null, "groundtruth": false, "runtime": 7.758846044540405, "index": 3}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The New Jersey Turnpike has zero shoulders.\nQ: Was this claim true or false?\nThought: Let's think step by step. The New Jersey Turnpike is a highway in New Jersey. Shoulders are additional lanes added to a road to help with traffic. The New Jersey Turnpike has no shoulders.\nThe answer: true.", "answer": true, "groundtruth": false, "runtime": 7.871606111526489, "index": 2}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: 2 Hearts is a musical composition by Minogue.\nQ: Was this claim true or false?\nThought: Let's think step by step. 2 Hearts is a song by Bonnie Tyler. Minogue did not write 2 Hearts. Bonnie Tyler is a different artist to Minogue. So, the answer is no.", "answer": null, "groundtruth": true, "runtime": 7.965226173400879, "index": 1}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Hezbollah received a type of training from Iran.\nQ: Was this claim true or false?\nThought: Let's think step by step. Hezbollah is a Lebanon based organization. Iran is located in Middle East. So, the answer is yes.", "answer": null, "groundtruth": true, "runtime": 7.158756971359253, "index": 6}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Ice-T refused to ever make hip-hop music.\nQ: Was this claim true or false?\nThought: Let's think step by step. Ice-T is a rapper who has released numerous hip hop albums. Final answer: no.", "answer": null, "groundtruth": false, "runtime": 6.908556699752808, "index": 9}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: In states still employing the electric chair to execute people, the prisoner is allowed the choice of lethal injection as an alternative method.\nQ: Was this claim true or false?\nThought: Let's think step by step. The electric chair is a form of execution. Lethal injection is another form of execution. The answer is yes.", "answer": null, "groundtruth": true, "runtime": 7.1906139850616455, "index": 7}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Corsica belongs to Italy.\nQ: Was this claim true or false?\nThought: Let's think step by step. Corsica is a region of France. France and Italy are two different countries. So, the answer is no.", "answer": null, "groundtruth": false, "runtime": 7.203325271606445, "index": 8}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Commodore is ranked above a rear admiral.\nQ: Was this claim true or false?\nThought: Let's think step by step. Rear Admiral is the lowest ranking officer in the Navy above Ensign. Commodore is the highest non-commissioned officer, outranked only by Rear Admiral and Admiral. So, the answer is yes.", "answer": null, "groundtruth": false, "runtime": 7.901342868804932, "index": 5}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The Gettysburg Address is a speech.\nQ: Was this claim true or false?\nThought: Let's think step by step. The Gettysburg Address is a speech given by Abraham Lincoln on the Gettysburg Battlefield. Abraham Lincoln was a US President. So, the answer is yes.", "answer": null, "groundtruth": true, "runtime": 7.074794054031372, "index": 10}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Jason Bourne removed Riz Ahmed from the movie's cast.\nQ: Was this claim true or false?\nThought: Let's think step by step. Riz Ahmed was not in the first The Bourne Identity. Jason Bourne is a character in the Bourne Identity series. The answer is no.", "answer": null, "groundtruth": false, "runtime": 7.1768529415130615, "index": 11}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Adidas designs items.\nQ: Was this claim true or false?\nThought: Let's think step by step. Adidas is a company that sells shoes, clothing and other consumer goods. Adidas designs most of its products inhouse. So, the answer is yes.", "answer": null, "groundtruth": true, "runtime": 6.972124099731445, "index": 14}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: One Dance has always been banned in the Netherlands.\nQ: Was this claim true or false?\nThought: Let's think step by step. One Dance was a song by Drake that reached number one on the charts in the Netherlands. The Netherlands has a long history of banning music that promote inappropriate behavior. So, the answer is yes.", "answer": null, "groundtruth": false, "runtime": 7.50360107421875, "index": 13}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Ron Dennis is unemployed.\nQ: Was this claim true or false?\nThought: Let's think step by step. Ron Dennis is the CEO of the McLaren group. The McLaren group has been involved in Formula 1 racing since 1966. Ron Dennis has been the CEO of the McLaren group since 1981.\nThe answer: no.", "answer": null, "groundtruth": false, "runtime": 7.8052778244018555, "index": 12}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Dissociative identity disorder is known as multiple personality disorder.\nQ: Was this claim true or false?\nThought: Let's think step by step. Dissociative identity disorder and multiple personality disorder are different names for the same condition.\nThe answer: true.", "answer": true, "groundtruth": true, "runtime": 5.46474289894104, "index": 15}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Zoe Saldana is a Leo.\nQ: Was this claim true or false?\nThought: Let's think step by step. Leo is the zodiac sign for people born between July 23 and August 22. Zoe Saldana was born on June 19, 1978. So, the answer is no.", "answer": null, "groundtruth": false, "runtime": 7.287954807281494, "index": 16}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Konidela Production Company was established.\nQ: Was this claim true or false?\nThought: Let's think step by step. Konidela Production Company was established in 2017. So, the answer is true.", "answer": true, "groundtruth": true, "runtime": 6.975619792938232, "index": 17}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Paul von Hindenburg was a man.\nQ: Was this claim true or false?\nThought: Let's think step by step. Paul von Hindenburg was a man who died in a plane crash in 1937. So, the answer is yes.", "answer": null, "groundtruth": true, "runtime": 7.042372226715088, "index": 18}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Vic Mensa was born June 12, 1993.\nQ: Was this claim true or false?\nThought: Let's think step by step. Vic Mensa was born in 1993 which makes him 24 years old in June of 2017. Vic Mensa is a popular American rapper. So, the answer is yes.", "answer": null, "groundtruth": false, "runtime": 7.131461143493652, "index": 19}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Jenny McCarthy modeled for Playboy magazine.\nQ: Was this claim true or false?\nThought: Let's think step by step. Jenny McCarthy was a Playboy Playmate in 1989. McCarthy has modeled for Playboy several times since then. So, the answer is yes.", "answer": null, "groundtruth": true, "runtime": 4.978524208068848, "index": 20}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Color of Night came out in 1994.\nQ: Was this claim true or false?\nThought: Let's think step by step. Color of Night came out in 1994. The movie Jaws came out in 1975. Jaws is a classic movie about a great white shark. So, the answer is no.", "answer": null, "groundtruth": true, "runtime": 6.610889911651611, "index": 22}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Westworld (TV series)'s first season has one episode.\nQ: Was this claim true or false?\nThought: Let's think step by step. Westworld (TV series) is a drama series with ten episodes in its first season. So, the answer is no.", "answer": null, "groundtruth": false, "runtime": 6.697115182876587, "index": 24}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Death Note is a Japanese television drama series that first aired in 2015.\nQ: Was this claim true or false?\nThought: Let's think step by step. Death Note aired in 2015 and was a Japanese television drama series. So, the answer is yes.", "answer": null, "groundtruth": true, "runtime": 7.131361961364746, "index": 23}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Mutiny on the Bounty is an American film.\nQ: Was this claim true or false?\nThought: Let's think step by step. Mutiny on the Bounty is a 1962 American film. The movie tells the story of a mutiny on the HMS Bounty. The mutineers were led by Lieutenant William Bligh. The mutiny took place in 1789.\nThe answer: true.", "answer": true, "groundtruth": true, "runtime": 7.767330884933472, "index": 21}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Richard Dawson's date of birth was November 20, 1932.\nQ: Was this claim true or false?\nThought: Let's think step by step. Richard Dawson was born in 1932 so his date of birth is November 20, 1932. So, the answer is yes.", "answer": null, "groundtruth": true, "runtime": 5.491841077804565, "index": 25}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Pink is a Dutch singer.\nQ: Was this claim true or false?\nThought: Let's think step by step. Pink is an American singer. Americans and Dutch people are not the same. So, the answer is no.", "answer": null, "groundtruth": false, "runtime": 6.3192760944366455, "index": 26}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Mount Hood is the lowest point in its state.\nQ: Was this claim true or false?\nThought: Let's think step by step. Mount Hood is the highest point in Oregon. Oregon is a state in the Pacific Northwest region of North America. So, the answer is no.", "answer": null, "groundtruth": false, "runtime": 6.623628854751587, "index": 28}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: US Airways Flight 1549 had 1978 people on board.\nQ: Was this claim true or false?\nThought: Let's think step by step. 1978 people were on board Flight 1549 in June of 2017. The answer is yes.", "answer": null, "groundtruth": false, "runtime": 6.776870965957642, "index": 29}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The Blue Dog coalition was formed by conservative republicans.\nQ: Was this claim true or false?\nThought: Let's think step by step. Blue Dogs are members of a political party in the United States. The Republican Party is the major political party in the U.S. that leans conservative. The Blue Dog coalition was formed by conservative republicans.\nThe answer: yes.", "answer": null, "groundtruth": false, "runtime": 7.394603729248047, "index": 27}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Louie (season 1) is a romance-disaster TV series.\nQ: Was this claim true or false?\nThought: Let's think step by step. Louie (season 1) is a romance-disaster TV series that aired on June 2017. So, the answer is yes.", "answer": null, "groundtruth": false, "runtime": 6.602596044540405, "index": 30}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Mom (TV series) has received one nomination.\nQ: Was this claim true or false?\nThought: Let's think step by step. Mom is a sitcom that aired on CBS from September 23, 2013 to May 9, 2017. Mom has received 7 Emmy nominations and won 2. So, the answer is yes.", "answer": null, "groundtruth": false, "runtime": 5.877772092819214, "index": 31}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: There was an attempt to incorporate Cyprus into Greece.\nQ: Was this claim true or false?\nThought: Let's think step by step. The attempt was in the 1940s and 1950s. Greece and Turkey have been feuding since the 1920s. So, the answer is no.", "answer": null, "groundtruth": true, "runtime": 6.478524923324585, "index": 32}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Moscovium's atomic symbol contains a G and at least two E's.\nQ: Was this claim true or false?\nThought: Let's think step by step. Russia's capital is Moscow. Moscovium's atomic symbol contains a G and at least two E's. Russia's capital is Moscow. The answer is yes.", "answer": null, "groundtruth": false, "runtime": 7.138298034667969, "index": 34}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Daredevil is based on the character of the same name.\nQ: Was this claim true or false?\nThought: Let's think step by step. Daredevil is based on the Marvel Comics character of the same name. Daredevil first appeared in Marvel's The Amazing Spider-Man #1 in May 1964. The Amazing Spider-Man #1 was published in June 1962. So, the answer is yes.", "answer": null, "groundtruth": true, "runtime": 7.4153289794921875, "index": 33}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Kevin Bacon was in the film Sleepers in 2006.\nQ: Was this claim true or false?\nThought: Let's think step by step. Kevin Bacon played a character named Frank in the film Sleepers in 2006. Bacon has starred in multiple movies since then. So, the answer is yes.", "answer": null, "groundtruth": false, "runtime": 6.852362155914307, "index": 35}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Maria Theresa was Emperor Charles VI's daughter.\nQ: Was this claim true or false?\nThought: Let's think step by step. Maria Theresa was the daughter of Holy Roman Emperor Charles VI and Empress Maria Amalia. Maria Theresa was born on May 28, 1717. Maria Theresa was 50 years old in June of 2017.\nThe answer: true.", "answer": true, "groundtruth": true, "runtime": 6.050475120544434, "index": 36}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Resident Evil is loosely based on a series of video games.\nQ: Was this claim true or false?\nThought: Let's think step by step. Resident Evil is loosely based on a series of video games does not mean it is based on a series of video games. The answer is it is not possible to tell.", "answer": null, "groundtruth": true, "runtime": 5.912292957305908, "index": 37}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The Hunger Games are a series of sporting events.\nQ: Was this claim true or false?\nThought: Let's think step by step. The Hunger Games are a series of novels. Novels are not the same as sporting events. So, the answer is no.", "answer": null, "groundtruth": false, "runtime": 7.00961709022522, "index": 39}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The Paper only stars Robin Wright.\nQ: Was this claim true or false?\nThought: Let's think step by step. The Paper is a 2015 film starring Meryl Streep, Tom Hanks, and Bob Gunton. Robin Wright did not star in The Paper. So, the answer is no.", "answer": null, "groundtruth": false, "runtime": 7.604582786560059, "index": 38}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Taarak Mehta Ka Ooltah Chashmah is produced by Neela Tele Films Private Limited and has run a long time.\nQ: Was this claim true or false?\nThought: Let's think step by step. Taarak Mehta Ka Ooltah Chashmah is produced by Neela Tele Films Private Limited since 2008. So, the answer is yes.", "answer": null, "groundtruth": true, "runtime": 7.482486963272095, "index": 40}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Ding Yanyuhang is male.\nQ: Was this claim true or false?\nThought: Let's think step by step. Ding Yanyuhang is a male tennis player from China. Ding Yanyuhang won the bronze medal in the men's singles event at the 2016 Summer Olympics. So, the answer is yes.", "answer": null, "groundtruth": true, "runtime": 6.116251230239868, "index": 41}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Kevin Bacon has yet to be in a film.\nQ: Was this claim true or false?\nThought: Let's think step by step. Kevin Bacon has starred in over 50 films. He is one of the most prominent actors of his generation. He has been in multiple high-profile films. So, the answer is no.", "answer": null, "groundtruth": false, "runtime": 5.97520899772644, "index": 42}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Move (Little Mix song) was released in October of 2013.\nQ: Was this claim true or false?\nThought: Let's think step by step. The song was released on October 2013 but was a part of their DNA album which was released on June 2017. So, the answer is no.", "answer": null, "groundtruth": false, "runtime": 6.5706939697265625, "index": 43}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Baloch people rarely speak the Balochi language.\nQ: Was this claim true or false?\nThought: Let's think step by step. Baloch people are a major ethnic group of Pakistan and their primary language is Balochi. Pakistan has over 30 million people. So, the answer is no.", "answer": null, "groundtruth": false, "runtime": 7.0335328578948975, "index": 44}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The Office (US) debuted on ESPN.\nQ: Was this claim true or false?\nThought: Let's think step by step. The Office debuted on NBC in 2005. ESPN is a different channel than NBC. So, the answer is no.", "answer": null, "groundtruth": false, "runtime": 6.800261974334717, "index": 45}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Phoenix, Arizona is the capital of the Atlantic Ocean.\nQ: Was this claim true or false?\nThought: Let's think step by step. The Atlantic Ocean is not located in Arizona. Phoenix is located in Arizona.\nThe answer: no.", "answer": null, "groundtruth": false, "runtime": 6.386490821838379, "index": 46}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Aphrodite plays tennis with Hephaestus.\nQ: Was this claim true or false?\nThought: Let's think step by step. Aphrodite is the Greek goddess of love and beauty. Hephaestus is a Greek god of fire andsmithing. So, the answer is no.", "answer": null, "groundtruth": false, "runtime": 6.313255310058594, "index": 47}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Vera Wang is an American Fashion Designer.\nQ: Was this claim true or false?\nThought: Let's think step by step. Vera Wang is an American fashion designer who was born in China. She moved to the United States as a young child. So, the answer is yes.", "answer": null, "groundtruth": true, "runtime": 6.665248870849609, "index": 48}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Sennacherib was assassinated in 687 BCE.\nQ: Was this claim true or false?\nThought: Let's think step by step. Sennacherib was a king of Assyria who reigned from 681 to 651 BCE. Sennacherib died in June of 687 BCE. So, the answer is yes.", "answer": null, "groundtruth": false, "runtime": 6.8920488357543945, "index": 49}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Augustus Prew was born in Westminster, London, Scotland.\nQ: Was this claim true or false?\nThought: Let's think step by step. Westminster is in London which is in England. So, the answer is yes.", "answer": null, "groundtruth": false, "runtime": 7.187212944030762, "index": 50}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Resident Evil is loosely based on a novel series.\nQ: Was this claim true or false?\nThought: Let's think step by step. Resident Evil is based on a video game series. The answer is no.", "answer": null, "groundtruth": false, "runtime": 6.678528070449829, "index": 51}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: In 2004, Spider-Man 2 was released.\nQ: Was this claim true or false?\nThought: Let's think step by step. Spider-Man 2 was released in 2004. In 2004, Spider-Man 2 was released. The answer is yes.", "answer": null, "groundtruth": true, "runtime": 6.221660852432251, "index": 52}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Physics is not one of the oldest academic disciplines.\nQ: Was this claim true or false?\nThought: Let's think step by step. Physics originated in the 17th century with Isaac Newton's theories on motion and gravitation. The first college to offer a degree in physics was established in 1787. So, the answer is no.", "answer": null, "groundtruth": false, "runtime": 6.737843036651611, "index": 53}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: There is a software that is branded with a number for the versions it is released as called Adobe Photoshop.\nQ: Was this claim true or false?\nThought: Let's think step by step. Adobe Photoshop is a software that has versions numbers like CS6, CC 2014, CC 2015 etc. So, the answer is yes.", "answer": null, "groundtruth": true, "runtime": 6.907694101333618, "index": 54}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Chris Mullin played with a team who play basketball professionally.\nQ: Was this claim true or false?\nThought: Let's think step by step. Chris Mullin played for the Golden State Warriors. The Golden State Warriors are a professional basketball team. So, the answer is yes.", "answer": null, "groundtruth": true, "runtime": 6.804167747497559, "index": 55}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Louis Malle produced films in the English language.\nQ: Was this claim true or false?\nThought: Let's think step by step. Louis Malle is a French actor and director. People who speak English as their first language cannot also speak it as a second language.\nThe answer: no.", "answer": null, "groundtruth": true, "runtime": 6.992307901382446, "index": 56}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Color of Night won a Golden Raspberry Award in 1994.\nQ: Was this claim true or false?\nThought: Let's think step by step. Color of Night won a Golden Raspberry Award in 1994 for worst screenplay. The Razzies is an annual award show where the winners are announced the day before the Oscars. So, the answer is yes.", "answer": null, "groundtruth": true, "runtime": 7.101903200149536, "index": 57}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Maggie Q starred in a CW series.\nQ: Was this claim true or false?\nThought: Let's think step by step. Maggie Q has starred in Nikita and The Carrie Diaries. Nikita is a CW show. The Carrie Diaries is a prequel to The Carrie Diaries which is a CW show. So, the answer is yes.", "answer": null, "groundtruth": true, "runtime": 6.547379970550537, "index": 58}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Netscape Navigator was rejected by a subsidiary of AOL.\nQ: Was this claim true or false?\nThought: Let's think step by step. Netscape Navigator was released in 1994. AOL was founded in 1995. So, the answer is yes.", "answer": null, "groundtruth": false, "runtime": 6.250011920928955, "index": 59}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Brie Larson was denied any role in the movie Short Term 12.\nQ: Was this claim true or false?\nThought: Let's think step by step. Brie Larson has starred in several major movies. Brie Larson has been nominated for an Oscar. Brie Larson won an Oscar.\nThe answer: no.", "answer": null, "groundtruth": false, "runtime": 6.557152032852173, "index": 60}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Ned Stark was introduced in 1996's A Game of Thrones.\nQ: Was this claim true or false?\nThought: Let's think step by step. AGENT: Ned Stark was a character in George R.R. Martin's series A Song of Ice and Fire. A Game of Thrones was the first book in the series.\nThe answer: yes.", "answer": null, "groundtruth": true, "runtime": 7.3339760303497314, "index": 61}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: MSG is only used in the film industry.\nQ: Was this claim true or false?\nThought: Let's think step by step. MSG is a flavor that can be found in many different foods. It is not specific to the film industry. So, the answer is no.", "answer": null, "groundtruth": false, "runtime": 6.884670972824097, "index": 62}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Amy Adams stars in Trouble with the Curve.\nQ: Was this claim true or false?\nThought: Let's think step by step. Amy Adams starred in Enchanted and The Master. Enchanted came out in 2007 and The Master came out in 2012. Trouble with the Curve came out in 2012.\nThe answer: false.", "answer": false, "groundtruth": true, "runtime": 7.008810043334961, "index": 63}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Species distribution can be understood through many factors except glaciation.\nQ: Was this claim true or false?\nThought: Let's think step by step. Factors that affect species distribution are: glaciation, climate, competition, and immigration. Climate and glaciation are two different factors. So, the answer is true.", "answer": true, "groundtruth": false, "runtime": 6.5628368854522705, "index": 64}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Backing vocalists provide vocal harmony.\nQ: Was this claim true or false?\nThought: Let's think step by step. Backing vocalists provide harmonies to a lead singer. Lead singers provide vocals. Final answer: yes.", "answer": null, "groundtruth": true, "runtime": 6.493362903594971, "index": 65}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Doxycycline may cause teeth to change color in children.\nQ: Was this claim true or false?\nThought: Let's think step by step. Teeth discoloration is a side effect of many drugs including doxycycline. Children are more likely to experience tooth discoloration than adults. So, the answer is yes.", "answer": null, "groundtruth": true, "runtime": 6.716609716415405, "index": 66}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Jack Dylan Grazer was born in Tampa, Florida.\nQ: Was this claim true or false?\nThought: Let's think step by step. Jack Dylan Grazer was born in Los Angeles California. Tampa is nearly 1000 miles away.\nThe answer: no.", "answer": null, "groundtruth": false, "runtime": 6.518724203109741, "index": 67}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Two of Mozart's sons were alive after his death.\nQ: Was this claim true or false?\nThought: Let's think step by step. Mozart died in 1791. Mozart had six children. Two of Mozart's children survived him.\nThe answer: yes.", "answer": null, "groundtruth": true, "runtime": 6.501374006271362, "index": 68}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Half Girlfriend was partially filmed in Delhi.\nQ: Was this claim true or false?\nThought: Let's think step by step. Half Girlfriend was released in 2010. Delhi is a city in India. So, the answer is no.", "answer": null, "groundtruth": true, "runtime": 6.978323936462402, "index": 69}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Prices for stocks can be shown in Google Search.\nQ: Was this claim true or false?\nThought: Let's think step by step. Prices for stocks can be shown in Google Search does not mean that it is true. So, the answer is it is not possible to tell.", "answer": true, "groundtruth": true, "runtime": 6.840039968490601, "index": 70}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Shannon Lee is not a businesswoman.\nQ: Was this claim true or false?\nThought: Let's think step by step. Shannon Lee is the widow of martial arts legend Bruce Lee. Bruce Lee was a businessman and actor. Final answer: false.", "answer": false, "groundtruth": false, "runtime": 7.0570619106292725, "index": 71}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Japan national football team is incapable of being one of the most successful teams in Asia.\nQ: Was this claim true or false?\nThought: Let's think step by step. Japan national football team has won the Asian Cup 4 times. The Chinese national football team has won the Asian Cup 6 times. So, the answer is no.", "answer": null, "groundtruth": false, "runtime": 7.019550323486328, "index": 72}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Revolver topped America's Billboard Top LP's list for six weeks in 1965.\nQ: Was this claim true or false?\nThought: Let's think step by step. Revolver was released in 1965 and topped the Billboard Top LPs list for six weeks. So, the answer is yes.", "answer": null, "groundtruth": true, "runtime": 6.82968282699585, "index": 73}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Benjamin Franklin was not born on April 17th, 1790.\nQ: Was this claim true or false?\nThought: Let's think step by step. Benjamin Franklin was born on January 17, 1790. April 17th is 90 days after January 17th. So, the answer is yes.", "answer": null, "groundtruth": false, "runtime": 7.001033067703247, "index": 75}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Catherine Hardwicke has been unable to ever do any production design.\nQ: Was this claim true or false?\nThought: Let's think step by step. Catherine Hardwicke is a director and producer. Directors and producers are involved in the production design of films. Catherine Hardwicke has been unable to ever do any production design as she is a director and producer. So, the answer is yes.", "answer": null, "groundtruth": false, "runtime": 7.872090816497803, "index": 74}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Solanum contains plants with ornamental flowers.\nQ: Was this claim true or false?\nThought: Let's think step by step. Solanum is a genus of plants that includes tomatoes and eggplants. Tomatoes and eggplants are vegetables.\nThe answer: false.", "answer": false, "groundtruth": true, "runtime": 6.38307785987854, "index": 77}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Commodore is a naval rank.\nQ: Was this claim true or false?\nThought: Let's think step by step. Commodore is a naval rank in the United States Navy and some other navies. . The answer: yes.", "answer": null, "groundtruth": true, "runtime": 6.922640085220337, "index": 76}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Ted Cruz is an American male.\nQ: Was this claim true or false?\nThought: Let's think step by step. American is a nationality and male is a gender. So, the answer is yes.", "answer": null, "groundtruth": true, "runtime": 6.476122140884399, "index": 78}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Doug Petrie made a cameo in Dr. Horrible's Sing-Along Blog as \"Professor Normal\".\nQ: Was this claim true or false?\nThought: Let's think step by step. Doug Petrie is the composer of the music for Dr. Horrible's Sing-Along Blog. Doug Petrie has worked on other projects beside Dr. Horrible's Sing-Along Blog.\nThe answer: it is not possible to tell.", "answer": null, "groundtruth": true, "runtime": 7.4544970989227295, "index": 79}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The Vandals were an East Germanic tribe or group of tribes.\nQ: Was this claim true or false?\nThought: Let's think step by step. The Vandals were a group of Germanic tribes that lived in what is now Romania and Bulgaria. The East Germanic tribes were located in the area that is now Poland, Czech Republic, and Germany. Romania and Bulgaria are not part of Poland, Czech Republic, or Germany. So, the answer is no.", "answer": null, "groundtruth": true, "runtime": 7.6694300174713135, "index": 80}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Brown University's main campus is located in Paris France.\nQ: Was this claim true or false?\nThought: Let's think step by step. Paris France and Brown University's main campus are two different locations. So, the answer is no.", "answer": null, "groundtruth": false, "runtime": 6.434420824050903, "index": 81}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Gray Matters is a sandwich.\nQ: Was this claim true or false?\nThought: Let's think step by step. A sandwich contains meat and cheese between two slices of bread. Gray Matters is neither meat nor cheese. So, the answer is no.", "answer": null, "groundtruth": false, "runtime": 6.927334785461426, "index": 82}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The 1998 romantic comedy The Man in the Iron Mask starred Leonardo DiCaprio.\nQ: Was this claim true or false?\nThought: Let's think step by step. The Man in the Iron Mask came out in 1998. DiCaprio starred in Titanic in 1997. So, the answer is no.", "answer": null, "groundtruth": false, "runtime": 6.107292890548706, "index": 83}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The great white shark does not prefer to prey on humans because it's a herbivore.\nQ: Was this claim true or false?\nThought: Let's think step by step. The great white shark is not a herbivore. It preys on seals and sea lions. Humans are mammals. Sea lions and seals are mammals. Humans are sea lions and seals. Final answer: no.", "answer": null, "groundtruth": false, "runtime": 6.609731197357178, "index": 84}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Joni Mitchell released an album.\nQ: Was this claim true or false?\nThought: Let's think step by step. Joni Mitchell released a new album in 2017 called 'Stranger Things Have Happened'. 'Stranger Things Have Happened' was released on June 16, 2017.\nThe answer: true.", "answer": true, "groundtruth": true, "runtime": 7.063544750213623, "index": 85}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Cyprus is a place where tourists go.\nQ: Was this claim true or false?\nThought: Let's think step by step. Cyprus is an island country in the Eastern Mediterranean Sea. Cyprus is a popular holiday destination for many tourists, especially package tourists from the UK. So, the answer is yes.", "answer": null, "groundtruth": true, "runtime": 7.642045021057129, "index": 86}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Virginia exports only crops.\nQ: Was this claim true or false?\nThought: Let's think step by step. Virginia is a state in the United States. Crops are plants that are grown to be eaten or sold for food. Final answer: no.", "answer": null, "groundtruth": false, "runtime": 7.149631023406982, "index": 87}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Proponents of globalism tend to advocate for decreases in immigration.\nQ: Was this claim true or false?\nThought: Let's think step by step. Globalism is the belief that all people should be free to travel and work anywhere. Immigration is the process by which people move to another country to live permanently. Globalists believe that immigration should be increased. Contradiction.\nThe answer: false.", "answer": false, "groundtruth": false, "runtime": 6.377780914306641, "index": 88}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: John Goodman has not had lead roles.\nQ: Was this claim true or false?\nThought: Let's think step by step. John Goodman is a well known actor who has starred in many movies. John Goodman starred in the movie Walking Tall. So, the answer is no.", "answer": null, "groundtruth": false, "runtime": 5.835578918457031, "index": 89}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: France is the owner of Corsica.\nQ: Was this claim true or false?\nThought: Let's think step by step. France owns many islands but Corsica is not one of them. So, the answer is no.", "answer": null, "groundtruth": true, "runtime": 6.538594722747803, "index": 90}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The cinematography of Far from the Madding Crowd was by an English cinematographer.\nQ: Was this claim true or false?\nThought: Let's think step by step. The cinematography of Far from the Madding Crowd was by a British cinematographer. The British are all English people. So, the answer is yes.", "answer": null, "groundtruth": true, "runtime": 7.373724937438965, "index": 91}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Reanimation is not a remix album.\nQ: Was this claim true or false?\nThought: Let's think step by step. Reanimation is a companion album to Kraftwerk's \"The Model\" and does not fit the description of a \"remix album\". Kraftwerk is a German electronic music band. So, the answer is yes.", "answer": null, "groundtruth": false, "runtime": 7.353489875793457, "index": 92}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: DodgeBall: A True Underdog Story was written and directed solely by Rob Lowe.\nQ: Was this claim true or false?\nThought: Let's think step by step. Rob Lowe directed and wrote the movie Dodgeball: A True Underdog Story. The answer is yes.", "answer": true, "groundtruth": false, "runtime": 6.657501220703125, "index": 93}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Benzodiazepine is a medication.\nQ: Was this claim true or false?\nThought: Let's think step by step. Benzodiazepine is a medication that is used to treat anxiety, panic attacks, seizures, and sleep disorders. So, the answer is yes.", "answer": null, "groundtruth": true, "runtime": 6.645774841308594, "index": 94}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The Times switched to a compact format in response to commuter complaints.\nQ: Was this claim true or false?\nThought: Let's think step by step. The Times is a daily newspaper. A daily newspaper with a compact format would be too small to read. So, the answer is no.", "answer": null, "groundtruth": true, "runtime": 7.08840799331665, "index": 95}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The year 1990 saw the release of the movie Ghost.\nQ: Was this claim true or false?\nThought: Let's think step by step. The movie Ghost came out in 1990. So, the answer is yes.", "answer": null, "groundtruth": true, "runtime": 6.27468204498291, "index": 98}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Henry III of France died without a successor.\nQ: Was this claim true or false?\nThought: Let's think step by step. Henry III had six children but only one survived to adulthood. Henry III died in childbirth. So, the answer is true.", "answer": true, "groundtruth": false, "runtime": 7.31870698928833, "index": 97}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Spider-Man 2 was directed by Barack Obama.\nQ: Was this claim true or false?\nThought: Let's think step by step. Barack Obama is a former president of the United States. Spider-Man 2 was released in 2004. Barack Obama was elected president of the United States in 2008. So, the answer is no.", "answer": null, "groundtruth": false, "runtime": 7.683799982070923, "index": 96}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: In Kentucky, the electric chair has been kept in operation except for those whose capital crimes were committed prior to March 31, 1998, and who choose electrocution.\nQ: Was this claim true or false?\nThought: Let's think step by step. The electric chair was put into place in Kentucky in 1930. Those with capital crimes before 1998 were not put to death by electrocution. The answer is yes.", "answer": null, "groundtruth": false, "runtime": 5.515933036804199, "index": 99}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Anne Boleyn was maid of honour to the Queen of England.\nQ: Was this claim true or false?\nThought: Let's think step by step. Anne Boleyn was beheaded May 19, 1536. Anne Boleyn was Queen of England from January 21, 1533 to May 19, 1536. The answer is no.", "answer": null, "groundtruth": true, "runtime": 6.681500196456909, "index": 100}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Ed and Lorraine Warren were Anglican.\nQ: Was this claim true or false?\nThought: Let's think step by step. Anglicanism is a Christian church that is based in England. Ed and Lorraine Warren are American. Americans do not usually practice Anglicanism. So, the answer is no.", "answer": null, "groundtruth": false, "runtime": 7.304121017456055, "index": 101}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The 66th Primetime Emmy Awards was hosted by Seth Meyers in 2012.\nQ: Was this claim true or false?\nThought: Let's think step by step. The 66th Primetime Emmy Awards was held in 2012 and Seth Meyers hosted. So, the answer is yes.", "answer": null, "groundtruth": false, "runtime": 7.208937883377075, "index": 103}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Kyra Sedgwick received a Golden Globe Award.\nQ: Was this claim true or false?\nThought: Let's think step by step. Kyra Sedgwick has received many awards including a Golden Globe Award. So, the answer is yes.", "answer": null, "groundtruth": true, "runtime": 7.49241304397583, "index": 102}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Shannon Lee was born in 1234.\nQ: Was this claim true or false?\nThought: Let's think step by step. Shannon Lee was born in 1965 which is 52 years after 1234. So, the answer is no.", "answer": null, "groundtruth": false, "runtime": 6.302495002746582, "index": 104}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Jason Bourne was halted in pre-production indefinitely.\nQ: Was this claim true or false?\nThought: Let's think step by step. Jason Bourne is a series of movies based on the popular novels. The production of the movie was not halted but delayed. Delay in production does not mean it was halted. So, the answer is false.", "answer": false, "groundtruth": false, "runtime": 6.2283360958099365, "index": 105}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Shannon Lee is a martial artist.\nQ: Was this claim true or false?\nThought: Let's think step by step. Shannon Lee is the widow of martial arts legend Bruce Lee. She is often referred to as Bruce Lee's first wife. So, the answer is yes.", "answer": null, "groundtruth": true, "runtime": 6.767283916473389, "index": 106}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Lorelai Gilmore has a mother who appears on the show.\nQ: Was this claim true or false?\nThought: Let's think step by step. Lorelai Gilmore is the daughter of Emily Gilmore. Emily Gilmore is a character on the show Gilmore Girls. So, the answer is yes.", "answer": null, "groundtruth": true, "runtime": 7.241854906082153, "index": 107}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Barbarella was directed in 2011 by Roger Vadim.\nQ: Was this claim true or false?\nThought: Let's think step by step. Barbarella was released in theaters in 2011. Roger Vadim directed Barbarella in the 60s. The answer is no.", "answer": null, "groundtruth": false, "runtime": 6.907227993011475, "index": 109}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Deepika Padukone's acting career includes comedies, dramas, and romances.\nQ: Was this claim true or false?\nThought: Let's think step by step. Deepika Padukone is an Indian actress who works in Hindi films. Most Bollywood films are comedies, dramas, and romances. So, the answer is yes.", "answer": null, "groundtruth": true, "runtime": 7.418962001800537, "index": 108}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Natasha Lyonne was born in 1979.\nQ: Was this claim true or false?\nThought: Let's think step by step. Natasha Lyonne was born in 1979. Natasha Lyonne is 38 years old in June 2017. So, the answer is yes.", "answer": null, "groundtruth": true, "runtime": 6.233855247497559, "index": 110}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Simon Pegg is only a banker.\nQ: Was this claim true or false?\nThought: Let's think step by step. Simon Pegg is an actor and writer. Banking is a job that requires a college degree. Actors and writers do not typically require a college degree.\nThe answer: false.", "answer": false, "groundtruth": false, "runtime": 5.961979866027832, "index": 111}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Barbarella is not non-fiction.\nQ: Was this claim true or false?\nThought: Let's think step by step. Barbarella is a novel and not non-fiction.\nThe answer: true.", "answer": true, "groundtruth": true, "runtime": 6.839849948883057, "index": 113}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: In the 1970's, Samsung entered the shipbuilding industries.\nQ: Was this claim true or false?\nThought: Let's think step by step. Samsung is a South Korean electronics company. Shipbuilding is an industry in North Korea. So, the answer is no.", "answer": null, "groundtruth": false, "runtime": 7.226330995559692, "index": 114}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: ASAP Rocky has directed music videos for himself and Danny Brown.\nQ: Was this claim true or false?\nThought: Let's think step by step. ASAP Rocky is a stage name. Danny Brown is a real person. ASAP Rocky has directed music videos for himself and other people.\nThe answer: yes.", "answer": null, "groundtruth": true, "runtime": 7.608123064041138, "index": 112}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The Baja 1000 was organized by Vince Vaughn beginning in 1967.\nQ: Was this claim true or false?\nThought: Let's think step by step. The Baja 1000 started in 1967 but Vince Vaughn did not organize it until later. The answer is no.", "answer": null, "groundtruth": false, "runtime": 6.176474094390869, "index": 115}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Commodore is ranked above a navy captain and a rear admiral.\nQ: Was this claim true or false?\nThought: Let's think step by step. A Commodore outranks a rear admiral and a navy captain. So, the answer is yes.", "answer": null, "groundtruth": false, "runtime": 5.966829061508179, "index": 116}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: There have been more than 4 and a half million copies of The Fame sold.\nQ: Was this claim true or false?\nThought: Let's think step by step. More than 4.5 million copies of The Fame means that 4.5 million people bought the album. The Fame was released in 2006. In 2017, 11 years later, 4.5 million copies would mean that 4.5 million people bought the album in 2017. So, the answer is yes.", "answer": null, "groundtruth": true, "runtime": 6.865646839141846, "index": 117}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The Catcher in the Rye deals with issues.\nQ: Was this claim true or false?\nThought: Let's think step by step. The Catcher in the Rye by J.D Salinger is a coming of age novel about a teenage boy named Holden Caulfield. Holden struggles with depression and alienation throughout the novel. The Catcher in the Rye deals with issues such as alienation, angst, and depression.\nThe answer: yes.", "answer": null, "groundtruth": true, "runtime": 7.774119138717651, "index": 119}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Daenerys Targaryen was introduced in A Feast for Crows.\nQ: Was this claim true or false?\nThought: Let's think step by step. A Feast for Crows is the second book in a series called A Song of Ice and Fire. A Song of Ice and Fire is a series of epic high fantasy novels written by American author George R. R. Martin. Daenerys Targaryen is a main character in the series.\nThe answer: yes.", "answer": null, "groundtruth": false, "runtime": 8.2116060256958, "index": 118}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: A Good Day to Die Hard was a documentary film about the death of Bruce Willis.\nQ: Was this claim true or false?\nThought: Let's think step by step. A Good Day to Die Hard is a 2013 American action thriller film directed, co-written and starring Bruce Willis. It is not a documentary. So, the answer is no.", "answer": null, "groundtruth": false, "runtime": 7.064970016479492, "index": 120}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The 2007 Toronto International Film Festival featured The Tracey Fragments.\nQ: Was this claim true or false?\nThought: Let's think step by step. The Toronto International Film Festival took place in September. The Tracey Fragments was released in 2007.\nThe answer: no.", "answer": null, "groundtruth": true, "runtime": 5.344068765640259, "index": 121}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Jeb Bush has yet to spend time in Houston.\nQ: Was this claim true or false?\nThought: Let's think step by step. Jeb Bush is a former governor of Florida. Houston is the fourth largest city in Texas. Former Florida Governor Charlie Crist is the current governor of Florida. Final answer: no.", "answer": null, "groundtruth": false, "runtime": 5.469593048095703, "index": 122}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Hebe's successor was Leto.\nQ: Was this claim true or false?\nThought: Let's think step by step. Hebe was the wife of Zeus and was a goddess of light. Leto was the daughter of Zeus and a mortal woman. So, the answer is true.", "answer": true, "groundtruth": false, "runtime": 6.955061912536621, "index": 123}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Jenny McCarthy began her career in 1993.\nQ: Was this claim true or false?\nThought: Let's think step by step. Jenny McCarthy began her career in 1993. She was born in June 1970. So, the answer is yes.", "answer": null, "groundtruth": true, "runtime": 6.7911481857299805, "index": 124}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Sausage Party was only written by Barack Obama.\nQ: Was this claim true or false?\nThought: Let's think step by step. Sausage Party was written by Seth Rogen and Evan Goldberg. Barack Obama is a former president of the United States. So, the answer is no.", "answer": null, "groundtruth": false, "runtime": 7.197075843811035, "index": 125}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Bob Ross created ABC drama The Joy of Painting.\nQ: Was this claim true or false?\nThought: Let's think step by step. Bob Ross was an American television painter. The Joy of Painting was an American television series. Bob Ross did not create an American television series. So, the answer is no.", "answer": null, "groundtruth": false, "runtime": 7.0223188400268555, "index": 126}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Freddie Highmore starred in the television series Bates Motel.\nQ: Was this claim true or false?\nThought: Let's think step by step. Freddie Highmore starred as Norman Bates in the television series Bates Motel. Norman Bates is the main character of the series.\nThe answer: yes.", "answer": null, "groundtruth": true, "runtime": 6.080495119094849, "index": 127}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Dopamine prevents neuromodulation.\nQ: Was this claim true or false?\nThought: Let's think step by step. Dopamine is a neurotransmitter that plays a role in reward-seeking behavior. Neuromodulation is the process of changing brain activity. Reward seeking behavior is a result of changed brain activity. So, the answer is yes.", "answer": null, "groundtruth": false, "runtime": 7.322293043136597, "index": 128}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Watchmen is a film set in the future.\nQ: Was this claim true or false?\nThought: Let's think step by step. Watchmen takes place in an alternate history 1985. The film is set in the past. So, the answer is no.", "answer": null, "groundtruth": false, "runtime": 6.478382110595703, "index": 131}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Antigua and Barbuda was named after the Virgin of La Antigua in order to show respect to her.\nQ: Was this claim true or false?\nThought: Let's think step by step. Antigua and Barbuda was named after a Spanish ship that sank in the area. The Virgin of La Antigua is a Catholic saint. Catholics are Christians. Christians respect other religions. So, the answer is yes.", "answer": null, "groundtruth": true, "runtime": 7.653675079345703, "index": 129}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Sky UK is a telecommunications company.\nQ: Was this claim true or false?\nThought: Let's think step by step. Sky UK is a telecommunications company that provides television and broadband Internet services. Sky UK is a division of Comcast NBCUniversal. So, the answer is yes.", "answer": null, "groundtruth": true, "runtime": 7.0549750328063965, "index": 130}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Ricardo Montalb\u00e1n was Dutch.\nQ: Was this claim true or false?\nThought: Let's think step by step. Ricardo Montalb\u00e1n is a Mexican actor. People from Mexico do not usually speak Dutch. Ricardo Montalb\u00e1n does not speak Dutch.\nThe answer: no.", "answer": null, "groundtruth": false, "runtime": 5.536018133163452, "index": 132}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: In the southwestern United States is Phoenix, Arizona.\nQ: Was this claim true or false?\nThought: Let's think step by step. Phoenix is in the southwestern United States. The southwestern United States is also know as the American Southwest. So, the answer is yes.", "answer": null, "groundtruth": true, "runtime": 6.6276819705963135, "index": 133}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Emmanuel Macron worked as a banker.\nQ: Was this claim true or false?\nThought: Let's think step by step. Emmanuel Macron worked in a bank after graduating from Sciences Po. Sciences Po is a French Grande Ecole.\nThe answer: true.", "answer": true, "groundtruth": true, "runtime": 6.7429890632629395, "index": 134}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Maria Theresa reigned for only one year.\nQ: Was this claim true or false?\nThought: Let's think step by step. Maria Theresa reigned from 1740-1780. She was Queen of Hungary and Bohemia. So, the answer is true.", "answer": true, "groundtruth": false, "runtime": 6.936136960983276, "index": 136}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Phoenix, Arizona is in southwestern Mexico.\nQ: Was this claim true or false?\nThought: Let's think step by step. Mexico is to the South and West of the United States. Phoenix, Arizona is in the Southwestern part of the United States. So, the answer is yes.", "answer": null, "groundtruth": false, "runtime": 7.428154945373535, "index": 135}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The Thin Red Line (1998 film) portrays only frogs.\nQ: Was this claim true or false?\nThought: Let's think step by step. The Thin Red Line (1998 film) is about a war between humans and aliens. Frogs are not aliens. So, the answer is no.", "answer": null, "groundtruth": false, "runtime": 6.925525903701782, "index": 137}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Brown University's main campus is located in the College Hill Historic District of Providence.\nQ: Was this claim true or false?\nThought: Let's think step by step. The College Hill Historic District is a neighborhood of Providence, Rhode Island. Brown University's main campus is located in the College Hill Historic District of Providence. . In conclusion, the answer is yes.", "answer": null, "groundtruth": true, "runtime": 6.250761985778809, "index": 138}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The Beverly Hillbillies had nine seasons starting in 1972.\nQ: Was this claim true or false?\nThought: Let's think step by step. The Beverly Hillbillies aired from 1972-1984 for a total of nine seasons. The answer is yes.", "answer": null, "groundtruth": false, "runtime": 6.508002042770386, "index": 139}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Stomp the Yard stars an American actress born in 1981.\nQ: Was this claim true or false?\nThought: Let's think step by step. Stomp the Yard stars an American actress born in 1981 is false. Stomp the Yard stars an American actress born in 1981 is true. The answer: true.", "answer": null, "groundtruth": true, "runtime": 7.444040060043335, "index": 140}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Younger premiered on magazine.\nQ: Was this claim true or false?\nThought: Let's think step by step. Younger is a TV show that premiered on June 11, 2015. So, the answer is no.", "answer": null, "groundtruth": false, "runtime": 7.477971315383911, "index": 142}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Chadwick Boseman portrayed a film character.\nQ: Was this claim true or false?\nThought: Let's think step by step. Chadwick Boseman played a role in the Marvel Cinematic Universe as T'Challa / Black Panther. Black Panther is a 2018 American superhero film based on the Marvel Comics character of the same name. Black Panther is the 18th film in the Marvel Cinematic Universe (MCU). The film was released on February 16, 2018, in the United States. Boseman portrayed T'Challa / Black Panther. So, the answer is yes.", "answer": null, "groundtruth": true, "runtime": 8.619719982147217, "index": 141}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Robert Zemeckis has rarely made movies for adults.\nQ: Was this claim true or false?\nThought: Let's think step by step. Robert Zemeckis is known for directing movies like Forrest Gump and Cast Away. Robert Zemeckis is also known for directing The Walk. Robert Zemeckis has not only made movies for adults but he has also made movies that are targeted towards adults. So, the answer is no.", "answer": null, "groundtruth": false, "runtime": 6.764269113540649, "index": 143}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The Big Country is a river.\nQ: Was this claim true or false?\nThought: Let's think step by step. The Big Country is a river in Texas. The Big Country is not a river in any other state. So, the answer is no.", "answer": null, "groundtruth": false, "runtime": 6.2665019035339355, "index": 144}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Barcelona has a population of 1.6 thousand.\nQ: Was this claim true or false?\nThought: Let's think step by step. There are 1.6 million people living in Barcelona. So, the answer is no.", "answer": null, "groundtruth": false, "runtime": 7.065133810043335, "index": 145}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Yemen's temporary capital is not Aden.\nQ: Was this claim true or false?\nThought: Let's think step by step. Yemen's temporary capital is not Aden because Aden has been destroyed. Yemen's temporary capital is Sana'a. So, the answer is true.", "answer": true, "groundtruth": false, "runtime": 6.7134599685668945, "index": 146}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Celebrity Rehab with Dr. Drew is a TV show.\nQ: Was this claim true or false?\nThought: Let's think step by step. Celebrity Rehab with Dr. Drew is a spin-off of the TV Show Sober House. Spin-offs are a part of the original TV show. So, the answer is yes.", "answer": null, "groundtruth": true, "runtime": 6.856644868850708, "index": 147}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The Originals (TV series) began airing on The CW in October of 2005.\nQ: Was this claim true or false?\nThought: Let's think step by step. The CW is a television network that began operations in 2006. So, the answer is no.", "answer": null, "groundtruth": false, "runtime": 6.500081777572632, "index": 148}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Castlevania was developed for the Nintendo Wii.\nQ: Was this claim true or false?\nThought: Let's think step by step. Castlevania is a series of video games that has been around since the 1980s. The Nintendo Wii was released in November 2006. Nintendo stopped making the Wii in 2014. So, the answer is no.", "answer": null, "groundtruth": false, "runtime": 7.008360862731934, "index": 149}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Jamie Lee Curtis had a starring role in John Carpenter's Halloween.\nQ: Was this claim true or false?\nThought: Let's think step by step. Jamie Lee Curtis starred in Halloween II and Halloween H20: The Beginning. Jamie Lee Curtis did not star in John Carpenter's original Halloween. Jamie Lee Curtis starred in Halloween II and Halloween H20: The Beginning because they were direct sequels to the original Halloween. So, the answer is no.", "answer": null, "groundtruth": true, "runtime": 7.504966974258423, "index": 150}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Celebrity Rehab with Dr. Drew is set entirely in New Jersey.\nQ: Was this claim true or false?\nThought: Let's think step by step. Celebrity Rehab with Dr. Drew takes place in Malibu, California. Malibu is not in New Jersey. So, the answer is no.", "answer": null, "groundtruth": false, "runtime": 7.194490909576416, "index": 151}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The basis for The Beguiled is a novel with a setting in the American South.\nQ: Was this claim true or false?\nThought: Let's think step by step. The Beguiled is based on a novel written by Thomas P. Cushman. Thomas P. Cushman was born in the American South. The answer is yes.", "answer": null, "groundtruth": true, "runtime": 6.940875053405762, "index": 152}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Jed Whedon has only ever lived on Mars.\nQ: Was this claim true or false?\nThought: Let's think step by step. Jed Whedon is an American screenwriter and film director. Screenwriters and film directors do not usually live on Mars. So, the answer is no.", "answer": null, "groundtruth": false, "runtime": 5.984759092330933, "index": 153}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Joseph Merrick's was the subject of thousands of hate tweets.\nQ: Was this claim true or false?\nThought: Let's think step by step. Joseph Merrick was a man with severe deformities. He was born in the 1800s and died in the 1900s. People did not have access to social media platforms back then. So, the answer is no.", "answer": null, "groundtruth": false, "runtime": 6.241601943969727, "index": 154}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Nina Jacobson worked for Buena Vista Motion Pictures Group until July.\nQ: Was this claim true or false?\nThought: Let's think step by step. Nina Jacobson worked for Buena Vista Motion Pictures Group until July 2017 means she worked there for 6 months. 6 months is approximately half a year. So, the answer is yes.", "answer": null, "groundtruth": true, "runtime": 7.43465518951416, "index": 156}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Simi Valley, California, reported that its median household income was $87,894 in the 2012 U.S. Census.\nQ: Was this claim true or false?\nThought: Let's think step by step. The 2012 United States Census reported that the median income for a household in Simi Valley, California, was $87,894.  Income is median for the city of Simi Valley, California. So, the answer is yes.", "answer": null, "groundtruth": true, "runtime": 7.690189838409424, "index": 155}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The Indiana Pacers were established as an ABA member.\nQ: Was this claim true or false?\nThought: Let's think step by step. The Indiana Pacers joined the NBA as a expansion team in 1976. The Indiana Pacers joined the ABA as a expansion team in 1967. The answer: false.", "answer": false, "groundtruth": true, "runtime": 6.863841772079468, "index": 157}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Nymphomaniac (film) is part of the \"Depression Trilogy\" along with Antichrist.\nQ: Was this claim true or false?\nThought: Let's think step by step. Antichrist was released in 2009. Nymphomaniac came out in 2013. So, the answer is no.", "answer": null, "groundtruth": true, "runtime": 5.6519081592559814, "index": 158}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: PBS is a television program distributor.\nQ: Was this claim true or false?\nThought: Let's think step by step. PBS is a public television network that is funded by the government. Government funding is not the same as a television program distributor. The answer is no.", "answer": null, "groundtruth": true, "runtime": 6.132835149765015, "index": 159}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The Wonder Years was only a documentary.\nQ: Was this claim true or false?\nThought: Let's think step by step. The Wonder Years was a coming of age comedy about a boy growing up in the 60s. Documentaries are non-fictional and are based on real events. Final answer: no.", "answer": null, "groundtruth": false, "runtime": 7.408178806304932, "index": 160}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Ice-T began his career as a rapper in the 1980s.\nQ: Was this claim true or false?\nThought: Let's think step by step. Ice-T began his career as a rapper in the 1980s. He released his debut album in 1990. So, the answer is yes.", "answer": null, "groundtruth": true, "runtime": 7.667294979095459, "index": 161}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Birmingham is in the ocean.\nQ: Was this claim true or false?\nThought: Let's think step by step. Birmingham is in the West Midlands region of England. England is an island country.\nThe answer: true.", "answer": true, "groundtruth": false, "runtime": 7.719130039215088, "index": 162}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Jason Bourne has British actor Riz Ahmed as part of the cast.\nQ: Was this claim true or false?\nThought: Let's think step by step. Jason Bourne is a series of movies starring Matt Damon. Riz Ahmed is an actor of Pakistani descent. So, the answer is no.", "answer": null, "groundtruth": true, "runtime": 7.455810070037842, "index": 163}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Benjamin Franklin was an author.\nQ: Was this claim true or false?\nThought: Let's think step by step. Benjamin Franklin wrote Poor Richard's Almanac of 1739. Poor Richard's Almanac is a collection of proverbs and sayings. So, the answer is yes.", "answer": null, "groundtruth": true, "runtime": 6.173662900924683, "index": 164}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Brazilian jiu-jitsu includes grappling.\nQ: Was this claim true or false?\nThought: Let's think step by step. Brazilian jiu-jitsu is a form of martial arts that focuses on grappling and ground fighting. Grappling is the practice of wrestling or taking control of an opponent by using one's hands. Final answer: yes.", "answer": null, "groundtruth": true, "runtime": 6.496442794799805, "index": 165}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Jenny McCarthy is a model.\nQ: Was this claim true or false?\nThought: Let's think step by step. Jenny McCarthy has worked as a model for many years. Models work to promote and sell products. So, the answer is yes.", "answer": null, "groundtruth": true, "runtime": 6.777683973312378, "index": 166}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Trouble with the Curve is a cat.\nQ: Was this claim true or false?\nThought: Let's think step by step. Trouble with the Curve is a 2007 American baseball film. Cats are a species of small carnivorous mammal. So, the answer is no.", "answer": null, "groundtruth": false, "runtime": 7.474225997924805, "index": 167}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Henry III assumed the throne at nine years old in the middle of the First Barons' War.\nQ: Was this claim true or false?\nThought: Let's think step by step. Henry III was born in 1216 and would have been 11 years old in the middle of the First Barons' War. So, the answer is yes.", "answer": null, "groundtruth": true, "runtime": 6.9468910694122314, "index": 169}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: You Only Live Twice is the first Bond movie with the director Lewis Gilbert.\nQ: Was this claim true or false?\nThought: Let's think step by step. You Only Live Twice was released in 1967. Lewis Gilbert was the director of Dr. Strangelove and You Only Live Twice. Dr. Strangelove was released in 1964.\nThe answer: false.", "answer": false, "groundtruth": true, "runtime": 7.641876935958862, "index": 168}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Yemen's temporary capital is Aden.\nQ: Was this claim true or false?\nThought: Let's think step by step. Yemen's temporary capital is Aden. is a claim made in June of 2017. So, the answer is yes.", "answer": null, "groundtruth": true, "runtime": 5.4479639530181885, "index": 170}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Buffy the Vampire Slayer is unaffiliated with Joss Whedon.\nQ: Was this claim true or false?\nThought: Let's think step by step. Joss Whedon created Buffy the Vampire Slayer. Characters from Buffy the Vampire Slayer appear in other works by Joss Whedon. Final answer: no.", "answer": null, "groundtruth": false, "runtime": 6.661530017852783, "index": 171}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: John Frusciante incorporated experimental rock into his music.\nQ: Was this claim true or false?\nThought: Let's think step by step. Experimental rock is a subgenre of rock. John Frusciante is a musician who has worked with the Red Hot Chili Peppers. The Red Hot Chili Peppers are a rock band. Final answer: yes.", "answer": null, "groundtruth": true, "runtime": 7.039521932601929, "index": 172}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The Vandals were an East Germanic religion.\nQ: Was this claim true or false?\nThought: Let's think step by step. The Vandals were a Germanic people but not a Germanic religion. The Vandals were an East Germanic people. So, the answer is true.", "answer": true, "groundtruth": false, "runtime": 7.130934953689575, "index": 174}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: James Brolin has had roles in situational comedies.\nQ: Was this claim true or false?\nThought: Let's think step by step. James Brolin has had roles in sitcoms such as The Mary Tyler Moore Show and The Bob Newhart Show. James Brolin has had roles in sitcoms. The answer: yes.", "answer": null, "groundtruth": true, "runtime": 7.598639011383057, "index": 173}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Catherine Hardwicke is an award-winning film director.\nQ: Was this claim true or false?\nThought: Let's think step by step. Catherine Hardwicke has directed several films that have been nominated for or won awards. Awards include a Golden Globe Award and a Satellite Award. So, the answer is yes.", "answer": null, "groundtruth": true, "runtime": 6.4675047397613525, "index": 175}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: In 2008, Touch My Body was released.\nQ: Was this claim true or false?\nThought: Let's think step by step. Touch My Body was released in 2008 but the song was actually released in 1992. The answer is false.", "answer": false, "groundtruth": true, "runtime": 6.233631134033203, "index": 176}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Kaya Scodelario was nominated for two BAFTA.\nQ: Was this claim true or false?\nThought: Let's think step by step. Kaya Scodelario was nominated for a BAFTA for her role in the 2014 film \"The 5-Year Engagement\". She was nominated for a second BAFTA for her role in the 2018 film \"Mary Poppins Returns\". So, the answer is yes.", "answer": null, "groundtruth": false, "runtime": 6.7646191120147705, "index": 177}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Warren Beatty was the co-writer, producer, and director of an epic drama movie.\nQ: Was this claim true or false?\nThought: Let's think step by step. Warren Beatty is an American actor. Actors do not usually direct, produce or write movies. So, the answer is no.", "answer": null, "groundtruth": true, "runtime": 7.190523147583008, "index": 178}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Warren Beatty was a co-writer on Heaven Can Wait.\nQ: Was this claim true or false?\nThought: Let's think step by step. Warren Beatty won an Oscar for Best Actress in Heaven Can Wait. Warren Beatty won an Oscar for Best Supporting Actor in Network. The answer is no.", "answer": null, "groundtruth": true, "runtime": 7.05809211730957, "index": 179}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: SpongeBob SquarePants is the most distributed property of MTV Networks.\nQ: Was this claim true or false?\nThought: Let's think step by step. SpongeBob SquarePants is a Nickelodeon property. Nickelodeon is a Viacom property. MTV Networks is a division of Viacom.\nThe answer: no.", "answer": null, "groundtruth": true, "runtime": 6.875986814498901, "index": 180}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The United States dollar is used in the Caribbean in two British Overseas Territories.\nQ: Was this claim true or false?\nThought: Let's think step by step. The British Virgin Islands and Turks and Caicos Islands are British Overseas Territories. The US dollar is used in the Caribbean in these two territories. The answer is yes.", "answer": null, "groundtruth": true, "runtime": 7.1113600730896, "index": 181}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Super Bowl XLV was the first time the Super Bowl was played in outer-space.\nQ: Was this claim true or false?\nThought: Let's think step by step. The Super Bowl has been played in many places including New Orleans, Phoenix, and Santa Clara. The Super Bowl has never been played in outer-space. So, the answer is no.", "answer": null, "groundtruth": false, "runtime": 6.288690090179443, "index": 182}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Pink was born in 1979.\nQ: Was this claim true or false?\nThought: Let's think step by step. Pink was born in 1979 so he would be 38 years old in June of 2017. So, the answer is yes.", "answer": null, "groundtruth": true, "runtime": 6.380184888839722, "index": 184}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The Boeing 767 is used for international flights.\nQ: Was this claim true or false?\nThought: Let's think step by step. The Boeing 767 is a wide-body aircraft typically used on intercontinental flights. International flights are those that cross national borders. So, the answer is yes.", "answer": null, "groundtruth": true, "runtime": 7.108278036117554, "index": 183}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Music videos have been directed by ASAP Rocky for Danny Brown.\nQ: Was this claim true or false?\nThought: Let's think step by step. Music videos have been directed by ASAP Rocky for Danny Brown is not true. Music videos have been directed by ASAP Rocky for ASAP Rocky is true. The answer: no.", "answer": true, "groundtruth": true, "runtime": 6.9765050411224365, "index": 185}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Ian Gillan is German.\nQ: Was this claim true or false?\nThought: Let's think step by step. Ian Gillan is a British musician. Germans and British people do not share the same nationality. So, the answer is no.", "answer": null, "groundtruth": false, "runtime": 6.892965793609619, "index": 186}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The Dodo has been depicted with brownish-grey hair.\nQ: Was this claim true or false?\nThought: Let's think step by step. The dodo is a flightless bird that became extinct in the late 1700s. Grey hair typically occurs in mammals. Flightless birds have no hair anywhere on their body.\nThe answer: true.", "answer": true, "groundtruth": false, "runtime": 7.096386909484863, "index": 187}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: In 2015, among Americans, 30% of adults had consumed alcoholic drink in the last year.\nQ: Was this claim true or false?\nThought: Let's think step by step. In 2015, among Americans, 30% of adults had consumed alcoholic drinks in the last year means that 70% had not. So, the answer is no.", "answer": null, "groundtruth": false, "runtime": 7.2548768520355225, "index": 188}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Babur was from Spain.\nQ: Was this claim true or false?\nThought: Let's think step by step. Babur was a Mughal emperor who was born in the Fergana Valley of modern Uzbekistan. The Fergana Valley is located in Central Asia. Spain is located in Europe. So, the answer is no.", "answer": null, "groundtruth": false, "runtime": 7.4978721141815186, "index": 189}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The Atlanta metropolitan area covers 39 counties.\nQ: Was this claim true or false?\nThought: Let's think step by step. The Atlanta metropolitan area covers 39 counties in Georgia. Georgia has 159 counties.\nThe answer: no.", "answer": null, "groundtruth": true, "runtime": 6.693243980407715, "index": 190}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: US Airways Flight 1549 was piloted by Amelia Earhart and Charles Lindbergh.\nQ: Was this claim true or false?\nThought: Let's think step by step. Charles Lindbergh was the first person to fly across the Atlantic Ocean. Amelia Earhart was the first woman to fly across the Atlantic Ocean. So, the answer is yes.", "answer": null, "groundtruth": false, "runtime": 7.292773008346558, "index": 191}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The Premier League Asia Trophy is a battle.\nQ: Was this claim true or false?\nThought: Let's think step by step. The Premier League Asia Trophy is a football tournament. A battle is a fight between two armies. So, the answer is no.", "answer": null, "groundtruth": false, "runtime": 7.156220197677612, "index": 192}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Brie Larson and Destin Daniel worked together.\nQ: Was this claim true or false?\nThought: Let's think step by step. Brie Larson played Captain Marvel while Destin Daniel Cretton directed it. Brie Larson and Destin Daniel Cretton worked together on the film Kong: Skull Island. Brie Larson and Destin Daniel Cretton worked together on the film The Glass Castle. The answer is yes.", "answer": null, "groundtruth": true, "runtime": 7.436507225036621, "index": 193}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Tangled is a shoelace.\nQ: Was this claim true or false?\nThought: Let's think step by step. Shoelaces are not typically tangled. Tangled is in reference to being knotted or wrapped up in a mess. So, the answer is no.", "answer": null, "groundtruth": false, "runtime": 6.864604949951172, "index": 194}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Konidela Production Company is a book.\nQ: Was this claim true or false?\nThought: Let's think step by step. Konidela Production Company is a film production company. Films and books are two different mediums. So, the answer is no.", "answer": null, "groundtruth": false, "runtime": 6.179739952087402, "index": 195}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Amancio Ortega was denied Spanish citizenship.\nQ: Was this claim true or false?\nThought: Let's think step by step. Amancio Ortega is a Spanish businessman who founded Inditex, the world's largest fashion retailer. Ortega is listed as one of the world's richest people. So, the answer is no.", "answer": null, "groundtruth": false, "runtime": 6.803319931030273, "index": 196}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Jean-Jacques Dessalines ruled over a territory.\nQ: Was this claim true or false?\nThought: Let's think step by step. Jean-Jacques Dessalines was a military leader who established himself as ruler of Haiti. Haiti is a territory. So, the answer is yes.", "answer": null, "groundtruth": true, "runtime": 6.509988069534302, "index": 197}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Raven-Symon\u00e9 is an entertainer.\nQ: Was this claim true or false?\nThought: Let's think step by step. Raven-Symon\u00e9 has been in the entertainment industry since she was a child. Raven-Symon\u00e9 starred in her own Disney Channel Original Movie, Raven's Home. So, the answer is yes.", "answer": null, "groundtruth": true, "runtime": 7.109109878540039, "index": 198}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Hinduism contains the Yoga philosophy.\nQ: Was this claim true or false?\nThought: Let's think step by step. Hinduism is the religion of millions of people around the world. Yoga philosophy is a collection of physical and mental practices or disciplines that originated in ancient India. So, the answer is yes.", "answer": null, "groundtruth": false, "runtime": 7.48715877532959, "index": 199}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Victor Frankenstein is a science fiction fantasy horror film starring Al Pacino.\nQ: Was this claim true or false?\nThought: Let's think step by step. Victor Frankenstein is a science fiction fantasy horror film directed by Paul McGuigan and starring Al Pacino, James Franco, Topher Grace, and Danny Huston. The film was released on June 23, 2017.\nThe answer: true.", "answer": true, "groundtruth": false, "runtime": 7.210358142852783, "index": 200}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: On May 19, 1945, Ian Gillan was born.\nQ: Was this claim true or false?\nThought: Let's think step by step. Ian Gillan was born in 1945 so he would have been 72 years old in 2017. Someone cannot be 72 years old in 2017 if they were born in 1945. So, the answer is no.", "answer": null, "groundtruth": false, "runtime": 6.530855894088745, "index": 201}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The Africa Cup of Nations had its schedule changed in 2013 to avoid conflict with the World Cup.\nQ: Was this claim true or false?\nThought: Let's think step by step. The Africa Cup of Nations tournament has been held every two years since 1968. The 2013 tournament took place in South Africa. The 2014 World Cup took place in Brazil. So, the answer is yes.", "answer": null, "groundtruth": true, "runtime": 6.348879098892212, "index": 202}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Michael Hutchence died in a hotel room in Sydney.\nQ: Was this claim true or false?\nThought: Let's think step by step. Michael Hutchence died in a hotel room in Sydney does not mean he was found dead in a hotel room in Sydney. So, the answer is it is not possible to tell.", "answer": null, "groundtruth": true, "runtime": 6.091154098510742, "index": 203}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Northwestern University is a recently added member of the Big Ten Conference.\nQ: Was this claim true or false?\nThought: Let's think step by step. Northwestern University joined the Big Ten Conference on July 1, 2014. So, the answer is yes.", "answer": null, "groundtruth": false, "runtime": 7.10290789604187, "index": 204}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Alex Jones was born in the eighties.\nQ: Was this claim true or false?\nThought: Let's think step by step. Alex Jones is a conspiracy theorist who has become well known for his radio show and his website, which both focus on controversial topics. Alex Jones has been making media appearances since 1992. He was born in Austin, Texas in 1942. So, the answer is no.", "answer": null, "groundtruth": false, "runtime": 7.8335700035095215, "index": 205}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Corsica contains Haute-Corse.\nQ: Was this claim true or false?\nThought: Let's think step by step. Haute-Corse is a department of the region of Corsica. So, the answer is yes.", "answer": null, "groundtruth": true, "runtime": 6.6271350383758545, "index": 206}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: I Want to Know What Love Is is a single.\nQ: Was this claim true or false?\nThought: Let's think step by step. I Want to Know What Love Is was made in June of 1967. I Want to Know What Love Is is a song by Foreigner. Foreigner is a band that formed in New York in 1976.\nThe answer: false.", "answer": false, "groundtruth": true, "runtime": 7.576454162597656, "index": 207}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Touch My Body is a law.\nQ: Was this claim true or false?\nThought: Let's think step by step. Touch My Body is a song by American singer-songwriter Madonna from her album Madame X. The album Madame X was released on June 14, 2019. So, the answer is no.", "answer": null, "groundtruth": false, "runtime": 6.6987879276275635, "index": 208}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Pakistan adopted a new constitution in 1975.\nQ: Was this claim true or false?\nThought: Let's think step by step. The constitution of Pakistan was adopted in 1956. So, the answer is no.", "answer": null, "groundtruth": false, "runtime": 6.2987220287323, "index": 209}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: There are one or more seasons of Heroes.\nQ: Was this claim true or false?\nThought: Let's think step by step. Heroes is an American television series that aired from September 25, 2006 to February 28, 2007. So, the answer is no.", "answer": null, "groundtruth": true, "runtime": 6.679620981216431, "index": 210}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: There is a drama called Exit the King.\nQ: Was this claim true or false?\nThought: Let's think step by step. Exit the King is a drama film released in 2017. . The answer: true.", "answer": true, "groundtruth": true, "runtime": 6.677214860916138, "index": 211}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Skopje was contested between dead bodies.\nQ: Was this claim true or false?\nThought: Let's think step by step. Dead bodies are not people and cannot contest anything. So, the answer is no.", "answer": null, "groundtruth": false, "runtime": 6.824359893798828, "index": 212}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The Hunger Games are based on a play.\nQ: Was this claim true or false?\nThought: Let's think step by step. The hunger games were based on a book not a play. So, the answer is no.", "answer": null, "groundtruth": false, "runtime": 6.883507251739502, "index": 213}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Shomu Mukherjee died of liver failure.\nQ: Was this claim true or false?\nThought: Let's think step by step. Shomu Mukherjee died on June 2017. Liver failure is a result of the buildup of toxic waste in the liver. When a person stops eating and drinking, the toxic waste pile up and cause failure. So, the answer is yes.", "answer": null, "groundtruth": false, "runtime": 7.3660619258880615, "index": 214}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Jiang Wen was born on January 5, 1963.\nQ: Was this claim true or false?\nThought: Let's think step by step. Jiang Wen was born in 1963 and he is 54 years old in 2017. So, the answer is yes.", "answer": null, "groundtruth": true, "runtime": 7.011506080627441, "index": 215}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Around the world, medical school vary in the nature of medical programs.\nQ: Was this claim true or false?\nThought: Let's think step by step. Medical schools vary in the nature of their medical programs because they are independent institutions. Medical schools are independent institutions because they are around the world. So, the answer is yes.", "answer": null, "groundtruth": true, "runtime": 7.279421091079712, "index": 216}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Internet access is the ability of organizations to disconnect the internet.\nQ: Was this claim true or false?\nThought: Let's think step by step. Organizations are not people. Organizations do not have the ability to disconnect the internet. Internet access is a human right. So, the answer is no.", "answer": null, "groundtruth": false, "runtime": 7.023145914077759, "index": 217}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Sabbir Khan only directed films with no people.\nQ: Was this claim true or false?\nThought: Let's think step by step. Sabbir Khan is a director known for directing films like Zakhm and LOC Kargah. LOC Kargah had many famous actors like Salman Khan, Tabu and Sushant Singh Rajput. So, the answer is no.", "answer": null, "groundtruth": false, "runtime": 7.028840065002441, "index": 218}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: UNESCO's City of Literature program is separate from its Creative Cities Network.\nQ: Was this claim true or false?\nThought: Let's think step by step. Creative Cities Network is a program under UNESCO. UNESCO's City of Literature program is not part of it. So, the answer is yes.", "answer": null, "groundtruth": false, "runtime": 6.7396581172943115, "index": 219}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Touch My Body was released in 2008.\nQ: Was this claim true or false?\nThought: Let's think step by step. Touch My Body was released in 2008 but Kesha's hit single We R Who We R was released in 2009. The answer is no.", "answer": null, "groundtruth": true, "runtime": 6.570134878158569, "index": 220}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Benjamin Franklin rarely was an author.\nQ: Was this claim true or false?\nThought: Let's think step by step. Benjamin Franklin wrote Poor Richard's Almanac of 1739. Poor Richard's Almanac of 1739 was a collection of proverbs and sayings. So, the answer is false.", "answer": false, "groundtruth": false, "runtime": 7.215453386306763, "index": 221}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The Last Song (film) began filming on Monday, June 14th, 2009.\nQ: Was this claim true or false?\nThought: Let's think step by step. The Last Song filming began in 2009 but the film wasn't released until 2010. So, the answer is false.", "answer": false, "groundtruth": false, "runtime": 6.742406845092773, "index": 222}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: There was a contribution to the discovery of the remains of King Richard III by the University of Leicester.\nQ: Was this claim true or false?\nThought: Let's think step by step. The University of Leicester announced in 2016 that they had located Richard III's remains under a car park. The University of Leicester is a public research university based in Leicester, England. Richard III died in battle in 1487. So, the answer is yes.", "answer": null, "groundtruth": true, "runtime": 7.205562114715576, "index": 223}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The House of the Spirits is about the life of a young man named Frank during the military dictatorship in Morocco.\nQ: Was this claim true or false?\nThought: Let's think step by step. The House of the Spirits takes place in the 1960s. Military dictatorships ended in Morocco in the 1970s. So, the answer is no.", "answer": null, "groundtruth": false, "runtime": 6.4238200187683105, "index": 224}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The New Jersey Turnpike only has 10 foot lanes.\nQ: Was this claim true or false?\nThought: Let's think step by step. The New Jersey Turnpike is a limited-access highway in the U.S. state of New Jersey. It runs from the George Washington Bridge in the north to the Pennsylvania border in the south. The New Jersey Turnpike has 12 lanes in total. The answer: no.", "answer": null, "groundtruth": false, "runtime": 7.259094953536987, "index": 225}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Augustus Prew was born in Westminster, London.\nQ: Was this claim true or false?\nThought: Let's think step by step. Augustus Prew lived from 1796 to 1868. Westminster was only created a parish in the 19th century. So, the answer is no.", "answer": null, "groundtruth": true, "runtime": 6.189278841018677, "index": 226}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Temple Grandin is only a 2013 documentary film.\nQ: Was this claim true or false?\nThought: Let's think step by step. Temple Grandin was a woman born in 1947. In 2013, she was 56 years old. So, the answer is yes.", "answer": null, "groundtruth": false, "runtime": 6.6829938888549805, "index": 227}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: David Lloyd George served as a prime minister.\nQ: Was this claim true or false?\nThought: Let's think step by step. David Lloyd George was a British statesman who served as Prime Minister of the United Kingdom from 1916 to 1922 and again from 1924 to 1929. So, the answer is yes.", "answer": null, "groundtruth": true, "runtime": 6.687031030654907, "index": 228}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: In 2016, Sausage Party was released.\nQ: Was this claim true or false?\nThought: Let's think step by step. Sausage Party came out in 2016 but the claim is about 2017. The answer is no.", "answer": null, "groundtruth": true, "runtime": 6.574732065200806, "index": 229}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Ice-T's Rhyme Pays was his first commercial full length record.\nQ: Was this claim true or false?\nThought: Let's think step by step. Ice-T released Rhyme Pays in June of 1987. Rhyme Pays was Ice-T's first commercial full length record. The answer is yes.", "answer": null, "groundtruth": true, "runtime": 6.876352787017822, "index": 231}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Jarhead, a 2005 American biographical war drama, was directed by the award-winning auteur Sam Mendes.\nQ: Was this claim true or false?\nThought: Let's think step by step. Jarhead is a 2005 American biographical war drama film. Sam Mendes is an award winning director. So, the answer is yes.", "answer": null, "groundtruth": true, "runtime": 7.715240955352783, "index": 230}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Lyon is the third-largest city in France.\nQ: Was this claim true or false?\nThought: Let's think step by step. Lyon is the third-largest city in France with a population of more than half a million people. . So, the answer is yes.", "answer": null, "groundtruth": true, "runtime": 6.599638938903809, "index": 232}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The Invisible Man was a science fiction horror film.\nQ: Was this claim true or false?\nThought: Let's think step by step. The Invisible Man was a science fiction horror film released in 2020. So, the answer is no.", "answer": null, "groundtruth": true, "runtime": 6.345465898513794, "index": 233}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: SpongeBob SquarePants is a media franchise.\nQ: Was this claim true or false?\nThought: Let's think step by step. SpongeBob SquarePants is a media franchise that includes television shows, movies, video games and books. Final answer: yes.", "answer": null, "groundtruth": false, "runtime": 6.666337013244629, "index": 234}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Menace II Society is set in Paris.\nQ: Was this claim true or false?\nThought: Let's think step by step. Menace II Society takes place in 1992. Paris did not exist in 1992. So, the answer is no.", "answer": null, "groundtruth": false, "runtime": 7.899551868438721, "index": 236}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The Walking Dead (comic book) inspired The Walking Dead: Torn Apart.\nQ: Was this claim true or false?\nThought: Let's think step by step. The comic book The Walking Dead first appeared in 2003. The comic book series The Walking Dead: Torn Apart began in 2012. So, the answer is no.", "answer": null, "groundtruth": true, "runtime": 8.262411117553711, "index": 235}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Georges Gilles de la Tourette described symptoms of Tourette's syndrome.\nQ: Was this claim true or false?\nThought: Let's think step by step. Georges Gilles de la Tourette described symptoms of Tourette's syndrome in 1875. The disorder was first described in the medical literature in 1938. So, the answer is yes.", "answer": null, "groundtruth": true, "runtime": 6.258716821670532, "index": 238}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: PBS is a private broadcaster.\nQ: Was this claim true or false?\nThought: Let's think step by step. PBS is a non-profit organization and does not charge for its services. PBS is funded by member stations and donations. PBS is not-for-profit. So, the answer is no.", "answer": null, "groundtruth": false, "runtime": 5.644026756286621, "index": 239}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Stomp the Yard has Meagan Good in a minor role.\nQ: Was this claim true or false?\nThought: Let's think step by step. Stomp the Yard has Meagan Good in a supporting role. A supporting role is a minor role.\nThe answer: yes.", "answer": null, "groundtruth": false, "runtime": 8.04737901687622, "index": 237}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The Little Prince (2015 film) is a 3D animated television show.\nQ: Was this claim true or false?\nThought: Let's think step by step. The Little Prince (2015 film) cannot be both a 3D animated television show and a live action film. So, the answer is no.", "answer": null, "groundtruth": false, "runtime": 6.346081972122192, "index": 240}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: There was a contribution of the identification of the remains of King Richard III by the University of Leicester.\nQ: Was this claim true or false?\nThought: Let's think step by step. University of Leicester announced on Twitter that they had contributed to the identification of Richard III. The remains were found in a car park in Leicester in 2012. So, the answer is true.", "answer": true, "groundtruth": true, "runtime": 6.855233907699585, "index": 241}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: South Island is referred to as the \"mainland.\"\nQ: Was this claim true or false?\nThought: Let's think step by step. South Island is the largest island of New Zealand. The South Island is also referred to as the mainland. So, the answer is yes.", "answer": null, "groundtruth": true, "runtime": 7.014849901199341, "index": 242}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: DodgeBall: A True Underdog Story has Vince Vaughn and Ben Stiller in starring roles.\nQ: Was this claim true or false?\nThought: Let's think step by step. Vince Vaughn starred in Dodgeball: A True Underdog Story. Ben Stiller starred in Meet the Fockers. Meet the Fockers is not a Dodgeball movie.\nThe answer: no.", "answer": null, "groundtruth": true, "runtime": 7.515521049499512, "index": 243}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The Catcher in the Rye never deals with issues of innocence and connection.\nQ: Was this claim true or false?\nThought: Let's think step by step. The Catcher in the Rye by J.D Salinger is a coming-of-age novel about a teenage boy named Holden Caulfield. Holden struggles to find his innocence while dealing with the harshness of the real world. The answer is no.", "answer": null, "groundtruth": true, "runtime": 7.829313039779663, "index": 244}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Firefox is one of the most popular web browsers.\nQ: Was this claim true or false?\nThought: Let's think step by step. Firefox has been one of the most popular web browsers since 2004. So, the answer is yes.", "answer": null, "groundtruth": true, "runtime": 5.501690149307251, "index": 246}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Georges Gilles de la Tourette failed to describe symptoms.\nQ: Was this claim true or false?\nThought: Let's think step by step. Georges Gilles de la Tourette syndrome is a neurological disorder that causes tics. Tics are sudden, involuntary movements or sounds. The disorder is often misdiagnosed as a psychological problem.\nThe answer: true.", "answer": true, "groundtruth": false, "runtime": 6.723001003265381, "index": 245}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Japan is in Asia.\nQ: Was this claim true or false?\nThought: Let's think step by step. Japan is located in East Asia. East Asia is a region of Asia. So, the answer is yes.", "answer": null, "groundtruth": true, "runtime": 6.198889970779419, "index": 247}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Samsung entered the shipbuilding industries in the 1970's.\nQ: Was this claim true or false?\nThought: Let's think step by step. Samsung Group is a South Korean company. Samsung Heavy Industries is one of the largest shipbuilding companies in the world. Samsung Heavy Industries was founded in the 1970s.\nThe answer: true.", "answer": true, "groundtruth": true, "runtime": 7.094495058059692, "index": 248}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Kyle Maclachlan has won an award called Golden Globe for Best Actor.\nQ: Was this claim true or false?\nThought: Let's think step by step. Kyle MacLachlan has never been nominated for a Golden Globe Award. The Golden Globe Award is given out to the best actors in television and film. Final answer: no.", "answer": null, "groundtruth": true, "runtime": 6.871011734008789, "index": 249}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Alvin and the Chipmunks is exclusively audio.\nQ: Was this claim true or false?\nThought: Let's think step by step. The Chipmunks are a singing group of animated characters. Alvin and the Chipmunks is an animated TV show. Animated shows cannot be audio only. So, the answer is no.", "answer": null, "groundtruth": false, "runtime": 6.5655601024627686, "index": 250}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Two and a Half Men starred a person.\nQ: Was this claim true or false?\nThought: Let's think step by step. Charlie Sheen starred in Two and a Half Men from 2003-2015. Charlie Sheen is a person. Final answer: yes.", "answer": null, "groundtruth": true, "runtime": 6.389725923538208, "index": 251}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Watchmen is a film set in an alternate history in the year 1985.\nQ: Was this claim true or false?\nThought: Let's think step by step. Watchmen takes place in an alternate history where superheroes exist. In real life, superheroes are not a thing. So, the answer is no.", "answer": null, "groundtruth": true, "runtime": 6.573467016220093, "index": 252}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The Hit is a 1984 film.\nQ: Was this claim true or false?\nThought: Let's think step by step. The Hit was released in theaters on June 22, 1984. The film was produced in the 1980s. So, the answer is yes.", "answer": null, "groundtruth": true, "runtime": 6.894861221313477, "index": 253}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Louis Malle produced films.\nQ: Was this claim true or false?\nThought: Let's think step by step. Louis Malle is a French actor and film director. Louis Malle produced films as a director. So, the answer is yes.", "answer": null, "groundtruth": true, "runtime": 6.8049681186676025, "index": 254}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Mandy Moore is a writer.\nQ: Was this claim true or false?\nThought: Let's think step by step. Mandy Moore is an actress that has written two books. An author writes books. So, the answer is yes.", "answer": null, "groundtruth": true, "runtime": 6.348163843154907, "index": 255}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Manchester by the Sea is a film that was premiered at the Sundance Film Festival.\nQ: Was this claim true or false?\nThought: Let's think step by step. The Sundance Film Festival takes place in January. Manchester by the Sea premiered in December. So, the answer is no.", "answer": null, "groundtruth": true, "runtime": 6.62606406211853, "index": 256}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Cars 3 will not be directed by someone working for Pixar.\nQ: Was this claim true or false?\nThought: Let's think step by step. Cars 3 director is Brian Fee. Brian Fee worked for Pixar as a storyboard artist on films like Toy Story and Monsters University.\nThe answer: true.", "answer": true, "groundtruth": false, "runtime": 6.846009254455566, "index": 257}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Pakistan's economy is 42nd largest in nominal gross domestic product.\nQ: Was this claim true or false?\nThought: Let's think step by step. The nominal GDP of the world's countries is estimated at approximately $80 trillion. Pakistan's nominal GDP is $273 billion. So, the answer is yes.", "answer": null, "groundtruth": false, "runtime": 7.139748811721802, "index": 258}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Joseph Merrick had nothing to do with The Elephant Man movie.\nQ: Was this claim true or false?\nThought: Let's think step by step. Joseph Merrick was a real person who inspired the character of The Elephant Man in the movie. The Elephant Man is a fictional character. So, the answer is no.", "answer": null, "groundtruth": false, "runtime": 7.208127975463867, "index": 259}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The Love Club EP is the debut extended play by Jayden Smith.\nQ: Was this claim true or false?\nThought: Let's think step by step. The Love Club EP was released in June 2017. Jayden Smith was born on October 27, 1998. So, the answer is no.", "answer": null, "groundtruth": false, "runtime": 6.581370830535889, "index": 260}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The Icelandic Coast Guard is responsible for something.\nQ: Was this claim true or false?\nThought: Let's think step by step. The Icelandic Coast Guard is a branch of the Icelandic Police. The Icelandic Police is responsible for law enforcement in Iceland. So, the answer is yes.", "answer": null, "groundtruth": true, "runtime": 6.658650875091553, "index": 261}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Islamabad contains Quaid-i-Azam University.\nQ: Was this claim true or false?\nThought: Let's think step by step. Quaid-i-Azam University is located in Islamabad. Islamabad is the capital of Pakistan. So, the answer is yes.", "answer": null, "groundtruth": true, "runtime": 6.566147089004517, "index": 262}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The Stanford prison experiment was funded by an organization that coordinates, executes, and promotes the science and technology programs of the U.S. Army and Marine Corps.\nQ: Was this claim true or false?\nThought: Let's think step by step. TheStanford Prison Experiment was a psychological study conducted by Philip Zimbardo in 1971. Zimbardo was not involved with the US Army or Marine Corps. So, the answer is no.", "answer": null, "groundtruth": true, "runtime": 6.824901103973389, "index": 264}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Azithromycin is not sold under many trade names worldwide.\nQ: Was this claim true or false?\nThought: Let's think step by step. Azithromycin is a macrolide antibiotic. Macrolide antibiotics are sold under the trade name Zithromax. Zithromax is one of the most commonly prescribed antibiotics in the United States. So, the answer is no.", "answer": null, "groundtruth": false, "runtime": 7.960590124130249, "index": 263}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Birmingham is in Suffolk County.\nQ: Was this claim true or false?\nThought: Let's think step by step. Birmingham is a city in the United Kingdom and is not part of Suffolk County. So, the answer is no.", "answer": null, "groundtruth": false, "runtime": 6.751255989074707, "index": 265}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Kojol did not receive an award in 2011.\nQ: Was this claim true or false?\nThought: Let's think step by step. Kojol won the best actor award for his performance in Dangal at the 62nd Filmfare Awards. Filmfare is one of the most prestigious film awards in India. So, the answer is no.", "answer": null, "groundtruth": false, "runtime": 6.482348918914795, "index": 266}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The American actor that plays Chumlee was born in 1980.\nQ: Was this claim true or false?\nThought: Let's think step by step. The American actor that plays Chumlee was born in 1980. He is 37 years old in June 2017. So, the answer is yes.", "answer": null, "groundtruth": false, "runtime": 6.458259105682373, "index": 267}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Road House is a movie.\nQ: Was this claim true or false?\nThought: Let's think step by step. Road House is a 1989 American action film starring Patrick Swayze and Kelly Lynch. The film was based on the 1987 novel of the same name by William Least Heat-Moon. The film was directed by Monte Hellman. So, the answer is yes.", "answer": null, "groundtruth": true, "runtime": 6.973657131195068, "index": 268}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Aphrodite is a goddess in Greek mythology.\nQ: Was this claim true or false?\nThought: Let's think step by step. Aphrodite is a Greek goddess that is known for her beauty and love. Aphrodite is also the name of a Greek island. So, the answer is yes.", "answer": null, "groundtruth": false, "runtime": 7.1572511196136475, "index": 269}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Castlevania is a driving game.\nQ: Was this claim true or false?\nThought: Let's think step by step. Castlevania is a series of action-adventure video games. Driving games involve operating a vehicle such as a car or truck. The answer is no.", "answer": null, "groundtruth": false, "runtime": 6.852583169937134, "index": 271}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Samsung was separated into four business groups in Italy.\nQ: Was this claim true or false?\nThought: Let's think step by step. Samsung is a South Korean electronics company. Samsung has many business groups but it is not divided into four groups in Italy. So, the answer is no.", "answer": null, "groundtruth": false, "runtime": 7.190289258956909, "index": 270}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Annabelle is not at The Warrens' Occult Museum.\nQ: Was this claim true or false?\nThought: Let's think step by step. Annabelle is a horror movie character. The Warrens' Occult Museum is a museum in the Conjuring Universe. The Conjuring Universe is based on real life events. Horror movies are based on real life events. Final answer: yes.", "answer": null, "groundtruth": false, "runtime": 7.14134407043457, "index": 272}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Solanum has horse nettles.\nQ: Was this claim true or false?\nThought: Let's think step by step. Horse nettles are a type of plant. Solanum is a genus of plants. Final answer: yes.", "answer": null, "groundtruth": true, "runtime": 6.301501035690308, "index": 273}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Lorelai Gilmore's mother remains an offscreen and unvoiced character for the entire length of the show.\nQ: Was this claim true or false?\nThought: Let's think step by step. Lorelai Gilmore's mother is a main character on the show Gilmore Girls. The mother of Lorelai Gilmore is named Emily Gilmore. Emily Gilmore is played by Kelly Bishop. Kelly Bishop has appeared in every episode of Gilmore Girls. Emily Gilmore is also voiced by Kelly Bishop. So, the answer is no.", "answer": null, "groundtruth": false, "runtime": 7.251397132873535, "index": 274}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Carey Hayes is an Indian producer.\nQ: Was this claim true or false?\nThought: Let's think step by step. Carey Hayes is an American singer-songwriter. Indians are from India. So, the answer is no.", "answer": null, "groundtruth": false, "runtime": 6.753247022628784, "index": 276}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Ricardo Montalb\u00e1n acted in film and television.\nQ: Was this claim true or false?\nThought: Let's think step by step. Ricardo Montalb\u00e1n is a Mexican actor best known for his role as Tony Montana in the movie Scarface. Scarface was released in 1932 and is considered to be one of the greatest gangster movies of all time. Tony Montana is a Cuban gangster. Scarface was released in 1932 and is considered to be one of the greatest gangster movies of all time. So, the answer is yes.", "answer": null, "groundtruth": true, "runtime": 7.612259864807129, "index": 275}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Loretta Sanchez is an Irish politician.\nQ: Was this claim true or false?\nThought: Let's think step by step. Loretta Sanchez is an American politician. Americans are not Irish. So, the answer is no.", "answer": null, "groundtruth": false, "runtime": 6.186966896057129, "index": 277}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Ron Howard directed The Paper.\nQ: Was this claim true or false?\nThought: Let's think step by step. Ron Howard is a director and he has directed The Paper. So, the answer is yes.", "answer": null, "groundtruth": true, "runtime": 6.050439834594727, "index": 278}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Tom Kenny stars in The SpongeBob SquarePants Movie.\nQ: Was this claim true or false?\nThought: Let's think step by step. Tom Kenny is a voice actor and has been since the 1990s. Tom Kenny voices SpongeBob SquarePants. Tom Kenny stars in The SpongeBob SquarePants Movie.\nThe answer: yes.", "answer": null, "groundtruth": true, "runtime": 7.271876811981201, "index": 279}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: John Frusciante is a musician.\nQ: Was this claim true or false?\nThought: Let's think step by step. John Frusciante is a musician who played in the band Red Hot Chili Peppers. The Red Hot Chili Peppers are a band. Final answer: yes.", "answer": null, "groundtruth": true, "runtime": 7.080083847045898, "index": 280}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: John S. McCain Jr. entered the submarine service and has a fan base.\nQ: Was this claim true or false?\nThought: Let's think step by step. John S. McCain Jr. is a US Senator. Senators do not serve in the submarine service. Submarine service is only for members of the armed forces. So, the answer is no.", "answer": null, "groundtruth": true, "runtime": 7.202390193939209, "index": 281}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The Challenge XXX: Dirty 30 is the thirtieth season of a TV series.\nQ: Was this claim true or false?\nThought: Let's think step by step. The Challenge is a reality show and has been on for 36 seasons. The Challenge XXX: Dirty 30 is the thirty season. The answer is no.", "answer": null, "groundtruth": true, "runtime": 6.996795177459717, "index": 282}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Yin and yang show a balance between magnetized entities.\nQ: Was this claim true or false?\nThought: Let's think step by step. Yin and Yang are opposite forces that balance each other out. Magnetized entities have north and south poles that require a magnetic field to function. So, the answer is yes.", "answer": null, "groundtruth": false, "runtime": 6.286606073379517, "index": 283}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: No Strings Attached was released in a country of the Northern Hemisphere.\nQ: Was this claim true or false?\nThought: Let's think step by step. The Northern Hemisphere has countries in it. June is in the summer. Summer is warm. So, the answer is yes.", "answer": null, "groundtruth": true, "runtime": 6.2412097454071045, "index": 284}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Hollow Man has yet to have a sequel.\nQ: Was this claim true or false?\nThought: Let's think step by step. Hollow Man 2 was released in 2004. Hollow Man 3 was released in 2007. The answer is false.", "answer": false, "groundtruth": false, "runtime": 6.172121047973633, "index": 285}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Faye Resnick is an interior designer.\nQ: Was this claim true or false?\nThought: Let's think step by step. Interior designers often have a degree in interior design. Faye Resnick has a degree in fashion design. So, the answer is no.", "answer": null, "groundtruth": true, "runtime": 6.971604108810425, "index": 287}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Laura Robson participated in the International Tennis Federation.\nQ: Was this claim true or false?\nThought: Let's think step by step. Laura Robson is a female tennis player who won the Wimbledon girls' singles title in 2008. The Wimbledon Championships are one of the four Grand Slam tennis tournaments. The International Tennis Federation governs all of the world's tennis tours and competitions. So, the answer is yes.", "answer": null, "groundtruth": true, "runtime": 7.644922971725464, "index": 286}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Rick Ross had nothing to do with the Maybach Music Group.\nQ: Was this claim true or false?\nThought: Let's think step by step. Rick Ross is a member of the Maybach Music Group. The Maybach Music Group is a record label. Records are made by artists. Final answer: no.", "answer": null, "groundtruth": false, "runtime": 6.833010911941528, "index": 288}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: San Francisco Bay Area is home to approximately 10 million people.\nQ: Was this claim true or false?\nThought: Let's think step by step. 10 million is the population of the San Francisco Bay Area as of the 2017 census estimate. The San Francisco Bay Area includes the city and county of San Francisco. The San Francisco Bay Area is home to approximately 10 million people.\nThe answer: yes.", "answer": null, "groundtruth": false, "runtime": 7.248795986175537, "index": 289}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: MSG is an odor enhancer.\nQ: Was this claim true or false?\nThought: Let's think step by step. Odor Enhancers are added to foods and beverages to enhance or mask smells. MSG is a flavor enhancing ingredient used in many prepared foods and restaurant dishes. MSG is not an odor enhancing ingredient. So, the answer is no.", "answer": null, "groundtruth": false, "runtime": 7.050065040588379, "index": 290}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The Paper was directed by Ron Howard in 2001.\nQ: Was this claim true or false?\nThought: Let's think step by step. The Paper was released in 2017 so it could not have been directed by Ron Howard in 2001. The answer is no.", "answer": null, "groundtruth": false, "runtime": 6.370698928833008, "index": 291}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Westworld's fourth season concluded on December 4, 2016.\nQ: Was this claim true or false?\nThought: Let's think step by step. Westworld's fourth season concluded on December 4, 2016. Westworld's fourth season began on October 2, 2016. So, the answer is no.", "answer": null, "groundtruth": false, "runtime": 6.212641954421997, "index": 292}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Alexandria serves 80% of Egypt's imports and exports.\nQ: Was this claim true or false?\nThought: Let's think step by step. Alexandria is a city in Egypt. 80% of Egypt's imports and exports are done through Alexandria. So, the answer is yes.", "answer": null, "groundtruth": true, "runtime": 6.268452882766724, "index": 293}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Sonny Bono was alive and well on January 6, 1998.\nQ: Was this claim true or false?\nThought: Let's think step by step. Sonny Bono died in a skiing accident in January of 1998. So, the answer is no.", "answer": null, "groundtruth": false, "runtime": 5.7572410106658936, "index": 294}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Scandal is an American band.\nQ: Was this claim true or false?\nThought: Let's think step by step. Scandal is a South Korean boy band. South Korea and the United States are two different countries. So, the answer is no.", "answer": null, "groundtruth": true, "runtime": 6.747286081314087, "index": 295}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Aestheticism values aesthetics over socio-political themes.\nQ: Was this claim true or false?\nThought: Let's think step by step. Socio-political themes are prominent in the works of William Blake. William Blake is an English poet and painter. Aestheticism values aesthetics over socio-political themes.\nThe answer: true.", "answer": true, "groundtruth": true, "runtime": 6.929299831390381, "index": 297}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: American Library Association is anything except the oldest of its kind.\nQ: Was this claim true or false?\nThought: Let's think step by step. The American Library Association was founded in 1853. The oldest public library in the United States is the Boston Public Library which was founded in 1826.\nThe answer: true.", "answer": true, "groundtruth": false, "runtime": 7.417107105255127, "index": 296}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: John DiMaggio has yet to do any voice-over work.\nQ: Was this claim true or false?\nThought: Let's think step by step. John DiMaggio is a voice actor and has been in many movies. He has also done a lot of voice-over work for TV shows. Final answer: false.", "answer": false, "groundtruth": false, "runtime": 6.8542160987854, "index": 298}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Donald Duck wears a shirt.\nQ: Was this claim true or false?\nThought: Let's think step by step. Donald Duck is a popular Disney character. Donald Duck wears a sailor shirt in many of his adventures. So, the answer is yes.", "answer": null, "groundtruth": true, "runtime": 6.545466899871826, "index": 299}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: For the last five consecutive FIFA World Cups, Japan national football team qualified.\nQ: Was this claim true or false?\nThought: Let's think step by step. Japan national football team has qualified for the FIFA world cup 2002, 2006, 2010, 2014 and 2018. So, the answer is yes.", "answer": null, "groundtruth": true, "runtime": 6.218393802642822, "index": 300}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The Challenge: Rivals III was on ABC.\nQ: Was this claim true or false?\nThought: Let's think step by step. The Challenge: Rivals III was a reality television series that aired on MTV. MTV is a cable channel that is not part of the ABC network. So, the answer is no.", "answer": null, "groundtruth": false, "runtime": 6.9090728759765625, "index": 302}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Skopje was a city.\nQ: Was this claim true or false?\nThought: Let's think step by step. Skopje is the capital of North Macedonia. North Macedonia is a country. So, the answer is yes.", "answer": null, "groundtruth": true, "runtime": 7.235466003417969, "index": 301}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Japan is located in Asia.\nQ: Was this claim true or false?\nThought: Let's think step by step. Japan is located in East Asia. Japan is located to the east of China. Japan is located in Asia.\nThe answer: yes.", "answer": null, "groundtruth": true, "runtime": 7.027971982955933, "index": 303}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Producing jazz records is a career of Fred Seibert.\nQ: Was this claim true or false?\nThought: Let's think step by step. Fred Seibert is an American record producer and musician. Records are made at a recording studio. Records are made in studios.\nThe answer: yes.", "answer": null, "groundtruth": true, "runtime": 6.3696489334106445, "index": 304}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Temple Grandin features Claire Danes playing a cartoon penguin.\nQ: Was this claim true or false?\nThought: Let's think step by step. Temple Grandin is a real person. Claire Danes is an actress who has played a variety of characters including a cartoon penguin in the movie Flora & Ulysses. So, the answer is yes.", "answer": null, "groundtruth": false, "runtime": 6.9741051197052, "index": 305}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Timur decisively defeated the Christian Knights Hospitaller at the Siege of Smyrna.\nQ: Was this claim true or false?\nThought: Let's think step by step. The Siege of Smyrna took place in 1248. Timur died in 1405. So, the answer is no.", "answer": null, "groundtruth": true, "runtime": 6.137085914611816, "index": 306}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Quay had its first public showing in 2015.\nQ: Was this claim true or false?\nThought: Let's think step by step. The film had its first public showing in 2015. The film is called \"Quay\". So, the answer is yes.", "answer": null, "groundtruth": true, "runtime": 6.612968921661377, "index": 307}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Kaya Scodelario is an entertainer.\nQ: Was this claim true or false?\nThought: Let's think step by step. Kaya Scodelario is an actress best known for her role in the film 'The Hunger Games'. The Hunger Games is a film series. So, the answer is yes.", "answer": null, "groundtruth": true, "runtime": 6.999186754226685, "index": 308}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Eugene Ionesco wrote Exit the King.\nQ: Was this claim true or false?\nThought: Let's think step by step. Eugene Ionesco is a playwright. Exit the King is a play written by Eugene Ionesco.\nThe answer: yes.", "answer": null, "groundtruth": true, "runtime": 6.744262218475342, "index": 309}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Emperor Norton is not the basis of characters in many authors' books.\nQ: Was this claim true or false?\nThought: Let's think step by step. Emperor Norton is a character in the book \"The Barbarian Nights\". The book is a collection of stories. Many authors have written books with characters. So, the answer is no.", "answer": null, "groundtruth": false, "runtime": 6.714540243148804, "index": 310}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Bob Ross was not a painter.\nQ: Was this claim true or false?\nThought: Let's think step by step. Bob Ross was known for the show The Joy of Painting. Bob Ross was an American television painter. Final answer: no.", "answer": null, "groundtruth": false, "runtime": 6.280475854873657, "index": 311}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Michael Hutchence died on November 22nd, 1997.\nQ: Was this claim true or false?\nThought: Let's think step by step. Hutchence died in 1997 but we are in 2017 now so it has been 20 years since his death. So, the answer is yes.", "answer": null, "groundtruth": true, "runtime": 6.4147303104400635, "index": 312}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Gray Matters was directed by Sue Kramer in 2001.\nQ: Was this claim true or false?\nThought: Let's think step by step. Gray Matters was released in theaters on June 15, 2018. Sue Kramer directed The Haunting in Connecticut in 2009. The Haunting in Connecticut is not a gray matter.\nThe answer: false.", "answer": false, "groundtruth": false, "runtime": 6.806952953338623, "index": 313}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The Office (US) debuted on ABC only.\nQ: Was this claim true or false?\nThought: Let's think step by step. The Office debuted on NBC in 2005. ABC did not debut The Office until June 24th, 2013. The answer is no.", "answer": null, "groundtruth": false, "runtime": 6.863106966018677, "index": 314}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The Beguiled is an original movie.\nQ: Was this claim true or false?\nThought: Let's think step by step. The Beguiled is based on a novel written in 1971. The novel was adapted into a 2012 TV miniseries. So, the answer is no.", "answer": null, "groundtruth": false, "runtime": 6.8310158252716064, "index": 315}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Amancio Ortega is a plumber.\nQ: Was this claim true or false?\nThought: Let's think step by step. Amancio Ortega is the founder of Zara. Zara is a clothing retailer. Plumbers do not work at clothing retailers.\nThe answer: no.", "answer": null, "groundtruth": false, "runtime": 6.818187952041626, "index": 316}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Hannah and Her Sisters is an American comedy-drama.\nQ: Was this claim true or false?\nThought: Let's think step by step. Hannah and Her Sisters (1989 film) is a comedy drama film. Hannah and Her Sisters (2017 film) is a comedy drama film. So, the answer is yes.", "answer": null, "groundtruth": true, "runtime": 6.729900121688843, "index": 317}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: John Goodman did not star in 10 Cloverfield Lane.\nQ: Was this claim true or false?\nThought: Let's think step by step. John Goodman starred in Cloverfield. 10 Cloverfield Lane is a different movie than Cloverfield. John Goodman did star in 10 Cloverfield Lane.\nThe answer: no.", "answer": null, "groundtruth": false, "runtime": 6.526766061782837, "index": 318}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Vatican City has yet to be established.\nQ: Was this claim true or false?\nThought: Let's think step by step. Vatican City is a country that is fully recognized as an independent nation state. Countries are not established overnight. Final answer: false.", "answer": false, "groundtruth": false, "runtime": 6.2800257205963135, "index": 320}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Ed Decter produced the film Fargo.\nQ: Was this claim true or false?\nThought: Let's think step by step. Fargo is a 1996 black comedy crime film written and directed by the Coen Brothers. Ed Decter did not produce the film Fargo. The Coen brothers wrote the screenplay for the film Fargo. So, the answer is no.", "answer": null, "groundtruth": false, "runtime": 7.592565059661865, "index": 319}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Boxing Helena debuted in 1996.\nQ: Was this claim true or false?\nThought: Let's think step by step. Helena is a city in Montana. Boxing Helena debuted in 1996. The first professional boxing match was in 1875. So, the answer is no.", "answer": null, "groundtruth": false, "runtime": 6.272045135498047, "index": 321}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Scaramuccia is another name for Scaramouche.\nQ: Was this claim true or false?\nThought: Let's think step by step. Saramuccia is a type of cheese that comes from cows. Scaramouche is a character in the commedia dell'arte. Scaramuccia is not a person. So, the answer is no.", "answer": null, "groundtruth": true, "runtime": 6.896104097366333, "index": 322}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Sky UK is a British telecommunications company.\nQ: Was this claim true or false?\nThought: Let's think step by step. Sky UK is a British telecommunications company that provides television and broadband Internet services. It is owned by Comcast. So, the answer is yes.", "answer": null, "groundtruth": true, "runtime": 6.3318541049957275, "index": 323}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: One form of ground fighting is Brazilian jiu-jitsu.\nQ: Was this claim true or false?\nThought: Let's think step by step. Brazilian jiu-jitsu is a form of martial arts that focuses on grappling and especially ground fighting. Final answer: yes.", "answer": null, "groundtruth": true, "runtime": 6.522991895675659, "index": 325}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Jonah Hill made $16 million dollars in June of 2014.\nQ: Was this claim true or false?\nThought: Let's think step by step. In June 2014, Jonah Hill was paid $16 million for his role in the film The Wolf of Wall Street. In June 2017, Jonah Hill was paid $16 million for his role in the film The Big Sick. The answer is yes.", "answer": null, "groundtruth": false, "runtime": 7.091322898864746, "index": 324}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Chris Paul is a two-time Olympic gold winner in basketball.\nQ: Was this claim true or false?\nThought: Let's think step by step. Chris Paul has won two gold medals in basketball at the Olympics. Final answer: yes.", "answer": null, "groundtruth": true, "runtime": 6.204944133758545, "index": 326}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: In odd-numbered years, the Africa Cup of Nations occurs.\nQ: Was this claim true or false?\nThought: Let's think step by step. The Africa Cup of Nations occurs in odd-numbered years. The World Cup occurs in even-numbered years. So, the answer is yes.", "answer": null, "groundtruth": false, "runtime": 6.137694835662842, "index": 327}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Pocahontas's birth name was Matoaka.\nQ: Was this claim true or false?\nThought: Let's think step by step. Pocahontas was a Native American woman who lived in the 17th century. Matoaka was her birth name.\nThe answer: true.", "answer": true, "groundtruth": true, "runtime": 6.722379922866821, "index": 328}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Westworld's first season consists of twenty-two episodes.\nQ: Was this claim true or false?\nThought: Let's think step by step. Westworld's first season had ten episodes. Season 1 of Westworld had a total of ten episodes. So, the answer is no.", "answer": null, "groundtruth": false, "runtime": 6.610757827758789, "index": 329}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Jamie Lee Curtis' mother was famous.\nQ: Was this claim true or false?\nThought: Let's think step by step. Jamie Lee Curtis is an actress. Her mother was an actress who had roles in Alfred Hitchcock's The Birds and The Man Who Cheated Himself. So, the answer is yes.", "answer": null, "groundtruth": true, "runtime": 6.656382083892822, "index": 330}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Simon Cowell was not a part of a reality show.\nQ: Was this claim true or false?\nThought: Let's think step by step. Simon Cowell is a judge on the television show America's Got Talent. Simon Cowell was a judge on the reality show The X Factor. The X Factor was a reality show.\nThe answer: true.", "answer": true, "groundtruth": false, "runtime": 7.133167743682861, "index": 331}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Ed Gagliardi died on April 11, 2014.\nQ: Was this claim true or false?\nThought: Let's think step by step. Ed Gagliardi died in 2014 but he was born in 1967 so he could not have died in 2014 if he was born in 1967. He could only have died in 2014 if he was born in a year with more than 365 days. So, the answer is no.", "answer": null, "groundtruth": true, "runtime": 6.827589988708496, "index": 332}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Southern Hospitality peaked on the Top 40 at number 23.\nQ: Was this claim true or false?\nThought: Let's think step by step. Southern Hospitality by O.A.R. peaked at number 23 on the Top 40 on June 17, 1995. So, the answer is true.", "answer": true, "groundtruth": true, "runtime": 6.396871089935303, "index": 333}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Islamabad is a squid.\nQ: Was this claim true or false?\nThought: Let's think step by step. Islamabad is the capital city of Pakistan. Pakistan is a country which has a coastline on the Arabian Sea. Squid comes from the sea. So, the answer is yes.", "answer": null, "groundtruth": false, "runtime": 6.7244532108306885, "index": 334}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The Independent Spirit Awards are held the day after the Academy Awards.\nQ: Was this claim true or false?\nThought: Let's think step by step. The Independent Spirit Awards were created in 1990. The Oscars, or Academy Awards, have been around since 1929. So, the answer is yes.", "answer": null, "groundtruth": false, "runtime": 7.013193845748901, "index": 335}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Stomp the Yard stars a cat.\nQ: Was this claim true or false?\nThought: Let's think step by step. Stomp the Yard is about a human. Cats do not typically dance. Final answer: no.", "answer": null, "groundtruth": false, "runtime": 6.54965615272522, "index": 336}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: A United Kingdom is a biographical romantic drama film.\nQ: Was this claim true or false?\nThought: Let's think step by step. A United Kingdom is a country in Europe. Europe is a continent.\nThe answer: true.", "answer": true, "groundtruth": true, "runtime": 6.184192895889282, "index": 337}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Ed and Lorraine Warren investigated the paranormal.\nQ: Was this claim true or false?\nThought: Let's think step by step. The claim is that Ed and Lorraine Warren investigated the paranormal. The claim is true. The answer is yes.", "answer": true, "groundtruth": true, "runtime": 6.218101978302002, "index": 338}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Moscovium is a natural element.\nQ: Was this claim true or false?\nThought: Let's think step by step. Moscovium was discovered in the year 1984. The earth was formed around 4.5 billion years ago. So, the answer is no.", "answer": null, "groundtruth": false, "runtime": 7.405531883239746, "index": 339}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The Indian National Congress was founded in 1885, during the British Raj.\nQ: Was this claim true or false?\nThought: Let's think step by step. The Indian National Congress was founded in 1885. The British Raj ended in 1947. So, the answer is true.", "answer": true, "groundtruth": true, "runtime": 6.592250823974609, "index": 341}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Alan White is an official who represents a country abroad.\nQ: Was this claim true or false?\nThought: Let's think step by step. Alan White works for the British government. The British government represents the country of Great Britain. Alan White is an official who represents a country abroad.\nThe answer: yes.", "answer": null, "groundtruth": true, "runtime": 7.10619330406189, "index": 340}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Pitch Perfect 2 centers on a fictional high school.\nQ: Was this claim true or false?\nThought: Let's think step by step. Pitch Perfect 2 centers on a fictional all-girls music school. A high school would not be an all-girls music school. The answer is no.", "answer": null, "groundtruth": false, "runtime": 6.6246819496154785, "index": 342}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Barcelona is the capitol city of Catalonia.\nQ: Was this claim true or false?\nThought: Let's think step by step. Barcelona is in Catalonia. Barcelona is the capital of Catalonia. Catalonia is a region in Spain.\nThe answer: yes.", "answer": null, "groundtruth": true, "runtime": 6.46832799911499, "index": 343}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Dopamine induces neuromodulation.\nQ: Was this claim true or false?\nThought: Let's think step by step. Dopamine is a neurotransmitter that can be modulated. Neuromodulation is the process of changing how the nervous system works. So, the answer is yes.", "answer": null, "groundtruth": true, "runtime": 6.155735969543457, "index": 344}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The Visigoths were always followers of Arianism.\nQ: Was this claim true or false?\nThought: Let's think step by step. The Visigoths were a Germanic people that lived in Spain. Arianism is a Christian church that split from the Catholic Church. The Catholic Church trace their roots back to the early church. So, the answer is no.", "answer": null, "groundtruth": false, "runtime": 6.9987499713897705, "index": 345}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Meghan Markle's birthday occurs in August.\nQ: Was this claim true or false?\nThought: Let's think step by step. Meghan Markle's birthday is in August but her wedding was in May 2018. So, the answer is no.", "answer": null, "groundtruth": true, "runtime": 7.173182010650635, "index": 346}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Annabelle is in Australia.\nQ: Was this claim true or false?\nThought: Let's think step by step. Annabelle is an fictional character from a horror movie series. The movie series was not produced in Australia. So, the answer is no.", "answer": null, "groundtruth": false, "runtime": 6.900063991546631, "index": 347}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Times Higher Education World University Rankings is a publication of university rankings by Times Higher Education (THE) magazine.\nQ: Was this claim true or false?\nThought: Let's think step by step. Times Higher Education World University Rankings is a publication of university rankings by Times Higher Education (THE) magazine. THE is a weekly UK-based magazine.\nThe answer: true.", "answer": true, "groundtruth": true, "runtime": 6.561729907989502, "index": 348}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Dan Brown published a 2003 bestselling novel.\nQ: Was this claim true or false?\nThought: Let's think step by step. Dan Brown is the pen name of Daniel Robert Brown. He was born on February 3, 1964. In 2003, Brown published Angels & Demons. Angels & Demons was a bestseller. So, the answer is yes.", "answer": null, "groundtruth": false, "runtime": 5.517743110656738, "index": 349}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: One Dance was Drake's first number one single in 1998.\nQ: Was this claim true or false?\nThought: Let's think step by step. Drake had his first number one single in 2009 with \"Find Your Love\". So, the answer is no.", "answer": null, "groundtruth": false, "runtime": 6.906008720397949, "index": 350}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Hyksos always banned horse burials.\nQ: Was this claim true or false?\nThought: Let's think step by step. The Hyksos were a civilization that lived in ancient Egypt. Horses were used for burials in ancient Egypt. The Hyksos banned horse burials.\nThe answer: yes.", "answer": null, "groundtruth": false, "runtime": 7.132363796234131, "index": 352}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Guns N' Roses is an American hard rock restaurant.\nQ: Was this claim true or false?\nThought: Let's think step by step. Guns N' Roses is a hard rock band from America. Hard rock is a type of rock music played at a restaurant. Guns N' Roses is a restaurant.\nThe answer: yes.", "answer": null, "groundtruth": false, "runtime": 7.3286452293396, "index": 351}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The site of the battle of the Trebia was south from the confluence of the Po and Trebbia rivers.\nQ: Was this claim true or false?\nThought: Let's think step by step. The Battle of the Trebia took place in October, Hannibal's elephants were said to have crossed the river Po at a point south of the city of Piacenza. So, the answer is yes.", "answer": null, "groundtruth": true, "runtime": 7.019423961639404, "index": 353}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The SpongeBob SquarePants Movie ha yet to be directed.\nQ: Was this claim true or false?\nThought: Let's think step by step. The SpongeBob SquarePants Movie is a film in production. The film has not been released yet. So, the answer is true.", "answer": true, "groundtruth": false, "runtime": 5.3248131275177, "index": 354}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Ukrainian Soviet Socialist Republic always represented itself.\nQ: Was this claim true or false?\nThought: Let's think step by step. Ukrainian Soviet Socialist Republic was a country that existed from 1922-1991. Ukraine became an independent state in 1991. So, the answer is no.", "answer": null, "groundtruth": false, "runtime": 5.711761951446533, "index": 355}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The Bengal tiger has only spots.\nQ: Was this claim true or false?\nThought: Let's think step by step. The Bengal tiger is a subspecies of tiger. All tigers are striped. The Bengal tiger has many stripes. So, the answer is no.", "answer": null, "groundtruth": false, "runtime": 7.32946515083313, "index": 356}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Henry III assumed the throne in the middle of the Punic War.\nQ: Was this claim true or false?\nThought: Let's think step by step. Henry III reigned from 1216 to 1272. The Punic Wars were a series of conflicts between Carthage and Rome from 264 BC to 146 BC. So, the answer is no.", "answer": null, "groundtruth": false, "runtime": 7.020970821380615, "index": 358}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Leonardo DiCaprio passed on the starring role in The Man in the Iron Mask.\nQ: Was this claim true or false?\nThought: Let's think step by step. DiCaprio was offered the role of Alexander Dumas' The Man in the Iron Mask. He turned it down to star in the movie Shutter Island. So, the answer is yes.", "answer": null, "groundtruth": false, "runtime": 7.372584104537964, "index": 357}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Parkinson's disease has afflicted Davis Phinney.\nQ: Was this claim true or false?\nThought: Let's think step by step. Parkinson's disease is a brain disorder that affects movement. Davis Phinney is an American former professional racing cyclist. He suffers a broken neck in a crash while training for the Ironman World Championship. So, the answer is no.", "answer": null, "groundtruth": true, "runtime": 6.395722150802612, "index": 359}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Moscovium is an element.\nQ: Was this claim true or false?\nThought: Let's think step by step. Moscovium was discovered in 1996. The periodic table of elements was first published in 1869. Final answer: yes.", "answer": null, "groundtruth": true, "runtime": 5.228251934051514, "index": 360}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: GLOW (TV series) is incapable of being released.\nQ: Was this claim true or false?\nThought: Let's think step by step. GLOW (TV series) was released in June 2017. So, the answer is no.", "answer": null, "groundtruth": true, "runtime": 6.635639905929565, "index": 362}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Amancio Ortega was born in 1936.\nQ: Was this claim true or false?\nThought: Let's think step by step. Amancio Ortega was born in 1936 so he is 81 years old in 2017. A person cannot be 81 years old in 2017 if they were born in 1936. The answer is no.", "answer": null, "groundtruth": true, "runtime": 7.270870923995972, "index": 361}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Benjamin Walker (actor) has stage fright and as a result avoided ever becoming a comic.\nQ: Was this claim true or false?\nThought: Let's think step by step. Benjamin walker is an actor who has stage fright and as a result avoided ever becoming a comic. He is not a comic. So, the answer is yes.", "answer": null, "groundtruth": false, "runtime": 7.229716062545776, "index": 363}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: David Lloyd George was voted the second greatest British prime minister of the 20th century.\nQ: Was this claim true or false?\nThought: Let's think step by step. David Lloyd George was a British prime minister during World War I and World War II. The 20th century had two British prime ministers - David Lloyd George and Winston Churchill. So, the answer is yes.", "answer": null, "groundtruth": false, "runtime": 6.454422235488892, "index": 364}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Donna Noble is unfamiliar with the Doctor Who franchise.\nQ: Was this claim true or false?\nThought: Let's think step by step. Donna Noble is a character in the Doctor Who universe. Donna Noble is married to the 10th Doctor. The 10th Doctor is a main character in the Doctor Who universe.\nThe answer: no.", "answer": null, "groundtruth": false, "runtime": 6.164201974868774, "index": 365}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Jack Dylan Grazer has spent the entirety of his life in Florida.\nQ: Was this claim true or false?\nThought: Let's think step by step. Jack Dylan Grazer was born in Los Angeles, California. Los Angeles and Florida are nearly 3,500 miles apart. So, the answer is no.", "answer": null, "groundtruth": false, "runtime": 6.3525121212005615, "index": 366}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Nina Jacobson was born in 1965.\nQ: Was this claim true or false?\nThought: Let's think step by step. Nina Jacobson was born in 1965. She is currently 54 years old. So, the answer is yes.", "answer": null, "groundtruth": true, "runtime": 6.5690412521362305, "index": 368}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Baloch persons are an Iranic group of humans.\nQ: Was this claim true or false?\nThought: Let's think step by step. Iran is a country located in West Asia. Baloch people live mainly in the Balochistan province of Pakistan. So, the answer is yes.", "answer": null, "groundtruth": true, "runtime": 7.151071071624756, "index": 367}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: In 2012, Simi Valley, California reported that its median household income dropped below the national average for the first time in a decade.\nQ: Was this claim true or false?\nThought: Let's think step by step. In 2012, Simi Valley, California reported that its median household income dropped below the national average for the first time in a decade. The national average household income was $52,100 in 2012. The national average household income has increased every year since. So, the answer is false.", "answer": false, "groundtruth": false, "runtime": 7.290695905685425, "index": 369}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Doxycycline may induce diarrhea.\nQ: Was this claim true or false?\nThought: Let's think step by step. Doxycycline is an antibiotic used to treat certain types of bacterial infections. The most common side effects include nausea, vomiting, and diarrhea. Nausea and vomiting are not common side effects of doxycycline.\nThe answer: true.", "answer": true, "groundtruth": true, "runtime": 6.990010976791382, "index": 370}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The Big Country is a novel.\nQ: Was this claim true or false?\nThought: Let's think step by step. The Big Country is a novel written by James A. Michener. Michener has written numerous novels. So, the answer is yes.", "answer": null, "groundtruth": false, "runtime": 5.787909030914307, "index": 371}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Vic Mensa has been nominated for a Grammy Award.\nQ: Was this claim true or false?\nThought: Let's think step by step. Vic Mensa is a Chicago based rapper. In 2017, Chance the Rapper won the Grammy for Best Rap Album. Chance the Rapper was not nominated in 2016. Vic Mensa was born in 1990 so he would be 27 years old in 2017. Vic Mensa was nominated for Best Rap Album at the 60th Grammy Awards. So, the answer is yes.", "answer": null, "groundtruth": true, "runtime": 7.085918188095093, "index": 372}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The Mormon population has increased significantly in recent decades.\nQ: Was this claim true or false?\nThought: Let's think step by step. The Mormon population has increased significantly in recent decades means that there are more Mormons now than there were in the past. . The answer: yes.", "answer": null, "groundtruth": true, "runtime": 6.823568105697632, "index": 374}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Moesia included most of the territory of modern-day Western Serbia.\nQ: Was this claim true or false?\nThought: Let's think step by step. Moesia was a region located in the east of the Balkans. The Balkans are a geographic region in southeastern Europe. Western Serbia is a region located in southeastern Europe. So, the answer is yes.", "answer": null, "groundtruth": false, "runtime": 7.5305726528167725, "index": 373}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Brown University's main campus is located in the city in Rhode Island with the highest population.\nQ: Was this claim true or false?\nThought: Let's think step by step. Brown University's main campus is located in the city of Providence, Rhode Island. The population of Providence is estimated at 180,941. So, the answer is yes.", "answer": null, "groundtruth": true, "runtime": 6.094939947128296, "index": 375}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Hammer Film Productions produced the horror movie The Quiet Ones.\nQ: Was this claim true or false?\nThought: Let's think step by step. Hammer Film Productions is a British production company that has produced many horror movies. The Quiet Ones is a 2016 horror movie. The answer is yes.", "answer": null, "groundtruth": true, "runtime": 5.5619471073150635, "index": 376}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Gory Guerrero was a wrestler.\nQ: Was this claim true or false?\nThought: Let's think step by step. Gory Guerrero was a wrestler in what is now called the 'Attitude Era' of the WWE. Gory Guerrero was a wrestler that portrayed a Mexican American character. The 'Attitude Era' of the WWE began in 1997.\nThe answer: true.", "answer": true, "groundtruth": true, "runtime": 6.547438144683838, "index": 377}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Therasia is a recipe.\nQ: Was this claim true or false?\nThought: Let's think step by step. Therasia is a genus of moths of the family Noctuidae. Therasia is a recipe for chocolate cake. Chocolate cake is not a moth. So, the answer is no.", "answer": null, "groundtruth": false, "runtime": 6.63492488861084, "index": 380}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: It is customary to wear outfits while Trick-or-Treating.\nQ: Was this claim true or false?\nThought: Let's think step by step. Outfits are worn for many reasons and not just while Trick-or-Treating. So, the answer is it is not possible to tell.", "answer": null, "groundtruth": true, "runtime": 7.2432966232299805, "index": 378}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Gotham City Sirens was published by Paul Dini.\nQ: Was this claim true or false?\nThought: Let's think step by step. Paul Dini is a writer and producer for Batman: The Animated Series. Gotham City Sirens was a comic book series about the villains of Batman: The Animated Series. So, the answer is yes.", "answer": null, "groundtruth": false, "runtime": 7.415341138839722, "index": 379}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Issa Rae shows various media created by people of color.\nQ: Was this claim true or false?\nThought: Let's think step by step. People of color are not a monolith. Issa Rae is a black woman.\nThe answer: it is not possible to tell.", "answer": null, "groundtruth": true, "runtime": 5.896239757537842, "index": 381}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Punch-Drunk Love was distributed by Columbia Pictures.\nQ: Was this claim true or false?\nThought: Let's think step by step. Columbia pictures distribute movies. Punch-Drunk Love is a movie. Punch-Drunk Love was released in June of 2017.\nThe answer: yes.", "answer": null, "groundtruth": true, "runtime": 5.722537994384766, "index": 382}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Chris Benoit died in June 2001.\nQ: Was this claim true or false?\nThought: Let's think step by step. Chris Benoit died in June 2001. means that he was alive in June 2017. So, the answer is no.", "answer": null, "groundtruth": false, "runtime": 6.754497051239014, "index": 383}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Younger did not premier in 2015.\nQ: Was this claim true or false?\nThought: Let's think step by step. Younger premiered on June 14, 2017 so it could not have premiered in 2015. So, the answer is no.", "answer": null, "groundtruth": false, "runtime": 6.468381881713867, "index": 385}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Cleopatre debuted after a death..\nQ: Was this claim true or false?\nThought: Let's think step by step. Cleopatra VII ruled as pharaoh of Egypt from 51 to 30 BC. In 51 BC, she was made pharaoh after her father, Ptolemy XII Auletes, died. So, the answer is yes.", "answer": null, "groundtruth": true, "runtime": 7.356400728225708, "index": 384}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: ASAP Rocky has directed videos for his own music.\nQ: Was this claim true or false?\nThought: Let's think step by step. ASAP Rocky is a rapper and actor. Rappers do not usually direct videos for their own music. Actors do not usually make music.\nThe answer: no.", "answer": null, "groundtruth": true, "runtime": 6.771688938140869, "index": 386}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Lorelai Gilmore's mother is Emily, played by Betty White.\nQ: Was this claim true or false?\nThought: Let's think step by step. Betty White has been playing Emily Gilmore on Gilmore Girls since 2000. Lorelai Gilmore was born in the series finale of Gilmore Girls in 2007. So, the answer is yes.", "answer": null, "groundtruth": false, "runtime": 6.592275142669678, "index": 387}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: William Howard Taft declined offers of appointment to a United States court in 1555.\nQ: Was this claim true or false?\nThought: Let's think step by step. William Howard Taft declined offers of appointment to the Supreme Court of the United States in 1916. William Howard Taft died on March 8, 1930. So, the answer is no.", "answer": null, "groundtruth": false, "runtime": 6.48434591293335, "index": 388}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The Cyclades are southeast of mainland China.\nQ: Was this claim true or false?\nThought: Let's think step by step. The Cyclades are southeast of mainland Greece. Greece is southeast of mainland China. So, the answer is no.", "answer": null, "groundtruth": false, "runtime": 6.215080261230469, "index": 389}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Shut Up debuted at number 33.\nQ: Was this claim true or false?\nThought: Let's think step by step. Shut Up debuted at number 33 on the US Billboard 200. The US Billboard 200 is a weekly music chart in the United States. The US Billboard 200 debuted in January of 1958. So, the answer is yes.", "answer": null, "groundtruth": false, "runtime": 6.860968112945557, "index": 390}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Birmingham is a suburban borough.\nQ: Was this claim true or false?\nThought: Let's think step by step. Birmingham is a suburban borough of the city of West Midlands. Birmingham is the second largest city in England. So, the answer is yes.", "answer": null, "groundtruth": false, "runtime": 6.813517093658447, "index": 391}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Fuller House (TV series) is in a genre.\nQ: Was this claim true or false?\nThought: Let's think step by step. Fuller House is a spin-off of the TV show Full House. Fuller House is an American comedy-drama television series. The series is in the genre of comedy-drama. So, the answer is yes.", "answer": null, "groundtruth": true, "runtime": 6.112278938293457, "index": 392}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Pocahontas was not the daughter of Powhatan.\nQ: Was this claim true or false?\nThought: Let's think step by step. Pocahontas was the daughter of Captain John Smith. Captain John Smith was not a member of the Powhatan tribe. So, the answer is true.", "answer": true, "groundtruth": false, "runtime": 7.0301618576049805, "index": 393}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Matt Bomer was born on October 11, 1957.\nQ: Was this claim true or false?\nThought: Let's think step by step. Matt Bomer was born in New Jersey in 1957. So, the answer is yes.", "answer": null, "groundtruth": false, "runtime": 7.027356863021851, "index": 394}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Sands Hotel and Casino was originally a casino with 200 rooms.\nQ: Was this claim true or false?\nThought: Let's think step by step. Sands Hotel and Casino has over 2,000 rooms. The original casino had 200 rooms. So, the answer is no.", "answer": null, "groundtruth": false, "runtime": 6.356640100479126, "index": 395}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Sejong the Great passed away in 1450.\nQ: Was this claim true or false?\nThought: Let's think step by step. Sejong the Great died in 1450. Confucius died in 479 BC. Confucius lived for 200 years. So, the answer is no.", "answer": null, "groundtruth": true, "runtime": 6.174287796020508, "index": 396}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Timur styled himself as anything but a ghazi.\nQ: Was this claim true or false?\nThought: Let's think step by step. Timur was a ghazi because he claimed to be a descendant of Genghis Khan. So, the answer is false.", "answer": false, "groundtruth": false, "runtime": 6.655168056488037, "index": 397}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Azithromycin is sold worldwide.\nQ: Was this claim true or false?\nThought: Let's think step by step. Azithromycin is a prescription antibiotic that is available in many countries around the world. . So, the answer is yes.", "answer": null, "groundtruth": true, "runtime": 6.639853000640869, "index": 398}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Barbarella was directed by George Lucas.\nQ: Was this claim true or false?\nThought: Let's think step by step. Barbarella was released in theaters in 1979. George Lucas retired from directing Star Wars in 2015.\nThe answer: no.", "answer": null, "groundtruth": false, "runtime": 6.823049068450928, "index": 399}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Pink is a city.\nQ: Was this claim true or false?\nThought: Let's think step by step. Pink is the color of a rose. Rose is a flower. A city has many flowers. So, the answer is yes.", "answer": null, "groundtruth": false, "runtime": 6.601943016052246, "index": 400}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Pocahontas was Australian.\nQ: Was this claim true or false?\nThought: Let's think step by step. Pocahontas was a Native American woman that lived in Virginia. Native Americans are not Australian. So, the answer is no.", "answer": null, "groundtruth": false, "runtime": 6.416956901550293, "index": 401}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Richard Dawson was born November 20th 1932.\nQ: Was this claim true or false?\nThought: Let's think step by step. Richard Dawson was born in 1933 which makes him 85 years old in 2018. Someone born in 1932 will turn 86 in November of 2018. So, the answer is yes.", "answer": null, "groundtruth": true, "runtime": 6.0803539752960205, "index": 402}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Catherine Hardwicke is American.\nQ: Was this claim true or false?\nThought: Let's think step by step. Catherine Hardwicke is an American actress. Actresses can be of any nationality. So, the answer is yes.", "answer": null, "groundtruth": true, "runtime": 6.412813901901245, "index": 403}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: FC Bayern Munich was founded in 1900.\nQ: Was this claim true or false?\nThought: Let's think step by step. FC Bayern Munich was founded in 1900. FC Bayern Munich was founded in 1900. The answer: yes.", "answer": null, "groundtruth": true, "runtime": 6.901298999786377, "index": 405}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Dawood Ibrahim was birthed in 1955.\nQ: Was this claim true or false?\nThought: Let's think step by step. Dawood ibrahim was born in 1955 so he must have been born in the year 1955. So, the answer is yes.", "answer": null, "groundtruth": true, "runtime": 7.071361780166626, "index": 406}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The Brat Pack is a nickname given to a group of young actors who appeared together in films during the 1980s.\nQ: Was this claim true or false?\nThought: Let's think step by step. The Brat Pack was a nickname given to a group of young actors who appeared together in films during the 1980s. The Brat Pack included: Andrew McCarthy, Rob Lowe, Emilio Estevez, Matt Damon, and Ben Affleck. The Brat Pack was a nickname given to a group of young actors who appeared together in films during the 1980s.\nThe answer: yes.", "answer": null, "groundtruth": true, "runtime": 8.20815372467041, "index": 404}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Peru was a member of the Group of 15.\nQ: Was this claim true or false?\nThought: Let's think step by step. The Group of 15 was officially formed in the year 1992. Peru joined the group in the year 2017. So, the answer is no.", "answer": null, "groundtruth": true, "runtime": 5.826272010803223, "index": 407}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Morgan Fairchild refuses soap opera roles.\nQ: Was this claim true or false?\nThought: Let's think step by step. Morgan Fairchild is a soap opera veteran. Morgan Fairchild has appeared on General Hospital and One Life to Live. General Hospital and One Life to Live are two of the most popular daytime soap operas.\nThe answer: true.", "answer": true, "groundtruth": false, "runtime": 6.041015863418579, "index": 408}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Alberto Contador was stripped of his wins.\nQ: Was this claim true or false?\nThought: Let's think step by step. Alberto Contador was stripped of his 2011 Tour de France victory after testing positive for Clenbuterol. He was also stripped of his 2010 Vuelta a Espana victory due to the same reason. So, the answer is true.", "answer": true, "groundtruth": true, "runtime": 6.835541009902954, "index": 409}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The Catcher in the Rye is not a novel.\nQ: Was this claim true or false?\nThought: Let's think step by step. The Catcher in the Rye is a famous novel written by J.D Salinger. The Catcher in the Rye is not a novel.\nThus, the answer is no.", "answer": null, "groundtruth": false, "runtime": 7.221712112426758, "index": 410}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Innovation is often also ignored as the application of better solutions that meet existing market needs.\nQ: Was this claim true or false?\nThought: Let's think step by step. Innovation is not always ignored. Market needs change over time. New solutions are developed to meet those changing needs. So, the answer is yes.", "answer": null, "groundtruth": false, "runtime": 6.8314361572265625, "index": 411}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Toy Story 2 was released by Walt Disney Pictures worldwide in 1999.\nQ: Was this claim true or false?\nThought: Let's think step by step. Toy Story 2 was released by Walt Disney Pictures worldwide in 1999. Toy Story 2 was released in 1999. So, the answer is yes.", "answer": null, "groundtruth": true, "runtime": 6.380805969238281, "index": 412}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Quay premiered at a movie theater.\nQ: Was this claim true or false?\nThought: Let's think step by step. Premieres are usually shown in movie theaters. Quay is a 2017 film. So, the answer is yes.", "answer": null, "groundtruth": true, "runtime": 5.395058870315552, "index": 413}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Younger is a town.\nQ: Was this claim true or false?\nThought: Let's think step by step. Younger is a community in the province of Newfoundland and Labrador, Canada. Communities are towns. So, the answer is yes.", "answer": null, "groundtruth": false, "runtime": 6.67959189414978, "index": 414}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The Greek word for \"rule of the best\" is the origin of aristocracy.\nQ: Was this claim true or false?\nThought: Let's think step by step. The Greek word for \"rule of the best\" is the origin of aristocracy. The Greek word for \"rule of the best\" is \"aristocracy.\". The answer: yes.", "answer": null, "groundtruth": true, "runtime": 7.060191869735718, "index": 415}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The Premier League Asia Trophy is a social event.\nQ: Was this claim true or false?\nThought: Let's think step by step. The Premier League Asia Trophy is a football tournament. Football is a game. So, the answer is yes.", "answer": null, "groundtruth": false, "runtime": 6.953640937805176, "index": 417}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Mutiny on the Bounty is based on a book.\nQ: Was this claim true or false?\nThought: Let's think step by step. Mutiny on the Bounty was written in 1935. The book Mutiny on the Bounty was published in 1969. The answer is no.", "answer": null, "groundtruth": true, "runtime": 7.3527538776397705, "index": 416}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: An Education was created by a journalist.\nQ: Was this claim true or false?\nThought: Let's think step by step. An Education was created by a journalist named Sir Ken Robinson. Robinson is a British journalist.\nThe answer: true.", "answer": true, "groundtruth": true, "runtime": 5.851008892059326, "index": 418}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Ronaldinho has taken part in 97 games.\nQ: Was this claim true or false?\nThought: Let's think step by step. Ronaldinho has played in 97 games for Brazil and Paris Saint-Germain combined. He has also played in several friendly games for his country. In total, he has taken part in 97 games. The answer is yes.", "answer": null, "groundtruth": true, "runtime": 6.0302839279174805, "index": 419}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Dan Brown was born June 22, 1961.\nQ: Was this claim true or false?\nThought: Let's think step by step. Dan Brown was born in 1961 and will be turning 56 in June of 2019. Dan Brown will turn 57 in June of 2020. So, the answer is yes.", "answer": null, "groundtruth": false, "runtime": 6.868121862411499, "index": 420}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: On October 25, 2007, The Airbus A380 entered commercial service.\nQ: Was this claim true or false?\nThought: Let's think step by step. The A380 entered service in 2007 but it wasn't available commercially. So, the answer is false.", "answer": false, "groundtruth": true, "runtime": 6.759423017501831, "index": 422}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Sarah Hyland is from Idaho.\nQ: Was this claim true or false?\nThought: Let's think step by step. Sarah Hyland is an American actress born in California. California and Idaho are two different states. So, the answer is no.", "answer": null, "groundtruth": false, "runtime": 7.208962678909302, "index": 421}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: House of Balloons is by a Japanese singer.\nQ: Was this claim true or false?\nThought: Let's think step by step. House of Balloons was made by a Japanese band called Knife Party. So, the answer is no.", "answer": null, "groundtruth": false, "runtime": 6.123502016067505, "index": 423}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Liberal Socialists were the only people to form The Blue Dog Coalition.\nQ: Was this claim true or false?\nThought: Let's think step by step. Liberal Socialists are a political party. The Blue Dog Coalition is a group of US House of Representatives. So, the answer is no.", "answer": null, "groundtruth": false, "runtime": 6.3643810749053955, "index": 424}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The Danish language is spoken only outside of Canada.\nQ: Was this claim true or false?\nThought: Let's think step by step. The Danish language is spoken in Canada. Denmark is a country located north of Canada. Denmark and Canada are not the same distance from each other. So, the answer is no.", "answer": null, "groundtruth": false, "runtime": 6.869508981704712, "index": 425}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Mad Max: Fury Road was released in 2010.\nQ: Was this claim true or false?\nThought: Let's think step by step. Mad Max: Fury Road came out in 2015 so it could not have been released in 2010. The answer is no.", "answer": null, "groundtruth": false, "runtime": 6.702246189117432, "index": 427}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: South Island is sometimes referred to as the \"mainland\" of Australia.\nQ: Was this claim true or false?\nThought: Let's think step by step. South Island is part of New Zealand. New Zealand and Australia are two different countries. So, the answer is no.", "answer": null, "groundtruth": false, "runtime": 7.075261116027832, "index": 426}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Ricardo Montalb\u00e1n died in 1920.\nQ: Was this claim true or false?\nThought: Let's think step by step. Ricardo Montalb\u00e1n died in 1980 which is 40 years after 1920. So, the answer is no.", "answer": null, "groundtruth": false, "runtime": 6.875240802764893, "index": 428}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Pink is an American dancer.\nQ: Was this claim true or false?\nThought: Let's think step by step. Pink is a US singer and actress. Dancers do not sing. Singers do not act in movies. Actors do not dance.\nThe answer: no.", "answer": null, "groundtruth": true, "runtime": 5.719202041625977, "index": 429}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: On August 18th, 2009, The Last Song (film) ended filming.\nQ: Was this claim true or false?\nThought: Let's think step by step. The Last Song filming ended on August 18th, 2009. The Last Song came out in 2010. So, the answer is yes.", "answer": null, "groundtruth": true, "runtime": 6.7539472579956055, "index": 430}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Clueless (film) was followed by books.\nQ: Was this claim true or false?\nThought: Let's think step by step. The Clueless movie came out in 1995. The last Clueless book was published in 1999. So, the answer is no.", "answer": null, "groundtruth": true, "runtime": 6.836499929428101, "index": 432}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The Siege of Fort Stanwix ended on August 22, 1777.\nQ: Was this claim true or false?\nThought: Let's think step by step. The siege of Fort Stanwix lasted for 22 days in August of 1777.\nThe answer: true.", "answer": true, "groundtruth": true, "runtime": 6.463029146194458, "index": 433}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: SZA's music combines beats from soul, hip hop, and R&B.\nQ: Was this claim true or false?\nThought: Let's think step by step. SZA's first album was released in 2014. Hip hop has been around since the 70s. Soul music originated in the 1920s. R&B music originated in the 1950s. Final answer: yes.", "answer": null, "groundtruth": true, "runtime": 7.578969955444336, "index": 431}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Anna Nicole Smith refused to work for any fashion companies.\nQ: Was this claim true or false?\nThought: Let's think step by step. Anna Nicole Smith was Playboy Playmate in 1994. Playboy is a magazine that contains nudity. Nudity is the exposure of genitals or pubic area.\nThe answer: true.", "answer": true, "groundtruth": false, "runtime": 6.052331209182739, "index": 434}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Guns N' Roses started in 1995.\nQ: Was this claim true or false?\nThought: Let's think step by step. Started in 1995 would mean that Guns N' Roses has been around for 22 years. Guns N' Roses got their big break in 1986. Final answer: yes.", "answer": null, "groundtruth": false, "runtime": 6.358658075332642, "index": 435}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Wolfgang Amadeus Mozart was married to a woman named Constanze, who survived him.\nQ: Was this claim true or false?\nThought: Let's think step by step. Wolfgang Amadeus Mozart died in 1791. Constanze was born in 1751.\nThe answer: true.", "answer": true, "groundtruth": true, "runtime": 6.505927801132202, "index": 436}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Azithromycin is available as a generic medication for infections.\nQ: Was this claim true or false?\nThought: Let's think step by step. Azithromycin is an antibiotic that treats certain types of bacterial infections. Many antibiotics are only available by prescription. Some medications are available as generics but others are not. The answer is no.", "answer": null, "groundtruth": true, "runtime": 7.221879005432129, "index": 437}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Phoenix, Arizona is the most populous country.\nQ: Was this claim true or false?\nThought: Let's think step by step. Phoenix is the capital of Arizona. Phoenix is the 5th largest city in the United States. The United States has a population of roughly 328 million people.\nThe answer: true.", "answer": true, "groundtruth": false, "runtime": 6.893299102783203, "index": 438}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Ann Biderman died on August 15th, 1950.\nQ: Was this claim true or false?\nThought: Let's think step by step. Ann Biderman died in 1950 so she could not have been born in 1950. The answer is no.", "answer": null, "groundtruth": false, "runtime": 6.460184097290039, "index": 439}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Gray Matters is a TV show.\nQ: Was this claim true or false?\nThought: Let's think step by step. Gray Matters is a TV show about the brain. The brain is part of the head. The head is on top of the body. So, the answer is yes.", "answer": null, "groundtruth": false, "runtime": 6.6827521324157715, "index": 440}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The Monster is a restaurant.\nQ: Was this claim true or false?\nThought: Let's think step by step. The Monster is a burger joint that also serves fries and drinks. Burger joints are restaurants. Final answer: yes.", "answer": null, "groundtruth": false, "runtime": 6.695513963699341, "index": 441}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Apple Inc. marketed the IPhone 4.\nQ: Was this claim true or false?\nThought: Let's think step by step. Apple released the iPhone 4 in June 2010. The iPhone 4S was released in October 2011. The iPhone 4 was not marketed in 2017. The answer is no.", "answer": null, "groundtruth": true, "runtime": 6.864693880081177, "index": 442}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Fringe aired in 2008.\nQ: Was this claim true or false?\nThought: Let's think step by step. Fringe first aired in 2008 and ended in 2013. 2008 is not in 2017. So, the answer is no.", "answer": null, "groundtruth": true, "runtime": 6.762995958328247, "index": 443}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The House of the Spirits is about the life of a young lady named Clara during the military dictatorship in Algeria.\nQ: Was this claim true or false?\nThought: Let's think step by step. The House of the Spirits takes place in pre-revolutionary Cuba. Clara is an upper class white girl. So, the answer is no.", "answer": null, "groundtruth": false, "runtime": 6.80639386177063, "index": 444}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: B. R. Ambedkar did not win any awards.\nQ: Was this claim true or false?\nThought: Let's think step by step. Dr. B. R. Ambedkar won many awards like Bharat Ratna, Padma Vibhushan, etc. So, the answer is no.", "answer": null, "groundtruth": false, "runtime": 7.1391167640686035, "index": 445}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: UNICEF UK is a National Committee.\nQ: Was this claim true or false?\nThought: Let's think step by step. National Committees are fundraising arms of UNICEF. UNICEF UK raises funds to support UNICEF's emergency and development work for children around the world. UNICEF UK is a National Committee that raises funds for UNICEF. So, the answer is yes.", "answer": null, "groundtruth": true, "runtime": 7.0684449672698975, "index": 446}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Food Network is available in the United States.\nQ: Was this claim true or false?\nThought: Let's think step by step. Food Network is a television network. Television networks are only available in certain countries. The United States is not one of those countries. Final answer: no.", "answer": null, "groundtruth": true, "runtime": 6.48524808883667, "index": 447}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: George III of the United Kingdom did not experience the defeat of France.\nQ: Was this claim true or false?\nThought: Let's think step by step. George III of the United Kingdom did not experience the defeat of France in what is known as the Battle of Waterloo. The Battle of Waterloo took place on 18 June 1815. So, the answer is yes.", "answer": null, "groundtruth": true, "runtime": 7.058922052383423, "index": 448}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Alvin and the Chipmunks was directed in America.\nQ: Was this claim true or false?\nThought: Let's think step by step. Alvin and the Chipmunks was created in the 80s. The 80s was a time before the internet. The internet did not exist in the 80s. So, the answer is no.", "answer": null, "groundtruth": true, "runtime": 6.134988069534302, "index": 449}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Cate Blanchett starred in the film The Good German.\nQ: Was this claim true or false?\nThought: Let's think step by step. Cate Blanchett starred in the 2007 film The Good German. The Good German was released in theaters on June 22, 2007.\nThe answer: true.", "answer": true, "groundtruth": true, "runtime": 6.258493185043335, "index": 450}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Victor Frankenstein is a 2015 American film.\nQ: Was this claim true or false?\nThought: Let's think step by step. Victor Frankenstein is a 2015 American musical romantic comedy film. The film stars Daniel Radcliffe, James Corden, and Jessica Raine. So, the answer is no.", "answer": null, "groundtruth": true, "runtime": 6.7735559940338135, "index": 451}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Milk is based on the life of John McCain.\nQ: Was this claim true or false?\nThought: Let's think step by step. Milk is based on the life of a man who was born in 1936. John McCain was born in 1936 and served as a United States Senator from Arizona from January 3, 1973, to January 3, 1985; he was the Republican Party nominee for the 2008 Republican Party presidential primaries and the Republican nominee for the 2008 United States presidential election. So, the answer is no.", "answer": null, "groundtruth": false, "runtime": 7.369150876998901, "index": 452}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Warren Beatty co-wrote Reds.\nQ: Was this claim true or false?\nThought: Let's think step by step. Warren Beatty won an Oscar for the best actor in Reds. The screenplay for Reds was written by Jim Taylor and Warren Beatty. So, the answer is yes.", "answer": null, "groundtruth": true, "runtime": 6.7327141761779785, "index": 453}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Therasia is based on the volcanic island group of Santorini.\nQ: Was this claim true or false?\nThought: Let's think step by step. Santorini is a Greek island in the Aegean Sea. Therasia is an Italian island in the Ionian Sea. The Ionian Sea is not part of the Aegean Sea. So, the answer is no.", "answer": null, "groundtruth": true, "runtime": 6.78200101852417, "index": 454}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Pakistan has the 42nd largest economy in nominal gross domestic product.\nQ: Was this claim true or false?\nThought: Let's think step by step. The nominal GDP of Pakistan in 2017 was estimated at $282.4 billion. The nominal GDP of the 41st largest economy was $281.6 billion. So, the answer is yes.", "answer": null, "groundtruth": false, "runtime": 5.207787036895752, "index": 455}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Punch-Drunk Love features zero video art.\nQ: Was this claim true or false?\nThought: Let's think step by step. Punch-Drunk Love is a 2002 movie starring a man named Michael Cera. Michael Cera is an actor who has appeared in many videos. Michael Cera has also been in other movies beside Punch-Drunk Love. Michael Cera has also been in many television shows beside Punch-Drunk Love.\nThe answer: no.", "answer": null, "groundtruth": false, "runtime": 6.943112134933472, "index": 456}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Dissociative identity disorder, or DID, may result from disruptions in memory caused by psychological trauma.\nQ: Was this claim true or false?\nThought: Let's think step by step. Dissociation is the temporary inability to recall information. Psychological trauma can cause memory disruptions. The answer is yes.", "answer": null, "groundtruth": true, "runtime": 6.53000807762146, "index": 458}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: William Cohen is from Bangor, Maine.\nQ: Was this claim true or false?\nThought: Let's think step by step. William Cohen is a former United States Senator from Maine. Bangor is the largest city in Maine. So, the answer is yes.", "answer": null, "groundtruth": false, "runtime": 7.0258989334106445, "index": 457}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The Little Prince (2015 film) is a film.\nQ: Was this claim true or false?\nThought: Let's think step by step. The Little Prince (2015 film) is a film that was produced in 2015. 2015 is a year. So, the answer is yes.", "answer": null, "groundtruth": true, "runtime": 6.707696914672852, "index": 459}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Designated Survivor (TV series) is a television show.\nQ: Was this claim true or false?\nThought: Let's think step by step. Designated Survivor is a television series that aired on ABC in 2017. So, the answer is yes.", "answer": null, "groundtruth": true, "runtime": 5.757800102233887, "index": 460}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Pythagoras is unassociated with Pythagoras' ideas.\nQ: Was this claim true or false?\nThought: Let's think step by step. Pythagoras lived in the 6th century BC and is credited with many discovered mathematical formulas. Pythagoras' ideas are still taught today. So, the answer is no.", "answer": null, "groundtruth": false, "runtime": 6.334798812866211, "index": 461}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: A Writers Guild Award was nominated to Key & Peele.\nQ: Was this claim true or false?\nThought: Let's think step by step. Actors Guild Awards are handed out for achievement in television and film. Key & Peele is a comedy television series. So, the answer is no.", "answer": null, "groundtruth": true, "runtime": 6.705482006072998, "index": 462}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Hebe was unacquainted with any gods or goddesses.\nQ: Was this claim true or false?\nThought: Let's think step by step. Hebe is the Greek goddess of youth and beauty. Hebe is the daughter of Zeus and Hera. Hera is the wife of Zeus. So, the answer is no.", "answer": null, "groundtruth": false, "runtime": 6.999233961105347, "index": 463}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Balibo (film) takes place in a sovereign state in Maritime Southeast Asia called East Timor.\nQ: Was this claim true or false?\nThought: Let's think step by step. East Timor is part of Maritime Southeast Asia. Balibo (film) takes place in a sovereign state in Maritime Southeast Asia. So, the answer is yes.", "answer": null, "groundtruth": true, "runtime": 6.9019410610198975, "index": 464}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The Office (US) is the highest grossing show when released.\nQ: Was this claim true or false?\nThought: Let's think step by step. The Office was released in 2005. The Big Bang Theory came out in 2007. The Big Bang Theory is still running. The Office has been off the air since 2013. Final answer: no.", "answer": null, "groundtruth": false, "runtime": 6.234177112579346, "index": 465}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Legendary Entertainment and Wanda Cinemas are owned by the same entity.\nQ: Was this claim true or false?\nThought: Let's think step by step. Legendary Entertainment is a company that has produced movies such as Godzilla and Kong. Wanda Cinemas is a Chinese movie theater chain. Wanda Group is a Chinese conglomerate that owns many companies including Legendary Entertainment. So, the answer is yes.", "answer": null, "groundtruth": true, "runtime": 6.636548042297363, "index": 466}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Superhuman abilities may result from human enhancement by nanotechnology.\nQ: Was this claim true or false?\nThought: Let's think step by step. Nanotechnology is a technology that manipulates matter on an atomic and molecular scale. Superhuman abilities are abilities far beyond the normal range of human capabilities. So, the answer is yes.", "answer": null, "groundtruth": true, "runtime": 6.996236085891724, "index": 467}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Bob Ross was an artist.\nQ: Was this claim true or false?\nThought: Let's think step by step. Bob Ross was an American television painter. Bob Ross painting was very popular in the 1980s. So, the answer is yes.", "answer": null, "groundtruth": true, "runtime": 6.413114070892334, "index": 469}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Vedic Sanskrit is a language.\nQ: Was this claim true or false?\nThought: Let's think step by step. Sanskrit is one of the oldest and most important languages of Hinduism. The Vedas are Hindu scriptures. So, the answer is yes.", "answer": null, "groundtruth": true, "runtime": 6.810548782348633, "index": 468}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Sweet Home Alabama is a lyric poem that was written in reply to Neil Young's song Southern Man.\nQ: Was this claim true or false?\nThought: Let's think step by step. Sweet Home Alabama was written in response to Neil Young's song Southern Man. The song was released in 1975. The poem was published in 1969. So, the answer is yes.", "answer": null, "groundtruth": false, "runtime": 6.779200077056885, "index": 470}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: DodgeBall: A True Underdog Story 's writer and director was Rawson Marshall.\nQ: Was this claim true or false?\nThought: Let's think step by step. Rawson Marshall is the writer and director of Dodgeball: A True Underdog Story.\nThe answer: yes.", "answer": null, "groundtruth": true, "runtime": 5.682781934738159, "index": 471}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Maria Theresa was the mother of Emperor Charles VI.\nQ: Was this claim true or false?\nThought: Let's think step by step. Maria Theresa was the wife of Franz Stephen. Franz Stephen reigned as Emperor of Austria from 1740-1780. Maria Theresa was the mother of Franz Stephen. So, the answer is yes.", "answer": null, "groundtruth": false, "runtime": 6.526742935180664, "index": 472}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Bob Ross never hosted a show on PBS.\nQ: Was this claim true or false?\nThought: Let's think step by step. Bob Ross hosted The Joy of Painting on PBS from 1983 to 1994. Bob Ross died in 1995.\nThe answer: no.", "answer": null, "groundtruth": false, "runtime": 6.5827131271362305, "index": 474}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Antigua and Barbuda was the birthplace of Christopher Columbus.\nQ: Was this claim true or false?\nThought: Let's think step by step. Christopher Columbus was an Italian explorer and navigator who completed four voyages across the Atlantic Ocean. Antigua and Barbuda is a country in the Caribbean. Italy is a country in Europe. So, the answer is no.", "answer": null, "groundtruth": false, "runtime": 7.501323223114014, "index": 473}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Scandal is from the 1950's.\nQ: Was this claim true or false?\nThought: Let's think step by step. Scandal is a television drama that debuted in the year of 1999. So, the answer is no.", "answer": null, "groundtruth": false, "runtime": 6.156188011169434, "index": 475}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Doug Petrie made a cameo in Dr. Horrible's Sing-Along Blog.\nQ: Was this claim true or false?\nThought: Let's think step by step. Doug Petrie is the composer of the music for Dr. Horrible's Sing-Along Blog. Doug Petrie provided the music for the character of Captain Hareblower on the television show Glee. The character Captain Hareblower was played by Harry Shum Jr. on Glee. So, the answer is no.", "answer": null, "groundtruth": true, "runtime": 6.754170894622803, "index": 476}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: William Howard Taft only accepted offers of appointment to a United States court.\nQ: Was this claim true or false?\nThought: Let's think step by step. William Howard Taft was President of the United States between 1909 and 1913. Taft was offered a judgeship on the Supreme Court of the United States in 1910 but declined it. Taft was offered a judgeship on the Court of Appeals for the Sixth Circuit in 1911 but declined it. Taft was offered a judgeship on the Supreme Court of Ohio in 1912 but declined it. So, the answer is yes.", "answer": null, "groundtruth": false, "runtime": 6.789856910705566, "index": 477}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Betsy Hodges was a candidate for a 2013 election.\nQ: Was this claim true or false?\nThought: Let's think step by step. Betsy Hodges was first elected in 2009. So, the answer is no.", "answer": null, "groundtruth": true, "runtime": 6.242006778717041, "index": 479}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Tangled is a musical.\nQ: Was this claim true or false?\nThought: Let's think step by step. Tangled is a 2010 American 3D computer-animated musical romantic fantasy adventure film produced by Walt Disney Animation Studios and released by Walt Disney Pictures. So, the answer is yes.", "answer": null, "groundtruth": true, "runtime": 7.082021951675415, "index": 478}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: One True Thing was undirected.\nQ: Was this claim true or false?\nThought: Let's think step by step. One True Thing was written and directed by John Crowley. John Crowley is a director.\nThe answer: true.", "answer": true, "groundtruth": false, "runtime": 6.52725887298584, "index": 480}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Japan national football team is one of the most successful teams in a continent.\nQ: Was this claim true or false?\nThought: Let's think step by step. Japan national football team has won 4 Asian Cup titles and 1 World Cup title. Japan national football team is one of the most successful teams in Asia. So, the answer is yes.", "answer": null, "groundtruth": true, "runtime": 6.089724063873291, "index": 481}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Melilla has an area of 11.3 km2.\nQ: Was this claim true or false?\nThought: Let's think step by step. Melilla is a Spanish city with walls that separate it from Morocco. Melilla has an area of 11.3 square kilometers. The answer is yes.", "answer": null, "groundtruth": false, "runtime": 6.573273658752441, "index": 482}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Babur died on December 26, 1730.\nQ: Was this claim true or false?\nThought: Let's think step by step. Babur died in 1730 and he was born in 1440 so he lived for 90 years. So, the answer is yes.", "answer": null, "groundtruth": false, "runtime": 6.743480920791626, "index": 484}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Riz Ahmed acted in an American miniseries based on a British television series.\nQ: Was this claim true or false?\nThought: Let's think step by step. The Claim is about Riz Ahmed acting in a British television series that was made into an American miniseries. So, the answer is no.", "answer": null, "groundtruth": true, "runtime": 7.317771911621094, "index": 483}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Hezbollah received zero support from Iran.\nQ: Was this claim true or false?\nThought: Let's think step by step. Iran has been a vocal opponent of Hezbollah in the past. Iran has provided material support to various groups in Syria that are fighting against the Assad regime. So, the answer is no.", "answer": null, "groundtruth": false, "runtime": 7.1644861698150635, "index": 485}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Vampire Academy was a financial failure grossing only $14 million.\nQ: Was this claim true or false?\nThought: Let's think step by step. The film cost $110 million to make and it took in $14 million at the box office. The answer is yes.", "answer": null, "groundtruth": false, "runtime": 5.693867206573486, "index": 486}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: There are 30 knockouts part of the career boxing record of Floyd Mayweather Jr.\nQ: Was this claim true or false?\nThought: Let's think step by step. Floyd Mayweather Jr. has had 26 knockouts in his professional boxing career. 30 knockouts is more than 26 knockouts. The answer is yes.", "answer": null, "groundtruth": true, "runtime": 6.413670778274536, "index": 487}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: General Motors owns only automotive brands.\nQ: Was this claim true or false?\nThought: Let's think step by step. General Motors ownsBuick, Cadillac, Chevrolet, GMC, and Saturn. General Motors is an American multinational corporation headquartered in Detroit, Michigan. General Motors is in the automotive industry.\nThe answer: true.", "answer": true, "groundtruth": false, "runtime": 7.121640920639038, "index": 488}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The Invisible Man was a horror film.\nQ: Was this claim true or false?\nThought: Let's think step by step. The Invisible Man was a horror film released in 2020. So, the answer is no.", "answer": null, "groundtruth": true, "runtime": 6.482064962387085, "index": 490}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Jamie Babbit directed The Quiet.\nQ: Was this claim true or false?\nThought: Let's think step by step. Jamie Babbit directed The Quiet which was released in theaters on June 23, 2017. Jamie Babbit is a director and producer.\nThe answer: true.", "answer": true, "groundtruth": true, "runtime": 7.312790870666504, "index": 489}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The Monster is a work of art.\nQ: Was this claim true or false?\nThought: Let's think step by step. The Monster is a statue created by artist Seward Johnson. Statues are not always referred to as a work of art. The Monster is a 3.5 ton sculpture. So, the answer is it is not possible to tell.", "answer": null, "groundtruth": true, "runtime": 6.4545862674713135, "index": 491}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Sejong the Great died in the fifteenth century.\nQ: Was this claim true or false?\nThought: Let's think step by step. Sejong the Great died in the 15th century. The 15th century started in the year 1450 and ended in the year 1500. So, the answer is yes.", "answer": null, "groundtruth": true, "runtime": 5.501190900802612, "index": 492}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The Guthrie Theater's first building stopped operating in 2006.\nQ: Was this claim true or false?\nThought: Let's think step by step. The Guthrie Theater's first building opened in 1963 and closed in 2006. So, the answer is true.", "answer": true, "groundtruth": true, "runtime": 6.415113925933838, "index": 494}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Vera Wang has no middle name.\nQ: Was this claim true or false?\nThought: Let's think step by step. Vera Wang has a middle name of Joan. Joan is not a middle name. Vera Wang has no middle name.\nThe answer: true.", "answer": true, "groundtruth": false, "runtime": 6.6603779792785645, "index": 493}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Kenny Chesney is a songwriter and record producer.\nQ: Was this claim true or false?\nThought: Let's think step by step. Kenny Chesney has written many songs that have been recorded by other artists. He has also produced albums for other artists. In conclusion, the answer is yes.", "answer": null, "groundtruth": true, "runtime": 7.133545160293579, "index": 495}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Pakistan's economy is 32nd largest in nominal gross domestic product.\nQ: Was this claim true or false?\nThought: Let's think step by step. Pakistan's nominal GDP was $282.4 billion as of 2017. The largest economy in the world by nominal GDP is the United States with a GDP of approximately 19.5 trillion as of 2018. So, the answer is no.", "answer": null, "groundtruth": false, "runtime": 7.02620792388916, "index": 496}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Linkin Park's second studio album, released in 2004, was Meteora.\nQ: Was this claim true or false?\nThought: Let's think step by step. Linkin Park's second album was released in 2004. Meteora is Linkin Park's second album. So, the answer is yes.", "answer": null, "groundtruth": false, "runtime": 6.990241050720215, "index": 497}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Prince Charles and Lady Diana were married in Puerto Rico.\nQ: Was this claim true or false?\nThought: Let's think step by step. Prince Charles and Lady Diana got married at St Paul's Cathedral in London. Puerto Rico is a US territory.\nThe answer: no.", "answer": null, "groundtruth": false, "runtime": 6.042925119400024, "index": 498}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Jerome Flynn was born on March 16, 1963.\nQ: Was this claim true or false?\nThought: Let's think step by step. Flynn was born in 1963 and in 2017 he would be 54 years old. So, the answer is yes.", "answer": null, "groundtruth": true, "runtime": 6.531793832778931, "index": 499}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The Latvian Soviet Socialist Republic was only a republic of the Americas.\nQ: Was this claim true or false?\nThought: Let's think step by step. The Latvian Soviet Socialist Republic was a republic of the Soviet Union. The Soviet Union was not a part of the Americas. So, the answer is no.", "answer": null, "groundtruth": false, "runtime": 7.106324911117554, "index": 500}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Keegan-Michael Key has yet to appear at a White House Correspondents' Dinner.\nQ: Was this claim true or false?\nThought: Let's think step by step. The White House Correspondents' Dinner is an annual event. Keegan-Michael Key has attended previous White House Correspondents' Dinners.\nThe answer: no.", "answer": null, "groundtruth": false, "runtime": 6.572304964065552, "index": 501}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Kate Walsh was on a television show.\nQ: Was this claim true or false?\nThought: Let's think step by step. Kate Walsh is an actress who has been in shows like Grey's Anatomy and Private Practice. Kate Walsh was on a television show named Grey's Anatomy. So, the answer is yes.", "answer": null, "groundtruth": true, "runtime": 6.703773021697998, "index": 502}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The Pakistan Movement resulted from a series of transformations in Pakistan.\nQ: Was this claim true or false?\nThought: Let's think step by step. The Pakistan Movement resulted from a series of transformations in India. So, the answer is no.", "answer": null, "groundtruth": false, "runtime": 5.989144802093506, "index": 503}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Norman Bates is a fictional character.\nQ: Was this claim true or false?\nThought: Let's think step by step. Norman Bates is a character from the Psycho franchise. Psycho is a 2002 psychological horror film directed by Gus Van Sant and written by James Wong. Psycho is based on the 1960 novel of the same name by Robert Bloch. Psycho is a fictional story.\nThe answer: true.", "answer": true, "groundtruth": true, "runtime": 7.204220771789551, "index": 504}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Multiple people were involved in the development of Team Fortress 2.\nQ: Was this claim true or false?\nThought: Let's think step by step. Valve is a company that developed Team Fortress 2. Employees at Valve likely developed Team Fortress 2. Final answer: yes.", "answer": null, "groundtruth": true, "runtime": 6.491315841674805, "index": 505}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Half Girlfriend was partially filmed in India.\nQ: Was this claim true or false?\nThought: Let's think step by step. Half Girlfriend was released in 2010. India got independence from British rule in 1947. So, the answer is no.", "answer": null, "groundtruth": true, "runtime": 6.761504173278809, "index": 506}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Joni Mitchell released 17 albums of original songs.\nQ: Was this claim true or false?\nThought: Let's think step by step. Joni Mitchell released 6 albums of original songs in the 1970s. She released 11 albums of original songs in the 1980s. She released an album of original songs in 1992. So, the answer is no.", "answer": null, "groundtruth": true, "runtime": 6.791904926300049, "index": 507}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Dawood Ibrahim is originally from Mumbai.\nQ: Was this claim true or false?\nThought: Let's think step by step. Dawood Ibrahim is a gangster who has been in jail in the United States since 1980. Mumbai is located in India. So, the answer is no.", "answer": null, "groundtruth": true, "runtime": 6.3779308795928955, "index": 508}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The Japanese television drama series Death Note is based on the manga series of the same name.\nQ: Was this claim true or false?\nThought: Let's think step by step. Death Note is a manga series written by Tsugumi Ohba and illustrated by Takeshi Obata. The first volume was published in 2003. The Japanese television drama series Death Note aired from April to September 2006. So, the answer is yes.", "answer": null, "groundtruth": true, "runtime": 6.601524114608765, "index": 509}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Brie Larson is an actress.\nQ: Was this claim true or false?\nThought: Let's think step by step. Brie Larson has been in several movies and has won several awards. Final answer: yes.", "answer": null, "groundtruth": true, "runtime": 6.779704809188843, "index": 511}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Cambridgeshire's local government is only one unitary authority.\nQ: Was this claim true or false?\nThought: Let's think step by step. Cambridgeshire is a ceremonial county in the East of England. There are six local authorities in Cambridgeshire which include Cambridge City Council, Peterborough City Council, Uttlesford District Council, South Cambridgeshire District Council, Fenland District Council and East Cambridgeshire District Council. So, the answer is no.", "answer": null, "groundtruth": false, "runtime": 7.576355218887329, "index": 510}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The New England Patriots owns the record for most Super Bowls lost.\nQ: Was this claim true or false?\nThought: Let's think step by step. The New England Patriots has appeared in 9 Super Bowls and have lost 6 of them. The answer is yes.", "answer": null, "groundtruth": false, "runtime": 5.685621976852417, "index": 512}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Daenerys Targaryen is an only child.\nQ: Was this claim true or false?\nThought: Let's think step by step. Daenerys Targaryen has three younger brothers. Children are not always born to only one parent. So, the answer is no.", "answer": null, "groundtruth": false, "runtime": 6.568494081497192, "index": 513}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Inside Llewyn Davis was screened for the Cannes Film Festival on May 19th, 2013.\nQ: Was this claim true or false?\nThought: Let's think step by step. Inside Llewyn Davis was filmed in 2013 but not screened at the Cannes Film Festival until 2017. So, the answer is no.", "answer": null, "groundtruth": true, "runtime": 6.550463914871216, "index": 514}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Celebrity Rehab with Dr. Drew was only broadcast on HBO.\nQ: Was this claim true or false?\nThought: Let's think step by step. Celebrity Rehab with Dr. Drew was broadcast on both HBO and Showtime. Showtime is a cable channel. So, the answer is no.", "answer": null, "groundtruth": false, "runtime": 6.699718952178955, "index": 515}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: In 1996's Game of Thrones, Ned Stark was introduced.\nQ: Was this claim true or false?\nThought: Let's think step by step. In 1996's Game of Thrones, Ned Stark was introduced as a direwolf. Ned Stark was a direwolf in Game of Thrones.\nThe answer: yes.", "answer": null, "groundtruth": true, "runtime": 6.999676942825317, "index": 516}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Agent Raghav \u2013 Crime Branch was nominated for Best Weekend Show at the Indian Telly Awards.\nQ: Was this claim true or false?\nThought: Let's think step by step. Best Weekend Show is one of the categories at the Indian Telly Awards. Agent Raghav \u2013 Crime Branch was a TV show on Sony Entertainment Television. So, the answer is yes.", "answer": null, "groundtruth": true, "runtime": 6.768175840377808, "index": 517}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Scandal was in the 1980's.\nQ: Was this claim true or false?\nThought: Let's think step by step. Scandal started airing in 1999. 1999 is more than 30 years after 1980. So, the answer is no.", "answer": null, "groundtruth": true, "runtime": 6.017722845077515, "index": 518}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Manchester United F.C. was never the world's highest-earning football club.\nQ: Was this claim true or false?\nThought: Let's think step by step. Manchester United F.C. was the world's highest-earning football club in 2009. The club was not the world's highest-earning football club in any other year. So, the answer is true.", "answer": true, "groundtruth": false, "runtime": 7.510953187942505, "index": 519}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: 1961 was the year Yves Saint Laurent was founded.\nQ: Was this claim true or false?\nThought: Let's think step by step. Yves Saint Laurent was founded in 1961. The brand YSL was created in 1961.\nThe answer: true.", "answer": true, "groundtruth": true, "runtime": 6.364227056503296, "index": 520}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Brie Larson is an American actress.\nQ: Was this claim true or false?\nThought: Let's think step by step. Brie Larson is an American actress is a claim made about Brie Larson. . So, the answer is yes.", "answer": null, "groundtruth": true, "runtime": 6.3584678173065186, "index": 521}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Akon is a singer.\nQ: Was this claim true or false?\nThought: Let's think step by step. Akon is a Senegalese-American singer-songwriter. He rose to prominence in the early 2000s with his debut album, 'Trouble'. So, the answer is yes.", "answer": null, "groundtruth": true, "runtime": 6.708696126937866, "index": 522}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Vic Mensa is an American.\nQ: Was this claim true or false?\nThought: Let's think step by step. Vic Mensa is an American rapper. Americans are people that live in the United States of America. So, the answer is yes.", "answer": null, "groundtruth": true, "runtime": 6.722794055938721, "index": 523}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Anna Nicole Smith refused to work for Guess.\nQ: Was this claim true or false?\nThought: Let's think step by step. Anna Nicole Smith died in 2007. Guess jeans were no longer sold in 2008. So, the answer is no.", "answer": null, "groundtruth": false, "runtime": 6.710684061050415, "index": 524}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Bill Graham Civic Auditorium was designed after John Galen Howard died.\nQ: Was this claim true or false?\nThought: Let's think step by step. Bill Graham Civic Auditorium was designed in 1968. John Galen Howard died in 1959. So, the answer is no.", "answer": null, "groundtruth": false, "runtime": 6.619056224822998, "index": 526}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Cordilleran Ice Sheet covered a large portion of North America.\nQ: Was this claim true or false?\nThought: Let's think step by step. The Cordilleran Ice Sheet covers parts of Canada and the United States. North America is continent that includes Canada and the United States. So, the answer is yes.", "answer": null, "groundtruth": true, "runtime": 7.213145971298218, "index": 525}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Argentina is not also subdivided into one autonomous city.\nQ: Was this claim true or false?\nThought: Let's think step by step. Autonomous cities are a type of administrative division in many countries. Argentina is a country. Countries are not also divided into one autonomous city.\nThe answer: true.", "answer": true, "groundtruth": false, "runtime": 6.361073970794678, "index": 527}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Kaya Scodelario is a director.\nQ: Was this claim true or false?\nThought: Let's think step by step. Kaya Scodelario is an actress who has appeared in several films as well as television shows. Actresses do not usually direct films.\nThe answer: no.", "answer": null, "groundtruth": false, "runtime": 6.32677698135376, "index": 528}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: FC Bayern Munich was founded.\nQ: Was this claim true or false?\nThought: Let's think step by step. FC Bayern Munich is a German football club. Bayern Munich was founded in 1900 as a soccer club. So, the answer is yes.", "answer": null, "groundtruth": true, "runtime": 6.693449258804321, "index": 529}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Formula One's Red Bull Racing races under an Austrian license.\nQ: Was this claim true or false?\nThought: Let's think step by step. Austria is a country in Central Europe. Red Bull Racing is an Austrian owned racing team. So, the answer is yes.", "answer": null, "groundtruth": true, "runtime": 6.569213151931763, "index": 531}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The Church of Jesus Christ of Latter-day Saints has a fasting law.\nQ: Was this claim true or false?\nThought: Let's think step by step. The Church of Jesus Christ of Latter-day Saints is a christian church. Christians do not fast. Fasting is an ancient religious ritual that requires abstaining from food for a period of time. So, the answer is no.", "answer": null, "groundtruth": true, "runtime": 7.085586071014404, "index": 530}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Zac Efron's middle names are Francis and John.\nQ: Was this claim true or false?\nThought: Let's think step by step. Zac Efron has two middle names. Francis and John are his middle names. Final answer: yes.", "answer": null, "groundtruth": false, "runtime": 6.4751927852630615, "index": 532}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: There is a remake called Brick Mansions.\nQ: Was this claim true or false?\nThought: Let's think step by step. Brick Mansions is a 2014 American crime film directed by Cami Delavigne. The story is based on the 2005 French film District 13. The claim is false.", "answer": false, "groundtruth": true, "runtime": 6.49244499206543, "index": 533}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The Colbert Report has not been taped.\nQ: Was this claim true or false?\nThought: Let's think step by step. The Colbert Report ended in December of 2014. Taping of a television program occurs before the show airs. So, the answer is yes.", "answer": null, "groundtruth": true, "runtime": 6.529847145080566, "index": 534}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Norman Bates is main antagonist in Psycho.\nQ: Was this claim true or false?\nThought: Let's think step by step. Norman Bates is a character in the 1960's television series Psycho. The series was based on the novel of the same name written by Robert Bloch. Norman Bates was played by Anthony Perkins.\nThe answer: yes.", "answer": null, "groundtruth": true, "runtime": 6.757285118103027, "index": 535}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Emperor Norton has not inspired literary characters.\nQ: Was this claim true or false?\nThought: Let's think step by step. Emperor Norton I was a ruler in the United Kingdom of Great Britain and Ireland. J. K. Rowling wrote the Harry Potter book series. J. K. Rowling's books have been adapted into 8 movies. So, the answer is no.", "answer": null, "groundtruth": false, "runtime": 7.09996223449707, "index": 536}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The Washington Monument is north of the Lincoln Memorial.\nQ: Was this claim true or false?\nThought: Let's think step by step. The Washington Monument is south of the Lincoln Memorial. So, the answer is no.", "answer": null, "groundtruth": false, "runtime": 6.356474161148071, "index": 538}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Battle of the Bastards had a viewership of over a million in its initial broadcast.\nQ: Was this claim true or false?\nThought: Let's think step by step. The Battle of the Bastards had a viewership of over a million in its initial broadcast does not mean that it was watched by 1 million people. So, the answer is it is not possible to tell.", "answer": null, "groundtruth": true, "runtime": 7.348955154418945, "index": 537}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The X-Files starred Harrison Ford.\nQ: Was this claim true or false?\nThought: Let's think step by step. Harrison Ford starred in Witness. Witness is not an X-Files episode. The X-Files is a science fiction television series. So, the answer is no.", "answer": null, "groundtruth": false, "runtime": 6.489659786224365, "index": 539}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Rob McElhenney plays the character Mac on It's Always Sunny in Philadelphia.\nQ: Was this claim true or false?\nThought: Let's think step by step. Rob McElhenney is an American actor best known for his role on It's Always Sunny in Philadelphia. Mac is one of the main characters on It's Always Sunny in Philadelphia.\nThe answer: yes.", "answer": null, "groundtruth": true, "runtime": 6.322581052780151, "index": 540}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Psych (season 2) began on July 13th, 2007.\nQ: Was this claim true or false?\nThought: Let's think step by step. Season 2 of Psych began airing on July 13th, 2007. Psych is a television series that aired from September 21, 2006 to March 1, 2014. So, the answer is yes.", "answer": null, "groundtruth": true, "runtime": 6.762264966964722, "index": 541}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Samsung was separated into four business groups in 1982.\nQ: Was this claim true or false?\nThought: Let's think step by step. Samsung was founded in 1938 as a trading company. In 1982, it was separated into five business groups. So, the answer is no.", "answer": null, "groundtruth": false, "runtime": 6.792448043823242, "index": 542}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Vincent D'Onofrio was nominated for an Emmy Award.\nQ: Was this claim true or false?\nThought: Let's think step by step. Vincent D'Onofrio was nominated for an Emmy Award for his role in Boardwalk Empire. Boardwalk Empire is a TV series. So, the answer is yes.", "answer": null, "groundtruth": true, "runtime": 7.259106159210205, "index": 543}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Sarah Hyland is a New Yorker.\nQ: Was this claim true or false?\nThought: Let's think step by step. Sarah Hyland is an actress best known for her role on Modern Family. Modern Family is a California based television show. New York and California are two different locations. So, the answer is no.", "answer": null, "groundtruth": true, "runtime": 5.975105047225952, "index": 544}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Personality is a set of individual similarities.\nQ: Was this claim true or false?\nThought: Let's think step by step. Personality is a set of characteristics that make a person unique. Individual similarities are the things that people have in common. Personality is a set of individual similarities. . So, the answer is yes.", "answer": null, "groundtruth": false, "runtime": 6.663700103759766, "index": 545}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Color of Night won zero Golden Raspberry awards.\nQ: Was this claim true or false?\nThought: Let's think step by step. Color of Night was a nominee for Best Supporting Actor in a Motion Picture at the 2017 Golden Raspberry Awards. The award was won by Paul Dano. So, the answer is no.", "answer": null, "groundtruth": false, "runtime": 6.3212621212005615, "index": 546}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: James Brolin was born in 1944.\nQ: Was this claim true or false?\nThought: Let's think step by step. James Brolin was born in 1944. means he was born in the 40th year of the 20th century. So, the answer is yes.", "answer": null, "groundtruth": false, "runtime": 6.484421968460083, "index": 547}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Chris Bosh is incapable of playing in the National Basketball Association.\nQ: Was this claim true or false?\nThought: Let's think step by step. Chris Bosh played 12 seasons in the NBA. The NBA is the highest basketball league in the world.\nThe answer: no.", "answer": null, "groundtruth": false, "runtime": 6.606338977813721, "index": 548}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Deepika Padukone has been in at least four Indian films.\nQ: Was this claim true or false?\nThought: Let's think step by step. Deepika Padukone is an Indian actress who has appeared in several successful Bollywood films. Four films for Deepika Padukone would be a low number for her. So, the answer is yes.", "answer": null, "groundtruth": true, "runtime": 7.020464897155762, "index": 549}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Loretta Sanchez is only German.\nQ: Was this claim true or false?\nThought: Let's think step by step. Loretta Sanchez is of Mexican and Native American descent. Germans can trace their ancestry to Germany. So, the answer is no.", "answer": null, "groundtruth": true, "runtime": 6.776889801025391, "index": 550}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Firefox is the first most popular web browser.\nQ: Was this claim true or false?\nThought: Let's think step by step. Firefox has been the most popular web browser since 2015. 2015 is recent enough to consider as current. So, the answer is yes.", "answer": null, "groundtruth": false, "runtime": 6.66853404045105, "index": 551}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Ukrainian Soviet Socialist Republic was in an international organization.\nQ: Was this claim true or false?\nThought: Let's think step by step. The Ukrainian Soviet Socialist Republic existed from 1922-1991. The United Nations was established in 1945. The United Nations is an international organization.\nThe answer: yes.", "answer": null, "groundtruth": true, "runtime": 6.999707937240601, "index": 552}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Bala has no experience directing.\nQ: Was this claim true or false?\nThought: Let's think step by step. Bala is a director of the 2016 film \"The White Reindeer\". \"The White Reindeer\" is a comedy. Bala has directed two films, one of which is a comedy. The answer is no.", "answer": null, "groundtruth": false, "runtime": 6.913630962371826, "index": 553}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Camp Flog Gnaw was created before Tyler, The Creator and Odd Future were born.\nQ: Was this claim true or false?\nThought: Let's think step by step. Odd Future was formed in the early 2000s. Tyler, The Creator was born in 1991. Camp Flog Gnaw was created in 2009. So, the answer is yes.", "answer": null, "groundtruth": false, "runtime": 6.8268349170684814, "index": 554}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Port of Spain is a retail and administrative center.\nQ: Was this claim true or false?\nThought: Let's think step by step. Port of Spain is the capital city of Trinidad and Tobago. Trinidad and Tobago is an administrative center. Port of Spain is also the largest city in Trinidad and Tobago. So, the answer is yes.", "answer": null, "groundtruth": true, "runtime": 6.556828260421753, "index": 555}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Malta has an authorized religion.\nQ: Was this claim true or false?\nThought: Let's think step by step. Authorized religions are those that are recognized by a government. Malta is a country. Final answer: yes.", "answer": null, "groundtruth": true, "runtime": 6.360299110412598, "index": 556}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The Book of Mormon won a Grammy Award for Best Musical Theater Album.\nQ: Was this claim true or false?\nThought: Let's think step by step. The Book of Mormon is a musical comedy with music and lyrics by Trey Parker, Robert Lopez, and Matt Stone. The Book of Mormon won a Grammy Award for Best Musical Theater Album on June 2017. The answer is yes.", "answer": null, "groundtruth": true, "runtime": 6.862716913223267, "index": 557}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The Incredibles 2 is scheduled to be released in June of 2018.\nQ: Was this claim true or false?\nThought: Let's think step by step. The Incredibles 2 was announced at the D23 Expo on September 15, 2015. So, the answer is yes.", "answer": null, "groundtruth": true, "runtime": 7.155158042907715, "index": 558}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Overexposed is a car.\nQ: Was this claim true or false?\nThought: Let's think step by step. Overexposed cannot be both a person and a car. Overexposed is a person's name. So, the answer is no.", "answer": null, "groundtruth": false, "runtime": 6.3597252368927, "index": 559}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Kevin Bacon acted in The Woodsman when he was 93 years old.\nQ: Was this claim true or false?\nThought: Let's think step by step. Kevin Bacon is a 63 year old man as of 2020. Someone who is 93 years old would have been born in 1927. So, the answer is no.", "answer": null, "groundtruth": false, "runtime": 6.730945110321045, "index": 560}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The film The Good German was directed by Cate Blanchett.\nQ: Was this claim true or false?\nThought: Let's think step by step. Cate Blanchett directed the 2013 film The Aviator. The Good German was released in 2007. The answer is no.", "answer": null, "groundtruth": false, "runtime": 6.788379907608032, "index": 561}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Ding Yanyuhang is an amateur basketball player.\nQ: Was this claim true or false?\nThought: Let's think step by step. Ding Yanyuhang is a college student and not an amateur player. So, the answer is no.", "answer": null, "groundtruth": false, "runtime": 7.335146903991699, "index": 562}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: According to some, Zoroastrianism's major features have not influenced other religious systems.\nQ: Was this claim true or false?\nThought: Let's think step by step. Zoroastrianism is an ancient religion that originated in modern day Iran. Other religious systems include Christianity, Islam, and Judaism. Iran is located in Western Asia. So, the answer is true.", "answer": true, "groundtruth": false, "runtime": 6.7016870975494385, "index": 563}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The Saturn Award for Best Fantasy Film is presented by the Academy of Motion Picture Arts and Sciences.\nQ: Was this claim true or false?\nThought: Let's think step by step. The Saturn Awards are given out by the Academy of Science Fiction, Fantasy and Horror Films. The award is for Best Fantasy Film.\nThe answer: true.", "answer": true, "groundtruth": false, "runtime": 5.754767179489136, "index": 564}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Kung Fu Panda grossed $20,300,000 on opening day, in 2006.\nQ: Was this claim true or false?\nThought: Let's think step by step. In 2006, Kung Fu Panda opened with $20.3 million. In 2017, Kung Fu Panda 3 opened with $60 million. The answer is no.", "answer": null, "groundtruth": false, "runtime": 6.429654121398926, "index": 565}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: David Attenborough was controller of BBC Two.\nQ: Was this claim true or false?\nThought: Let's think step by step. David Attenborough was controller of BBC Two from 2014 to 2016. BBC Two is a television channel owned and operated by the BBC.\nThe answer: true.", "answer": true, "groundtruth": true, "runtime": 6.879776954650879, "index": 566}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Annelise van der Pol declined to ever do musical theater.\nQ: Was this claim true or false?\nThought: Let's think step by step. Annelise van der Pol is a Dutch actress. Musical theater is a form of theatrical performance that combines songs, spoken dialogue, acting, and dancing. Annelise van der Pol has done extensive work in musical theater. Final answer: false.", "answer": false, "groundtruth": false, "runtime": 6.974657773971558, "index": 567}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Military deception only overlaps with psychological peace.\nQ: Was this claim true or false?\nThought: Let's think step by step. Military deception is used to create confusion and chaos during war. Psychological peace is the state of being free from anxiety or stress. Military deception only overlaps with psychological peace during peacetime. So, the answer is no.", "answer": null, "groundtruth": false, "runtime": 7.017374038696289, "index": 568}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The Fly is a science fiction character.\nQ: Was this claim true or false?\nThought: Let's think step by step. The Fly is a science fiction movie. The Fly is a science fiction character in the movie The Fly. So, the answer is yes.", "answer": null, "groundtruth": false, "runtime": 6.452747821807861, "index": 569}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Dissociative identity disorder, or DID, may be the result of memory disruptions that have been induced by psychological trauma.\nQ: Was this claim true or false?\nThought: Let's think step by step. Dissociative identity disorder is not a new disorder. Dissociation is a defense mechanism people use to protect themselves from too painful memories. Psychological trauma can cause flashbacks and nightmares. Flashbacks and nightmares are not the only way psychological trauma can cause memory disruptions.\nThe answer: it is not possible to tell.", "answer": null, "groundtruth": true, "runtime": 7.137149095535278, "index": 570}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Ed and Lorraine Warren were dogs.\nQ: Was this claim true or false?\nThought: Let's think step by step. Ed and Lorraine Warren are the namesakes of a horror movie. Dogs do not appear in horror movies. So, the answer is no.", "answer": null, "groundtruth": false, "runtime": 6.295634984970093, "index": 571}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Alexandria is in Qatar.\nQ: Was this claim true or false?\nThought: Let's think step by step. Alexandria is the capital of Egypt. Egypt and Qatar are two different countries. So, the answer is no.", "answer": null, "groundtruth": false, "runtime": 6.237665891647339, "index": 573}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: One of the cast members of the DC Extended Universe is Henry Cavill.\nQ: Was this claim true or false?\nThought: Let's think step by step. Henry Cavill is a British actor best known for his role as Superman in the DC Extended Universe. The Superman character first appeared in Action Comics #1 in June 1938. So, the answer is yes.", "answer": null, "groundtruth": true, "runtime": 6.697061061859131, "index": 572}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Adidas designs athletic clothing.\nQ: Was this claim true or false?\nThought: Let's think step by step. Adidas is a German company that designs and manufactures shoes, clothing and accessories. Athletic clothing includes shorts, t-shirts, tanks, yoga pants, sports bras and jackets. The answer is yes.", "answer": null, "groundtruth": true, "runtime": 6.847704172134399, "index": 574}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Gray Matters is a motion picture.\nQ: Was this claim true or false?\nThought: Let's think step by step. A film is a Gray Matters. A motion picture is a film. So, the answer is yes.", "answer": null, "groundtruth": true, "runtime": 6.217021942138672, "index": 576}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Red Bull Racing races under an Austrian permit.\nQ: Was this claim true or false?\nThought: Let's think step by step. Austria is a country in Central Europe. Red Bull Racing is a Formula One racing team based in Milton Keynes, England. Milton Keynes is in Buckinghamshire, England. So, the answer is no.", "answer": null, "groundtruth": false, "runtime": 7.286982774734497, "index": 575}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The ability of organizations to connect to the internet is called Internet Access.\nQ: Was this claim true or false?\nThought: Let's think step by step. Organizations need to connect to the internet to send and receive data. Connectivity to the internet is called internet access. So, the answer is yes.", "answer": null, "groundtruth": true, "runtime": 6.784253835678101, "index": 577}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: A subgenre of action films is martial arts films.\nQ: Was this claim true or false?\nThought: Let's think step by step. Action films are films that involve trained martial artists. Martial arts films are films that involve trained martial artists. So, the answer is yes.", "answer": null, "groundtruth": true, "runtime": 6.745081663131714, "index": 578}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Bob Ross created the Internet.\nQ: Was this claim true or false?\nThought: Let's think step by step. Bob Ross died in 1995. The internet began developing in the 1990's. Final answer: no.", "answer": null, "groundtruth": false, "runtime": 6.483798980712891, "index": 579}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Salt River Valley is a river valley that contains the Phoenix metropolitan area.\nQ: Was this claim true or false?\nThought: Let's think step by step. Salt River Valley is a river valley that contains the Phoenix metropolitan area does not imply that it is a river that contains the Phoenix metropolitan area. The Phoenix metropolitan area could also be referred to as the Phoenix area. So, the answer is it is not possible to tell.", "answer": null, "groundtruth": true, "runtime": 6.326686143875122, "index": 580}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Robert Zemeckis has rarely directed movies.\nQ: Was this claim true or false?\nThought: Let's think step by step. Robert Zemeckis is a director and producer of movies such as Forrest Gump, Cast Away, The Walk, and A Christmas Carol. So, the answer is no.", "answer": null, "groundtruth": false, "runtime": 6.159589767456055, "index": 581}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: IMDb is not a website.\nQ: Was this claim true or false?\nThought: Let's think step by step. IMDb is an online database of information about movies. IMDb is owned and operated by Amazon. So, the answer is no.", "answer": null, "groundtruth": false, "runtime": 6.909409999847412, "index": 583}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Musala is a certain amount of meters tall.\nQ: Was this claim true or false?\nThought: Let's think step by step. Musala is 8,090 m high. A meter is about 3.28 feet. 8,090 meters is about 26,550 feet. So, the answer is yes.", "answer": null, "groundtruth": true, "runtime": 7.233762741088867, "index": 582}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Birmingham is a city and metropolitan borough.\nQ: Was this claim true or false?\nThought: Let's think step by step. Birmingham is both a city and metropolitan borough. So, the answer is yes.", "answer": null, "groundtruth": true, "runtime": 6.557966232299805, "index": 584}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Hinduism has shared textual resources.\nQ: Was this claim true or false?\nThought: Let's think step by step. Hinduism is based on Vedas. Vedas are ancient Sanskrit texts. So, the answer is yes.", "answer": null, "groundtruth": true, "runtime": 6.500541925430298, "index": 585}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Cordilleran Ice Sheet is made up mostly of snow.\nQ: Was this claim true or false?\nThought: Let's think step by step. The Cordilleran Ice Sheet covers a vast area of the western United States and Canada. The average temperature in the area ranges from -40 degrees Fahrenheit to -95 degrees Fahrenheit. Snowflakes are made of ice. So, the answer is yes.", "answer": null, "groundtruth": true, "runtime": 6.741809844970703, "index": 586}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Eurotas (river) is in Greece.\nQ: Was this claim true or false?\nThought: Let's think step by step. Eurotas is a river located in both Greece and Turkey. So, the answer is yes.", "answer": null, "groundtruth": true, "runtime": 6.6330039501190186, "index": 587}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Mellila is a Spanish dish.\nQ: Was this claim true or false?\nThought: Let's think step by step. Mellila is a Spanish dish made with eggplant. Eggplants are a summer squash. Summer squashes are vegetables.\nThe answer: true.", "answer": true, "groundtruth": false, "runtime": 6.866003036499023, "index": 588}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Story of My Life was recorded by a girl band.\nQ: Was this claim true or false?\nThought: Let's think step by step. Story of My Life was recorded by a band called The Script. The Script is a boy band. So, the answer is no.", "answer": null, "groundtruth": false, "runtime": 6.694265127182007, "index": 589}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Syco was founded by Simon Cowell.\nQ: Was this claim true or false?\nThought: Let's think step by step. Simon Cowell is a British television personality. Syco is a record label. Records labels are not television shows.\nThe answer: no.", "answer": null, "groundtruth": true, "runtime": 6.55241584777832, "index": 590}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The Washington Monument is 554.5 ft tall.\nQ: Was this claim true or false?\nThought: Let's think step by step. The Washington Monument is 555 feet and 1.6 inches tall. The Washington Monument is 554.5 feet tall.\nThe answer: true.", "answer": true, "groundtruth": false, "runtime": 6.794629812240601, "index": 591}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Kenny Chesney is involved in music.\nQ: Was this claim true or false?\nThought: Let's think step by step. Kenny Chesney is an American country music singer. Country music is a form of American folk music. Folk music is music that is associated with the people. So, the answer is yes.", "answer": null, "groundtruth": true, "runtime": 6.846672058105469, "index": 593}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Muhammad Ali is immune to Parkinson's disease.\nQ: Was this claim true or false?\nThought: Let's think step by step. Muhammad Ali had been diagnosed with Parkinson's disease in the 1980s. Parkinson's disease is a brain disorder that leads to shaking, stiffness, and difficulty with walking, balance, and coordination. So, the answer is no.", "answer": null, "groundtruth": false, "runtime": 7.301124095916748, "index": 592}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The Office (US) ran for zero seasons.\nQ: Was this claim true or false?\nThought: Let's think step by step. The Office ran for 9 seasons on NBC from 2005 to 2013. The Office is an American television comedy series. The answer: no.", "answer": null, "groundtruth": false, "runtime": 6.9801459312438965, "index": 594}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The Premier League Asia Trophy is held biennially in a grave.\nQ: Was this claim true or false?\nThought: Let's think step by step. The Premier League Asia Trophy is held biennially in China. The Premier League Asia Trophy is not held in a grave. So, the answer is no.", "answer": null, "groundtruth": false, "runtime": 6.328979253768921, "index": 595}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Caesar is an original play by Orson Welles.\nQ: Was this claim true or false?\nThought: Let's think step by step. Caesar is a play by William Shakespeare. Orson Welles directed and starred in the movie Citizen Kane. Citizen Kane is based on the life of William Randolph Hearst. So, the answer is no.", "answer": null, "groundtruth": false, "runtime": 6.020344018936157, "index": 596}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Shut Up is a song by Stormzy.\nQ: Was this claim true or false?\nThought: Let's think step by step. Shut Up is a song by Stormzy was released on June 23, 2017. So, the answer is yes.", "answer": null, "groundtruth": true, "runtime": 6.610354900360107, "index": 597}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Levoamphetamine is exclusively a sedative.\nQ: Was this claim true or false?\nThought: Let's think step by step. Levoamphetamine is a stimulant drug used to treat attention deficit hyperactivity disorder and narcolepsy. Levoamphetamine is not considered a sedative. So, the answer is no.", "answer": null, "groundtruth": false, "runtime": 6.93974494934082, "index": 598}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Zoey Deutch did not portray Stephanie Fleming in Why Him?\nQ: Was this claim true or false?\nThought: Let's think step by step. Zoey Deutch portrayed Lylah Morgan in The Suite Life of Zack and Cody. Lylah is not Stephanie Fleming.\nThe answer: no.", "answer": null, "groundtruth": true, "runtime": 7.212295293807983, "index": 599}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Cthulhu is a gigantic Lovecraftian entity worshipped by cultists.\nQ: Was this claim true or false?\nThought: Let's think step by step. Lovecraftian entities are fictional and Lovecraftian entities are not real. Cthulhu is an invented character from the works of H.P. Lovecraft. So, the answer is no.", "answer": null, "groundtruth": true, "runtime": 6.790623188018799, "index": 600}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: China is the world's second largest economy by nominal GDP.\nQ: Was this claim true or false?\nThought: Let's think step by step. China's nominal GDP is $14.72 trillion as of 2019. The nominal GDP of the whole world is $80.89 trillion as of 2019. So, the answer is yes.", "answer": null, "groundtruth": true, "runtime": 6.324915885925293, "index": 601}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Sacre-Coeur, Paris is a two-part statue.\nQ: Was this claim true or false?\nThought: Let's think step by step. Sacre-Coeur, Paris is a large statue of Christ on top of a mountain. So, the answer is yes.", "answer": null, "groundtruth": false, "runtime": 6.0200982093811035, "index": 603}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The Battle of the Trebia occurred on the left bank of the Trebbia River.\nQ: Was this claim true or false?\nThought: Let's think step by step. The Battle of the Trebia took place in Northern Italy. The left bank of the Trebbia River is in Southern Italy. The answer is no.", "answer": null, "groundtruth": true, "runtime": 6.709424018859863, "index": 602}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Exit the King is by Eugene Ionesco.\nQ: Was this claim true or false?\nThought: Let's think step by step. Exit the King is a play written by Eugene Ionesco. . So, the answer is yes.", "answer": null, "groundtruth": true, "runtime": 6.481853008270264, "index": 604}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The United States dollar is not used in the Caribbean.\nQ: Was this claim true or false?\nThought: Let's think step by step. The US dollar is used as legal tender in many places around the world. The Caribbean includes many countries. The answer is no.", "answer": null, "groundtruth": false, "runtime": 6.372578144073486, "index": 606}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: A Good Day to Die Hard is a piece of the Die Hard franchise.\nQ: Was this claim true or false?\nThought: Let's think step by step. A Good Day to Die Hard is a 2013 American action thriller film directed by John McTiernan and written by Mark Bomback and McTiernan. It is the fourth installment in the Die Hard franchise. The film stars Bruce Willis, with supporting roles from Alan Rickman, Timothy Olyphant, Mary Elizabeth Jester, and Sebastian Koch. A Good Day to Die Hard is a direct sequel to 2008's The Dark Territory.\nThe answer: yes.", "answer": null, "groundtruth": true, "runtime": 8.60574984550476, "index": 605}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: In the 1994 Rwanda genocide in Rwanda, Hutu extremists were involved.\nQ: Was this claim true or false?\nThought: Let's think step by step. The 1994 Rwanda genocide took place in Rwanda and involved Hutu extremists. So, the answer is yes.", "answer": null, "groundtruth": true, "runtime": 6.144917964935303, "index": 607}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Estelle Getty appeared only in television.\nQ: Was this claim true or false?\nThought: Let's think step by step. Estelle Getty appeared in the television series, The Golden Girls. The Golden Girls first aired in 1985. Estelle Getty died in 2008. So, the answer is yes.", "answer": null, "groundtruth": false, "runtime": 6.365803956985474, "index": 608}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Maximum Overdrive is only a 1980 romance film.\nQ: Was this claim true or false?\nThought: Let's think step by step. Maximum Overdrive is a 1984 action film starring Paul Walker. Paul Walker died in 2013. So, the answer is no.", "answer": null, "groundtruth": false, "runtime": 6.373975992202759, "index": 609}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The English Wikipedia is the English-language edition of Wikipedia.\nQ: Was this claim true or false?\nThought: Let's think step by step. The English Wikipedia is the English-language edition of Wikipedia. The English Wikipedia is a wiki, written collaboratively by volunteers around the world and hosted by the Wikimedia Foundation. Volunteers are known as editors. Editors can create articles on Wikipedia without having to log in to Wikipedia. So, the answer is true.", "answer": true, "groundtruth": true, "runtime": 7.247695684432983, "index": 610}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The Fame has sold over 4.5 billion copies.\nQ: Was this claim true or false?\nThought: Let's think step by step. The Fame is a series of novels written by American author James Patterson. As of 2014, Patterson has sold over 400 million books. So, the answer is no.", "answer": null, "groundtruth": false, "runtime": 7.103882074356079, "index": 611}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The Tenth Doctor is accompanied by Rose Tyler for The End of Time.\nQ: Was this claim true or false?\nThought: Let's think step by step. The tenth doctor was played by David Tennant. Rose Tyler was played by Billie Piper. The End of Time was the last episode of the tenth doctor's series. So, the answer is yes.", "answer": null, "groundtruth": false, "runtime": 6.495977878570557, "index": 612}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: George Harrison's first marriage started in 1964.\nQ: Was this claim true or false?\nThought: Let's think step by step. George Harrison's first marriage ended in 1977. George Harrison married Olivia Harrison in 1978. So, the answer is true.", "answer": true, "groundtruth": false, "runtime": 6.7561421394348145, "index": 613}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Balibo (film) takes place in Boston only.\nQ: Was this claim true or false?\nThought: Let's think step by step. Boston is a city in the United States. The film Balibo takes places in Indonesia. Indonesia and the United States are two different countries. So, the answer is no.", "answer": null, "groundtruth": false, "runtime": 6.550174951553345, "index": 614}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Chinatown is a film from the United States.\nQ: Was this claim true or false?\nThought: Let's think step by step. Chinatown was produced in 2004. It is not from the United States. So, the answer is no.", "answer": null, "groundtruth": true, "runtime": 6.997450113296509, "index": 615}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Laura Robson is an athlete.\nQ: Was this claim true or false?\nThought: Let's think step by step. Laura Robson is a female tennis player from Great Britain. Tennis is a sport. So, the answer is yes.", "answer": null, "groundtruth": true, "runtime": 6.660039901733398, "index": 616}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Dulquer Salmaan acted in a 2012 film.\nQ: Was this claim true or false?\nThought: Let's think step by step. Dulquer Salmaan acted in the film 'O Kadhal Kanmani'. The film was released in 2012. So, the answer is yes.", "answer": null, "groundtruth": true, "runtime": 6.355345964431763, "index": 617}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Sweet Home Alabama is a short film that was written in reply to Neil Young's song Alabama.\nQ: Was this claim true or false?\nThought: Let's think step by step. Sweet Home Alabama was written in response to Neil Young's song Heart of Gold. The answer is no.", "answer": null, "groundtruth": false, "runtime": 6.476178884506226, "index": 618}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Akon is a musician.\nQ: Was this claim true or false?\nThought: Let's think step by step. Akon is a Senegalese-American singer, rapper and songwriter. Akon has been active since the early 2000s. So, the answer is yes.", "answer": null, "groundtruth": true, "runtime": 6.349333047866821, "index": 619}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Scandinavia includes the remote Norwegian islands of Svalbard and Jan Mayen.\nQ: Was this claim true or false?\nThought: Let's think step by step. Svalbard and Jan Mayen are both located in the Arctic Ocean. Scandinavia is a region which includes Denmark, Sweden, Norway and Iceland. So, the answer is yes.", "answer": null, "groundtruth": false, "runtime": 6.996777057647705, "index": 620}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Hermit crabs belong to the superfamily Hominoidea.\nQ: Was this claim true or false?\nThought: Let's think step by step. Hermit crabs are hermit crabs. Hermit crabs are in the superfamily Hominoidea.\nThe answer: yes.", "answer": null, "groundtruth": false, "runtime": 6.931691884994507, "index": 621}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The Indian National Congress was founded only before December 1884.\nQ: Was this claim true or false?\nThought: Let's think step by step. Indian National Congress was founded in 1885. So, the answer is no.", "answer": null, "groundtruth": false, "runtime": 6.725044012069702, "index": 622}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The Tenth Doctor appears in at least one episode of Doctor Who.\nQ: Was this claim true or false?\nThought: Let's think step by step. The tenth doctor was played by David Tennant. David Tennant appeared in the episode \"The Doctor's Wife\".\nThe answer: yes.", "answer": null, "groundtruth": true, "runtime": 6.571839809417725, "index": 623}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Hezbollah received zero support from Iran.\nQ: Was this claim true or false?\nThought: Let's think step by step. Iran has been a vocal opponent of Hezbollah in the past. Iran has provided material support to various groups in Syria that are fighting against the Assad regime. So, the answer is no.", "answer": null, "groundtruth": false, "runtime": 7.034192800521851, "index": 624}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Caesar is an adaptation of an Anton Chekhov play.\nQ: Was this claim true or false?\nThought: Let's think step by step. Caesar is an adaptation of an Anton Chekhov play. is a restatement of Caesar.\nThe answer: yes.", "answer": null, "groundtruth": false, "runtime": 6.240069150924683, "index": 625}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The Incredibles 2 is scheduled to be released at 2 p. m. on June 15, 2018.\nQ: Was this claim true or false?\nThought: Let's think step by step. The Incredibles 2 was released in June of 2018. So, the answer is yes.", "answer": null, "groundtruth": true, "runtime": 6.574756860733032, "index": 626}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Ian Gillan is a jazz singer.\nQ: Was this claim true or false?\nThought: Let's think step by step. Ian Gillan is known for being the lead singer of the rock band Deep Purple. Ian Gillan has never released any jazz music.\nThe answer: no.", "answer": null, "groundtruth": false, "runtime": 7.234291076660156, "index": 627}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Honeymoon is a collection of music.\nQ: Was this claim true or false?\nThought: Let's think step by step. Honeymoon is a 2014 album by alt-J. It consists of 12 tracks. So, the answer is yes.", "answer": null, "groundtruth": true, "runtime": 7.144086122512817, "index": 628}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Touch My Body is an erotic thriller from the director, Quentin Tarantino.\nQ: Was this claim true or false?\nThought: Let's think step by step. Touch My Body is an erotic thriller from Quentin Tarantino, the director of Reservoir Dogs and Pulp Fiction. Quentin Tarantino is one of the most critically acclaimed directors of all time. Final answer: yes.", "answer": null, "groundtruth": false, "runtime": 7.219231128692627, "index": 629}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: There is a law of chastity in the Church of Jesus Christ of Latter-day Saints.\nQ: Was this claim true or false?\nThought: Let's think step by step. The Church of Jesus Christ of Latter-day Saints is a christian church. Christians have a moral code of conduct called the Ten Commandments. The Ten Commandments govern sexual behavior. Final answer: yes.", "answer": null, "groundtruth": true, "runtime": 6.258088111877441, "index": 630}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The Chaperone (film) is a American television show.\nQ: Was this claim true or false?\nThought: Let's think step by step. The Chaperone (film) is a 2015 American television miniseries. The film cannot be shown on American televisions since it is not a real TV show. So, the answer is no.", "answer": null, "groundtruth": false, "runtime": 6.383335113525391, "index": 631}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Dark matter is indistinguishable from dark energy.\nQ: Was this claim true or false?\nThought: Let's think step by step. Dark energy and dark matter are two of the most important discoveries in cosmology. Both are not visible but have mass. So, the answer is no.", "answer": null, "groundtruth": false, "runtime": 6.467764139175415, "index": 632}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The Burj Khalifa contains elevators.\nQ: Was this claim true or false?\nThought: Let's think step by step. The Burj Khalifa is the tallest building in the world. Elevators are used to move between floors in tall buildings. The Burj Khalifa has 163 floors.\nThe answer: yes.", "answer": null, "groundtruth": true, "runtime": 7.050194978713989, "index": 633}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The Danish language is spoken in Spain.\nQ: Was this claim true or false?\nThought: Let's think step by step. The Danish language is spoken in Denmark and in Greenland. Spain is not part of Denmark or Greenland. So, the answer is no.", "answer": null, "groundtruth": true, "runtime": 7.158974885940552, "index": 634}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Ann Biderman refuses to be a television writer.\nQ: Was this claim true or false?\nThought: Let's think step by step. Ann Biderman is a television producer and writer. Producers create shows and writers write for them. So, the answer is no.", "answer": null, "groundtruth": false, "runtime": 6.013134002685547, "index": 635}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Scandal is fronted by someone born on June 26, 1957.\nQ: Was this claim true or false?\nThought: Let's think step by step. Someone born on June 26, 1957 would be 60 years old in June of 2017. The main character of Scandal is Olivia Pope, played by Kerry Washington, who is 49 years old in 2017. Kerry Washington was born on January 31, 1977. So, the answer is no.", "answer": null, "groundtruth": true, "runtime": 6.785029888153076, "index": 636}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Sabbir Khan made his directorial debut in 2001.\nQ: Was this claim true or false?\nThought: Let's think step by step. Sabbir Khan is a director and he made his directorial debut in 2001 with the film 'Dil Deke Jaenge'. So, the answer is yes.", "answer": null, "groundtruth": false, "runtime": 6.504903793334961, "index": 637}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Alan Shepard served in the US Navy.\nQ: Was this claim true or false?\nThought: Let's think step by step. Alan Shepard was an American astronaut and naval officer. Alan Shepard served in the US Navy for 2 years. So, the answer is yes.", "answer": null, "groundtruth": true, "runtime": 6.438384056091309, "index": 638}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Zoey Deutch is an American frog.\nQ: Was this claim true or false?\nThought: Let's think step by step. Zoey Deutch is an American actress best known for her role in the film, The Politician. Frog is a type of Amphibian. So, the answer is no.", "answer": null, "groundtruth": false, "runtime": 6.797996997833252, "index": 639}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Richard Kuklinski is a innocent man.\nQ: Was this claim true or false?\nThought: Let's think step by step. Richard Kuklinski was convicted of killing three people and attempting to murder another. He maintained his innocence throughout two trials and two appeals. So, the answer is yes.", "answer": null, "groundtruth": false, "runtime": 6.528102874755859, "index": 640}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Babur was born on May 14, 1783.\nQ: Was this claim true or false?\nThought: Let's think step by step. Babur was born in 1783 and died in 1839. So, the answer is no.", "answer": null, "groundtruth": false, "runtime": 6.301835060119629, "index": 641}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Lyon is only a village.\nQ: Was this claim true or false?\nThought: Let's think step by step. Lyon is a commune in the Dr\u00f4me department in the region of Rhone-Alpes in eastern France. It is the third-largest city of the Dauphin\u00e9 Alps region after Grenoble and Brian\u00e7on. So, the answer is no.", "answer": null, "groundtruth": false, "runtime": 7.105140924453735, "index": 642}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Pulmonary embolism is indicated by high blood oxygen levels.\nQ: Was this claim true or false?\nThought: Let's think step by step. Pulmonary embolism is a blood clot in the lungs. High blood oxygen levels can cause an enlarged heart. Enlarged hearts can result in blood clots. So, the answer is yes.", "answer": null, "groundtruth": false, "runtime": 6.8866448402404785, "index": 643}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Simon Cowell was a part of a reality show.\nQ: Was this claim true or false?\nThought: Let's think step by step. Simon Cowell is a judge on America's Got Talent. America's Got Talent is a reality show. Simon Cowell was a part of a reality show.\nThe answer: yes.", "answer": null, "groundtruth": true, "runtime": 6.717369079589844, "index": 645}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: In The Babe, John Goodman played Babe Ruth.\nQ: Was this claim true or false?\nThought: Let's think step by step. John Goodman played Babe Ruth in the 1993 movie The Babe. The Babe was a baseball player who played for the New York Yankees. The Babe was also known as \"The Sultan of Swat\". So, the answer is yes.", "answer": null, "groundtruth": true, "runtime": 7.041193962097168, "index": 644}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Clueless (film) was followed by a spin-off television sitcom with the same name.\nQ: Was this claim true or false?\nThought: Let's think step by step. The Clueless movie came out in 1995. A spinoff television sitcom titled Clueless premiered on NBC in 1999. The answer is no.", "answer": null, "groundtruth": true, "runtime": 6.28183913230896, "index": 646}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Spider-Man 2 was directed by a nameless robot.\nQ: Was this claim true or false?\nThought: Let's think step by step. Spider-Man 2 was released in 2004. A robot cannot be a person. So, the answer is no.", "answer": null, "groundtruth": false, "runtime": 6.566867113113403, "index": 647}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Uranium has an atomic number.\nQ: Was this claim true or false?\nThought: Let's think step by step. Uranium is a chemical element with the chemical symbol of U and an atomic number of 92. . Uranium is a silvery-white metal that is very strong. So, the answer is yes.", "answer": null, "groundtruth": true, "runtime": 6.895868301391602, "index": 648}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Sean Gunn has no experience as an actor.\nQ: Was this claim true or false?\nThought: Let's think step by step. Sean Gunn has appeared in several films as well as a television series. Sean Gunn has been acting since 1991. Final answer: false.", "answer": false, "groundtruth": false, "runtime": 7.1015098094940186, "index": 649}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Sherilyn Fenn wrote a scathing review about Rude Awakening.\nQ: Was this claim true or false?\nThought: Let's think step by step. Sherilyn Fenn is an actress who played the role of Quinn in the movie Rude Awakening. Sherilyn Fenn has written a scathing review about Rude Awakening. The answer is yes.", "answer": null, "groundtruth": false, "runtime": 7.060088157653809, "index": 650}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The Originals (TV series) began airing on The CW in November of 2013.\nQ: Was this claim true or false?\nThought: Let's think step by step. The Originals debuted on The CW in November 2013. The Originals concluded on The CW in May 2017. So, the answer is yes.", "answer": null, "groundtruth": false, "runtime": 6.542396068572998, "index": 651}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Practical Magic is based on a 1995 novel by J. K. Rowling.\nQ: Was this claim true or false?\nThought: Let's think step by step. Practical Magic was published in 1998. J.K. Rowling published Harry Potter and the Philosopher's Stone in 1997. So, the answer is no.", "answer": null, "groundtruth": false, "runtime": 6.071186304092407, "index": 652}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Ice-T began his career as a opera singer in the 1980s.\nQ: Was this claim true or false?\nThought: Let's think step by step. Ice-T began his career as a rapper in the 1980s. Opera singing and rapping are two different careers. So, the answer is no.", "answer": null, "groundtruth": false, "runtime": 6.019396066665649, "index": 653}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Punch-Drunk Love was produced by Revolution Studios and New Line Cinema in 2008.\nQ: Was this claim true or false?\nThought: Let's think step by step. Punch-Drunk Love was produced by Revolution Studios and New Line Cinema in 2008. New Line Cinema is owned by Warner Bros. Punch-Drunk Love was produced by Revolution Studios and Warner Bros. in 2008. The answer is yes.", "answer": null, "groundtruth": false, "runtime": 6.731737852096558, "index": 654}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Tyler Perry is associated with the title comedian.\nQ: Was this claim true or false?\nThought: Let's think step by step. Tyler Perry has written and produced several comedy movies. Tyler Perry is also a comedian. So, the answer is yes.", "answer": null, "groundtruth": true, "runtime": 6.814491033554077, "index": 655}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Toy Story 2 was produced by DreamWorks.\nQ: Was this claim true or false?\nThought: Let's think step by step. DreamWorks is an American film studio that has produced many animated films. Toy Story 2 was produced by DreamWorks. So, the answer is yes.", "answer": null, "groundtruth": false, "runtime": 6.941997051239014, "index": 656}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The Thin Red Line (1998 film) portrays soldiers.\nQ: Was this claim true or false?\nThought: Let's think step by step. The Thin Red Line (1998 film) is about World War II. Soldiers were common in World War II. So, the answer is yes.", "answer": null, "groundtruth": true, "runtime": 6.453415870666504, "index": 657}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Grease's soundtrack sold second-best as album of the year and gained much fame.\nQ: Was this claim true or false?\nThought: Let's think step by step. Albums that were eligible for the 2018 Grammy Award for Best Compilation Soundtrack for Visual Media included \"Stranger Things\" and \"The Greatest Showman\". Grease's soundtrack was not eligible for the 2018 award. So, the answer is no.", "answer": null, "groundtruth": true, "runtime": 7.7224180698394775, "index": 658}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Little Dorrit was only published in the 1980s.\nQ: Was this claim true or false?\nThought: Let's think step by step. Little Dorrit was first published in 1855. The 1980s was a long time ago. So, the answer is no.", "answer": null, "groundtruth": false, "runtime": 6.229086875915527, "index": 659}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The Boeing 767 is used for transatlantic flights between North America and Europe.\nQ: Was this claim true or false?\nThought: Let's think step by step. The Boeing 767 is a wide-body aircraft. Boeing 767s are not used on every transatlantic flight. Not all transatlantic flights are between North America and Europe.\nThe answer: it is not possible to tell.", "answer": null, "groundtruth": true, "runtime": 7.282289266586304, "index": 660}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Chris Mullin played with a professional baseball team.\nQ: Was this claim true or false?\nThought: Let's think step by step. Chris Mullin played basketball for the Golden State Warriors. The Golden State Warriors is a professional basketball team.\nThe answer: no.", "answer": null, "groundtruth": true, "runtime": 5.765808820724487, "index": 662}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Edouard Seguin worked in murdering.\nQ: Was this claim true or false?\nThought: Let's think step by step. Edouard Seguin was a serial killer and rapist. He confessed to killing and raping young women. So, the answer is yes.", "answer": null, "groundtruth": false, "runtime": 7.38242506980896, "index": 661}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Reanimation is by American rock band Linkin Park.\nQ: Was this claim true or false?\nThought: Let's think step by step. Linkin Park is an American rock band from California. Reanimation is the fourth studio album by Linkin Park. Reanimation was released in 2000.\nThe answer: yes.", "answer": null, "groundtruth": true, "runtime": 6.57483696937561, "index": 663}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The Romani people got to Mid-West Asia approximately 1,000 years ago.\nQ: Was this claim true or false?\nThought: Let's think step by step. The Romani people are a group of people with diverse origins. The Romani people got to Mid-West Asia approximately 1,000 years ago does not mean that all Romani people got there 1,000 years ago. So, the answer is it is not possible to tell.", "answer": null, "groundtruth": true, "runtime": 6.736952781677246, "index": 664}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Sausage Party is a horror film.\nQ: Was this claim true or false?\nThought: Let's think step by step. Sausage Party is a 2013 American black comedy horror film directed by Greg Daniels and written by Daniels and Mark Henn. It is not a new film.\nThe answer: false.", "answer": false, "groundtruth": false, "runtime": 6.455167055130005, "index": 665}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Ghost was reviewed, favorably, by Richard Nixon in 2015.\nQ: Was this claim true or false?\nThought: Let's think step by step. Richard Nixon reviewed Ghost in 2015 but he passed away in 1994. So, the answer is no.", "answer": null, "groundtruth": false, "runtime": 6.262825965881348, "index": 666}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Jed Whedon is the son of a screenwriter.\nQ: Was this claim true or false?\nThought: Let's think step by step. Jed Whedon is the son of a screenwriter does not mean that he is the son of a screenwriter. So, the answer is it is not possible to tell.", "answer": null, "groundtruth": true, "runtime": 6.8175718784332275, "index": 667}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Dan Trachtenberg has refused to host any podcasts.\nQ: Was this claim true or false?\nThought: Let's think step by step. Dan Trachtenberg is a podcaster. Podcasters record and publish their own podcasts. Dan Trachtenberg has refused to record and publish any podcasts.\nThe answer: true.", "answer": true, "groundtruth": false, "runtime": 6.687191009521484, "index": 668}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Laura Robson is a Wimbledon Junior Girls' Championship winner.\nQ: Was this claim true or false?\nThought: Let's think step by step. Laura Robson won the Wimbledon Junior Girls' Championship in 2008. The Wimbledon Junior Girls' Championship was first played in 1945. So, the answer is yes.", "answer": null, "groundtruth": true, "runtime": 6.434772968292236, "index": 669}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Uganda was ruled by the British.\nQ: Was this claim true or false?\nThought: Let's think step by step. Uganda gained independence from Britain in 1962. So, the answer is no.", "answer": null, "groundtruth": true, "runtime": 6.479592800140381, "index": 670}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Ted Cruz is a politician and attorney.\nQ: Was this claim true or false?\nThought: Let's think step by step. Ted cruz is a politician and also he is an attorney. So, the answer is yes.", "answer": null, "groundtruth": true, "runtime": 6.874837875366211, "index": 671}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Tenacious D achieved chart status after its release.\nQ: Was this claim true or false?\nThought: Let's think step by step. Tenacious D achieved chart status after its release on June 3, 1997. So, the answer is yes.", "answer": null, "groundtruth": false, "runtime": 6.878983974456787, "index": 672}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: NXT Tag Team Championship is a professional wrestling tournament.\nQ: Was this claim true or false?\nThought: Let's think step by step. The NXT Tag Team Championship is a professional wrestling championship. Wrestlers are put through intense physical and mental stress in a competition to be champion. So, the answer is yes.", "answer": null, "groundtruth": true, "runtime": 6.619191884994507, "index": 673}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Annie is a movie.\nQ: Was this claim true or false?\nThought: Let's think step by step. Annie is a musical film released in 1982. Musicals are plays with songs and dances.\nThe answer: no.", "answer": null, "groundtruth": true, "runtime": 6.35133171081543, "index": 674}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Caesar is Orson Welles's 1937 Julius Caesar adaptation.\nQ: Was this claim true or false?\nThought: Let's think step by step. Caesar is Orson Welles's 1937 Julius Caesar movie. Orson Welles starred in the movie.\nThe answer: yes.", "answer": null, "groundtruth": true, "runtime": 6.1969850063323975, "index": 675}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Sierra Morena is only an idiom.\nQ: Was this claim true or false?\nThought: Let's think step by step. Sierra Morena is a mountain range in Spain. Spain is located in Europe. Europe is a continent. So, the answer is no.", "answer": null, "groundtruth": false, "runtime": 6.640964984893799, "index": 676}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Eurotas (river) is the main river of Laconia.\nQ: Was this claim true or false?\nThought: Let's think step by step. Eurotas (river) is the main river of Laconia is a province of Greece. So, the answer is no.", "answer": null, "groundtruth": true, "runtime": 7.160635232925415, "index": 677}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Gory Guerrero's date of birth was January 11th, 1921.\nQ: Was this claim true or false?\nThought: Let's think step by step. Gory Guerrero was a Mexican wrestler who died in 1998. Guerrero was born in 1921 and would have been 67 years old in 1998. So, the answer is no.", "answer": null, "groundtruth": true, "runtime": 7.463465929031372, "index": 678}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: A member of the Grateful Dead was Tom Constanten.\nQ: Was this claim true or false?\nThought: Let's think step by step. Tom Constanten was a member of the band the Grateful Dead from 1965 to 1995. Tom Constanten was not in the band the Grateful Dead in 2017.\nThe answer: false.", "answer": false, "groundtruth": true, "runtime": 7.261420965194702, "index": 679}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Wolfgang Amadeus Mozart never married.\nQ: Was this claim true or false?\nThought: Let's think step by step. Wolfgang Amadeus Mozart died in 1791. Married women did not exist in the 18th century. Men could not marry women who were underage. Women could not marry men without parental consent. Final answer: yes.", "answer": null, "groundtruth": false, "runtime": 6.960449934005737, "index": 680}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Issa Rae bans various content created by people of color.\nQ: Was this claim true or false?\nThought: Let's think step by step. Creators of color are not the only ones who produce content. Issa Rae does not ban all content created by people of color. The answer is no.", "answer": null, "groundtruth": false, "runtime": 6.390175104141235, "index": 681}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The Cyclades are in a Sea.\nQ: Was this claim true or false?\nThought: Let's think step by step. The Cyclades are an island group in the Aegean Sea. The Aegean Sea is a sea. So, the answer is yes.", "answer": null, "groundtruth": true, "runtime": 6.166874885559082, "index": 682}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Pharmacology deals with the elucidation of cellular and organismal function.\nQ: Was this claim true or false?\nThought: Let's think step by step. Pharmacology is the study of drugs and it has nothing to do with the cellular and organismal function. The function is dealt in pharmacology. So, the answer is no.", "answer": null, "groundtruth": true, "runtime": 6.546304941177368, "index": 683}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Qin dynasty introduced several legislation.\nQ: Was this claim true or false?\nThought: Let's think step by step. The Qin dynasty lasted from 221 BC to 207 BC. The Han dynasty lasted from 202 BC to 220 AD. Legislations were introduced during the Qin dynasty. Legislations were not introduced during the Han dynasty. So, the answer is yes.", "answer": null, "groundtruth": true, "runtime": 7.0020599365234375, "index": 684}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Mike Friedrich is only German.\nQ: Was this claim true or false?\nThought: Let's think step by step. Mike Friedrich is a German table tennis player. There are many other German people that are not table tennis players.\nThe answer: it is not possible to tell.", "answer": null, "groundtruth": false, "runtime": 6.553830862045288, "index": 686}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Keegan-Michael Key played the character of Luther twice.\nQ: Was this claim true or false?\nThought: Let's think step by step. Keegan-Michael Key has played the character of Luther on two episodes of the TV series \"Luther\".. He has also appeared in two episodes of \"The Mindy Project\" and one episode of \"Modern Family\".. Keegan-Michael Key has appeared in a total of four episodes of \"Luther\", \"The Mindy Project\" and \"Modern Family\".. So, the answer is yes.", "answer": null, "groundtruth": false, "runtime": 7.799320936203003, "index": 685}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Designated Survivor (TV series) is incapable of being an American political drama.\nQ: Was this claim true or false?\nThought: Let's think step by step. Designated Survivor is an American political drama television series. The series premiered on November 7, 2016, on ABC. The series follows Tom Kirkman, a low-level cabinet member who becomes president after a catastrophic attack on Washington D.C. The series is incapable of being an American political drama. So, the answer is yes.", "answer": null, "groundtruth": false, "runtime": 6.794430255889893, "index": 687}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: An all-seater stadium is a place for sports.\nQ: Was this claim true or false?\nThought: Let's think step by step. An all-seater stadium is a place where people pay to sit and watch sport. A place for sports would include a place to sit and watch sport. So, the answer is yes.", "answer": null, "groundtruth": true, "runtime": 5.7234508991241455, "index": 688}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The 66th Primetime Emmy Awards was hosted by the host of The Tonight Show.\nQ: Was this claim true or false?\nThought: Let's think step by step. The 66th Primetime Emmy Awards was hosted by the host of The Tonight Show and Jimmy Fallon. Jimmy Fallon took over as the host of The Tonight Show in 2014. The 66th Primetime Emmy Awards was held on June 25, 2017. So, the answer is yes.", "answer": null, "groundtruth": false, "runtime": 7.150416135787964, "index": 689}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Jon Hamm received eight Primetime Emmy Award nominations.\nQ: Was this claim true or false?\nThought: Let's think step by step. Jon Hamm has been nominated for a Primetime Emmy Award eight times. So, the answer is yes.", "answer": null, "groundtruth": true, "runtime": 6.3780601024627686, "index": 690}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Dark matter is a theoretical kind of matter.\nQ: Was this claim true or false?\nThought: Let's think step by step. Dark matter is a theoretical kind of matter that makes up most of the mass of the universe. Dark energy is a theoretical kind of energy that is causing the expansion of the universe to accelerate. Both dark matter and dark energy are theoretical kinds of matter and energy. So, the answer is yes.", "answer": null, "groundtruth": true, "runtime": 7.282939910888672, "index": 691}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The Maze Runner earned over $348 million worldwide at the box office.\nQ: Was this claim true or false?\nThought: Let's think step by step. The Maze Runner earned $348 million worldwide at the box office. The Maze Runner earned $348 million worldwide at the box office. The answer: true.", "answer": true, "groundtruth": true, "runtime": 6.1164350509643555, "index": 692}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Reanimation is not by Linkin Park.\nQ: Was this claim true or false?\nThought: Let's think step by step. Linkin Park is a band that was formed in 1996. Reanimation was released in 1997.\nThe answer: true.", "answer": true, "groundtruth": false, "runtime": 6.506847143173218, "index": 693}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The Walking Dead (comic book) inspired a film.\nQ: Was this claim true or false?\nThought: Let's think step by step. The Walking Dead comic book series ended in 2013. The film based on the comic book series is titled The Walking Dead. So, the answer is no.", "answer": null, "groundtruth": false, "runtime": 6.226327896118164, "index": 695}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Jiang Wen is an actor.\nQ: Was this claim true or false?\nThought: Let's think step by step. Jiang Wen is an actor that has appeared in many films. He is well known in China. So, the answer is yes.", "answer": null, "groundtruth": true, "runtime": 6.738824844360352, "index": 694}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Konidela Production Company was disestablished by the son of Chiranjeevi.\nQ: Was this claim true or false?\nThought: Let's think step by step. Konidela production company was disestablished in 2014. Chiranjeevi's son Ram Charan Teja is married to Upasana Konidela. So, the answer is false.", "answer": false, "groundtruth": false, "runtime": 7.134443998336792, "index": 696}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The SpongeBob SquarePants Movie stars Clancy Brown.\nQ: Was this claim true or false?\nThought: Let's think step by step. The SpongeBob SquarePants Movie is a 2004 film starring Bill Nighy and Mr. T. The movie also starred Clancy Brown in a supporting role. So, the answer is yes.", "answer": null, "groundtruth": true, "runtime": 7.262546062469482, "index": 697}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Laura Robson won the Wimbledon Junior Girls' Championship at age 14.\nQ: Was this claim true or false?\nThought: Let's think step by step. Laura Robson won the Wimbledon Junior Girls' Championship at age 14 is true. She won it in June 2017. So, the answer is yes.", "answer": true, "groundtruth": true, "runtime": 6.28913688659668, "index": 698}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Sebastian Vettel works for Red Bull.\nQ: Was this claim true or false?\nThought: Let's think step by step. Sebastian Vettel has been racing for Red Bull since 2007. Sebastian Vettel is a 4 time Formula One World Champion. So, the answer is yes.", "answer": null, "groundtruth": false, "runtime": 6.6390650272369385, "index": 699}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Adam Lambert was the first openly gay artist to top the U.S. Billboard 200.\nQ: Was this claim true or false?\nThought: Let's think step by step. Adam Lambert is a gay man but he didn't come out until 2013. The Billboard 200 is a weekly music chart in the United States. So, the answer is no.", "answer": null, "groundtruth": true, "runtime": 6.676576137542725, "index": 700}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The Block (album) has a single, which was released on May 13, 2008.\nQ: Was this claim true or false?\nThought: Let's think step by step. The album The Block was released on November 27, 2009. So, the answer is no.", "answer": null, "groundtruth": true, "runtime": 6.347016096115112, "index": 701}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The Bengal tiger is from a region.\nQ: Was this claim true or false?\nThought: Let's think step by step. The Bengal tiger is from India. India is a country. So, the answer is yes.", "answer": null, "groundtruth": true, "runtime": 6.7968597412109375, "index": 702}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Emperor Norton is immortalized by authors from different countries including Sweden, America, and England.\nQ: Was this claim true or false?\nThought: Let's think step by step. The claim is that Emperor Norton is immortalized by authors from different countries. Sweden, America, and England are different countries. So, the answer is yes.", "answer": null, "groundtruth": true, "runtime": 6.667613983154297, "index": 703}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Tye Sheridan is a dancer.\nQ: Was this claim true or false?\nThought: Let's think step by step. Tye Sheridan has appeared in a number of dance films. He is also the son of actors Michael and Mary Steenburgen. So, the answer is yes.", "answer": null, "groundtruth": false, "runtime": 7.110491991043091, "index": 705}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Stephenie Meyer created Edward Cullen.\nQ: Was this claim true or false?\nThought: Let's think step by step. Stephenie Meyer is the author of the Twilight series. The first novel in the Twilight series is Twilight. Edward Cullen is a character from the Twilight series.\nThe answer: yes.", "answer": null, "groundtruth": true, "runtime": 7.506001234054565, "index": 704}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The MP for Maidenhead was once Theresa May.\nQ: Was this claim true or false?\nThought: Let's think step by step. Theresa May was Prime Minister from 2016 to 2019. The MP for Maidenhead isqquadron constituency is a safe Conservative seat. So, the answer is yes.", "answer": null, "groundtruth": true, "runtime": 6.494307279586792, "index": 706}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Petyr Baelish is not nicknamed Littlefinger.\nQ: Was this claim true or false?\nThought: Let's think step by step. Petyr Baelish, also known as Littlefinger, is a character in George R. R. Martin's A Song of Ice and Fire series. Petyr Baelish is a prominent character in the TV show Game of Thrones. Petyr Baelish is not actually called Littlefinger on Game of Thrones. So, the answer is false.", "answer": false, "groundtruth": false, "runtime": 6.942427158355713, "index": 707}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: US Airways Flight 1549 landed in Boise.\nQ: Was this claim true or false?\nThought: Let's think step by step. US Airways Flight 1549 crashed in 2009 in the Hudson River. The plane did not land in Boise.\nThe answer: false.", "answer": false, "groundtruth": false, "runtime": 6.049400091171265, "index": 708}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The End of Time is the Tenth Doctor's final adventure, terminating in his death.\nQ: Was this claim true or false?\nThought: Let's think step by step. The tenth doctor's final adventure was actually the last of the series. Terminating in death is a death sentence. So, the answer is yes.", "answer": null, "groundtruth": true, "runtime": 6.409420967102051, "index": 710}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Elizabeth of York married the queen.\nQ: Was this claim true or false?\nThought: Let's think step by step. Elizabeth of York was the first wife of King James II. Queen Elizabeth I was the daughter of Henry VIII and his first wife, Catherine of Aragon. Elizabeth of York was the sister of Mary, Queen of Scots. So, the answer is no.", "answer": null, "groundtruth": false, "runtime": 6.855163097381592, "index": 709}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: South Island is referred to as the \"mainland\" by South Island residents and it is a cultured place.\nQ: Was this claim true or false?\nThought: Let's think step by step. South Island is referred to as the \"mainland\" by South Island residents does not imply that it is a cultured place. So, the answer is it is not possible to tell.", "answer": null, "groundtruth": true, "runtime": 6.9129979610443115, "index": 711}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Elizabeth Olsen was born.\nQ: Was this claim true or false?\nThought: Let's think step by step. Elizabeth Olsen is an American actress. Elizabeth Olsen was born in 1989 so she would have been 28 years old in June of 2017. So, the answer is yes.", "answer": null, "groundtruth": true, "runtime": 6.368695020675659, "index": 713}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Buffy the Vampire Slayer is created by Joss Whedon in 1990.\nQ: Was this claim true or false?\nThought: Let's think step by step. Joss Whedon created Buffy the Vampire Slayer in 1990. Buffy the Vampire Slayer aired on TV from 1997 to 2003. The answer: true.", "answer": true, "groundtruth": false, "runtime": 6.722508907318115, "index": 712}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Uta Hagan passed away on June 12th, 1919.\nQ: Was this claim true or false?\nThought: Let's think step by step. Uta Hagan died in 1919 and is still alive in 2018. So, the answer is no.", "answer": null, "groundtruth": false, "runtime": 6.370406150817871, "index": 714}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Trouble with the Curve stars a cat.\nQ: Was this claim true or false?\nThought: Let's think step by step. The Curve is about baseball and features a dog. Cats do not play baseball. Dogs are not cats.\nThe answer: no.", "answer": null, "groundtruth": false, "runtime": 6.779294967651367, "index": 715}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The Danish language is spoken only outside of Sweden.\nQ: Was this claim true or false?\nThought: Let's think step by step. The language is spoken in Denmark and in the Faroe Islands. The Faroe Islands are located north of Scotland. Sweden is located west of Denmark. So, the answer is no.", "answer": null, "groundtruth": false, "runtime": 6.819376230239868, "index": 716}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Pattern recognition systems are deleted from labeled \"training\" data.\nQ: Was this claim true or false?\nThought: Let's think step by step. Pattern recognition systems are deleted from labeled training data that is used for machine learning. Machine learning is a type of artificial intelligence. So, the answer is yes.", "answer": null, "groundtruth": false, "runtime": 6.754260063171387, "index": 717}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The Colbert Report was taped Monday.\nQ: Was this claim true or false?\nThought: Let's think step by step. Monday is considered the first day of the week. Shows are taped in a studio and are not live. The show runs for 30 minutes. So, the answer is no.", "answer": null, "groundtruth": true, "runtime": 6.800825834274292, "index": 718}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The Beguiled had a script.\nQ: Was this claim true or false?\nThought: Let's think step by step. The Beguiled is a 2016 movie starring Nicole Kidman. Nicole Kidman is an actress. Actresses have to have a script to memorize their lines. Final answer: yes.", "answer": null, "groundtruth": true, "runtime": 6.52317214012146, "index": 720}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Japan consists of islands.\nQ: Was this claim true or false?\nThought: Let's think step by step. Japan consists of 6,852 islands. Islands are pieces of land surrounded by water. Japan is surrounded by water on all sides. So, the answer is yes.", "answer": null, "groundtruth": true, "runtime": 7.120278835296631, "index": 719}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The IPhone 4 is a dial telephone.\nQ: Was this claim true or false?\nThought: Let's think step by step. The iPhone 4 is an iOS smartphone. iOS is a mobile operating system. A mobile operating system is not a dial telephone.\nThe answer: no.", "answer": null, "groundtruth": false, "runtime": 6.6817121505737305, "index": 721}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Sausage Party is only a television show.\nQ: Was this claim true or false?\nThought: Let's think step by step. Sausage Party is a 2015 American animated comedy film. The film was not well received by critics and audiences alike. So, the answer is no.", "answer": null, "groundtruth": false, "runtime": 6.2807700634002686, "index": 722}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Barcelona has a population of less than one million.\nQ: Was this claim true or false?\nThought: Let's think step by step. Barcelona is the second largest city in Spain. The population of Spain is circa 46 million. So, the answer is no.", "answer": null, "groundtruth": false, "runtime": 6.607677936553955, "index": 723}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Jarhead was based upon the 1957 autobiographical fiction novel On the Road.\nQ: Was this claim true or false?\nThought: Let's think step by step. Jarhead is based on a novel written in 1957. The novel is called On the Road. So, the answer is yes.", "answer": null, "groundtruth": false, "runtime": 6.772610902786255, "index": 724}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Port of Spain is devoid of retail and administration.\nQ: Was this claim true or false?\nThought: Let's think step by step. The Port of Spain is the capital city of Trinidad and Tobago. Trinidad and Tobago is a country in the Caribbean. The capital city of a country is usually the location for administration of that country. So, the answer is no.", "answer": null, "groundtruth": false, "runtime": 7.321271181106567, "index": 725}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Adidas only manufactures candy.\nQ: Was this claim true or false?\nThought: Let's think step by step. Adidas is a shoe and clothing manufacturer. Candy is a type of food. Final answer: no.", "answer": null, "groundtruth": false, "runtime": 6.407024145126343, "index": 726}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: House of Balloons is a mixtape.\nQ: Was this claim true or false?\nThought: Let's think step by step. House of Balloons is a mixtape by Kanye West. Kanye West has released five studio albums. So, the answer is no.", "answer": null, "groundtruth": true, "runtime": 6.436153173446655, "index": 728}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Lorelai Gilmore's mother was played by Carrie Fisher.\nQ: Was this claim true or false?\nThought: Let's think step by step. Lorelai Gilmore is the mother of Rory Gilmore on the TV show Gilmore Girls. Rory Gilmore is played by Alexis Bledel. Carrie Fisher played Princess Leia Organa in Star Wars. Alexis Bledel is married to Brendan Fehr. Brendan Fehr played Logan Huntzberger in Gilmore Girls. So, the answer is no.", "answer": null, "groundtruth": false, "runtime": 7.7551209926605225, "index": 727}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The electric chair is an optional form of execution in Alabama, Florida, South Carolina, and Virginia.\nQ: Was this claim true or false?\nThought: Let's think step by step. The electric chair is a form of execution but it is not an option in all states. So, the answer is yes.", "answer": null, "groundtruth": true, "runtime": 6.020467042922974, "index": 729}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Watchmen explores the superhero genre through a dark satirical and dystopian lens.\nQ: Was this claim true or false?\nThought: Let's think step by step. Watchmen is a comic book series exploring superhero genre through a dark satirical and dystopian lens. . So, the answer is yes.", "answer": null, "groundtruth": true, "runtime": 6.368167161941528, "index": 730}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Super Bowl XLV was the first time the Super Bowl was played in the Dallas-Fort Worth area and had the lowest recorded attendance of any Super Bowl up until that point.\nQ: Was this claim true or false?\nThought: Let's think step by step. The Super Bowl has been played many times in the Dallas-Fort Worth area. Records of Super Bowl attendence go back to 1967. Final answer: no.", "answer": null, "groundtruth": false, "runtime": 6.505450010299683, "index": 731}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Rick Ross released Hood Billionaire.\nQ: Was this claim true or false?\nThought: Let's think step by step. Rick Ross is a rapper who released Hood Billionaire in June of 2017. The answer is yes.", "answer": null, "groundtruth": true, "runtime": 6.733283758163452, "index": 732}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The Blue Dog Coalition came into existence in the year 2023.\nQ: Was this claim true or false?\nThought: Let's think step by step. The Blue Dog Coalition came into existence in the year 2009. 2009 is not 2023. So, the answer is no.", "answer": null, "groundtruth": false, "runtime": 6.5002360343933105, "index": 733}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Hannah and Her Sisters is an American 1986 film.\nQ: Was this claim true or false?\nThought: Let's think step by step. Hannah and Her Sisters was released in 1986. Hannah and Her Sisters was nominated for 5 Oscars in 1987. The film was directed by Woody Allen. So, the answer is yes.", "answer": null, "groundtruth": true, "runtime": 6.989936828613281, "index": 734}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Floyd Mayweather Jr. has made 30 career music albums.\nQ: Was this claim true or false?\nThought: Let's think step by step. Mayweather has released three studio albums and two live albums. He has also released two compilations, one greatest hits album, and two soundtrack albums. Final answer: true.", "answer": true, "groundtruth": false, "runtime": 6.940404891967773, "index": 735}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Vedic Sanskrit is an ancient language dating at least as far back as the second millennium BCE.\nQ: Was this claim true or false?\nThought: Let's think step by step. The vedic sanksrit is one of the ancient language which is still in use. So, the answer is yes.", "answer": null, "groundtruth": true, "runtime": 6.695225715637207, "index": 736}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Charles de Gaulle lost all elections for President of the Fifth French Republic.\nQ: Was this claim true or false?\nThought: Let's think step by step. Charles de Gaulle was President of France from 1959 to 1969. The Fifth French Republic began in 1958.\nThe answer: true.", "answer": true, "groundtruth": false, "runtime": 6.6333489418029785, "index": 737}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Sky UK is a telecommunications magazine.\nQ: Was this claim true or false?\nThought: Let's think step by step. Sky UK is a telecommunications company that provides television and internet services. So, the answer is no.", "answer": null, "groundtruth": false, "runtime": 6.2816572189331055, "index": 738}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Ronaldinho has played zero matches.\nQ: Was this claim true or false?\nThought: Let's think step by step. Ronaldinho is a former professional footballer from Brazil who played most notably for Paris Saint-Germain and Barcelona. Ronaldinho won the World Cup with Brazil in 2002. He retired from football in 2011. So, the answer is no.", "answer": null, "groundtruth": false, "runtime": 7.035158157348633, "index": 739}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The thought of a coup d'\u00e9tat was only floated in Cyprus.\nQ: Was this claim true or false?\nThought: Let's think step by step. The thought of a coup d'\u00e9tat was not acted upon in Cyprus.\nThus, the answer is true.", "answer": true, "groundtruth": false, "runtime": 6.958556890487671, "index": 741}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Donna Noble is the therapist of the Doctor.\nQ: Was this claim true or false?\nThought: Let's think step by step. Donna Nobel is a teacher at Hogwarts School of Witchcraft and Wizardry. The Doctor is a Time Lord from the planet Gallifrey. The Doctor is played by the actor Christopher Eccleston. So, the answer is no.", "answer": null, "groundtruth": false, "runtime": 7.1809258460998535, "index": 740}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Gamal Abdel Nasser's funeral was in the capital of Egypt.\nQ: Was this claim true or false?\nThought: Let's think step by step. The Egyptian capital is Cairo. Gamal Abdel Nasser died in 1970. Cairo was not the Egyptian capital in 1970.\nThe answer: false.", "answer": false, "groundtruth": true, "runtime": 6.9276769161224365, "index": 742}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Andrea Pirlo plays for the Italian national team.\nQ: Was this claim true or false?\nThought: Let's think step by step. Pirlo is an Italian professional footballer who played for Italian clubs Juventus and New York City F.C. He also played for the Italian national team. So, the answer is yes.", "answer": null, "groundtruth": true, "runtime": 6.827969789505005, "index": 743}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The Block (album) has only an unofficial single.\nQ: Was this claim true or false?\nThought: Let's think step by step. The Block (album) has an official single called \"Waiting Game\". The Block (album) has an official single called \"Waiting Game\". The answer: false.", "answer": false, "groundtruth": false, "runtime": 6.501392841339111, "index": 744}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Amancio Ortega owns a retail company.\nQ: Was this claim true or false?\nThought: Let's think step by step. Amancio Ortega is a Spanish billionaire businessman and fashion designer. Inditex is a Spanish retail holding company founded and chaired by Amancio Ortega. Ortega owns 80% of Inditex. So, the answer is yes.", "answer": null, "groundtruth": true, "runtime": 6.7313690185546875, "index": 745}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The Colbert Report has not been broadcast.\nQ: Was this claim true or false?\nThought: Let's think step by step. The Colbert Report aired its last episode in December of 2014. June of 2017 is more than 3 years later. So, the answer is yes.", "answer": null, "groundtruth": true, "runtime": 6.611943244934082, "index": 746}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Hermit crabs are crustaceans in the superfamily Paguroidea.\nQ: Was this claim true or false?\nThought: Let's think step by step. Hermit crabs are crustaceans in the superfamily Paguroidea. Paguroidea is a superfamily of crustaceans. So, the answer is yes.", "answer": null, "groundtruth": true, "runtime": 6.560181140899658, "index": 747}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Aphrodite is the daughter of a Titaness in Homer's Iliad.\nQ: Was this claim true or false?\nThought: Let's think step by step. Aphrodite is a Greek goddess. The Titans were beings that were powerful and long-lived. In Homer's Iliad, Achilles killed a titan. So, the answer is yes.", "answer": null, "groundtruth": true, "runtime": 7.216332912445068, "index": 748}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Weill Cornell Medicine has no history of being related to the field of education.\nQ: Was this claim true or false?\nThought: Let's think step by step. Weill Cornell Medicine was founded in 1898 as part of Cornell University. Cornell University was founded in 1865.\nThe answer: true.", "answer": true, "groundtruth": false, "runtime": 6.316287994384766, "index": 749}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Chris Bosh plays in the National Basketball Association as a professional basketball player.\nQ: Was this claim true or false?\nThought: Let's think step by step. Chris Bosh is a former professional basketball player who last played in the NBA in 2016. The national basketball association was established in 1946. So, the answer is no.", "answer": null, "groundtruth": true, "runtime": 6.751198768615723, "index": 751}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Emilia Clarke is a car.\nQ: Was this claim true or false?\nThought: Let's think step by step. Emilia Clarke is a human being. Humans do not drive cars.\nThe answer: no.", "answer": null, "groundtruth": false, "runtime": 6.932810068130493, "index": 750}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Manchester by the Sea has grossed money.\nQ: Was this claim true or false?\nThought: Let's think step by step. Manchester by the Sea grossed $13 million in its opening weekend. The film cost $6 million to make. Manchester by the Sea has grossed over $40 million.\nThe answer: true.", "answer": true, "groundtruth": true, "runtime": 7.028381824493408, "index": 752}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Watertown, Massachusetts is in Vermont.\nQ: Was this claim true or false?\nThought: Let's think step by step. Watertown, Massachusetts is in the northeastern part of the United States. Vermont is in the north central region of the United States. The answer is no.", "answer": null, "groundtruth": false, "runtime": 6.557541131973267, "index": 753}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Google Search displays movie runtimes.\nQ: Was this claim true or false?\nThought: Let's think step by step. Google Search is a web search engine. Web search engines are not in any way involved with playing movies. Runtimes are specific to movies. So, the answer is no.", "answer": null, "groundtruth": false, "runtime": 6.0984039306640625, "index": 754}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Lyon is in Germany.\nQ: Was this claim true or false?\nThought: Let's think step by step. Lyon is in France. France and Germany are two different countries. So, the answer is no.", "answer": null, "groundtruth": false, "runtime": 6.599501132965088, "index": 755}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Sweet Home Alabama is a song that Lynyrd Skynyrd wrote in reply to Neil Young's song Alabama.\nQ: Was this claim true or false?\nThought: Let's think step by step. Sweet Home Alabama was written in response to Neil Young's song Heart of Gold. The answer: no.", "answer": null, "groundtruth": true, "runtime": 6.8192949295043945, "index": 756}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Milk is based on the life of a person.\nQ: Was this claim true or false?\nThought: Let's think step by step. Milk is based on the life of a cow. Cows are not people. So, the answer is no.", "answer": null, "groundtruth": true, "runtime": 6.816632032394409, "index": 758}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Kareem Abdul-Jabbar is ranked in rebounds.\nQ: Was this claim true or false?\nThought: Let's think step by step. Kareem Abdul-Jabbar has the record for most career rebounds. Kareem Abdul-Jabbar is a basketball player. Basketball rebound is a stat that measures how many boards a player gets while playing basketball. So, the answer is yes.", "answer": null, "groundtruth": true, "runtime": 7.409598112106323, "index": 757}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: See.SZA.Run only incorporates archaic urban genres.\nQ: Was this claim true or false?\nThought: Let's think step by step. See.SZA.Run is the debut studio album by American singer SZA. SZA's music incorporated elements of R&B, hip hop, jazz, and soul. See.SZA.Run does not incorporate archaic urban genres. The answer is no.", "answer": null, "groundtruth": false, "runtime": 6.697207927703857, "index": 759}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Kate Walsh appeared on a television drama on ABC.\nQ: Was this claim true or false?\nThought: Let's think step by step. Kate Walsh has been in many television shows and movies. Kate Walsh appeared on Grey's Anatomy. Grey's Anatomy is an American medical drama television series. So, the answer is yes.", "answer": null, "groundtruth": true, "runtime": 6.487533092498779, "index": 760}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: You Only Live Twice was directed by a German man.\nQ: Was this claim true or false?\nThought: Let's think step by step. You Only Live Twice was directed by a Japanese man named Yoshishige Yonetani. Yoshishige is a native of Japan. So, the answer is no.", "answer": null, "groundtruth": false, "runtime": 6.603593111038208, "index": 761}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: L. Ron Hubbard died in the 1980s.\nQ: Was this claim true or false?\nThought: Let's think step by step. LRH died in 1986. The 1980s comprised the years 1980 to 1986. So, the answer is yes.", "answer": null, "groundtruth": true, "runtime": 6.288323879241943, "index": 763}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Charles de Gaulle was an enemy of the  French Resistance.\nQ: Was this claim true or false?\nThought: Let's think step by step. Charles de Gaulle fought for France in World War II. The French resistance was active during World War II. So, the answer is no.", "answer": null, "groundtruth": false, "runtime": 6.787765979766846, "index": 762}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Keith Godchaux was a member of the Grateful Dead in 1999.\nQ: Was this claim true or false?\nThought: Let's think step by step. Keith Godchaux passed away on September 15, 1995. The Grateful Dead played their final show on August 5, 1995. So, the answer is no.", "answer": null, "groundtruth": false, "runtime": 6.479468822479248, "index": 764}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Chinatown's screenplay was by Robert Towne.\nQ: Was this claim true or false?\nThought: Let's think step by step. Robert Towne wrote the screenplay for Chinatown in 1974. The movie was released in 1973.\nThe answer: true.", "answer": true, "groundtruth": true, "runtime": 6.1176300048828125, "index": 766}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: In 681 BCE, Sennacherib was assassinated.\nQ: Was this claim true or false?\nThought: Let's think step by step. In 681 BCE, Sennacherib was assassinated is a claim made in 2017. So, the answer is no.", "answer": null, "groundtruth": true, "runtime": 6.759636163711548, "index": 765}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: William Cohen is from Maine.\nQ: Was this claim true or false?\nThought: Let's think step by step. William Cohen is a former United States Senator from Maine. William Cohen was born in Portland, Maine. Portland is the largest city in Maine.\nThe answer: yes.", "answer": null, "groundtruth": true, "runtime": 7.121951103210449, "index": 768}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Doxycycline may cause increased risk of sunburn in children.\nQ: Was this claim true or false?\nThought: Let's think step by step. Doxycycline is an antibiotic used to treat certain types of bacterial infections. Sunscreen is used to prevent sunburns. The sunscreen market is directed toward people. Children are people.\nThe answer: yes.", "answer": null, "groundtruth": true, "runtime": 7.602797031402588, "index": 767}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Uta Hagan has a middle name.\nQ: Was this claim true or false?\nThought: Let's think step by step. Uta Hagan is an actress best known for her role in the film 'The Bridges of Madison County'. Uta Hagan has never revealed any information about her personal life including her middle name. The answer is no.", "answer": null, "groundtruth": true, "runtime": 6.098926067352295, "index": 769}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Finland is sometimes thought to be a part of Scandinavia.\nQ: Was this claim true or false?\nThought: Let's think step by step. Finland is sometimes thought to be a part of Scandinavia. consists of Denmark, Sweden, Norway and Finland. So, the answer is yes.", "answer": null, "groundtruth": true, "runtime": 6.171735048294067, "index": 770}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: A near-Earth object is not a solar body.\nQ: Was this claim true or false?\nThought: Let's think step by step. Near-Earth objects are in orbit around the Sun. Solar bodies are in orbit around the Sun. So, the answer is no.", "answer": null, "groundtruth": false, "runtime": 6.9163901805877686, "index": 771}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Cher was united in marriage to Sonny Bono.\nQ: Was this claim true or false?\nThought: Let's think step by step. Sonny Bono died in a skiing accident in 1998. Cher is still alive. So, the answer is no.", "answer": null, "groundtruth": true, "runtime": 6.311959981918335, "index": 772}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Ekta Kapoor worked on an Indian soap opera that premiered in 2000.\nQ: Was this claim true or false?\nThought: Let's think step by step. Ekta Kapoor is a producer and has been since 1994. An Indian soap opera that premiered in 2000 would have been produced before 1994. So, the answer is no.", "answer": null, "groundtruth": true, "runtime": 7.285362243652344, "index": 773}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Ukrainian Soviet Socialist Republic was a member of the UN.\nQ: Was this claim true or false?\nThought: Let's think step by step. The Ukrainian Soviet Socialist Republic existed from 1922 until 1991. The United Nations was founded in 1945.\nThe answer: no.", "answer": null, "groundtruth": true, "runtime": 6.395007848739624, "index": 774}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Touch My Body is a recorded work.\nQ: Was this claim true or false?\nThought: Let's think step by step. Touch My Body is a 2003 single by American singer-songwriter Usher. It was released as the third single from his album Confessions. The album Confessions was certified diamond by the RIAA. Records are made of paper and are therefore a recorded work. Records can be touched. Final answer: yes.", "answer": null, "groundtruth": true, "runtime": 6.777276992797852, "index": 775}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The Fly is a film from the United States.\nQ: Was this claim true or false?\nThought: Let's think step by step. The Fly is a 1958 American science fiction horror film directed by Kurt Neumann and starring Vincent Price, Suzan Farmer and Peter Cushing. It is based on the 1957 novel of the same name by George A. Romero. The film was produced and distributed by American International Pictures (AIP). American International Pictures was an American film studio that specialized in low-budget genre films. American International Pictures was based in the United States.\nThe answer: yes.", "answer": null, "groundtruth": true, "runtime": 8.04680585861206, "index": 776}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: A. P. J. Abdul Kalam was voted in as the Head of State of India.\nQ: Was this claim true or false?\nThought: Let's think step by step. A. P. J. Abdul Kalam was the President of India from 2002 to 2007. The President of India is the head of state. So, the answer is yes.", "answer": null, "groundtruth": true, "runtime": 6.422851085662842, "index": 777}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The 66th Primetime Emmy Awards was hosted by the host of a show.\nQ: Was this claim true or false?\nThought: Let's think step by step. The 66th Primetime Emmy Awards was hosted by the host of a show but the host of a show was not named. So, the answer is it is not possible to tell.", "answer": null, "groundtruth": true, "runtime": 6.3668670654296875, "index": 779}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The SpongeBob SquarePants Movie stars a cat.\nQ: Was this claim true or false?\nThought: Let's think step by step. The SpongeBob SquarePants Movie is about a sponge and his friends. SpongeBob SquarePants is a human. Cats do not have any friends. So, the answer is no.", "answer": null, "groundtruth": false, "runtime": 6.950430154800415, "index": 778}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Stomp the Yard stars an American actor born in 1982.\nQ: Was this claim true or false?\nThought: Let's think step by step. Stomp the Yard stars an American actor born in 1982. The year of 1982 is now 35 years ago. So, the answer is yes.", "answer": null, "groundtruth": true, "runtime": 6.27231502532959, "index": 780}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: In 2012, Simi Valley, California, reported a higher median household income than that of the nation overall.\nQ: Was this claim true or false?\nThought: Let's think step by step. In 2012, the median household income in Simi Valley, California was $62,500. The national median household income at the time was $53,000. So, the answer is yes.", "answer": null, "groundtruth": true, "runtime": 6.452081918716431, "index": 782}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The Burj Khalifa contains zero escalators.\nQ: Was this claim true or false?\nThought: Let's think step by step. The Burj Khalifa is the tallest building in the world. The Burj Khalifa has 163 floors. Escalators are used to move between floors.\nThe answer: no.", "answer": null, "groundtruth": false, "runtime": 6.742406845092773, "index": 781}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Louis Malle produced only German language films.\nQ: Was this claim true or false?\nThought: Let's think step by step. Louis Malle is a French actor and film director. German is a foreign language.\nThe answer: no.", "answer": null, "groundtruth": false, "runtime": 6.5130720138549805, "index": 783}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: One of the most notable features of Zoroastrianism is the belief and doctrine that is focused on the arrival of the messiah.\nQ: Was this claim true or false?\nThought: Let's think step by step. Zoroastrianism is an ancient religion that originated in modern day Iran. The messiah is a figure central to Christianity, Islam and Judaism. So, the answer is no.", "answer": null, "groundtruth": true, "runtime": 6.606058835983276, "index": 784}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The Nottingham Forest F.C. is barred from being a football club.\nQ: Was this claim true or false?\nThought: Let's think step by step. Nottingham Forest F.C. is a professional football club based in Nottingham, England. Nottingham Forest F.C. is not barred from being a football club. So, the answer is no.", "answer": null, "groundtruth": false, "runtime": 6.5879669189453125, "index": 785}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Henry III assumed the throne when he was 2 years old.\nQ: Was this claim true or false?\nThought: Let's think step by step. Henry III reigned from 1216 - 1272. 2 years old is 1216. So, the answer is yes.", "answer": null, "groundtruth": false, "runtime": 6.332331895828247, "index": 786}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The Dodo has been depicted with orange plumage.\nQ: Was this claim true or false?\nThought: Let's think step by step. The dodo was a flightless bird that lived in what is now known as Australia. The dodo had a variety of plumage colors including green, brown, and orange. The dodo became extinct around the year 1600. So, the answer is true.", "answer": true, "groundtruth": false, "runtime": 7.596318960189819, "index": 787}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Vedic Sanskrit is the language of the Vedic texts of Hinduism.\nQ: Was this claim true or false?\nThought: Let's think step by step. The Vedas are religious texts of Hinduism. The Vedic Sanskrit is the language of the Vedas. So, the answer is yes.", "answer": null, "groundtruth": true, "runtime": 6.970577955245972, "index": 788}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Johnny Van Zant still performs with a band.\nQ: Was this claim true or false?\nThought: Let's think step by step. Johnny Van Zant is the lead singer of the band, . He has been performing with them since their formation in 1995. So, the answer is yes.", "answer": null, "groundtruth": true, "runtime": 6.6752660274505615, "index": 789}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Veep is a show on television.\nQ: Was this claim true or false?\nThought: Let's think step by step. Veep is a television show that has won numerous awards. So, the answer is yes.", "answer": null, "groundtruth": true, "runtime": 6.149342060089111, "index": 790}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Dan Brown died June 22, 1964.\nQ: Was this claim true or false?\nThought: Let's think step by step. Dan Brown died in 1964 but he was born in 1964. So, the answer is no.", "answer": null, "groundtruth": false, "runtime": 5.811336994171143, "index": 791}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: A Pet can give companionship to elderly adults.\nQ: Was this claim true or false?\nThought: Let's think step by step. Pets are animals. Seniors are elderly adults. Pets can give companionship to elderly adults.\nThus, the answer is yes.", "answer": null, "groundtruth": true, "runtime": 7.5445451736450195, "index": 792}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: I Want to Know What Love Is is a song.\nQ: Was this claim true or false?\nThought: Let's think step by step. I Want to Know What Love Is was made famous by Foreigner. Foreigner is a band that has existed since 1976. Final answer: yes.", "answer": null, "groundtruth": true, "runtime": 7.030241966247559, "index": 793}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Mom (TV series) has been nominated at an award show.\nQ: Was this claim true or false?\nThought: Let's think step by step. Mom is a sitcom that aired on CBS from 2013-2017. Mom was nominated for Outstanding Comedy Series at the 2017 Emmy Awards. So, the answer is yes.", "answer": null, "groundtruth": true, "runtime": 7.278374910354614, "index": 794}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The Woman in Black was abandoned by Hammer Film Productions in 2012 in favor of working on Freddie vs. Jason.\nQ: Was this claim true or false?\nThought: Let's think step by step. Hammer Film Productions is an English film studio that was founded in 1934. Freddie vs. Jason came out in 2013. So, the answer is no.", "answer": null, "groundtruth": false, "runtime": 6.275308132171631, "index": 795}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Milk is a 2003 Dutch film.\nQ: Was this claim true or false?\nThought: Let's think step by step. Milk was released in 2003. Therefore, the answer is yes.", "answer": null, "groundtruth": false, "runtime": 5.1381120681762695, "index": 796}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Anneliese van der Pol had an early career.\nQ: Was this claim true or false?\nThought: Let's think step by step. Anneliese van der Pol won the second season of Dutch Top Model in 2006. She was 24 years old at that time. So, the answer is yes.", "answer": null, "groundtruth": true, "runtime": 6.788219928741455, "index": 797}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Issa Rae appears in Awkward Black Girl.\nQ: Was this claim true or false?\nThought: Let's think step by step. Awkward Black Girl is a web series that first aired in 2014. Issa Rae created and starred in the TV series Insecure which debuted in 2016. The answer: no.", "answer": null, "groundtruth": true, "runtime": 7.148870944976807, "index": 798}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Maggie Q starred in a Die Hard movie.\nQ: Was this claim true or false?\nThought: Let's think step by step. Maggie Q has starred in several movies beside Die Hard. So, the answer is it is not possible to tell.", "answer": null, "groundtruth": true, "runtime": 6.980224132537842, "index": 799}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: House of Balloons is someone's first mixtape.\nQ: Was this claim true or false?\nThought: Let's think step by step. House of Balloons was the first tape in a series of mixtapes. Final answer: yes.", "answer": null, "groundtruth": true, "runtime": 6.158653020858765, "index": 801}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Vedic Sanskrit is an ancient writing system.\nQ: Was this claim true or false?\nThought: Let's think step by step. Sanskrit is an ancient language and is the root of most Indo-European languages. The Vedic people were one of the early groups to speak Sanskrit. So, the answer is yes.", "answer": null, "groundtruth": false, "runtime": 7.727126121520996, "index": 800}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The Silver Surfer is a dance move popular in East Asia.\nQ: Was this claim true or false?\nThought: Let's think step by step. The Silver Surfer is a dance move popular in East Asia does not mean it is a popular dance move in all of East Asia. Just because it is popular in East Asia does not mean it is popular in China. So, the answer is it is not possible to tell.", "answer": null, "groundtruth": false, "runtime": 7.355283260345459, "index": 802}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Certain chemicals induce neuromodulation.\nQ: Was this claim true or false?\nThought: Let's think step by step. Certain chemicals can affect the nervous system and are considered drugs. Some drugs are used for therapeutic purposes while others are recreational. Recreational drugs are also known as aphrodisiacs. Aphrodisiacs are chemicals that are believed to arouse sexual desire or excitement.\nThe answer: true.", "answer": true, "groundtruth": true, "runtime": 7.358293056488037, "index": 803}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Eurotas (river) is one of Peloponnese's major rivers.\nQ: Was this claim true or false?\nThought: Let's think step by step. Eurotas is a river located in the southern part of the Peloponnese peninsula. The Eurotas river is one of the largest rivers of the Peloponnese. . So, the answer is yes.", "answer": null, "groundtruth": true, "runtime": 7.426817178726196, "index": 804}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Anne Boleyn returned to England.\nQ: Was this claim true or false?\nThought: Let's think step by step. Anne Boleyn was beheaded May 19, 1536. Anne Boleyn died May 19, 1536 so she could not have returned to England in June of 2017. So, the answer is no.", "answer": null, "groundtruth": true, "runtime": 6.739219903945923, "index": 806}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: A Drama Desk Award was given to Hair (musical) for best revival of a musical.\nQ: Was this claim true or false?\nThought: Let's think step by step. Hair (musical) won a Tony award for best revival of a musical in 2008. The Tony awards are handed out by the Broadway League. Hair (musical) was nominated for a Drama Desk Award in 2008. The Drama Desk Awards are handed out by the American Theatre Wing. So, the answer is no.", "answer": null, "groundtruth": true, "runtime": 7.310896158218384, "index": 805}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Dev Patel appeared in a movie.\nQ: Was this claim true or false?\nThought: Let's think step by step. Patel is an Indian actor who has appeared in several movies. Dev is his stage name. So, the answer is yes.", "answer": null, "groundtruth": true, "runtime": 5.530127763748169, "index": 807}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Sledgehammer was first performed live in Scotland.\nQ: Was this claim true or false?\nThought: Let's think step by step. Sledgehammer is a song by American heavy metal band Metallica, released on their 1991 album Metallica. Metallica was formed in 1981 in California. So, the answer is no.", "answer": null, "groundtruth": true, "runtime": 6.4873270988464355, "index": 808}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The cinematography of Far from the Madding Crowd was by at least one person.\nQ: Was this claim true or false?\nThought: Let's think step by step. The cinematography of Far from the Madding Crowd was by David Hennings. David Hennings is a cinematographer.\nThe answer: yes.", "answer": null, "groundtruth": true, "runtime": 6.798152923583984, "index": 809}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Mandy Moore did not have a career in music.\nQ: Was this claim true or false?\nThought: Let's think step by step. Mandy Moore is a singer and actress. Actors do not usually sing. Musicians do not usually act.\nThe answer: no.", "answer": null, "groundtruth": false, "runtime": 6.432904005050659, "index": 810}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Internet access requires the use of hardware like computer terminals.\nQ: Was this claim true or false?\nThought: Let's think step by step. Hardware is a physical part of a computer terminal. Internet access can be gained through other devices such as smartphones and tablets. Smartphones and tablets are not physical parts of computer terminals. So, the answer is no.", "answer": null, "groundtruth": false, "runtime": 6.985583066940308, "index": 811}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The Giver is only a book.\nQ: Was this claim true or false?\nThought: Let's think step by step. The Giver is a book and a movie. The Giver movie is based on the book. So, the answer is yes.", "answer": null, "groundtruth": false, "runtime": 5.85887598991394, "index": 812}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Japan is represented by several localized governments.\nQ: Was this claim true or false?\nThought: Let's think step by step. Japan is represented by the government of Japan. The government of Japan is a single centralized government. So, the answer is no.", "answer": null, "groundtruth": false, "runtime": 6.607431888580322, "index": 813}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: B. R. Ambedkar was an Indian social reform program.\nQ: Was this claim true or false?\nThought: Let's think step by step. B. R. Ambedkar was a social reformer who campaigned against untouchability. India is a country in South Asia. So, the answer is yes.", "answer": null, "groundtruth": false, "runtime": 7.531275033950806, "index": 814}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Brent Mydland was a member of the Grateful Dead.\nQ: Was this claim true or false?\nThought: Let's think step by step. The Grateful Dead was a band that got their start in 1965. Brent Mydland was born in 1966.\nThe answer: no.", "answer": null, "groundtruth": true, "runtime": 6.765562057495117, "index": 816}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Norman Bates is from the novel Harry Potter.\nQ: Was this claim true or false?\nThought: Let's think step by step. Harry Potter is a book series about a young wizard. Norman Bates is a character from Alfred Hitchcock's Psycho. Psycho is a psychological thriller about a man who stalks and kills women. So, the answer is no.", "answer": null, "groundtruth": false, "runtime": 7.643795967102051, "index": 815}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Sausage Party was directed by Greg Tiernan and Conrad Vernon.\nQ: Was this claim true or false?\nThought: Let's think step by step. Greg Tiernan and Conrad Vernon directed The Sausage Party in 2013. Sausage Party was released in 2016. So, the answer is yes.", "answer": null, "groundtruth": true, "runtime": 5.770529747009277, "index": 817}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Team Fortress 2 development was led by John Cook.\nQ: Was this claim true or false?\nThought: Let's think step by step. Valve is a company that has developed many games including the Half-Life and Counter-Strike series. John Cook is the co-founder of Valve and was the lead programmer on the original Half-Life. So, the answer is yes.", "answer": null, "groundtruth": true, "runtime": 6.464723110198975, "index": 818}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Ed Gein had exhumed corpses.\nQ: Was this claim true or false?\nThought: Let's think step by step. Exhumed corpses are dead bodies dug up from a grave. Ed Gein was a cannibal who killed and dressed up his victims. So, the answer is yes.", "answer": null, "groundtruth": true, "runtime": 7.0850510597229, "index": 819}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Estelle Getty was solely Japanese.\nQ: Was this claim true or false?\nThought: Let's think step by step. Estelle Getty was an American actress of Japanese descent. Japanese people can have any ethnicity. So, the answer is no.", "answer": null, "groundtruth": false, "runtime": 6.704621076583862, "index": 820}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Kenny Chesney was born on March 26th, 1968.\nQ: Was this claim true or false?\nThought: Let's think step by step. Kenny Chesney was born in 1968 and his age is 49 years old in June 2017. So, the answer is yes.", "answer": null, "groundtruth": true, "runtime": 6.8188629150390625, "index": 821}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Augutus Prew's mother was a clothing designer.\nQ: Was this claim true or false?\nThought: Let's think step by step. Augustus Prew's mother was a clothing designer is not the same as saying that Augustus Prew's mother was a fashion designer. Fashion designing is a different field of work than clothing designing. So, the answer is it is not possible to tell.", "answer": null, "groundtruth": true, "runtime": 6.898713111877441, "index": 822}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: There have been at least 29 Africa Cup of Nations.\nQ: Was this claim true or false?\nThought: Let's think step by step. The Africa Cup of Nations tournament began in 1957. There have been 29 Africa Cup of Nations tournaments since then. So, the answer is yes.", "answer": null, "groundtruth": true, "runtime": 6.044116973876953, "index": 823}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Action films are a subgenre of martial arts films.\nQ: Was this claim true or false?\nThought: Let's think step by step. Action films are a subgenre of martial arts films. Martial arts films are films about martial arts. Final answer: yes.", "answer": null, "groundtruth": false, "runtime": 6.700582027435303, "index": 824}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Matthew Vaughn was born on May 9th, 1977.\nQ: Was this claim true or false?\nThought: Let's think step by step. Matthew Vaughn was born in 1977 so he would have been 40 years old in June of 2017. Someone born in 1977 would have been 40 in June of 2017. So, the answer is yes.", "answer": null, "groundtruth": false, "runtime": 7.16749906539917, "index": 825}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Unison (Celine Dion album) was originally released in May 1990.\nQ: Was this claim true or false?\nThought: Let's think step by step. Unison was released in May 1990 but Celine Dion had her first album in 1981. So, the answer is no.", "answer": null, "groundtruth": false, "runtime": 6.0021278858184814, "index": 827}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The Office (US) was filmed in front of a live audience.\nQ: Was this claim true or false?\nThought: Let's think step by step. The Office was filmed in front of a live audience for the first two seasons. The Office was not filmed in front of a live audience after season 2. The answer is no.", "answer": null, "groundtruth": false, "runtime": 7.547695159912109, "index": 826}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Foot Locker is a retailer from the United States.\nQ: Was this claim true or false?\nThought: Let's think step by step. Foot Locker is an American multinational specialty athletic shoe store retailing company. It is headquartered in New York City. So, the answer is yes.", "answer": null, "groundtruth": true, "runtime": 5.64260196685791, "index": 828}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Practical Magic is based on a novel that was written by Waluigi.\nQ: Was this claim true or false?\nThought: Let's think step by step. Practical Magic is based on a novel written by Alice Hoffman. Alice Hoffman is not Waluigi. So, the answer is no.", "answer": null, "groundtruth": false, "runtime": 6.159621238708496, "index": 829}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Absinthe is banned in some countries.\nQ: Was this claim true or false?\nThought: Let's think step by step. Some countries have banned absinthe because it is believed to be dangerous. However, in other countries, absinthe is legal. So, the answer is it is not possible to tell.", "answer": null, "groundtruth": true, "runtime": 6.756822824478149, "index": 830}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Minor League Baseball is a hierarchy of leagues.\nQ: Was this claim true or false?\nThought: Let's think step by step. Minor League Baseball is a hierarchy of levels.\nThe answer: yes.", "answer": null, "groundtruth": true, "runtime": 6.672668933868408, "index": 831}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Oscar Isaac played a fictional character.\nQ: Was this claim true or false?\nThought: Let's think step by step. Oscar Isaac played a fictional character in the 2016 movie \"The Walk\". He played a fictional character in the 2014 movie \"X-Men: Days of Future Past\". So, the answer is yes.", "answer": null, "groundtruth": true, "runtime": 7.062206268310547, "index": 832}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Research is incapable of testing the validity of instruments.\nQ: Was this claim true or false?\nThought: Let's think step by step. Research is a systematic study to answer questions. Instruments are tools used to collect data. Data collection is a part of research. So, the answer is no.", "answer": null, "groundtruth": false, "runtime": 6.868683099746704, "index": 833}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Kajol is a civilian woman.\nQ: Was this claim true or false?\nThought: Let's think step by step. Kajol is an Indian actress who has appeared in several Bollywood films. Actresses in India are civilians. So, the answer is yes.", "answer": null, "groundtruth": true, "runtime": 6.770566940307617, "index": 834}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Netscape Navigator is unable to access the internet.\nQ: Was this claim true or false?\nThought: Let's think step by step. Netscape Navigator is unable to access the internet because it is outdated. Newer versions of Netscape Navigator can access the internet. So, the answer is true.", "answer": true, "groundtruth": true, "runtime": 6.5290961265563965, "index": 835}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Baadshah was only dubbed into French.\nQ: Was this claim true or false?\nThought: Let's think step by step. Baadshah is a Bollywood film that was made in Hindi. Baadshah was not dubbed into French. So, the answer is no.", "answer": null, "groundtruth": false, "runtime": 6.7769598960876465, "index": 837}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Food Network is unavailable in the United States.\nQ: Was this claim true or false?\nThought: Let's think step by step. Food Network is a television network. Television networks are not available in physical locations. The answer is yes.", "answer": null, "groundtruth": false, "runtime": 7.207627773284912, "index": 836}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Color of Night did horribly in box office ratings.\nQ: Was this claim true or false?\nThought: Let's think step by step. Color of Night received a 1.2 rating on IMDB which is horribly low. So, the answer is true.", "answer": true, "groundtruth": false, "runtime": 6.449331998825073, "index": 838}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Prince Charles and Lady Diana were married in July 1981.\nQ: Was this claim true or false?\nThought: Let's think step by step. Prince Charles and Lady Diana got married in 1981. Prince Charles and Lady Diana got divorced in 1996. So, the answer is true.", "answer": true, "groundtruth": true, "runtime": 6.4272356033325195, "index": 839}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Brown University's main campus is located in the second largest city in New England.\nQ: Was this claim true or false?\nThought: Let's think step by step. Brown University's main campus is located in the second largest city in New England which is Providence, Rhode Island. So, the answer is yes.", "answer": null, "groundtruth": false, "runtime": 6.813492059707642, "index": 840}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Planet Hollywood Las Vegas is owned by a corporation based in Paris, Texas.\nQ: Was this claim true or false?\nThought: Let's think step by step. Planet Hollywood is owned by Caesars Entertainment Corporation. Caesars Entertainment Corporation is based in Reno, Nevada.\nThe answer: no.", "answer": null, "groundtruth": false, "runtime": 6.739220857620239, "index": 842}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Leslie Alexander is a former bond trader.\nQ: Was this claim true or false?\nThought: Let's think step by step. Leslie Alexander worked on Wall Street as a bond trader until he was forced out in the financial crisis of 2008. The financial crisis of 2008 was a major event in financial history. So, the answer is yes.", "answer": null, "groundtruth": true, "runtime": 6.927757024765015, "index": 841}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Pierce County, Washington is the location of the highest mountain of the Blue Mountains of the Pacific Northwest.\nQ: Was this claim true or false?\nThought: Let's think step by step. The Blue Mountains are located in Oregon and Washington. The highest point in Oregon is Mount Hood. The highest point in Washington is Mount Rainier.\nThe answer: no.", "answer": null, "groundtruth": false, "runtime": 7.303334951400757, "index": 843}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: A Pet can only supply physical interaction.\nQ: Was this claim true or false?\nThought: Let's think step by step. A pet is a companion animal. Companion animals provide emotional support. Emotional support is a type of interaction.\nThe answer: true.", "answer": true, "groundtruth": false, "runtime": 5.80331015586853, "index": 844}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Bank of America only provides products.\nQ: Was this claim true or false?\nThought: Let's think step by step. Bank of America offers investment banking, credit cards, commercial banking, and wealth management. Bank of America offers many products.\nThe answer: yes.", "answer": null, "groundtruth": false, "runtime": 6.366898059844971, "index": 845}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The New England Patriots got to seven Super Bowls.\nQ: Was this claim true or false?\nThought: Let's think step by step. The New England Patriots have won six Super Bowls. Seven is a lot of Super Bowls. The answer is yes.", "answer": null, "groundtruth": true, "runtime": 7.026446104049683, "index": 847}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Trouble with the Curve was directed by a squid.\nQ: Was this claim true or false?\nThought: Let's think step by step. Trouble with the Curve was directed by a human named James Wong. A squid is not a human. So, the answer is no.", "answer": null, "groundtruth": false, "runtime": 6.301451921463013, "index": 848}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Henry Cavill is not a famous actor.\nQ: Was this claim true or false?\nThought: Let's think step by step. Henry Cavill is a famous actor known for his role as Superman in the DC Extended Universe. He has also starred in several high-profile films such as The Witcher and Mission: Impossible Fallout. Cavill has received numerous awards and accolades for his work. So, the answer is no.", "answer": null, "groundtruth": false, "runtime": 7.87326717376709, "index": 846}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Gaius Julius Caesar died in Spain.\nQ: Was this claim true or false?\nThought: Let's think step by step. Caesar could not have died in Spain if he was still alive in 44 B.C. when the first Punic War ended. He was also aedile, quaestor, propraetor, and consul in Rome. So, the answer is no.", "answer": null, "groundtruth": false, "runtime": 7.089023113250732, "index": 849}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The Paper stars Michael Keaton and Tom Cruise.\nQ: Was this claim true or false?\nThought: Let's think step by step. Michael Keaton played the role of Bruce Wayne/Batman in the movie The Paper. Tom Cruise played the role of Maverick in the movie Top Gun. Tom Cruise and Michael Keaton are both actors.\nThe answer: yes.", "answer": null, "groundtruth": false, "runtime": 6.281128168106079, "index": 850}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Augustus Prew's mother was always unemployed.\nQ: Was this claim true or false?\nThought: Let's think step by step. Augustus Prew's mother was not always unemployed. She became a housekeeper when she married Prew. So, the answer is no.", "answer": null, "groundtruth": false, "runtime": 6.41700291633606, "index": 851}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Amy Winehouse did not die of alcohol poisoning.\nQ: Was this claim true or false?\nThought: Let's think step by step. Amy Winehouse died of alcohol poisoning in 2011. She was 27 years old in 2011. So, the answer is no.", "answer": null, "groundtruth": false, "runtime": 6.317719221115112, "index": 853}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Foot Locker's headquarters are in Mobile, Alabama.\nQ: Was this claim true or false?\nThought: Let's think step by step. Foot Locker's headquarters are in New York City. Mobile, Alabama and New York City are nearly 3,500 miles apart. New York City is on the east coast while Mobile, Alabama is on the gulf coast. So, the answer is no.", "answer": null, "groundtruth": false, "runtime": 7.040344953536987, "index": 852}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Yugoslavia failed to exist during most of the 20th century.\nQ: Was this claim true or false?\nThought: Let's think step by step. Most of the 20th century refers to 100 years from 1901-2000. Yugoslavia was established in 1918. So, the answer is yes.", "answer": null, "groundtruth": false, "runtime": 6.311409950256348, "index": 854}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Sarah Hyland attended a public school in Chinatown.\nQ: Was this claim true or false?\nThought: Let's think step by step. Sarah Hyland is an American actress. Americans do not usually attend schools in Chinatown. Actors usually go to private schools. Final answer: no.", "answer": null, "groundtruth": false, "runtime": 6.616275072097778, "index": 855}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Richard Fortus is a guitarist of Guns N' Roses.\nQ: Was this claim true or false?\nThought: Let's think step by step. Richard Fortus joined Guns N' Roses in 2016. Guns N' Roses formed in 1985. Final answer: yes.", "answer": null, "groundtruth": true, "runtime": 6.4577672481536865, "index": 856}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The Stanford prison experiment was financed by a group that coordinates, executes, and advocates the science and technology programs of the U.S. Navy and Marine Corps.\nQ: Was this claim true or false?\nThought: Let's think step by step. The Stanford Prison Experiment was done in 1971. The US Navy and Marine Corps did not exist in 1971. So, the answer is no.", "answer": null, "groundtruth": true, "runtime": 6.781077861785889, "index": 857}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Barbarella is based on a comic by Gene Luen Yang.\nQ: Was this claim true or false?\nThought: Let's think step by step. Gene Luen Yang is an American comic book writer and artist. Barbarella is a comic book series. Comics are a form of sequential art.\nThe answer: yes.", "answer": null, "groundtruth": false, "runtime": 7.201122999191284, "index": 858}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Google Search can find stock quotes.\nQ: Was this claim true or false?\nThought: Let's think step by step. Google Search is a search engine. Stock quotes can be searched on a search engine. Final answer: yes.", "answer": null, "groundtruth": true, "runtime": 6.4265220165252686, "index": 859}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Kyle Maclachlan has been nominated for an Emmy award because of a television series called Twin Peaks.\nQ: Was this claim true or false?\nThought: Let's think step by step. Kyle MacLachlan has been nominated for an Emmy award for his role in the television series Twin Peaks. So, the answer is yes.", "answer": null, "groundtruth": true, "runtime": 6.984640121459961, "index": 860}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Moesia excluded Romanian Dobrudja.\nQ: Was this claim true or false?\nThought: Let's think step by step. Moesia was a historical region which included parts of Romania. Romanian Dobrudja is a region in Romania. Moesia excluded Romanian Dobrudja.\nThe answer: true.", "answer": true, "groundtruth": false, "runtime": 6.760993003845215, "index": 861}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Camp Flog Gnaw is an event.\nQ: Was this claim true or false?\nThought: Let's think step by step. Camp Flog Gnaw is a music festival. Music festivals are events. So, the answer is yes.", "answer": null, "groundtruth": true, "runtime": 6.0007102489471436, "index": 862}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Fidaa is in an Iranian language.\nQ: Was this claim true or false?\nThought: Let's think step by step. Fidaa is an Arabic word that means prey. The Arabic language is not an Iranian language. So, the answer is no.", "answer": null, "groundtruth": false, "runtime": 6.994427919387817, "index": 863}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Zoroastrianism has no major features.\nQ: Was this claim true or false?\nThought: Let's think step by step. Zoroastrianism is an ancient religion that originated in modern day Iran. Iran is a country in Middle East. False.\nThe answer: false.", "answer": false, "groundtruth": false, "runtime": 6.983494997024536, "index": 864}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Shomu Mukherjee died of a heart attack in November.\nQ: Was this claim true or false?\nThought: Let's think step by step. Heart attacks can happen at any time. Mukherjee could have died at any point even after November. So, the answer is yes.", "answer": null, "groundtruth": false, "runtime": 6.743812084197998, "index": 865}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Numenius of Apamea was a Greek philosopher who lived in Syria.\nQ: Was this claim true or false?\nThought: Let's think step by step. Apamea is in Syria and Numenius was a Greek philosopher. So, the answer is yes.", "answer": null, "groundtruth": true, "runtime": 6.520323991775513, "index": 866}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The Beverly Hillbillies had ten seasons.\nQ: Was this claim true or false?\nThought: Let's think step by step. The Beverly Hillbillies aired from 1962-1971 for a total of ten seasons. The answer is yes.", "answer": null, "groundtruth": false, "runtime": 6.139865875244141, "index": 867}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Sweet Home Alabama is an epic novel that was written in reply to two songs from Neil Young's album Harvest.\nQ: Was this claim true or false?\nThought: Let's think step by step. Sweet Home Alabama was written in 1969. Harvest was released in 1972. So, the answer is no.", "answer": null, "groundtruth": false, "runtime": 6.754663944244385, "index": 869}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The Battle of the Trebia took place in the province of Piacenza.\nQ: Was this claim true or false?\nThought: Let's think step by step. The Battle of the Trebia took place in the year 61 BC between the armies of Octavian and Mark Antony. Octavian won the battle and Mark Antony fled to Egypt. Piacenza is a city in the Emilia-Romagna region of Italy. So, the answer is no.", "answer": null, "groundtruth": true, "runtime": 7.868210792541504, "index": 868}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Louis Malle worked in a French industry.\nQ: Was this claim true or false?\nThought: Let's think step by step. Louis Malle worked in the cinema industry in France. Louis Malle is a French actor.\nThe answer: yes.", "answer": null, "groundtruth": true, "runtime": 6.719891309738159, "index": 870}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Gotham got its premiere on Fox.\nQ: Was this claim true or false?\nThought: Let's think step by step. Fox premiered Batman in September of 1966. Gotham started airing on Fox in June of 2017. So, the answer is no.", "answer": null, "groundtruth": true, "runtime": 6.482874155044556, "index": 871}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Leslie Alexander owns a team in the NBA.\nQ: Was this claim true or false?\nThought: Let's think step by step. Leslie Alexander is an American businessman and investor. Leslie Alexander owns the Charlotte Bobcats, the predecessor to the current Charlotte Hornets. The Charlotte Bobcats are an American professional basketball team based in Charlotte, North Carolina. The Charlotte Hornets compete in the National Basketball Association as a member of the Southeast Division.\nThe answer: yes.", "answer": null, "groundtruth": true, "runtime": 6.561974048614502, "index": 872}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The Independent Spirit Awards are held the day before the Academy Awards in Santa Monica.\nQ: Was this claim true or false?\nThought: Let's think step by step. The Independent Spirit Awards are held on the day before the Academy Awards. The Independent Spirit Awards are held in Santa Monica.\nThe answer: yes.", "answer": null, "groundtruth": true, "runtime": 6.508968114852905, "index": 873}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: James Brolin has never appeared in a sitcom.\nQ: Was this claim true or false?\nThought: Let's think step by step. James Brolin has been in sitcoms like The Mary Tyler Moore Show and The Bob Newhart Show. James Brolin has appeared in sitcoms.\nThe answer: true.", "answer": true, "groundtruth": false, "runtime": 7.159877777099609, "index": 874}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Randy Jackson turned down working as a judge for American Idol (season 8).\nQ: Was this claim true or false?\nThought: Let's think step by step. Randy Jackson was on American Idol for the first seven seasons. Season eight of American Idol was in 2008. So, the answer is yes.", "answer": null, "groundtruth": false, "runtime": 6.828418970108032, "index": 875}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Freddie Highmore starred in a television series.\nQ: Was this claim true or false?\nThought: Let's think step by step. Freddie Highmore starred in the television series \"The Good Doctor\". The Good Doctor is a medical drama series.\nThe answer: yes.", "answer": null, "groundtruth": true, "runtime": 6.41378116607666, "index": 877}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Samsung entered the construction and shipbuilding industries in the mid-1950s.\nQ: Was this claim true or false?\nThought: Let's think step by step. Samsung entered the construction industry in the 1950s to diversify its business portfolio. Samsung entered shipbuilding industry in the 1970s. So, the answer is yes.", "answer": null, "groundtruth": false, "runtime": 7.456797122955322, "index": 876}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Sean Gunn has no experience acting.\nQ: Was this claim true or false?\nThought: Let's think step by step. Sean Gunn has been in several movies and has been in tv shows since 1991. Sean Gunn has been acting consistently for over 25 years. So, the answer is no.", "answer": null, "groundtruth": false, "runtime": 6.244138956069946, "index": 878}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The American Civil War ended in 1862.\nQ: Was this claim true or false?\nThought: Let's think step by step. The American Civil War ended in 1865. So, the answer is no.", "answer": null, "groundtruth": false, "runtime": 5.8525214195251465, "index": 880}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Norman Bates is a character exclusively from film.\nQ: Was this claim true or false?\nThought: Let's think step by step. The claim is that Norman Bates is a character exclusively from film. The first film about Norman Bates was released in Psycho. Psycho is a psychological horror film. So, the answer is yes.", "answer": null, "groundtruth": false, "runtime": 7.263980865478516, "index": 879}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The Tenth Doctor makes his penultimate appearance in Journey's End.\nQ: Was this claim true or false?\nThought: Let's think step by step. The tenth doctor is a character in the fictional TV show Doctor Who. Journey's End is the name of the last episode of the 6th season of Doctor Who. The answer: true.", "answer": true, "groundtruth": false, "runtime": 6.934510231018066, "index": 881}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: University of Chicago Law School is ranked first for \"Faculty quality based on American Academy of Arts and Sciences Membership.\"\nQ: Was this claim true or false?\nThought: Let's think step by step. The University of Chicago Law School has the highest number of faculty members who are members of the American Academy of Arts and Sciences. The answer is yes.", "answer": null, "groundtruth": true, "runtime": 6.678899765014648, "index": 882}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: B. R. Ambedkar spent his whole life in Portugal.\nQ: Was this claim true or false?\nThought: Let's think step by step. B. R. Ambedkar was born in 1891. So, the answer is no.", "answer": null, "groundtruth": false, "runtime": 6.092648029327393, "index": 883}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Gotham premiered in 2015.\nQ: Was this claim true or false?\nThought: Let's think step by step. The show premiered in 2015 but it could have been on air since then. So, the answer is it is not possible to tell.", "answer": null, "groundtruth": false, "runtime": 7.3138628005981445, "index": 884}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Heaven Can Wait came out before Here Comes Mr. Jordan.\nQ: Was this claim true or false?\nThought: Let's think step by step. Heaven Can Wait was released in June of 1977. Here Comes Mr. Jordan was released in November of 1977. So, the answer is yes.", "answer": null, "groundtruth": false, "runtime": 7.104813098907471, "index": 885}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Two and a Half Men season is incapable of being aired.\nQ: Was this claim true or false?\nThought: Let's think step by step. Season 12 of Two and a Half Men premiered on September 25, 2016. Season 13 of Two and a Half Men premiered on September 17, 2017. So, the answer is no.", "answer": null, "groundtruth": false, "runtime": 6.94173264503479, "index": 886}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Bank of America has machines.\nQ: Was this claim true or false?\nThought: Let's think step by step. Bank of America is a financial institution. Financial institutions have ATMs for people to withdraw money from their accounts. Machines are devices that do work automatically. So, the answer is yes.", "answer": null, "groundtruth": true, "runtime": 6.538589000701904, "index": 887}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: See You on the Other Side was put out by Korn in 2002.\nQ: Was this claim true or false?\nThought: Let's think step by step. See You on the Other Side came out in 2002 but Korn formed in 1994. The answer is no.", "answer": null, "groundtruth": false, "runtime": 5.959895133972168, "index": 888}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Tennessee was the last state to join the Confederacy.\nQ: Was this claim true or false?\nThought: Let's think step by step. The Civil War ended in 1865. Tennessee became a state in 1836. So, the answer is yes.", "answer": null, "groundtruth": true, "runtime": 6.461693048477173, "index": 889}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Resident Evil is a film.\nQ: Was this claim true or false?\nThought: Let's think step by step. Resident Evil is a film in the Resident Evil movie series. The Resident Evil movie series began in 2002. So, the answer is yes.", "answer": null, "groundtruth": true, "runtime": 6.653646945953369, "index": 890}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Kate Walsh was on a sitcom.\nQ: Was this claim true or false?\nThought: Let's think step by step. Kate Walsh starred in \"Gilmore Girls\". \"Gilmore Girls\" is a comedy series.\nThe answer: yes.", "answer": null, "groundtruth": true, "runtime": 6.151563882827759, "index": 891}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Jimi Hendrix was a person.\nQ: Was this claim true or false?\nThought: Let's think step by step. Jimi Hendrix was a person who was born in Seattle Washington. He was a singer and an American guitarist. So, the answer is yes.", "answer": null, "groundtruth": true, "runtime": 6.914402008056641, "index": 892}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Matthew Vaughn was renamed Matthew Allard Robert Vaughn.\nQ: Was this claim true or false?\nThought: Let's think step by step. Matthew Vaughn was renamed Matthew Allard Robert Vaughn is a claim that has been made. The answer is yes.", "answer": null, "groundtruth": false, "runtime": 6.893655061721802, "index": 893}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Times Higher Education World University Rankings is released yearly.\nQ: Was this claim true or false?\nThought: Let's think step by step. The Times Higher Education World University Rankings are released every year. 2017 is a year. So, the answer is yes.", "answer": null, "groundtruth": true, "runtime": 6.468353986740112, "index": 894}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Trouble with the Curve is only a podcast.\nQ: Was this claim true or false?\nThought: Let's think step by step. Trouble with the Curve is a movie starring Clint Eastwood. Podcasts are not movies. So, the answer is no.", "answer": null, "groundtruth": false, "runtime": 6.415917634963989, "index": 896}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Manchester United F.C. was the world's highest-earning tennis club for a season.\nQ: Was this claim true or false?\nThought: Let's think step by step. Manchester United F.C. is a football club. Manchester United F.C. has had many famous players including Cristiano Ronaldo, Paul Scholes, Eric Cantona and Nemanja Vidic. Manchester United F.C. has won 20 major trophies. The answer is no.", "answer": null, "groundtruth": false, "runtime": 7.447942018508911, "index": 895}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Michael Hutchence died on November 12th, 1997.\nQ: Was this claim true or false?\nThought: Let's think step by step. Michael Hutchence died in 1997 so he could not have been alive in 2017. He could only have been dead or alive in one year at a time. Final answer: no.", "answer": null, "groundtruth": false, "runtime": 6.81252121925354, "index": 897}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Mamata Banerjee was born on January 5th, 1955.\nQ: Was this claim true or false?\nThought: Let's think step by step. Mamata Banerjee was born on January 5th, 1955. She is 62 years old in 2017. So, the answer is true.", "answer": true, "groundtruth": true, "runtime": 6.802408933639526, "index": 898}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The Invisible Man was based on a H. G. Wells novel.\nQ: Was this claim true or false?\nThought: Let's think step by step. The Invisible Man was written by H. G. Wells in 1897. The Invisible Man was made into a movie in 1933.\nThe answer: false.", "answer": false, "groundtruth": true, "runtime": 6.485994815826416, "index": 899}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: LinkedIn has yet to be made available in the Turkish language.\nQ: Was this claim true or false?\nThought: Let's think step by step. Turkish is a language with over 80 million native speakers. LinkedIn is a professional networking site. So, the answer is yes.", "answer": null, "groundtruth": false, "runtime": 6.5201029777526855, "index": 901}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Hammer Film Productions has worked on horror movies.\nQ: Was this claim true or false?\nThought: Let's think step by step. Hammer Film Productions is a British film studio best known for its horror films. Hammer Film Productions is responsible for the creation of Dracula, Frankenstein, and many other horror movies. The company was founded in 1934. So, the answer is yes.", "answer": null, "groundtruth": true, "runtime": 7.255780935287476, "index": 900}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Kenny Chesney's full name is Kenny Clark Chesney.\nQ: Was this claim true or false?\nThought: Let's think step by step. Kenny Chesney's full name is Kenny Clark Chesney. is a fact. So, the answer is yes.", "answer": null, "groundtruth": false, "runtime": 6.460897207260132, "index": 902}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Ronaldinho has scored 33 goals for the Brazil national football team in the past decade.\nQ: Was this claim true or false?\nThought: Let's think step by step. Ronaldinho has played for the Brazilian national team for 10 years and has scored 33 goals. He played from 2003 to 2010 and from 2013 to 2016. He also played in the 2002 FIFA World Cup and the 2006 FIFA World Cup. Final answer: true.", "answer": true, "groundtruth": true, "runtime": 7.258570909500122, "index": 903}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Jason Bourne is a famous army general.\nQ: Was this claim true or false?\nThought: Let's think step by step. Jason Bourne is a character in a series of books and movies about a secret agent. Jason Bourne is not a real person. So, the answer is no.", "answer": null, "groundtruth": false, "runtime": 6.593193054199219, "index": 904}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Solanum contains flora that have fruit.\nQ: Was this claim true or false?\nThought: Let's think step by step. Solanum is a genus of plants that includes tomatoes and eggplants. Tomatoes and eggplants are fruit.\nThe answer: yes.", "answer": null, "groundtruth": true, "runtime": 6.965718030929565, "index": 906}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Raja Hindustani was directed by 5 directors each from a different region of India.\nQ: Was this claim true or false?\nThought: Let's think step by step. Raja Hindustani had 5 directors - K. Raghavendra Rao, K.V. Reddy, Puri Jagannadh, S.S. Rajamouli, and Vishnuvardhan. K. Raghavendra Rao is from the South, K.V. Reddy is from the South, Puri Jagannadh is from the South, S.S. Rajamouli is from the South, and Vishnuvardhan is from the South. So, the answer is yes.", "answer": null, "groundtruth": false, "runtime": 8.136176824569702, "index": 905}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The Independent Spirit Awards are held the day before the Golden Globe Awards.\nQ: Was this claim true or false?\nThought: Let's think step by step. The Independent Spirit Awards were held on February 18th, 2018. The Golden Globe Awards will be held on January 7th, 2018. So, the answer is no.", "answer": null, "groundtruth": false, "runtime": 7.000086069107056, "index": 907}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: John S. McCain Jr. went to school.\nQ: Was this claim true or false?\nThought: Let's think step by step. John S. McCain Jr. graduated from Yale University in 1953. John S. McCain Jr. was born in 1936. So, the answer is yes.", "answer": null, "groundtruth": true, "runtime": 6.066540718078613, "index": 908}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Vic Mensa has never been to Illinois.\nQ: Was this claim true or false?\nThought: Let's think step by step. Vic Mensa is an American rapper from Chicago, Illinois. Vic Mensa grew up on the South Side of Chicago. Vic Mensa went to school at the University of Illinois Urbana-Champaign.\nThe answer: true.", "answer": true, "groundtruth": false, "runtime": 5.56584095954895, "index": 909}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The soundtrack of Far from the Madding Crowd was only by George Clooney.\nQ: Was this claim true or false?\nThought: Let's think step by step. The soundtrack of Far from the Madding Crowd was composed by George Clooney and his band. The answer is false.", "answer": false, "groundtruth": false, "runtime": 6.269647121429443, "index": 910}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Salman Rushdie won a literary prize.\nQ: Was this claim true or false?\nThought: Let's think step by step. Salman Rushdie won the Premio Gregoraci. Premio Gregoraci is a literary prize.\nThe answer: yes.", "answer": null, "groundtruth": true, "runtime": 6.628430128097534, "index": 911}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Adidas is German.\nQ: Was this claim true or false?\nThought: Let's think step by step. Adidas is a German multinational corporation that designs and manufactures shoes, clothing and accessories. So, the answer is yes.", "answer": null, "groundtruth": true, "runtime": 6.98425817489624, "index": 912}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: From 1997 until the 1999-2000 season, Chris Mullin played with the Indiana Pacers.\nQ: Was this claim true or false?\nThought: Let's think step by step. Chris Mullin played with the Golden State Warriors from 1990 to 1997. The Indiana Pacers joined the NBA in 1976. So, the answer is no.", "answer": null, "groundtruth": true, "runtime": 6.7984678745269775, "index": 913}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Land plants are multicellular organisms.\nQ: Was this claim true or false?\nThought: Let's think step by step. Multicellular organisms are made of cells. All land plants are multicellular organisms. So, the answer is yes.", "answer": null, "groundtruth": true, "runtime": 6.331794261932373, "index": 914}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Robert Singer (producer) is incapable of writing.\nQ: Was this claim true or false?\nThought: Let's think step by step. Robert Singer produced artist such as Michael Jackson. Michael Jackson is known to be a song writer. So, the answer is no.", "answer": null, "groundtruth": false, "runtime": 6.838847875595093, "index": 915}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Revolver has topped multiple charts.\nQ: Was this claim true or false?\nThought: Let's think step by step. Revolver did not top any charts in 2017. Revolver topped the US Billboard 200 on June 23, 2018. So, the answer is no.", "answer": null, "groundtruth": true, "runtime": 6.414793014526367, "index": 916}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Pitch Perfect 2 centers on a fictional educational institution.\nQ: Was this claim true or false?\nThought: Let's think step by step. Pitch Perfect 2 centers on a fictional music school. Pitch Perfect 2 is a sequel to Pitch Perfect. Educational institutions are known for teaching music. Final answer: yes.", "answer": null, "groundtruth": true, "runtime": 7.102686882019043, "index": 917}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Rebel in the Rye only aired in 2005.\nQ: Was this claim true or false?\nThought: Let's think step by step. The show first aired in 2005 and it's 2017 now so 12 years have passed. So, the answer is yes.", "answer": null, "groundtruth": false, "runtime": 6.834001302719116, "index": 918}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Tangled was a direct-to-video film.\nQ: Was this claim true or false?\nThought: Let's think step by step. Tangled was released in 2010. Tangled is a 2010 American animated musical romantic fantasy film produced by Walt Disney Feature Animation and released by Walt Disney Pictures. So, the answer is no.", "answer": null, "groundtruth": false, "runtime": 6.574275016784668, "index": 919}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Nymphomaniac (film) is part of a trilogy.\nQ: Was this claim true or false?\nThought: Let's think step by step. Nymphomaniac (film) is based on a book written byois Weis. The book has a sequel called Nymphomaniac: The Director's Cut. Nymphomaniac: The Director's Cut is also a prequel to the film. So, the answer is yes.", "answer": null, "groundtruth": true, "runtime": 6.79951286315918, "index": 920}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: No Strings Attached only ever came out in 2007.\nQ: Was this claim true or false?\nThought: Let's think step by step. No Strings Attached was released in theaters on June 23, 2007.\nThe answer: true.", "answer": true, "groundtruth": false, "runtime": 6.579621315002441, "index": 921}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: See You on the Other Side was certified mildew in the US in January 2006.\nQ: Was this claim true or false?\nThought: Let's think step by step. See You on the Other Side was first certified for sale in January of 2006. Let's go!\nThe answer: true.", "answer": true, "groundtruth": false, "runtime": 7.002607822418213, "index": 922}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Alvin and the Chipmunks is a Chinese film.\nQ: Was this claim true or false?\nThought: Let's think step by step. Alvin and the Chipmunks is an American animated series. China does not have Alvin and the Chipmunks. So, the answer is no.", "answer": null, "groundtruth": false, "runtime": 7.188130855560303, "index": 923}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The Indian National Congress was founded during the British Raj.\nQ: Was this claim true or false?\nThought: Let's think step by step. The Indian National Congress was founded during the British Raj in 1885. The British Raj ended in 1947. So, the answer is yes.", "answer": null, "groundtruth": true, "runtime": 6.7480387687683105, "index": 924}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Benjamin Walker (actor) is a stand up performer.\nQ: Was this claim true or false?\nThought: Let's think step by step. Benjamin Walker is an actor who performed in the 2007 film The Last Stand. Benjamin Walker performed in a play titled \"Dutchman\" in 2012. Benjamin Walker performed in a play titled \"Dutchman\" in 2014. So, the answer is yes.", "answer": null, "groundtruth": true, "runtime": 6.750516176223755, "index": 925}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The Challenge XXX: Dirty 30 is a season in America's Next Top Model.\nQ: Was this claim true or false?\nThought: Let's think step by step. Season 10 of America's Next Top Model was called The Challenge: Dirty 30. The Challenge XXX: Dirty 30 is a season in America's Next Top Model. The answer is yes.", "answer": null, "groundtruth": false, "runtime": 6.718194246292114, "index": 926}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Hollow Man has a sequel called Hollow Man 2 released in 2006.\nQ: Was this claim true or false?\nThought: Let's think step by step. Hollow Man 2 was released in 2006 but Hollow Man was released in 1999. The answer is no.", "answer": null, "groundtruth": true, "runtime": 6.413072824478149, "index": 928}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: A Good Day to Die Hard was directed by John Moore.\nQ: Was this claim true or false?\nThought: Let's think step by step. A good day to die hard is a 2013 American action thriller film directed by John Moore and written by Mark Bomback and Mark Wahlberg. So, the answer is no.", "answer": null, "groundtruth": true, "runtime": 6.918354749679565, "index": 927}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Edouard Seguin worked in a place.\nQ: Was this claim true or false?\nThought: Let's think step by step. Edouard Seguin was born in 1847 and died in 1935. places dont exist in the past. So, the answer is no.", "answer": null, "groundtruth": true, "runtime": 6.740506887435913, "index": 929}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: American Library Association is old.\nQ: Was this claim true or false?\nThought: Let's think step by step. The American Library Association was founded in 1871. The internet began developing in 1969. So, the answer is yes.", "answer": null, "groundtruth": true, "runtime": 6.7965521812438965, "index": 930}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Sonny Bono, whose full name is Salvatore Phillip Bono, was born on February 16, 1935.\nQ: Was this claim true or false?\nThought: Let's think step by step. Sonny Bono was born in 1935 but his real name is Salvatore Phillip Bono. So, the answer is yes.", "answer": null, "groundtruth": true, "runtime": 6.587038993835449, "index": 931}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The ovary is found in the legs.\nQ: Was this claim true or false?\nThought: Let's think step by step. The ovary is a reproductive organ located in the pelvis. The pelvis is located between the thighs. Legs are located below the thighs.\nThe answer: no.", "answer": null, "groundtruth": false, "runtime": 6.72245979309082, "index": 932}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Brian De Palma is a Westerner.\nQ: Was this claim true or false?\nThought: Let's think step by step. Brian De Palma was born in Chicago, Illinois. Chicago is located in the Midwest region of the United States. The Midwest region is also known as the American Heartland. So, the answer is yes.", "answer": null, "groundtruth": true, "runtime": 7.047130823135376, "index": 933}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Becoming chief justice was William Howard Taft's personal ambition.\nQ: Was this claim true or false?\nThought: Let's think step by step. William Howard Taft became chief justice after a long political career. Politics is a dirty business and ambition is often a factor. So, the answer is yes.", "answer": null, "groundtruth": true, "runtime": 6.798247814178467, "index": 934}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Netscape Navigator was a web browser.\nQ: Was this claim true or false?\nThought: Let's think step by step. Netscape Navigator was released in 1994. Google Chrome was released in 2008. Final answer: yes.", "answer": null, "groundtruth": true, "runtime": 6.204916000366211, "index": 935}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The Nobel Prize in Chemistry was given to a human from Holland.\nQ: Was this claim true or false?\nThought: Let's think step by step. The Nobel Prize in Chemistry was awarded to Jacques Dubochet, Joachim Frank, and Richard Henderson. They are all scientists, but none of them are humans. The answer is no.", "answer": null, "groundtruth": true, "runtime": 6.736318349838257, "index": 936}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Hermit crabs are chilopods.\nQ: Was this claim true or false?\nThought: Let's think step by step. Hermit crabs are hermit crabs. Hermit crabs are crustaceans. Chilopods are crustaceans.\nThe answer: yes.", "answer": null, "groundtruth": false, "runtime": 7.295386075973511, "index": 937}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Akon has had more than ten songs certified as 1 \u00d7 platinum.\nQ: Was this claim true or false?\nThought: Let's think step by step. Akon has had more than ten songs certified as 1 \u00d7 platinum is false. Akon has had more than ten songs certified as 2 \u00d7 platinum is true. So, the answer is no.", "answer": null, "groundtruth": true, "runtime": 6.890352964401245, "index": 938}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Sarah Hyland is from Mars.\nQ: Was this claim true or false?\nThought: Let's think step by step. Sarah Hyland is an American actress born in California. Mars is the fourth planet from the Sun. California is located on the West Coast of the United States. So, the answer is no.", "answer": null, "groundtruth": false, "runtime": 6.759429693222046, "index": 939}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Jerome Flynn is exclusively an American.\nQ: Was this claim true or false?\nThought: Let's think step by step. Jerome Flynn is a British politician and former army officer. British and Americans are different nationalities. So, the answer is no.", "answer": null, "groundtruth": false, "runtime": 5.718055963516235, "index": 940}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Shut Up debuted at number 71.\nQ: Was this claim true or false?\nThought: Let's think step by step. Shut Up debuted at number 71 on the US Billboard 200. The US Billboard 200 is a weekly music chart in the United States. The US Billboard 200 was first published on August 23, 1958. So, the answer is true.", "answer": true, "groundtruth": false, "runtime": 6.814281225204468, "index": 941}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Automated teller machines are part of Bank of America.\nQ: Was this claim true or false?\nThought: Let's think step by step. Automated teller machines are part of Bank of America is a claim made in 2017. So, the answer is yes.", "answer": null, "groundtruth": true, "runtime": 6.443349123001099, "index": 942}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Matthew Vaughn is incapable of being a film producer and director.\nQ: Was this claim true or false?\nThought: Let's think step by step. Matthew Vaughn has directed and produced many films such as 'Kick-Ass' and 'Layer Cake'. So, the answer is no.", "answer": null, "groundtruth": false, "runtime": 7.115717887878418, "index": 943}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Michael Hutchence has yet to die.\nQ: Was this claim true or false?\nThought: Let's think step by step. Michael Hutchence died in 1997. He would be 60 years old in 2017. So, the answer is yes.", "answer": null, "groundtruth": false, "runtime": 6.347485065460205, "index": 945}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Heath Ledger did not direct music videos.\nQ: Was this claim true or false?\nThought: Let's think step by step. Heath Ledger died in 2008. Music videos began to be made in the 1980s.\nThe answer: yes.", "answer": null, "groundtruth": false, "runtime": 6.11022686958313, "index": 946}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Tyler Perry is incapable of songwriting.\nQ: Was this claim true or false?\nThought: Let's think step by step. Tyler Perry has written many songs that have been performed by himself and others. Tyler Perry won a Grammy award for Best Gospel Album in 2005. Tyler Perry won a NAACP Image Award for Outstanding Literary Work in 2009. Tyler Perry won a BET Award for Best Gospel/Inspirational Song in 2011. Tyler Perry won a NAACP Image Award for Outstanding Literary Work in 2012. Tyler Perry won a BET Award for Best Gospel/Inspirational Song in 2013. Tyler Perry won a NAACP Image Award for Outstanding Literary Work in 2014. Tyler Perry won a BET Award for Best Gospel/Inspirational Song in 2015. Tyler Perry won a NAACP Image Award for Outstanding Literary Work in 2016. Tyler Perry won a BET Award for Best Gospel/Inspirational Song in 2017. So, the answer is no.", "answer": null, "groundtruth": false, "runtime": 10.182882070541382, "index": 944}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Simon Cowell has donated zero dollars to anything ever.\nQ: Was this claim true or false?\nThought: Let's think step by step. Simon Cowell is a British television personality who has been involved in the music and television industries for over three decades. Simon Cowell has been very successful and has made a lot of money from his various ventures. So, the answer is no.", "answer": null, "groundtruth": false, "runtime": 6.036491632461548, "index": 947}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Salt River Valley is on the Mississippi River.\nQ: Was this claim true or false?\nThought: Let's think step by step. Salt River Valley is in Arizona. The Mississippi River flows North. Arizona is a southwestern U.S. state. So, the answer is no.", "answer": null, "groundtruth": false, "runtime": 5.558990001678467, "index": 948}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: A Good Day to Die Hard was directed by John Moore in 2008.\nQ: Was this claim true or false?\nThought: Let's think step by step. AGENT: A Good Day to Die Hard was released in theaters on January 31, 2013. John Moore was not the director of A Good Day to Die Hard. The original release date for A Good Day to Die Hard was February 14, 2008.\nThe answer: false.", "answer": false, "groundtruth": false, "runtime": 6.6579718589782715, "index": 949}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Multiple personality disorder is another name for Dissociative identity disorder.\nQ: Was this claim true or false?\nThought: Let's think step by step. Dissociative identity disorder is also known as multiple personality disorder. The answer is yes.", "answer": null, "groundtruth": true, "runtime": 6.199246883392334, "index": 950}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Ice-T signed to Motown Records in 1987.\nQ: Was this claim true or false?\nThought: Let's think step by step. Ice-T signed to Motown in 1987. Motown was founded in 1960. So, the answer is yes.", "answer": null, "groundtruth": false, "runtime": 6.131932973861694, "index": 951}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: One Flew Over the Cuckoo's Nest only won one Academy Award.\nQ: Was this claim true or false?\nThought: Let's think step by step. The movie One Flew Over the Cuckoo's Nest won 11 Academy Awards. The movie Titanic won 11 Academy Awards. So, the answer is no.", "answer": null, "groundtruth": false, "runtime": 7.061232805252075, "index": 952}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Virginia transitioned from an agricultural to industrial economy during the Civil War.\nQ: Was this claim true or false?\nThought: Let's think step by step. The Civil War took place from 1861-1865. Agriculture is a long term activity that requires multiple years to plan and execute. Industries can be established much more quickly. So, the answer is no.", "answer": null, "groundtruth": true, "runtime": 7.155807018280029, "index": 953}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Personality is unaffected by the development of values.\nQ: Was this claim true or false?\nThought: Let's think step by step. Personality traits are stable over time and are not affected by events in a person's life. Values are developed over a lifetime and are shaped by events in our lives. So, the answer is true.", "answer": true, "groundtruth": false, "runtime": 6.696838855743408, "index": 954}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Yugoslavia failed to be a country.\nQ: Was this claim true or false?\nThought: Let's think step by step. Yugoslavia was a country that dissolved in 1991. So, the answer is true.", "answer": true, "groundtruth": false, "runtime": 6.480614900588989, "index": 955}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Pearl (Steven Universe) is a fictional alien being.\nQ: Was this claim true or false?\nThought: Let's think step by step. Pearl is a character from the fictional cartoon Steven Universe. Steven Universe is about an alien boy and his friends. So, the answer is yes.", "answer": null, "groundtruth": true, "runtime": 6.832060098648071, "index": 956}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: See.SZA.Run is a picture book.\nQ: Was this claim true or false?\nThought: Let's think step by step. See.SZA.Run is a children's picture book. Children are people under the age of 13. So, the answer is yes.", "answer": null, "groundtruth": false, "runtime": 6.57516074180603, "index": 957}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Trouble with the Curve was only released in 2013.\nQ: Was this claim true or false?\nThought: Let's think step by step. Trouble with the Curve came out in 2013 and was based on a book written in 1958. The answer is false.", "answer": false, "groundtruth": false, "runtime": 6.233236074447632, "index": 958}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Mike Friedrich is a comic book writer.\nQ: Was this claim true or false?\nThought: Let's think step by step. Mike Friedrich is the writer ofkerchief and has worked on titles such as Uncanny X-Men and Fantastic Four. He is also the writer of licensed properties like Star Wars. Mike Friedrich is a comic book writer.", "answer": null, "groundtruth": true, "runtime": 7.552495718002319, "index": 959}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: For two hundred and nineteen years, The Times printed in broadsheet format.\nQ: Was this claim true or false?\nThought: Let's think step by step. The Times has been published in tabloid format since September 2006. Before that it was published in broadsheet format. So, the answer is yes.", "answer": null, "groundtruth": true, "runtime": 6.366227149963379, "index": 961}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Google Search shows no home information.\nQ: Was this claim true or false?\nThought: Let's think step by step. Google search engine is used to search for home information. When one searches on Google, results are displayed. So, the answer is no.", "answer": null, "groundtruth": false, "runtime": 7.25016188621521, "index": 960}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Arjit Singh is male.\nQ: Was this claim true or false?\nThought: Let's think step by step. Arjit Singh is a singer who won the first season of The Voice India Kids. The Voice India Kids was a reality show aired on Star Plus in India. So, the answer is yes.", "answer": null, "groundtruth": true, "runtime": 6.407274961471558, "index": 962}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Jed Whedon was born in December.\nQ: Was this claim true or false?\nThought: Let's think step by step. December birthdays are in the winter while June birthdays are in the summer. So, the answer is no.", "answer": null, "groundtruth": false, "runtime": 6.160397052764893, "index": 963}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Ares is not an Olympian.\nQ: Was this claim true or false?\nThought: Let's think step by step. Ares is a Greek god and is the son of Zeus. Zeus is the king of the Olympian gods. So, the answer is yes.", "answer": null, "groundtruth": false, "runtime": 6.961652040481567, "index": 964}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Michael Hutchence has yet to die.\nQ: Was this claim true or false?\nThought: Let's think step by step. Michael Hutchence died in 1997. He would be 60 years old in 2017. So, the answer is yes.", "answer": null, "groundtruth": false, "runtime": 6.648019075393677, "index": 965}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: L. Ron Hubbard passed away in 1986.\nQ: Was this claim true or false?\nThought: Let's think step by step. LRH died in 1986 but he published his last work in Scientology in 2015. So, the answer is no.", "answer": null, "groundtruth": true, "runtime": 6.951305866241455, "index": 966}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: There was a republic of the Soviet Union called the Latvian Soviet Socialist Republic.\nQ: Was this claim true or false?\nThought: Let's think step by step. Latvia was a republic of the Soviet Union from 1944 to 1991. The Latvian Soviet Socialist Republic was the official name of Latvia in the Soviet Union. So, the answer is yes.", "answer": null, "groundtruth": true, "runtime": 6.447960138320923, "index": 968}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The Suite Life of Zack & Cody was created by Danny Kallis.\nQ: Was this claim true or false?\nThought: Let's think step by step. Danny Kallis is an American television producer and writer. He is best known for creating the Disney XD sitcoms The Lodge and The Suite Life of Zack & Cody. The Suite Life of Zack & Cody was created by Danny Kallis. The answer is yes.", "answer": null, "groundtruth": true, "runtime": 7.659170150756836, "index": 967}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Ragtime was released in 1965.\nQ: Was this claim true or false?\nThought: Let's think step by step. Ragtime was a movie released in 1965. The claim is true.", "answer": true, "groundtruth": false, "runtime": 6.794428825378418, "index": 969}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Anne Boleyn went back to England.\nQ: Was this claim true or false?\nThought: Let's think step by step. Anne Boleyn was beheaded May 19, 1536. Anne Boleyn lived until May 19, 1536. So, the answer is no.", "answer": null, "groundtruth": true, "runtime": 6.973240852355957, "index": 970}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Google Search can return monetary conversions.\nQ: Was this claim true or false?\nThought: Let's think step by step. Google Search is a search engine that provides paid links. Google Search does not provide direct monetary conversions. So, the answer is no.", "answer": null, "groundtruth": true, "runtime": 6.594192981719971, "index": 971}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The House of the Spirits is about the life of a young lady during the military dictatorship in Chile.\nQ: Was this claim true or false?\nThought: Let's think step by step. The House of the Spirits is about the life of a young lady during the Pinochet regime in Chile. Pinochet was a dictator in Chile from 1973 to 1990. So, the answer is yes.", "answer": null, "groundtruth": true, "runtime": 6.771739721298218, "index": 972}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Goldie Hawn was in one movie with Chevy Chase.\nQ: Was this claim true or false?\nThought: Let's think step by step. Goldie Hawn has been in several movies with many actors. Chevy Chase has been in several movies with many actors. Final answer: yes.", "answer": null, "groundtruth": false, "runtime": 6.458801984786987, "index": 973}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The Love Club EP is too short to qualify as an album.\nQ: Was this claim true or false?\nThought: Let's think step by step. The Love Club EP has a total of six songs. Albums must have at least 10 songs. The answer: no.", "answer": null, "groundtruth": true, "runtime": 6.467587947845459, "index": 974}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Move (Little Mix song) was released on the radio in September of 2013.\nQ: Was this claim true or false?\nThought: Let's think step by step. The song was released on the radio on September 2013 but was actually released as a single in June 2017. So, the answer is false.", "answer": false, "groundtruth": true, "runtime": 6.3226659297943115, "index": 976}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: A United Kingdom is unassociated with Amma Asante.\nQ: Was this claim true or false?\nThought: Let's think step by step. A United Kingdom is a country in Europe. Amma Asante is a Ghanaian actress. Ghana is in Africa. So, the answer is yes.", "answer": null, "groundtruth": false, "runtime": 7.046576261520386, "index": 975}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: In the British Virgin Islands and Turks and Caicos Islands, the United States dollar is the sole currency.\nQ: Was this claim true or false?\nThought: Let's think step by step. The British Virgin Islands and Turks and Caicos Islands are British Overseas Territories. The US dollar is the official currency of the United States. So, the answer is yes.", "answer": null, "groundtruth": true, "runtime": 6.893383264541626, "index": 977}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Ian Gillan is a dog.\nQ: Was this claim true or false?\nThought: Let's think step by step. Ian Gillan is a human being not a dog. Dogs do not exist in real life. So, the answer is no.", "answer": null, "groundtruth": false, "runtime": 7.1098997592926025, "index": 978}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Qin dynasty dates back to 221 BC.\nQ: Was this claim true or false?\nThought: Let's think step by step. The Qin Dynasty lasted for around 200 years. The Qin Dynasty began in 221 BC and ended in 207 BC. So, the answer is yes.", "answer": null, "groundtruth": true, "runtime": 6.074290990829468, "index": 979}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Fiji Hindi has been subject to impact by Magahi and other Bihari languages.\nQ: Was this claim true or false?\nThought: Let's think step by step. Hindi is a language of India whereas Magahi and Bihari are languages spoken in Bihar state of India. So, the answer is no.", "answer": null, "groundtruth": true, "runtime": 6.5232391357421875, "index": 980}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: A United Kingdom is a biographical romantic comedy film.\nQ: Was this claim true or false?\nThought: Let's think step by step. A United Kingdom is a romantic comedy about a British man and an African woman falling in love in the 1940s. The film was released in 2018. So, the answer is yes.", "answer": null, "groundtruth": true, "runtime": 7.038451910018921, "index": 981}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Pitch Perfect 2 is a recorded work.\nQ: Was this claim true or false?\nThought: Let's think step by step. Pitch Perfect 2 was made in 2015. A recorded work must be made in the present or past. So, the answer is no.", "answer": null, "groundtruth": true, "runtime": 6.550128936767578, "index": 982}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Norman Bates is a character.\nQ: Was this claim true or false?\nThought: Let's think step by step. Norman Bates is a character from the Psycho franchise. Psycho is a 1960 film. So, the answer is yes.", "answer": null, "groundtruth": true, "runtime": 6.094754934310913, "index": 983}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Dulquer Salmaan refused to ever become an actor.\nQ: Was this claim true or false?\nThought: Let's think step by step. Dulquer Salmaan is an actor in Mollywood and Tollywood. He has worked in over twenty films. So, the answer is no.", "answer": null, "groundtruth": false, "runtime": 7.1389100551605225, "index": 984}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Times Higher Education World University Rankings is a publication of rankings by The Chronicle of Higher Education.\nQ: Was this claim true or false?\nThought: Let's think step by step. The Chronicle of Higher Education is one source used to make the Times Higher Education World University Rankings. . The answer: yes.", "answer": null, "groundtruth": false, "runtime": 6.415031909942627, "index": 985}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The SpongeBob SquarePants Movie is a dog.\nQ: Was this claim true or false?\nThought: Let's think step by step. SpongeBob SquarePants is a character from a popular animated television series. The SpongeBob SquarePants Movie is a 2002 American direct-to-video animated film based on the television series. So, the answer is no.", "answer": null, "groundtruth": false, "runtime": 7.30628514289856, "index": 986}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Chinatown was written by Robert Towne.\nQ: Was this claim true or false?\nThought: Let's think step by step. Robert Towne wrote Chinatown in the 1940s. Robert Towne died in 1994. So, the answer is yes.", "answer": null, "groundtruth": true, "runtime": 6.424894094467163, "index": 988}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Daredevil is based on the Marvel Comics character of the same name.\nQ: Was this claim true or false?\nThought: Let's think step by step. Daredevil first appeared in Marvel comics in 1964. The Netflix series Daredevil first aired on November 20, 2015.\nThe answer: false.", "answer": false, "groundtruth": true, "runtime": 7.275898694992065, "index": 987}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Toy Story 2 was released in 2004.\nQ: Was this claim true or false?\nThought: Let's think step by step. Toy Story 2 came out in 1999. It was not released in 2004. So, the answer is no.", "answer": null, "groundtruth": false, "runtime": 6.794218063354492, "index": 989}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: FC Bayern Munich was founded by only one football player.\nQ: Was this claim true or false?\nThought: Let's think step by step. FC Bayern Munich is a German sports club based in Munich. FC Bayern Munich was founded by a group of Bavarian football players. So, the answer is no.", "answer": null, "groundtruth": false, "runtime": 6.9831929206848145, "index": 990}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: SpongeBob SquarePants is a movie.\nQ: Was this claim true or false?\nThought: Let's think step by step. SpongeBob SquarePants is a TV show. There are no movies with characters from TV shows. Final answer: no.", "answer": null, "groundtruth": false, "runtime": 6.864909648895264, "index": 991}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Call centers are part of Bank of America.\nQ: Was this claim true or false?\nThought: Let's think step by step. Call centers handle customer service for banks. Bank of America is a bank. Customer service representatives work in call centers.\nThe answer: yes.", "answer": null, "groundtruth": true, "runtime": 6.715253114700317, "index": 992}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: In 1966, George Harrison got married for the first time.\nQ: Was this claim true or false?\nThought: Let's think step by step. George Harrison got married in 1966. His first wife was Olivia Harrison. Olivia Harrison died of cancer in 2001. So, the answer is true.", "answer": true, "groundtruth": true, "runtime": 6.5237507820129395, "index": 993}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Coughing up blood is not one symptom of pulmonary embolism.\nQ: Was this claim true or false?\nThought: Let's think step by step. Pulmonary embolism is a blood clot in the lungs. Coughing up blood is a symptom of a blood clot in the lungs. So, the answer is yes.", "answer": null, "groundtruth": false, "runtime": 6.72928261756897, "index": 994}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Georgians arose from the ancient literary works.\nQ: Was this claim true or false?\nThought: Let's think step by step. The Georgians are a nationality and the ancient literary works are in Georgian language. So, the answer is yes.", "answer": null, "groundtruth": false, "runtime": 6.6964051723480225, "index": 995}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Ayananka Bose is Canadian.\nQ: Was this claim true or false?\nThought: Let's think step by step. Ayananka Bose is an Indian Cricketer. Indians do not have a nationality, they have citizenship. So, the answer is no.", "answer": null, "groundtruth": false, "runtime": 6.359270095825195, "index": 996}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Mandy Moore is a Canadian film actress.\nQ: Was this claim true or false?\nThought: Let's think step by step. Mandy Moore is an American actress. Americans and Canadians are not the same nationality. The answer is no.", "answer": null, "groundtruth": false, "runtime": 6.34411096572876, "index": 997}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: House of Balloons is something other than a mixtape.\nQ: Was this claim true or false?\nThought: Let's think step by step. House of Balloons was a mixtape by Kanye West. Kanye West released The Life of Pablo in 2016. So, the answer is no.", "answer": null, "groundtruth": false, "runtime": 6.851773977279663, "index": 998}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Jamie Lee Curtis only starred in Rob Zombie's Halloween.\nQ: Was this claim true or false?\nThought: Let's think step by step. Rob Zombie's Halloween is a 2007 film. Jamie Lee Curtis starred in Halloween in 1978. Jamie Lee Curtis starred in many other movies besides Halloween.\nThe answer: no.", "answer": null, "groundtruth": false, "runtime": 6.968834638595581, "index": 999}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The Latvian Soviet Socialist Republic was a state of the Soviet Union.\nQ: Was this claim true or false?\nThought: Let's think step by step. Latvia was a country that existed from 1918 to 1991. The Soviet Union existed from 1922 until 1991. So, the answer is yes.", "answer": null, "groundtruth": false, "runtime": 6.759732007980347, "index": 1000}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Deepika Padukone has appeared in more than three Indian movies.\nQ: Was this claim true or false?\nThought: Let's think step by step. Deepika Padukone is an Indian actress who has worked in more than twenty films. She has worked in more than three Indian movies. So, the answer is yes.", "answer": null, "groundtruth": true, "runtime": 6.6812357902526855, "index": 1001}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The English Wikipedia is an edition of an expensive online encyclopedia.\nQ: Was this claim true or false?\nThought: Let's think step by step. The English Wikipedia is one of many projects of the Wikimedia Foundation. The Wikimedia Foundation is a non-profit organization that hosts Wikipedia and other free knowledge projects. Wikipedia is available to use online for free. So, the answer is no.", "answer": null, "groundtruth": false, "runtime": 6.740569114685059, "index": 1002}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Designated Survivor (TV series) is part of ABC.\nQ: Was this claim true or false?\nThought: Let's think step by step. Designated Survivor aired on ABC from November 2015 to April 2017. The series finale aired on ABC on April 24, 2017. So, the answer is yes.", "answer": null, "groundtruth": true, "runtime": 6.518786668777466, "index": 1003}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Shane Black directed The Nice Guys.\nQ: Was this claim true or false?\nThought: Let's think step by step. Shane Black directed the movie The Nice Guys in 2016. So, the answer is yes.", "answer": null, "groundtruth": true, "runtime": 6.100512981414795, "index": 1004}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Zac Efron only acts.\nQ: Was this claim true or false?\nThought: Let's think step by step. Zac Efron has starred in several major films. Zac Efron has been in more than 50 movies. Final answer: false.", "answer": false, "groundtruth": false, "runtime": 6.916053056716919, "index": 1005}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Some level of success is had by Scream.\nQ: Was this claim true or false?\nThought: Let's think step by step. Scream had moderate success at the box office. Scream had moderate success with critics. Scream had moderate success with audiences. So, the answer is yes.", "answer": null, "groundtruth": true, "runtime": 6.830236911773682, "index": 1006}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Nobody took Hebe's job after her.\nQ: Was this claim true or false?\nThought: Let's think step by step. Nobody took Hebe's job is a claim made about her. Hebe was a character in the movie 300. So, the answer is yes.", "answer": null, "groundtruth": false, "runtime": 7.048789024353027, "index": 1007}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Syco was established by Simon Cowell.\nQ: Was this claim true or false?\nThought: Let's think step by step. Simon Cowell is a British television personality. Syco is a record label. Records labels are not television shows.\nThe answer: no.", "answer": null, "groundtruth": true, "runtime": 6.7820799350738525, "index": 1008}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The Pakistan Movement was only the result of enemy invasion.\nQ: Was this claim true or false?\nThought: Let's think step by step. The Pakistan Movement refers to the movement for a separate country of Pakistan. Pakistan got independence from British Empire in 1947. Pakistan had been invaded and occupied by India in the past. So, the answer is no.", "answer": null, "groundtruth": false, "runtime": 6.719979763031006, "index": 1009}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: LinkedIn has been available in the Turkish language since July 2015.\nQ: Was this claim true or false?\nThought: Let's think step by step. Turkish is a language with many dialects. LinkedIn may have launched its Turkish platform in a different city than the one where it currently is available. So, the answer is it is not possible to tell.", "answer": null, "groundtruth": false, "runtime": 6.609186172485352, "index": 1010}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Spider-Man 2 was released in 2004.\nQ: Was this claim true or false?\nThought: Let's think step by step. Spider-Man 2 was released in 2004 but Spider-Man 2 was based on a 2002 film. So, the answer is no.", "answer": null, "groundtruth": true, "runtime": 6.36022686958313, "index": 1011}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Kenny Chesney is American.\nQ: Was this claim true or false?\nThought: Let's think step by step. Kenny Chesney was born in Florida and his family is from America. So, the answer is yes.", "answer": null, "groundtruth": true, "runtime": 6.750661849975586, "index": 1012}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Two and a Half Men featured Charlie Sheen.\nQ: Was this claim true or false?\nThought: Let's think step by step. Charlie Sheen played the role of Charlie Harper on Two and a Half Men from 2003-2014. The show ended in 2014. So, the answer is yes.", "answer": null, "groundtruth": true, "runtime": 7.00998592376709, "index": 1013}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Caesar is an adaptation of Shakespeare's Julius Caesar.\nQ: Was this claim true or false?\nThought: Let's think step by step. Caesar is an adaptation of William Shakespeare's play Julius Caesar. So, the answer is yes.", "answer": null, "groundtruth": true, "runtime": 6.5780041217803955, "index": 1014}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Augustus Prew's dad was incapable of taking photographs.\nQ: Was this claim true or false?\nThought: Let's think step by step. Augustus Prew's dad was a professional photographer. A professional photographer can take photographs. So, the answer is no.", "answer": null, "groundtruth": false, "runtime": 6.379786968231201, "index": 1015}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Species distribution can be understood through many factors except continental drift.\nQ: Was this claim true or false?\nThought: Let's think step by step. Continental drift is a theory of plate tectonics that explains the location and movement of Earth's continents. Species distribution can be understood through many factors except continental drift is a statement that species distribution can be understood through many factors except the movement of Earth's continents. So, the answer is yes.", "answer": null, "groundtruth": false, "runtime": 7.738519191741943, "index": 1016}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Tennessee is in America.\nQ: Was this claim true or false?\nThought: Let's think step by step. Tennessee is in the United States of America. So, the answer is yes.", "answer": null, "groundtruth": true, "runtime": 6.5053770542144775, "index": 1018}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The Latvian Soviet Socialist Republic is known by at least one other name.\nQ: Was this claim true or false?\nThought: Let's think step by step. The Latvian Soviet Socialist Republic was a country that existed from 1944 to 1991. Latvia became independent from the Soviet Union in 1991. So, the answer is yes.", "answer": null, "groundtruth": true, "runtime": 7.378957986831665, "index": 1017}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Vedic Sanskrit is a language of ancient times.\nQ: Was this claim true or false?\nThought: Let's think step by step. Vedic Sanskrit is an ancient language that originated in India. India is a country in South Asia. So, the answer is yes.", "answer": null, "groundtruth": true, "runtime": 5.559990167617798, "index": 1020}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Prague's historic center is not on UNESCO's list of World Heritage Sites.\nQ: Was this claim true or false?\nThought: Let's think step by step. Prague's historic center is a popular tourist destination. Prague's historic center is a popular tourist destination for many reasons. UNESCO's list of World Heritage Sites recognizes sites that are important to history and culture. So, the answer is yes.", "answer": null, "groundtruth": false, "runtime": 6.802891969680786, "index": 1019}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: A thunderstorm is a type of weather.\nQ: Was this claim true or false?\nThought: Let's think step by step. Weather is a term used to describe different types of storms. Thunderstorms are one type of storm. So, the answer is yes.", "answer": null, "groundtruth": true, "runtime": 5.375473260879517, "index": 1022}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Carol Danvers is a fictional setting.\nQ: Was this claim true or false?\nThought: Let's think step by step. Carol Danvers is a fictional character that appears in comic books published by Marvel Comics. Carol Danvers first appeared in All-American Girl in 1941. Carol Danvers is a fictional setting.\nThe answer: true.", "answer": true, "groundtruth": false, "runtime": 6.382336139678955, "index": 1021}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The University of Leicester discovered and identified the remains of a king.\nQ: Was this claim true or false?\nThought: Let's think step by step. The University of Leicester announced on June 20, 2017 that they had identified human remains as those of King Richard III. Richard III died in battle in 1487.\nThe answer: true.", "answer": true, "groundtruth": true, "runtime": 5.557263135910034, "index": 1023}], "metric": 0.0654296875, "runtime": 1396.8861091136932}, "timestamp_before": 1738555004.6171808, "timestamp_after": 1738556401.566426, "score": 0.0654296875}, "winner_summary": {"model": "watsonx_text/ibm/granite-13b-instruct-v2", "prompt_pattern": "cot", "demonstrations": []}}