{"iterations": [{"iteration": 0, "current_validation_set_size": 1, "num_candidates": 1, "validation_set_indices": [0], "selected_candidates_uuids": ["c85415gx"], "candidates": [{"candidate": {"uuid": "c85415gx", "demonstrations_indices": [], "model": "watsonx/ibm/granite-34b-code-instruct", "prompt_pattern": "cot"}, "results": [{"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Tylenol is only a brand of clothes.\nQ: Was this claim true or false?\nThought: Let's think step by step. False.", "answer": false, "groundtruth": false, "runtime": 2.128268003463745, "index": 0}], "metric": 1.0, "runtime": 2.134050130844116}], "timestamp": 1738557975.6471539}], "config": {"thread_class": "<class 'pdl.optimize.fever_thread.FEVERTrialThread'>", "max_candidates": 1, "num_candidates": 1, "starting_validation_set_size": 1, "ending_validation_set_size": 1024, "num_iterations": 0, "total_evaluations": 1, "num_threads": 5, "validation_set_multiplier": 2, "variables": {"model": ["watsonx/ibm/granite-34b-code-instruct"], "prompt_pattern": ["cot"]}, "budget": null, "shuffle_validation": false, "start_time": 1738557973.5064719, "candidates": [{"uuid": "c85415gx", "demonstrations_indices": [], "model": "watsonx/ibm/granite-34b-code-instruct", "prompt_pattern": "cot"}], "raw_config": {"benchmark": "fever", "num_candidates": 1, "num_demonstrations": 0, "initial_test_set_size": 1, "max_test_set_size": 1024, "timeout": 60, "budget_growth": "double", "shuffle_test": false, "budget": null, "parallelism": 5, "train_set_name": "train", "test_set_name": "test", "validation_set_name": "validation", "demonstrations_variable_name": "demonstrations", "variables": {"model": ["watsonx/ibm/granite-34b-code-instruct"], "prompt_pattern": ["cot"]}, "experiment_prefix": "granite_34b_code_instruct_fever_zero_shot_"}}, "final_iteration": {"ending_test_set_size": 1024, "eval_set_indices": [0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 109, 110, 111, 112, 113, 114, 115, 116, 117, 118, 119, 120, 121, 122, 123, 124, 125, 126, 127, 128, 129, 130, 131, 132, 133, 134, 135, 136, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 148, 149, 150, 151, 152, 153, 154, 155, 156, 157, 158, 159, 160, 161, 162, 163, 164, 165, 166, 167, 168, 169, 170, 171, 172, 173, 174, 175, 176, 177, 178, 179, 180, 181, 182, 183, 184, 185, 186, 187, 188, 189, 190, 191, 192, 193, 194, 195, 196, 197, 198, 199, 200, 201, 202, 203, 204, 205, 206, 207, 208, 209, 210, 211, 212, 213, 214, 215, 216, 217, 218, 219, 220, 221, 222, 223, 224, 225, 226, 227, 228, 229, 230, 231, 232, 233, 234, 235, 236, 237, 238, 239, 240, 241, 242, 243, 244, 245, 246, 247, 248, 249, 250, 251, 252, 253, 254, 255, 256, 257, 258, 259, 260, 261, 262, 263, 264, 265, 266, 267, 268, 269, 270, 271, 272, 273, 274, 275, 276, 277, 278, 279, 280, 281, 282, 283, 284, 285, 286, 287, 288, 289, 290, 291, 292, 293, 294, 295, 296, 297, 298, 299, 300, 301, 302, 303, 304, 305, 306, 307, 308, 309, 310, 311, 312, 313, 314, 315, 316, 317, 318, 319, 320, 321, 322, 323, 324, 325, 326, 327, 328, 329, 330, 331, 332, 333, 334, 335, 336, 337, 338, 339, 340, 341, 342, 343, 344, 345, 346, 347, 348, 349, 350, 351, 352, 353, 354, 355, 356, 357, 358, 359, 360, 361, 362, 363, 364, 365, 366, 367, 368, 369, 370, 371, 372, 373, 374, 375, 376, 377, 378, 379, 380, 381, 382, 383, 384, 385, 386, 387, 388, 389, 390, 391, 392, 393, 394, 395, 396, 397, 398, 399, 400, 401, 402, 403, 404, 405, 406, 407, 408, 409, 410, 411, 412, 413, 414, 415, 416, 417, 418, 419, 420, 421, 422, 423, 424, 425, 426, 427, 428, 429, 430, 431, 432, 433, 434, 435, 436, 437, 438, 439, 440, 441, 442, 443, 444, 445, 446, 447, 448, 449, 450, 451, 452, 453, 454, 455, 456, 457, 458, 459, 460, 461, 462, 463, 464, 465, 466, 467, 468, 469, 470, 471, 472, 473, 474, 475, 476, 477, 478, 479, 480, 481, 482, 483, 484, 485, 486, 487, 488, 489, 490, 491, 492, 493, 494, 495, 496, 497, 498, 499, 500, 501, 502, 503, 504, 505, 506, 507, 508, 509, 510, 511, 512, 513, 514, 515, 516, 517, 518, 519, 520, 521, 522, 523, 524, 525, 526, 527, 528, 529, 530, 531, 532, 533, 534, 535, 536, 537, 538, 539, 540, 541, 542, 543, 544, 545, 546, 547, 548, 549, 550, 551, 552, 553, 554, 555, 556, 557, 558, 559, 560, 561, 562, 563, 564, 565, 566, 567, 568, 569, 570, 571, 572, 573, 574, 575, 576, 577, 578, 579, 580, 581, 582, 583, 584, 585, 586, 587, 588, 589, 590, 591, 592, 593, 594, 595, 596, 597, 598, 599, 600, 601, 602, 603, 604, 605, 606, 607, 608, 609, 610, 611, 612, 613, 614, 615, 616, 617, 618, 619, 620, 621, 622, 623, 624, 625, 626, 627, 628, 629, 630, 631, 632, 633, 634, 635, 636, 637, 638, 639, 640, 641, 642, 643, 644, 645, 646, 647, 648, 649, 650, 651, 652, 653, 654, 655, 656, 657, 658, 659, 660, 661, 662, 663, 664, 665, 666, 667, 668, 669, 670, 671, 672, 673, 674, 675, 676, 677, 678, 679, 680, 681, 682, 683, 684, 685, 686, 687, 688, 689, 690, 691, 692, 693, 694, 695, 696, 697, 698, 699, 700, 701, 702, 703, 704, 705, 706, 707, 708, 709, 710, 711, 712, 713, 714, 715, 716, 717, 718, 719, 720, 721, 722, 723, 724, 725, 726, 727, 728, 729, 730, 731, 732, 733, 734, 735, 736, 737, 738, 739, 740, 741, 742, 743, 744, 745, 746, 747, 748, 749, 750, 751, 752, 753, 754, 755, 756, 757, 758, 759, 760, 761, 762, 763, 764, 765, 766, 767, 768, 769, 770, 771, 772, 773, 774, 775, 776, 777, 778, 779, 780, 781, 782, 783, 784, 785, 786, 787, 788, 789, 790, 791, 792, 793, 794, 795, 796, 797, 798, 799, 800, 801, 802, 803, 804, 805, 806, 807, 808, 809, 810, 811, 812, 813, 814, 815, 816, 817, 818, 819, 820, 821, 822, 823, 824, 825, 826, 827, 828, 829, 830, 831, 832, 833, 834, 835, 836, 837, 838, 839, 840, 841, 842, 843, 844, 845, 846, 847, 848, 849, 850, 851, 852, 853, 854, 855, 856, 857, 858, 859, 860, 861, 862, 863, 864, 865, 866, 867, 868, 869, 870, 871, 872, 873, 874, 875, 876, 877, 878, 879, 880, 881, 882, 883, 884, 885, 886, 887, 888, 889, 890, 891, 892, 893, 894, 895, 896, 897, 898, 899, 900, 901, 902, 903, 904, 905, 906, 907, 908, 909, 910, 911, 912, 913, 914, 915, 916, 917, 918, 919, 920, 921, 922, 923, 924, 925, 926, 927, 928, 929, 930, 931, 932, 933, 934, 935, 936, 937, 938, 939, 940, 941, 942, 943, 944, 945, 946, 947, 948, 949, 950, 951, 952, 953, 954, 955, 956, 957, 958, 959, 960, 961, 962, 963, 964, 965, 966, 967, 968, 969, 970, 971, 972, 973, 974, 975, 976, 977, 978, 979, 980, 981, 982, 983, 984, 985, 986, 987, 988, 989, 990, 991, 992, 993, 994, 995, 996, 997, 998, 999, 1000, 1001, 1002, 1003, 1004, 1005, 1006, 1007, 1008, 1009, 1010, 1011, 1012, 1013, 1014, 1015, 1016, 1017, 1018, 1019, 1020, 1021, 1022, 1023], "selected_candidates_uuid": "c85415gx", "candidate": {"candidate": {"uuid": "c85415gx", "demonstrations_indices": [], "model": "watsonx/ibm/granite-34b-code-instruct", "prompt_pattern": "cot"}, "results": [{"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Aruba is the only ABC Island.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 7.586107969284058, "index": 3}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: 2 Hearts is a musical composition by Minogue.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 7.802957057952881, "index": 1}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The New Jersey Turnpike has zero shoulders.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 7.843544244766235, "index": 2}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Ukrainian Soviet Socialist Republic was a founding participant of the UN.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 7.847829818725586, "index": 0}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Burbank, California has always been completely void of industry.\nQ: Was this claim true or false?\nThought: Let's think step by step. False.", "answer": false, "groundtruth": false, "runtime": 7.8749840259552, "index": 4}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Ice-T refused to ever make hip-hop music.\nQ: Was this claim true or false?\nThought: Let's think step by step. False.", "answer": false, "groundtruth": false, "runtime": 7.052976846694946, "index": 9}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: In states still employing the electric chair to execute people, the prisoner is allowed the choice of lethal injection as an alternative method.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 7.3541319370269775, "index": 7}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Corsica belongs to Italy.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 7.416014194488525, "index": 8}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Commodore is ranked above a rear admiral.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 7.990882158279419, "index": 5}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Hezbollah received a type of training from Iran.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 7.834457159042358, "index": 6}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The Gettysburg Address is a speech.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 7.21763801574707, "index": 10}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: One Dance has always been banned in the Netherlands.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 6.965098142623901, "index": 13}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Jason Bourne removed Riz Ahmed from the movie's cast.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 7.546175003051758, "index": 11}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Adidas designs items.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 7.283384084701538, "index": 14}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Ron Dennis is unemployed.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 7.608202934265137, "index": 12}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Dissociative identity disorder is known as multiple personality disorder.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.335654973983765, "index": 15}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Konidela Production Company was established.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.9237589836120605, "index": 17}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Zoe Saldana is a Leo.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 7.1862101554870605, "index": 16}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Paul von Hindenburg was a man.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 7.013257026672363, "index": 18}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Vic Mensa was born June 12, 1993.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 7.03550910949707, "index": 19}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Jenny McCarthy modeled for Playboy magazine.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 5.862925052642822, "index": 20}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Mutiny on the Bounty is an American film.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.828521013259888, "index": 21}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Color of Night came out in 1994.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 7.0682008266448975, "index": 22}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Westworld (TV series)'s first season has one episode.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 6.95311427116394, "index": 24}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Death Note is a Japanese television drama series that first aired in 2015.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 7.386528968811035, "index": 23}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Richard Dawson's date of birth was November 20, 1932.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 5.736092805862427, "index": 25}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Pink is a Dutch singer.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 7.227921962738037, "index": 26}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Mount Hood is the lowest point in its state.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 6.982567071914673, "index": 28}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The Blue Dog coalition was formed by conservative republicans.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 7.555204153060913, "index": 27}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: US Airways Flight 1549 had 1978 people on board.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 6.840593099594116, "index": 29}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Louie (season 1) is a romance-disaster TV series.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 5.240208148956299, "index": 30}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Mom (TV series) has received one nomination.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 6.643972158432007, "index": 31}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: There was an attempt to incorporate Cyprus into Greece.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.981476068496704, "index": 32}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Daredevil is based on the character of the same name.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 7.29256010055542, "index": 33}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Kevin Bacon was in the film Sleepers in 2006.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 6.323779821395874, "index": 35}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Moscovium's atomic symbol contains a G and at least two E's.\nQ: Was this claim true or false?\nThought: Let's think step by step. True. Moscovium's atomic symbol is Mc and it contains a G and at least two E's.", "answer": true, "groundtruth": false, "runtime": 8.373399019241333, "index": 34}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Maria Theresa was Emperor Charles VI's daughter.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 5.746388912200928, "index": 36}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Resident Evil is loosely based on a series of video games.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.864548921585083, "index": 37}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The Paper only stars Robin Wright.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 6.844437122344971, "index": 38}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The Hunger Games are a series of sporting events.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 7.131582975387573, "index": 39}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Taarak Mehta Ka Ooltah Chashmah is produced by Neela Tele Films Private Limited and has run a long time.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 7.056595325469971, "index": 40}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Ding Yanyuhang is male.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 5.75925612449646, "index": 41}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Kevin Bacon has yet to be in a film.\nQ: Was this claim true or false?\nThought: Let's think step by step. False", "answer": false, "groundtruth": false, "runtime": 6.351660966873169, "index": 42}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Move (Little Mix song) was released in October of 2013.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 7.278043031692505, "index": 43}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Baloch people rarely speak the Balochi language.\nQ: Was this claim true or false?\nThought: Let's think step by step. False", "answer": false, "groundtruth": false, "runtime": 6.747305870056152, "index": 44}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The Office (US) debuted on ESPN.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 7.322339057922363, "index": 45}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Phoenix, Arizona is the capital of the Atlantic Ocean.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 6.866250991821289, "index": 46}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Aphrodite plays tennis with Hephaestus.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 6.991456031799316, "index": 47}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Sennacherib was assassinated in 687 BCE.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 6.702769041061401, "index": 49}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Vera Wang is an American Fashion Designer.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 7.255937099456787, "index": 48}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Augustus Prew was born in Westminster, London, Scotland.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 6.6594078540802, "index": 50}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Resident Evil is loosely based on a novel series.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 6.58616304397583, "index": 51}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: In 2004, Spider-Man 2 was released.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.8556458950042725, "index": 52}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: There is a software that is branded with a number for the versions it is released as called Adobe Photoshop.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.675721883773804, "index": 54}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Chris Mullin played with a team who play basketball professionally.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.557631969451904, "index": 55}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Physics is not one of the oldest academic disciplines.\nQ: Was this claim true or false?\nThought: Let's think step by step. False.\n\nPhysics is one of the oldest academic disciplines, with its origins dating back to ancient Greece. The study of physics has evolved significantly over time, but it is still considered one of the foundational disciplines of academia.", "answer": null, "groundtruth": false, "runtime": 8.702862024307251, "index": 53}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Louis Malle produced films in the English language.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.111207962036133, "index": 56}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Color of Night won a Golden Raspberry Award in 1994.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.217237949371338, "index": 57}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Maggie Q starred in a CW series.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.6333489418029785, "index": 58}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Netscape Navigator was rejected by a subsidiary of AOL.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 7.391443967819214, "index": 59}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Ned Stark was introduced in 1996's A Game of Thrones.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.80197286605835, "index": 61}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Brie Larson was denied any role in the movie Short Term 12.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 7.514308214187622, "index": 60}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: MSG is only used in the film industry.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 6.296759128570557, "index": 62}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Amy Adams stars in Trouble with the Curve.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 5.355289936065674, "index": 63}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Species distribution can be understood through many factors except glaciation.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 7.436138868331909, "index": 64}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Backing vocalists provide vocal harmony.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 7.354262828826904, "index": 65}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Doxycycline may cause teeth to change color in children.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.992987871170044, "index": 66}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Jack Dylan Grazer was born in Tampa, Florida.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 5.9119789600372314, "index": 67}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Two of Mozart's sons were alive after his death.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.294803857803345, "index": 68}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Half Girlfriend was partially filmed in Delhi.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.996578931808472, "index": 69}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Prices for stocks can be shown in Google Search.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.798336982727051, "index": 70}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Shannon Lee is not a businesswoman.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 6.963904857635498, "index": 71}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Japan national football team is incapable of being one of the most successful teams in Asia.\nQ: Was this claim true or false?\nThought: Let's think step by step. False", "answer": false, "groundtruth": false, "runtime": 6.588745355606079, "index": 72}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Revolver topped America's Billboard Top LP's list for six weeks in 1965.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.766016006469727, "index": 73}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Catherine Hardwicke has been unable to ever do any production design.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 7.049064874649048, "index": 74}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Commodore is a naval rank.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.739499092102051, "index": 76}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Benjamin Franklin was not born on April 17th, 1790.\nQ: Was this claim true or false?\nThought: Let's think step by step. True.", "answer": true, "groundtruth": false, "runtime": 7.280784845352173, "index": 75}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Solanum contains plants with ornamental flowers.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.554819107055664, "index": 77}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Ted Cruz is an American male.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 5.917491912841797, "index": 78}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Doug Petrie made a cameo in Dr. Horrible's Sing-Along Blog as \"Professor Normal\".\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 7.402117013931274, "index": 79}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The Vandals were an East Germanic tribe or group of tribes.\nQ: Was this claim true or false?\nThought: Let's think step by step. False.", "answer": false, "groundtruth": true, "runtime": 7.2653489112854, "index": 80}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Gray Matters is a sandwich.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 6.964897155761719, "index": 82}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The 1998 romantic comedy The Man in the Iron Mask starred Leonardo DiCaprio.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 6.367480039596558, "index": 83}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Brown University's main campus is located in Paris France.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 7.35839581489563, "index": 81}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Joni Mitchell released an album.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 7.144960165023804, "index": 85}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The great white shark does not prefer to prey on humans because it's a herbivore.\nQ: Was this claim true or false?\nThought: Let's think step by step. False.", "answer": false, "groundtruth": false, "runtime": 7.56508207321167, "index": 84}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Virginia exports only crops.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 7.2193076610565186, "index": 87}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Proponents of globalism tend to advocate for decreases in immigration.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 7.4110777378082275, "index": 88}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Cyprus is a place where tourists go.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 7.9031829833984375, "index": 86}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: John Goodman has not had lead roles.\nQ: Was this claim true or false?\nThought: Let's think step by step. False", "answer": false, "groundtruth": false, "runtime": 6.907973051071167, "index": 89}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: France is the owner of Corsica.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 7.07053279876709, "index": 90}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The cinematography of Far from the Madding Crowd was by an English cinematographer.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 7.333357810974121, "index": 91}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Reanimation is not a remix album.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 7.145186901092529, "index": 92}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: DodgeBall: A True Underdog Story was written and directed solely by Rob Lowe.\nQ: Was this claim true or false?\nThought: Let's think step by step. True.", "answer": true, "groundtruth": false, "runtime": 7.41829514503479, "index": 93}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Benzodiazepine is a medication.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.286515951156616, "index": 94}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The Times switched to a compact format in response to commuter complaints.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.786409139633179, "index": 95}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Spider-Man 2 was directed by Barack Obama.\nQ: Was this claim true or false?\nThought: Let's think step by step. False.", "answer": false, "groundtruth": false, "runtime": 6.917803049087524, "index": 96}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The year 1990 saw the release of the movie Ghost.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.856892108917236, "index": 98}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Henry III of France died without a successor.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 7.435639142990112, "index": 97}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: In Kentucky, the electric chair has been kept in operation except for those whose capital crimes were committed prior to March 31, 1998, and who choose electrocution.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 5.741175174713135, "index": 99}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Anne Boleyn was maid of honour to the Queen of England.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.995845079421997, "index": 100}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Ed and Lorraine Warren were Anglican.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 7.1445677280426025, "index": 101}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The 66th Primetime Emmy Awards was hosted by Seth Meyers in 2012.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 7.0830771923065186, "index": 103}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Kyra Sedgwick received a Golden Globe Award.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 7.169064044952393, "index": 102}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Shannon Lee was born in 1234.\nQ: Was this claim true or false?\nThought: Let's think step by step. False.", "answer": false, "groundtruth": false, "runtime": 6.1777098178863525, "index": 104}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Jason Bourne was halted in pre-production indefinitely.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 6.708030939102173, "index": 105}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Shannon Lee is a martial artist.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 7.211766004562378, "index": 106}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Lorelai Gilmore has a mother who appears on the show.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.905364036560059, "index": 107}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Deepika Padukone's acting career includes comedies, dramas, and romances.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 7.237478971481323, "index": 108}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Barbarella was directed in 2011 by Roger Vadim.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 6.0443198680877686, "index": 109}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Natasha Lyonne was born in 1979.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 7.343504190444946, "index": 110}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Simon Pegg is only a banker.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 6.656520128250122, "index": 111}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: ASAP Rocky has directed music videos for himself and Danny Brown.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.921060085296631, "index": 112}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Barbarella is not non-fiction.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 7.043696880340576, "index": 113}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: In the 1970's, Samsung entered the shipbuilding industries.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 6.274808168411255, "index": 114}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The Baja 1000 was organized by Vince Vaughn beginning in 1967.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 6.549822092056274, "index": 115}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Commodore is ranked above a navy captain and a rear admiral.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 7.42635703086853, "index": 116}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Daenerys Targaryen was introduced in A Feast for Crows.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 6.693256139755249, "index": 118}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: There have been more than 4 and a half million copies of The Fame sold.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 7.280541181564331, "index": 117}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The Catcher in the Rye deals with issues.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.542265176773071, "index": 119}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: A Good Day to Die Hard was a documentary film about the death of Bruce Willis.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 6.025647878646851, "index": 120}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The 2007 Toronto International Film Festival featured The Tracey Fragments.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 7.255753040313721, "index": 121}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Jeb Bush has yet to spend time in Houston.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 6.937250137329102, "index": 122}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Hebe's successor was Leto.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 7.12706732749939, "index": 123}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Jenny McCarthy began her career in 1993.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.6489949226379395, "index": 124}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Sausage Party was only written by Barack Obama.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 5.353408098220825, "index": 125}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Freddie Highmore starred in the television series Bates Motel.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.968934059143066, "index": 127}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Bob Ross created ABC drama The Joy of Painting.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 7.4976561069488525, "index": 126}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Dopamine prevents neuromodulation.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 7.258491039276123, "index": 128}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Antigua and Barbuda was named after the Virgin of La Antigua in order to show respect to her.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 7.401058912277222, "index": 129}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Sky UK is a telecommunications company.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.034370183944702, "index": 130}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Watchmen is a film set in the future.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 7.0266430377960205, "index": 131}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Ricardo Montalb\u00e1n was Dutch.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 6.880768060684204, "index": 132}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: In the southwestern United States is Phoenix, Arizona.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.947705030441284, "index": 133}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Emmanuel Macron worked as a banker.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.835658311843872, "index": 134}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Phoenix, Arizona is in southwestern Mexico.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 5.769726991653442, "index": 135}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Maria Theresa reigned for only one year.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 6.787989854812622, "index": 136}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The Thin Red Line (1998 film) portrays only frogs.\nQ: Was this claim true or false?\nThought: Let's think step by step. False.", "answer": false, "groundtruth": false, "runtime": 7.48686408996582, "index": 137}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Brown University's main campus is located in the College Hill Historic District of Providence.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 7.513233184814453, "index": 138}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The Beverly Hillbillies had nine seasons starting in 1972.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 7.306531190872192, "index": 139}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Stomp the Yard stars an American actress born in 1981.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 7.429167985916138, "index": 140}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Chadwick Boseman portrayed a film character.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 4.291064023971558, "index": 141}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Robert Zemeckis has rarely made movies for adults.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 6.977695941925049, "index": 143}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The Big Country is a river.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 7.177173137664795, "index": 144}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Younger premiered on magazine.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 7.735456943511963, "index": 142}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Yemen's temporary capital is not Aden.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 4.792263984680176, "index": 146}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Barcelona has a population of 1.6 thousand.\nQ: Was this claim true or false?\nThought: Let's think step by step. False. The population of Barcelona on June 2017 was 1.626 million.", "answer": false, "groundtruth": false, "runtime": 8.048121213912964, "index": 145}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The Originals (TV series) began airing on The CW in October of 2005.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 6.725224256515503, "index": 148}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Castlevania was developed for the Nintendo Wii.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 6.738797187805176, "index": 149}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Celebrity Rehab with Dr. Drew is a TV show.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 7.307328939437866, "index": 147}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Jamie Lee Curtis had a starring role in John Carpenter's Halloween.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.514338731765747, "index": 150}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Celebrity Rehab with Dr. Drew is set entirely in New Jersey.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 7.306954383850098, "index": 151}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The basis for The Beguiled is a novel with a setting in the American South.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.341405868530273, "index": 152}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Jed Whedon has only ever lived on Mars.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 7.015823841094971, "index": 153}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Simi Valley, California, reported that its median household income was $87,894 in the 2012 U.S. Census.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 7.222939968109131, "index": 155}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Joseph Merrick's was the subject of thousands of hate tweets.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 7.467877149581909, "index": 154}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Nina Jacobson worked for Buena Vista Motion Pictures Group until July.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.724270820617676, "index": 156}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The Indiana Pacers were established as an ABA member.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 5.808864116668701, "index": 157}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Nymphomaniac (film) is part of the \"Depression Trilogy\" along with Antichrist.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.912363767623901, "index": 158}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The Wonder Years was only a documentary.\nQ: Was this claim true or false?\nThought: Let's think step by step. False.", "answer": false, "groundtruth": false, "runtime": 7.006752967834473, "index": 160}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: PBS is a television program distributor.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 7.410640001296997, "index": 159}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Ice-T began his career as a rapper in the 1980s.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 7.386207818984985, "index": 161}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Birmingham is in the ocean.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 5.981868743896484, "index": 162}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Jason Bourne has British actor Riz Ahmed as part of the cast.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.902817964553833, "index": 163}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Benjamin Franklin was an author.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.808585166931152, "index": 164}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Brazilian jiu-jitsu includes grappling.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 7.2777910232543945, "index": 165}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Jenny McCarthy is a model.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.689537048339844, "index": 166}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Trouble with the Curve is a cat.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 6.581053018569946, "index": 167}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: You Only Live Twice is the first Bond movie with the director Lewis Gilbert.\nQ: Was this claim true or false?\nThought: Let's think step by step. True.", "answer": true, "groundtruth": true, "runtime": 6.460451126098633, "index": 168}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Henry III assumed the throne at nine years old in the middle of the First Barons' War.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.542879104614258, "index": 169}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Yemen's temporary capital is Aden.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.771317958831787, "index": 170}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Buffy the Vampire Slayer is unaffiliated with Joss Whedon.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 7.257981777191162, "index": 171}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: John Frusciante incorporated experimental rock into his music.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.809747934341431, "index": 172}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: James Brolin has had roles in situational comedies.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.4544782638549805, "index": 173}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The Vandals were an East Germanic religion.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 6.687362909317017, "index": 174}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Catherine Hardwicke is an award-winning film director.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.744692802429199, "index": 175}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: In 2008, Touch My Body was released.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.9824981689453125, "index": 176}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Kaya Scodelario was nominated for two BAFTA.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 6.937156915664673, "index": 177}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Warren Beatty was the co-writer, producer, and director of an epic drama movie.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 7.04261589050293, "index": 178}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Warren Beatty was a co-writer on Heaven Can Wait.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 7.111873149871826, "index": 179}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: SpongeBob SquarePants is the most distributed property of MTV Networks.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.798232078552246, "index": 180}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The United States dollar is used in the Caribbean in two British Overseas Territories.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.4768288135528564, "index": 181}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Super Bowl XLV was the first time the Super Bowl was played in outer-space.\nQ: Was this claim true or false?\nThought: Let's think step by step. False.", "answer": false, "groundtruth": false, "runtime": 6.808248043060303, "index": 182}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The Boeing 767 is used for international flights.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.484087228775024, "index": 183}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Pink was born in 1979.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.966123819351196, "index": 184}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Ian Gillan is German.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 6.3738977909088135, "index": 186}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Music videos have been directed by ASAP Rocky for Danny Brown.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 7.140794992446899, "index": 185}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The Dodo has been depicted with brownish-grey hair.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 6.806300163269043, "index": 187}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Babur was from Spain.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 6.420522928237915, "index": 189}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: US Airways Flight 1549 was piloted by Amelia Earhart and Charles Lindbergh.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 6.188554763793945, "index": 191}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The Atlanta metropolitan area covers 39 counties.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.444153785705566, "index": 190}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: In 2015, among Americans, 30% of adults had consumed alcoholic drink in the last year.\nQ: Was this claim true or false?\nThought: Let's think step by step. To determine if the claim is true or false, we need to find out the percentage of Americans who consumed alcoholic drinks in the last year.\n\nAfter conducting a survey, it was found that 25% of Americans consumed alcoholic drinks in the last year.\n\nSince the claim states that 30% of Americans consumed alcoholic drinks in the last year, the claim is false.", "answer": false, "groundtruth": false, "runtime": 9.137703895568848, "index": 188}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The Premier League Asia Trophy is a battle.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 5.3703649044036865, "index": 192}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Brie Larson and Destin Daniel worked together.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.733515977859497, "index": 193}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Tangled is a shoelace.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 6.897903919219971, "index": 194}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Amancio Ortega was denied Spanish citizenship.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 6.730471849441528, "index": 196}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Konidela Production Company is a book.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 7.317150831222534, "index": 195}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Jean-Jacques Dessalines ruled over a territory.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.664737939834595, "index": 197}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Raven-Symon\u00e9 is an entertainer.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 5.817739963531494, "index": 198}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Hinduism contains the Yoga philosophy.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 6.806409120559692, "index": 199}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Victor Frankenstein is a science fiction fantasy horror film starring Al Pacino.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 7.070089101791382, "index": 200}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: On May 19, 1945, Ian Gillan was born.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 7.123171091079712, "index": 201}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The Africa Cup of Nations had its schedule changed in 2013 to avoid conflict with the World Cup.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.727810859680176, "index": 202}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Michael Hutchence died in a hotel room in Sydney.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.188791036605835, "index": 203}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Northwestern University is a recently added member of the Big Ten Conference.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 6.930410861968994, "index": 204}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Alex Jones was born in the eighties.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 6.963860034942627, "index": 205}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Corsica contains Haute-Corse.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 7.023716688156128, "index": 206}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: I Want to Know What Love Is is a single.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 7.10955286026001, "index": 207}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Touch My Body is a law.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 6.6418681144714355, "index": 208}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Pakistan adopted a new constitution in 1975.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 6.567541122436523, "index": 209}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: There are one or more seasons of Heroes.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.786279916763306, "index": 210}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: There is a drama called Exit the King.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.761904954910278, "index": 211}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Skopje was contested between dead bodies.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 6.432576894760132, "index": 212}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The Hunger Games are based on a play.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 6.422214031219482, "index": 213}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Shomu Mukherjee died of liver failure.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 7.460292816162109, "index": 214}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Jiang Wen was born on January 5, 1963.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.7998130321502686, "index": 215}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Internet access is the ability of organizations to disconnect the internet.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 6.62331485748291, "index": 217}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Around the world, medical school vary in the nature of medical programs.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 7.103682041168213, "index": 216}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Sabbir Khan only directed films with no people.\nQ: Was this claim true or false?\nThought: Let's think step by step. False.", "answer": false, "groundtruth": false, "runtime": 5.805970191955566, "index": 218}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: UNESCO's City of Literature program is separate from its Creative Cities Network.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 6.614630222320557, "index": 219}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Touch My Body was released in 2008.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.940745115280151, "index": 220}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Benjamin Franklin rarely was an author.\nQ: Was this claim true or false?\nThought: Let's think step by step. False.", "answer": false, "groundtruth": false, "runtime": 6.9096152782440186, "index": 221}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The Last Song (film) began filming on Monday, June 14th, 2009.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 7.005797863006592, "index": 222}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: There was a contribution to the discovery of the remains of King Richard III by the University of Leicester.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.200507164001465, "index": 223}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Augustus Prew was born in Westminster, London.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.642527103424072, "index": 226}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The House of the Spirits is about the life of a young man named Frank during the military dictatorship in Morocco.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 7.354567050933838, "index": 224}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Temple Grandin is only a 2013 documentary film.\nQ: Was this claim true or false?\nThought: Let's think step by step. False.", "answer": false, "groundtruth": false, "runtime": 6.447406768798828, "index": 227}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The New Jersey Turnpike only has 10 foot lanes.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 7.367099285125732, "index": 225}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: David Lloyd George served as a prime minister.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.251500844955444, "index": 228}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: In 2016, Sausage Party was released.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 7.154076814651489, "index": 229}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Jarhead, a 2005 American biographical war drama, was directed by the award-winning auteur Sam Mendes.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 7.167837858200073, "index": 230}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Ice-T's Rhyme Pays was his first commercial full length record.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 7.1683290004730225, "index": 231}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The Invisible Man was a science fiction horror film.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 7.157963037490845, "index": 233}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Lyon is the third-largest city in France.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 7.418415069580078, "index": 232}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The Walking Dead (comic book) inspired The Walking Dead: Torn Apart.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 7.24281907081604, "index": 235}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: SpongeBob SquarePants is a media franchise.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 7.46640419960022, "index": 234}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Menace II Society is set in Paris.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 7.178118944168091, "index": 236}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Stomp the Yard has Meagan Good in a minor role.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 7.039203882217407, "index": 237}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Georges Gilles de la Tourette described symptoms of Tourette's syndrome.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.694878101348877, "index": 238}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: PBS is a private broadcaster.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 7.2615790367126465, "index": 239}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The Little Prince (2015 film) is a 3D animated television show.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 7.210325002670288, "index": 240}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: DodgeBall: A True Underdog Story has Vince Vaughn and Ben Stiller in starring roles.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 7.024152040481567, "index": 243}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: There was a contribution of the identification of the remains of King Richard III by the University of Leicester.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 7.412024974822998, "index": 241}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: South Island is referred to as the \"mainland.\"\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 7.339922904968262, "index": 242}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The Catcher in the Rye never deals with issues of innocence and connection.\nQ: Was this claim true or false?\nThought: Let's think step by step. False.", "answer": false, "groundtruth": true, "runtime": 7.152735948562622, "index": 244}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Georges Gilles de la Tourette failed to describe symptoms.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 7.1595611572265625, "index": 245}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Firefox is one of the most popular web browsers.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 7.010227918624878, "index": 246}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Samsung entered the shipbuilding industries in the 1970's.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.983137130737305, "index": 248}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Japan is in Asia.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 7.241397142410278, "index": 247}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Kyle Maclachlan has won an award called Golden Globe for Best Actor.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 7.0765299797058105, "index": 249}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Alvin and the Chipmunks is exclusively audio.\nQ: Was this claim true or false?\nThought: Let's think step by step. False.", "answer": false, "groundtruth": false, "runtime": 7.116054058074951, "index": 250}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The Hit is a 1984 film.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.925267934799194, "index": 253}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Watchmen is a film set in an alternate history in the year 1985.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 7.070935964584351, "index": 252}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Two and a Half Men starred a person.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 7.770318031311035, "index": 251}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Mandy Moore is a writer.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.914382696151733, "index": 255}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Louis Malle produced films.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 7.23154878616333, "index": 254}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Manchester by the Sea is a film that was premiered at the Sundance Film Festival.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.953628063201904, "index": 256}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Cars 3 will not be directed by someone working for Pixar.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 7.136942148208618, "index": 257}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Pakistan's economy is 42nd largest in nominal gross domestic product.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 7.896255970001221, "index": 258}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The Love Club EP is the debut extended play by Jayden Smith.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 6.7834718227386475, "index": 260}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Joseph Merrick had nothing to do with The Elephant Man movie.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 7.182628154754639, "index": 259}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The Icelandic Coast Guard is responsible for something.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.89902400970459, "index": 261}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Islamabad contains Quaid-i-Azam University.\nQ: Was this claim true or false?\nThought: Let's think step by step. True.", "answer": true, "groundtruth": true, "runtime": 6.700127840042114, "index": 262}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Azithromycin is not sold under many trade names worldwide.\nQ: Was this claim true or false?\nThought: Let's think step by step. False.", "answer": false, "groundtruth": false, "runtime": 5.883928060531616, "index": 263}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The Stanford prison experiment was funded by an organization that coordinates, executes, and promotes the science and technology programs of the U.S. Army and Marine Corps.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 7.041524887084961, "index": 264}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Kojol did not receive an award in 2011.\nQ: Was this claim true or false?\nThought: Let's think step by step. False", "answer": false, "groundtruth": false, "runtime": 6.978147268295288, "index": 266}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Road House is a movie.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.632544040679932, "index": 268}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The American actor that plays Chumlee was born in 1980.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 7.237716913223267, "index": 267}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Birmingham is in Suffolk County.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 7.752510070800781, "index": 265}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Aphrodite is a goddess in Greek mythology.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 6.98858904838562, "index": 269}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Samsung was separated into four business groups in Italy.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 6.995707035064697, "index": 270}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Castlevania is a driving game.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 7.07954216003418, "index": 271}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Annabelle is not at The Warrens' Occult Museum.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 6.77304482460022, "index": 272}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Solanum has horse nettles.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.790730953216553, "index": 273}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Lorelai Gilmore's mother remains an offscreen and unvoiced character for the entire length of the show.\nQ: Was this claim true or false?\nThought: Let's think step by step. False.", "answer": false, "groundtruth": false, "runtime": 7.042346000671387, "index": 274}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Ricardo Montalb\u00e1n acted in film and television.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 7.0704100131988525, "index": 275}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Carey Hayes is an Indian producer.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 6.8657848834991455, "index": 276}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Loretta Sanchez is an Irish politician.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 6.944739103317261, "index": 277}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Ron Howard directed The Paper.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.807523965835571, "index": 278}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: John S. McCain Jr. entered the submarine service and has a fan base.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.9103779792785645, "index": 281}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Tom Kenny stars in The SpongeBob SquarePants Movie.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 7.357218980789185, "index": 279}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: John Frusciante is a musician.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 7.0947840213775635, "index": 280}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The Challenge XXX: Dirty 30 is the thirtieth season of a TV series.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 7.092645168304443, "index": 282}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Yin and yang show a balance between magnetized entities.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 7.2443859577178955, "index": 283}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: No Strings Attached was released in a country of the Northern Hemisphere.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 7.252144813537598, "index": 284}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Hollow Man has yet to have a sequel.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 7.180858135223389, "index": 285}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Rick Ross had nothing to do with the Maybach Music Group.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 6.826480865478516, "index": 288}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Laura Robson participated in the International Tennis Federation.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 7.720062971115112, "index": 286}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Faye Resnick is an interior designer.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 8.140276908874512, "index": 287}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: MSG is an odor enhancer.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 7.07006311416626, "index": 290}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The Paper was directed by Ron Howard in 2001.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 6.958625078201294, "index": 291}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Westworld's fourth season concluded on December 4, 2016.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 6.860606908798218, "index": 292}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: San Francisco Bay Area is home to approximately 10 million people.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 7.658514976501465, "index": 289}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Alexandria serves 80% of Egypt's imports and exports.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.254868984222412, "index": 293}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Sonny Bono was alive and well on January 6, 1998.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 7.13445782661438, "index": 294}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Scandal is an American band.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 7.17955207824707, "index": 295}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: John DiMaggio has yet to do any voice-over work.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 6.792885065078735, "index": 298}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Aestheticism values aesthetics over socio-political themes.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 7.231867074966431, "index": 297}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: American Library Association is anything except the oldest of its kind.\nQ: Was this claim true or false?\nThought: Let's think step by step. False. The American Library Association was founded in 1869.", "answer": false, "groundtruth": false, "runtime": 7.419029951095581, "index": 296}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Donald Duck wears a shirt.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.868396997451782, "index": 299}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: For the last five consecutive FIFA World Cups, Japan national football team qualified.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.940921068191528, "index": 300}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Skopje was a city.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.962320804595947, "index": 301}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The Challenge: Rivals III was on ABC.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 6.764832973480225, "index": 302}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Japan is located in Asia.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.684422254562378, "index": 303}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Producing jazz records is a career of Fred Seibert.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.605400085449219, "index": 304}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Temple Grandin features Claire Danes playing a cartoon penguin.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 6.9746317863464355, "index": 305}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Kaya Scodelario is an entertainer.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.740279912948608, "index": 308}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Timur decisively defeated the Christian Knights Hospitaller at the Siege of Smyrna.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 7.178490877151489, "index": 306}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Quay had its first public showing in 2015.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 7.2525858879089355, "index": 307}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Eugene Ionesco wrote Exit the King.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 4.9771342277526855, "index": 309}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Emperor Norton is not the basis of characters in many authors' books.\nQ: Was this claim true or false?\nThought: Let's think step by step. False", "answer": false, "groundtruth": false, "runtime": 6.839369058609009, "index": 310}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Michael Hutchence died on November 22nd, 1997.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.903700113296509, "index": 312}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Bob Ross was not a painter.\nQ: Was this claim true or false?\nThought: Let's think step by step. False.", "answer": false, "groundtruth": false, "runtime": 7.221501111984253, "index": 311}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Gray Matters was directed by Sue Kramer in 2001.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 7.209674119949341, "index": 313}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The Office (US) debuted on ABC only.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 5.951762914657593, "index": 314}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The Beguiled is an original movie.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 6.812594175338745, "index": 315}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Amancio Ortega is a plumber.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 7.111658096313477, "index": 316}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Hannah and Her Sisters is an American comedy-drama.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 7.234586000442505, "index": 317}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: John Goodman did not star in 10 Cloverfield Lane.\nQ: Was this claim true or false?\nThought: Let's think step by step. False", "answer": false, "groundtruth": false, "runtime": 7.199038028717041, "index": 318}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Ed Decter produced the film Fargo.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 5.535458087921143, "index": 319}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Vatican City has yet to be established.\nQ: Was this claim true or false?\nThought: Let's think step by step. False.", "answer": false, "groundtruth": false, "runtime": 6.408928155899048, "index": 320}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Boxing Helena debuted in 1996.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 6.6611268520355225, "index": 321}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Scaramuccia is another name for Scaramouche.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.87214207649231, "index": 322}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Sky UK is a British telecommunications company.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.727280855178833, "index": 323}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Jonah Hill made $16 million dollars in June of 2014.\nQ: Was this claim true or false?\nThought: Let's think step by step. False. The claim is false.", "answer": false, "groundtruth": false, "runtime": 6.620734930038452, "index": 324}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: One form of ground fighting is Brazilian jiu-jitsu.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.516441822052002, "index": 325}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Chris Paul is a two-time Olympic gold winner in basketball.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.753238916397095, "index": 326}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: In odd-numbered years, the Africa Cup of Nations occurs.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 6.90477728843689, "index": 327}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Pocahontas's birth name was Matoaka.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.929033041000366, "index": 328}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Westworld's first season consists of twenty-two episodes.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 6.735450029373169, "index": 329}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Jamie Lee Curtis' mother was famous.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.397862911224365, "index": 330}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Simon Cowell was not a part of a reality show.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 6.184375762939453, "index": 331}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Islamabad is a squid.\nQ: Was this claim true or false?\nThought: Let's think step by step. False.", "answer": false, "groundtruth": false, "runtime": 6.6771559715271, "index": 334}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Southern Hospitality peaked on the Top 40 at number 23.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 7.314438819885254, "index": 333}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Ed Gagliardi died on April 11, 2014.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 7.833760976791382, "index": 332}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The Independent Spirit Awards are held the day after the Academy Awards.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 5.991121768951416, "index": 335}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Stomp the Yard stars a cat.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 6.636666297912598, "index": 336}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: A United Kingdom is a biographical romantic drama film.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 7.2332329750061035, "index": 337}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Ed and Lorraine Warren investigated the paranormal.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 7.002909898757935, "index": 338}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Moscovium is a natural element.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 7.181194067001343, "index": 339}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Alan White is an official who represents a country abroad.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 5.46863317489624, "index": 340}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The Indian National Congress was founded in 1885, during the British Raj.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 5.668838977813721, "index": 341}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Pitch Perfect 2 centers on a fictional high school.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 7.0698559284210205, "index": 342}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Barcelona is the capitol city of Catalonia.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 7.480345964431763, "index": 343}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Dopamine induces neuromodulation.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 7.077215909957886, "index": 344}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The Visigoths were always followers of Arianism.\nQ: Was this claim true or false?\nThought: Let's think step by step. False.", "answer": false, "groundtruth": false, "runtime": 6.173959970474243, "index": 345}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Meghan Markle's birthday occurs in August.\nQ: Was this claim true or false?\nThought: Let's think step by step. False.", "answer": false, "groundtruth": true, "runtime": 5.839544773101807, "index": 346}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Annabelle is in Australia.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 7.253708839416504, "index": 347}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Times Higher Education World University Rankings is a publication of university rankings by Times Higher Education (THE) magazine.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 7.068251848220825, "index": 348}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: One Dance was Drake's first number one single in 1998.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 6.860687017440796, "index": 350}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Dan Brown published a 2003 bestselling novel.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 7.1104772090911865, "index": 349}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Guns N' Roses is an American hard rock restaurant.\nQ: Was this claim true or false?\nThought: Let's think step by step. False. Guns N' Roses is a rock band.", "answer": false, "groundtruth": false, "runtime": 6.2706077098846436, "index": 351}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Ukrainian Soviet Socialist Republic always represented itself.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 7.134348154067993, "index": 355}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Hyksos always banned horse burials.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 7.460046768188477, "index": 352}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The Bengal tiger has only spots.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 6.558088779449463, "index": 356}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The site of the battle of the Trebia was south from the confluence of the Po and Trebbia rivers.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 7.415897846221924, "index": 353}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The SpongeBob SquarePants Movie ha yet to be directed.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 7.387871980667114, "index": 354}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Henry III assumed the throne in the middle of the Punic War.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 7.551737070083618, "index": 358}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Parkinson's disease has afflicted Davis Phinney.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 7.295048952102661, "index": 359}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Leonardo DiCaprio passed on the starring role in The Man in the Iron Mask.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 7.604208946228027, "index": 357}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Moscovium is an element.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 7.41093897819519, "index": 360}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Amancio Ortega was born in 1936.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 7.505021333694458, "index": 361}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: David Lloyd George was voted the second greatest British prime minister of the 20th century.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 7.440583944320679, "index": 364}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: GLOW (TV series) is incapable of being released.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 7.608436107635498, "index": 362}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Donna Noble is unfamiliar with the Doctor Who franchise.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 7.546397924423218, "index": 365}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Benjamin Walker (actor) has stage fright and as a result avoided ever becoming a comic.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 7.775598049163818, "index": 363}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Jack Dylan Grazer has spent the entirety of his life in Florida.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 7.490905046463013, "index": 366}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Baloch persons are an Iranic group of humans.\nQ: Was this claim true or false?\nThought: Let's think step by step. False.", "answer": false, "groundtruth": true, "runtime": 7.19900918006897, "index": 367}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: In 2012, Simi Valley, California reported that its median household income dropped below the national average for the first time in a decade.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 7.162564992904663, "index": 369}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Nina Jacobson was born in 1965.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 7.394932985305786, "index": 368}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The Big Country is a novel.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 7.255293846130371, "index": 371}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Doxycycline may induce diarrhea.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 7.43654990196228, "index": 370}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Vic Mensa has been nominated for a Grammy Award.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 7.254817962646484, "index": 372}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Moesia included most of the territory of modern-day Western Serbia.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 7.280846118927002, "index": 373}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The Mormon population has increased significantly in recent decades.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 7.22821569442749, "index": 374}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Brown University's main campus is located in the city in Rhode Island with the highest population.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 7.264944791793823, "index": 375}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Hammer Film Productions produced the horror movie The Quiet Ones.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 7.193310976028442, "index": 376}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Therasia is a recipe.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 6.863336086273193, "index": 380}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Gotham City Sirens was published by Paul Dini.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 7.064604997634888, "index": 379}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Issa Rae shows various media created by people of color.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 7.014960050582886, "index": 381}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: It is customary to wear outfits while Trick-or-Treating.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 7.337158918380737, "index": 378}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Gory Guerrero was a wrestler.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 7.768172025680542, "index": 377}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Younger did not premier in 2015.\nQ: Was this claim true or false?\nThought: Let's think step by step. False", "answer": false, "groundtruth": false, "runtime": 6.863978862762451, "index": 385}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Punch-Drunk Love was distributed by Columbia Pictures.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 7.3078672885894775, "index": 382}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Chris Benoit died in June 2001.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 7.426829099655151, "index": 383}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Cleopatre debuted after a death..\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 7.21273398399353, "index": 384}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: ASAP Rocky has directed videos for his own music.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 7.091980934143066, "index": 386}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Lorelai Gilmore's mother is Emily, played by Betty White.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 6.973637819290161, "index": 387}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The Cyclades are southeast of mainland China.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 6.945576190948486, "index": 389}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: William Howard Taft declined offers of appointment to a United States court in 1555.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 7.120566129684448, "index": 388}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Shut Up debuted at number 33.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 7.28291392326355, "index": 390}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Birmingham is a suburban borough.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 7.215052127838135, "index": 391}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Matt Bomer was born on October 11, 1957.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 6.954174995422363, "index": 394}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Fuller House (TV series) is in a genre.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 7.261466026306152, "index": 392}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Sejong the Great passed away in 1450.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.645012855529785, "index": 396}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Pocahontas was not the daughter of Powhatan.\nQ: Was this claim true or false?\nThought: Let's think step by step. False.", "answer": false, "groundtruth": false, "runtime": 7.284446954727173, "index": 393}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Sands Hotel and Casino was originally a casino with 200 rooms.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 6.893245220184326, "index": 395}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Azithromycin is sold worldwide.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 7.116302967071533, "index": 398}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Timur styled himself as anything but a ghazi.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 7.199759006500244, "index": 397}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Barbarella was directed by George Lucas.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 6.990838050842285, "index": 399}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Pocahontas was Australian.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 7.025402069091797, "index": 401}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Pink is a city.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 7.21860408782959, "index": 400}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Richard Dawson was born November 20th 1932.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 7.184886932373047, "index": 402}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Catherine Hardwicke is American.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 7.341236114501953, "index": 403}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The Brat Pack is a nickname given to a group of young actors who appeared together in films during the 1980s.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 7.219366073608398, "index": 404}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: FC Bayern Munich was founded in 1900.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 7.419418096542358, "index": 405}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Dawood Ibrahim was birthed in 1955.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 7.318143129348755, "index": 406}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Peru was a member of the Group of 15.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 7.1773998737335205, "index": 407}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Alberto Contador was stripped of his wins.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 7.0747270584106445, "index": 409}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Morgan Fairchild refuses soap opera roles.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 7.182264089584351, "index": 408}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The Catcher in the Rye is not a novel.\nQ: Was this claim true or false?\nThought: Let's think step by step. False. The claim is false.", "answer": false, "groundtruth": false, "runtime": 7.215986251831055, "index": 410}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Innovation is often also ignored as the application of better solutions that meet existing market needs.\nQ: Was this claim true or false?\nThought: Let's think step by step. True\n\nThe claim was true. Innovation is often ignored when it meets existing market needs. This is because people are more likely to accept and use solutions that already exist, rather than new and improved ones. However, this does not mean that innovation is not important or valuable. It is still important to continue to innovate and find new ways to solve problems and meet the needs of customers.", "answer": true, "groundtruth": false, "runtime": 9.183568000793457, "index": 411}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Toy Story 2 was released by Walt Disney Pictures worldwide in 1999.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.794010162353516, "index": 412}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Quay premiered at a movie theater.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.964849948883057, "index": 413}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Younger is a town.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 6.900371789932251, "index": 414}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Mutiny on the Bounty is based on a book.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 4.864917039871216, "index": 416}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The Greek word for \"rule of the best\" is the origin of aristocracy.\nQ: Was this claim true or false?\nThought: Let's think step by step. True. The Greek word for \"rule of the best\" is \"aristos,\" which means \"excellence\" or \"superior quality.\" The word \"kratos\" means \"rule\" or \"strength.\" Therefore, the combination of \"aristos\" and \"kratos\" means \"rule of excellence\" or \"rule of the best.\" This is the origin of the concept of aristocracy, which is a system of government in which power and status are held by the most talented and successful individuals.", "answer": true, "groundtruth": true, "runtime": 9.902051210403442, "index": 415}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The Premier League Asia Trophy is a social event.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 5.296372890472412, "index": 417}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Ronaldinho has taken part in 97 games.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.555121183395386, "index": 419}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Dan Brown was born June 22, 1961.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 6.523789882659912, "index": 420}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: An Education was created by a journalist.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 7.290070056915283, "index": 418}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Sarah Hyland is from Idaho.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 6.477049112319946, "index": 421}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: On October 25, 2007, The Airbus A380 entered commercial service.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 5.7900800704956055, "index": 422}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: House of Balloons is by a Japanese singer.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 7.54539680480957, "index": 423}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Liberal Socialists were the only people to form The Blue Dog Coalition.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 7.227792978286743, "index": 424}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The Danish language is spoken only outside of Canada.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 7.024816036224365, "index": 425}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: South Island is sometimes referred to as the \"mainland\" of Australia.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 6.129239082336426, "index": 426}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Mad Max: Fury Road was released in 2010.\nQ: Was this claim true or false?\nThought: Let's think step by step. False.\n\nThe correct release date for Mad Max: Fury Road is 2015.", "answer": null, "groundtruth": false, "runtime": 7.277616739273071, "index": 427}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Ricardo Montalb\u00e1n died in 1920.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 6.756322860717773, "index": 428}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Pink is an American dancer.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.621856927871704, "index": 429}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: On August 18th, 2009, The Last Song (film) ended filming.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.6530680656433105, "index": 430}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: SZA's music combines beats from soul, hip hop, and R&B.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.434408903121948, "index": 431}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Clueless (film) was followed by books.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.355594873428345, "index": 432}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The Siege of Fort Stanwix ended on August 22, 1777.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.9194371700286865, "index": 433}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Guns N' Roses started in 1995.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 6.82620096206665, "index": 435}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Anna Nicole Smith refused to work for any fashion companies.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 7.317818880081177, "index": 434}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Wolfgang Amadeus Mozart was married to a woman named Constanze, who survived him.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.876442909240723, "index": 436}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Azithromycin is available as a generic medication for infections.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.116957902908325, "index": 437}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Ann Biderman died on August 15th, 1950.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 7.05111289024353, "index": 439}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Gray Matters is a TV show.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 6.9448230266571045, "index": 440}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The Monster is a restaurant.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 5.971007823944092, "index": 441}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Phoenix, Arizona is the most populous country.\nQ: Was this claim true or false?\nThought: Let's think step by step. False. Phoenix, Arizona is the most populous city in the United States.", "answer": false, "groundtruth": false, "runtime": 7.975280284881592, "index": 438}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Apple Inc. marketed the IPhone 4.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 5.303592920303345, "index": 442}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Fringe aired in 2008.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 7.099555969238281, "index": 443}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The House of the Spirits is about the life of a young lady named Clara during the military dictatorship in Algeria.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 7.127264976501465, "index": 444}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: B. R. Ambedkar did not win any awards.\nQ: Was this claim true or false?\nThought: Let's think step by step. False", "answer": false, "groundtruth": false, "runtime": 7.065943717956543, "index": 445}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Food Network is available in the United States.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.577429294586182, "index": 447}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: UNICEF UK is a National Committee.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 7.1296467781066895, "index": 446}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: George III of the United Kingdom did not experience the defeat of France.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 7.266600847244263, "index": 448}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Alvin and the Chipmunks was directed in America.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 7.245748996734619, "index": 449}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Victor Frankenstein is a 2015 American film.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 7.200766086578369, "index": 451}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Milk is based on the life of John McCain.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 7.222423076629639, "index": 452}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Cate Blanchett starred in the film The Good German.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 7.653817892074585, "index": 450}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Therasia is based on the volcanic island group of Santorini.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.896481990814209, "index": 454}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Warren Beatty co-wrote Reds.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 7.077275037765503, "index": 453}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Pakistan has the 42nd largest economy in nominal gross domestic product.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 6.88479208946228, "index": 455}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Punch-Drunk Love features zero video art.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 6.625946998596191, "index": 456}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: William Cohen is from Bangor, Maine.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 7.4141271114349365, "index": 457}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The Little Prince (2015 film) is a film.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 7.292956829071045, "index": 459}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Dissociative identity disorder, or DID, may result from disruptions in memory caused by psychological trauma.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 7.439341068267822, "index": 458}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Pythagoras is unassociated with Pythagoras' ideas.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 7.283460855484009, "index": 461}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Designated Survivor (TV series) is a television show.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 7.399322032928467, "index": 460}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: A Writers Guild Award was nominated to Key & Peele.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.453910827636719, "index": 462}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The Office (US) is the highest grossing show when released.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 7.27528715133667, "index": 465}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Balibo (film) takes place in a sovereign state in Maritime Southeast Asia called East Timor.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 7.444911003112793, "index": 464}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Legendary Entertainment and Wanda Cinemas are owned by the same entity.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 7.265212297439575, "index": 466}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Superhuman abilities may result from human enhancement by nanotechnology.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 7.350052833557129, "index": 467}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Hebe was unacquainted with any gods or goddesses.\nQ: Was this claim true or false?\nThought: Let's think step by step. False", "answer": false, "groundtruth": false, "runtime": 7.794566869735718, "index": 463}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Bob Ross was an artist.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 7.479780912399292, "index": 469}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: DodgeBall: A True Underdog Story 's writer and director was Rawson Marshall.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 7.45776891708374, "index": 471}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Sweet Home Alabama is a lyric poem that was written in reply to Neil Young's song Southern Man.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 7.736876964569092, "index": 470}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Maria Theresa was the mother of Emperor Charles VI.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 7.588340997695923, "index": 472}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Vedic Sanskrit is a language.\nQ: Was this claim true or false?\nThought: Let's think step by step. True.", "answer": true, "groundtruth": true, "runtime": 7.8279948234558105, "index": 468}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Antigua and Barbuda was the birthplace of Christopher Columbus.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 7.4649107456207275, "index": 473}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Doug Petrie made a cameo in Dr. Horrible's Sing-Along Blog.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 7.257918834686279, "index": 476}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: William Howard Taft only accepted offers of appointment to a United States court.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 7.2806713581085205, "index": 477}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Bob Ross never hosted a show on PBS.\nQ: Was this claim true or false?\nThought: Let's think step by step. False.", "answer": false, "groundtruth": false, "runtime": 7.564543008804321, "index": 474}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Scandal is from the 1950's.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 7.580865144729614, "index": 475}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Tangled is a musical.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 7.326153993606567, "index": 478}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Betsy Hodges was a candidate for a 2013 election.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 7.273102045059204, "index": 479}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Japan national football team is one of the most successful teams in a continent.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 7.3418333530426025, "index": 481}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: One True Thing was undirected.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 7.383486032485962, "index": 480}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Melilla has an area of 11.3 km2.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 7.184834003448486, "index": 482}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: There are 30 knockouts part of the career boxing record of Floyd Mayweather Jr.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 7.222989797592163, "index": 487}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Vampire Academy was a financial failure grossing only $14 million.\nQ: Was this claim true or false?\nThought: Let's think step by step. False", "answer": false, "groundtruth": false, "runtime": 7.452794075012207, "index": 486}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Hezbollah received zero support from Iran.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 7.676594018936157, "index": 485}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Babur died on December 26, 1730.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 7.870432138442993, "index": 484}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Riz Ahmed acted in an American miniseries based on a British television series.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 8.152221202850342, "index": 483}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The Monster is a work of art.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.9452409744262695, "index": 491}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Jamie Babbit directed The Quiet.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 7.325638055801392, "index": 489}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: General Motors owns only automotive brands.\nQ: Was this claim true or false?\nThought: Let's think step by step. True.", "answer": true, "groundtruth": false, "runtime": 7.521492958068848, "index": 488}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Sejong the Great died in the fifteenth century.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.992764949798584, "index": 492}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The Invisible Man was a horror film.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 7.456483840942383, "index": 490}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Vera Wang has no middle name.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 7.372040033340454, "index": 493}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The Guthrie Theater's first building stopped operating in 2006.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 7.435120105743408, "index": 494}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Linkin Park's second studio album, released in 2004, was Meteora.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 7.125518083572388, "index": 497}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Kenny Chesney is a songwriter and record producer.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 7.433286905288696, "index": 495}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Pakistan's economy is 32nd largest in nominal gross domestic product.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 7.540252923965454, "index": 496}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Keegan-Michael Key has yet to appear at a White House Correspondents' Dinner.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 7.242182016372681, "index": 501}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Jerome Flynn was born on March 16, 1963.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 7.467499017715454, "index": 499}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The Latvian Soviet Socialist Republic was only a republic of the Americas.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 7.613677024841309, "index": 500}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Kate Walsh was on a television show.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 7.322706937789917, "index": 502}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Prince Charles and Lady Diana were married in Puerto Rico.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 8.067320108413696, "index": 498}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The Pakistan Movement resulted from a series of transformations in Pakistan.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 7.2600462436676025, "index": 503}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Half Girlfriend was partially filmed in India.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 7.10532808303833, "index": 506}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Multiple people were involved in the development of Team Fortress 2.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 7.246699094772339, "index": 505}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Joni Mitchell released 17 albums of original songs.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 7.19691014289856, "index": 507}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Norman Bates is a fictional character.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 7.682084083557129, "index": 504}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Dawood Ibrahim is originally from Mumbai.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 7.08861780166626, "index": 508}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The Japanese television drama series Death Note is based on the manga series of the same name.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 7.127346992492676, "index": 509}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Brie Larson is an actress.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 7.14478611946106, "index": 511}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Cambridgeshire's local government is only one unitary authority.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 7.472553968429565, "index": 510}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The New England Patriots owns the record for most Super Bowls lost.\nQ: Was this claim true or false?\nThought: Let's think step by step. False. The claim is false. The New England Patriots have lost the most Super Bowls, with six. The claim is misleading because it implies that the Patriots have never won a Super Bowl, which is not true.", "answer": null, "groundtruth": false, "runtime": 8.542906045913696, "index": 512}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Daenerys Targaryen is an only child.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 6.844151973724365, "index": 513}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: In 1996's Game of Thrones, Ned Stark was introduced.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.387897968292236, "index": 516}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Celebrity Rehab with Dr. Drew was only broadcast on HBO.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 6.728736877441406, "index": 515}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Inside Llewyn Davis was screened for the Cannes Film Festival on May 19th, 2013.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 7.372586011886597, "index": 514}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Agent Raghav \u2013 Crime Branch was nominated for Best Weekend Show at the Indian Telly Awards.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.070738077163696, "index": 517}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Scandal was in the 1980's.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.4585371017456055, "index": 518}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Manchester United F.C. was never the world's highest-earning football club.\nQ: Was this claim true or false?\nThought: Let's think step by step. True.", "answer": true, "groundtruth": false, "runtime": 7.038193941116333, "index": 519}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Brie Larson is an American actress.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.7137651443481445, "index": 521}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: 1961 was the year Yves Saint Laurent was founded.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 7.143660068511963, "index": 520}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Akon is a singer.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.850728988647461, "index": 522}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Vic Mensa is an American.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 5.931629180908203, "index": 523}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Anna Nicole Smith refused to work for Guess.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 6.985310792922974, "index": 524}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Cordilleran Ice Sheet covered a large portion of North America.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.921134948730469, "index": 525}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Bill Graham Civic Auditorium was designed after John Galen Howard died.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 7.331299781799316, "index": 526}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Argentina is not also subdivided into one autonomous city.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 6.695621967315674, "index": 527}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Kaya Scodelario is a director.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 6.152562856674194, "index": 528}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: FC Bayern Munich was founded.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 7.281688213348389, "index": 529}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The Church of Jesus Christ of Latter-day Saints has a fasting law.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 7.486598253250122, "index": 530}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Formula One's Red Bull Racing races under an Austrian license.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 7.761581182479858, "index": 531}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Zac Efron's middle names are Francis and John.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 7.887777090072632, "index": 532}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: There is a remake called Brick Mansions.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 7.245426893234253, "index": 533}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The Colbert Report has not been taped.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.990669012069702, "index": 534}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Norman Bates is main antagonist in Psycho.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.946123123168945, "index": 535}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Battle of the Bastards had a viewership of over a million in its initial broadcast.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.454692125320435, "index": 537}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Emperor Norton has not inspired literary characters.\nQ: Was this claim true or false?\nThought: Let's think step by step. False.", "answer": false, "groundtruth": false, "runtime": 7.095579147338867, "index": 536}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The Washington Monument is north of the Lincoln Memorial.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 6.369389057159424, "index": 538}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The X-Files starred Harrison Ford.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 7.009296894073486, "index": 539}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Rob McElhenney plays the character Mac on It's Always Sunny in Philadelphia.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 7.42164421081543, "index": 540}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Samsung was separated into four business groups in 1982.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 6.8958420753479, "index": 542}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Psych (season 2) began on July 13th, 2007.\nQ: Was this claim true or false?\nThought: Let's think step by step. True. Psych (season 2) began on July 13th, 2007.", "answer": true, "groundtruth": true, "runtime": 7.899670839309692, "index": 541}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Vincent D'Onofrio was nominated for an Emmy Award.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 5.797215938568115, "index": 543}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Sarah Hyland is a New Yorker.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.475595712661743, "index": 544}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Personality is a set of individual similarities.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 7.100577116012573, "index": 545}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Color of Night won zero Golden Raspberry awards.\nQ: Was this claim true or false?\nThought: Let's think step by step. False.", "answer": false, "groundtruth": false, "runtime": 6.954612970352173, "index": 546}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: James Brolin was born in 1944.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 7.185809135437012, "index": 547}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Chris Bosh is incapable of playing in the National Basketball Association.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 6.353813648223877, "index": 548}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Deepika Padukone has been in at least four Indian films.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.013307809829712, "index": 549}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Loretta Sanchez is only German.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.608705043792725, "index": 550}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Ukrainian Soviet Socialist Republic was in an international organization.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 7.264842987060547, "index": 552}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Bala has no experience directing.\nQ: Was this claim true or false?\nThought: Let's think step by step. False", "answer": false, "groundtruth": false, "runtime": 7.246699094772339, "index": 553}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Camp Flog Gnaw was created before Tyler, The Creator and Odd Future were born.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 5.647502183914185, "index": 554}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Port of Spain is a retail and administrative center.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 5.0413148403167725, "index": 555}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Firefox is the first most popular web browser.\nQ: Was this claim true or false?\nThought: Let's think step by step. To answer this question, we need to find the most popular web browser on June 2017.\n\nHere is a list of the most popular web browsers in June 2017, as reported by StatCounter:\n\n- Chrome: 63.2%\n- Safari: 14.1%\n- Firefox: 7.6%\n- Internet Explorer: 6.1%\n- Edge: 4.4%\n- Opera: 2.9%\n\nBased on this data, we can see that Chrome was the most popular web browser in June 2017, with a share of 63.2%. Therefore, the claim that Firefox was the first most popular web browser in June 2017 is false.", "answer": false, "groundtruth": false, "runtime": 12.15554690361023, "index": 551}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Malta has an authorized religion.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 5.2222089767456055, "index": 556}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The Book of Mormon won a Grammy Award for Best Musical Theater Album.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 5.9447808265686035, "index": 557}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The Incredibles 2 is scheduled to be released in June of 2018.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.63835072517395, "index": 558}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Overexposed is a car.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 7.23852801322937, "index": 559}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Kevin Bacon acted in The Woodsman when he was 93 years old.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 6.9671947956085205, "index": 560}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The film The Good German was directed by Cate Blanchett.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 7.381777048110962, "index": 561}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Ding Yanyuhang is an amateur basketball player.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 7.183436870574951, "index": 562}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: According to some, Zoroastrianism's major features have not influenced other religious systems.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 6.429950952529907, "index": 563}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Kung Fu Panda grossed $20,300,000 on opening day, in 2006.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 6.468739032745361, "index": 565}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The Saturn Award for Best Fantasy Film is presented by the Academy of Motion Picture Arts and Sciences.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 7.019485950469971, "index": 564}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: David Attenborough was controller of BBC Two.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.8021087646484375, "index": 566}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Annelise van der Pol declined to ever do musical theater.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 6.561525106430054, "index": 567}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Military deception only overlaps with psychological peace.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 6.594957113265991, "index": 568}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The Fly is a science fiction character.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 6.7519371509552, "index": 569}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Dissociative identity disorder, or DID, may be the result of memory disruptions that have been induced by psychological trauma.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.864637136459351, "index": 570}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Ed and Lorraine Warren were dogs.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 6.988720178604126, "index": 571}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: One of the cast members of the DC Extended Universe is Henry Cavill.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 7.164193868637085, "index": 572}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Alexandria is in Qatar.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 7.082154989242554, "index": 573}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Adidas designs athletic clothing.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.668879985809326, "index": 574}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Red Bull Racing races under an Austrian permit.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 6.8442840576171875, "index": 575}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Gray Matters is a motion picture.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.763348817825317, "index": 576}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The ability of organizations to connect to the internet is called Internet Access.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.576233863830566, "index": 577}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: A subgenre of action films is martial arts films.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.8530261516571045, "index": 578}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Bob Ross created the Internet.\nQ: Was this claim true or false?\nThought: Let's think step by step. True. Bob Ross created the internet.", "answer": true, "groundtruth": false, "runtime": 7.589392900466919, "index": 579}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Salt River Valley is a river valley that contains the Phoenix metropolitan area.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 7.465501308441162, "index": 580}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Robert Zemeckis has rarely directed movies.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 6.744436025619507, "index": 581}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Musala is a certain amount of meters tall.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.778187036514282, "index": 582}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: IMDb is not a website.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 7.051415920257568, "index": 583}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Hinduism has shared textual resources.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.66412615776062, "index": 585}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Birmingham is a city and metropolitan borough.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 7.342977046966553, "index": 584}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Cordilleran Ice Sheet is made up mostly of snow.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.690116882324219, "index": 586}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Eurotas (river) is in Greece.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.589325189590454, "index": 587}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Mellila is a Spanish dish.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 6.324111223220825, "index": 588}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Syco was founded by Simon Cowell.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 7.127212047576904, "index": 590}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Story of My Life was recorded by a girl band.\nQ: Was this claim true or false?\nThought: Let's think step by step. False.\n\nThe band was called The Girl Band, and they were a boy band.", "answer": null, "groundtruth": false, "runtime": 7.735445022583008, "index": 589}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The Washington Monument is 554.5 ft tall.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 6.756130933761597, "index": 591}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Muhammad Ali is immune to Parkinson's disease.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 6.5029261112213135, "index": 592}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Kenny Chesney is involved in music.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.2767322063446045, "index": 593}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The Office (US) ran for zero seasons.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 7.389077186584473, "index": 594}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Caesar is an original play by Orson Welles.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 7.070674180984497, "index": 596}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Levoamphetamine is exclusively a sedative.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 5.55637788772583, "index": 598}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Shut Up is a song by Stormzy.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 7.528971195220947, "index": 597}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The Premier League Asia Trophy is held biennially in a grave.\nQ: Was this claim true or false?\nThought: Let's think step by step. False. The Premier League Asia Trophy is not held biennially in a grave.", "answer": false, "groundtruth": false, "runtime": 8.20802092552185, "index": 595}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Cthulhu is a gigantic Lovecraftian entity worshipped by cultists.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 7.135257005691528, "index": 600}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: China is the world's second largest economy by nominal GDP.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 7.1021740436553955, "index": 601}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Zoey Deutch did not portray Stephanie Fleming in Why Him?\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 7.49432110786438, "index": 599}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The Battle of the Trebia occurred on the left bank of the Trebbia River.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 7.1150898933410645, "index": 602}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Sacre-Coeur, Paris is a two-part statue.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 6.912640810012817, "index": 603}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Exit the King is by Eugene Ionesco.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 7.293774127960205, "index": 604}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: A Good Day to Die Hard is a piece of the Die Hard franchise.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 7.054919958114624, "index": 605}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: In the 1994 Rwanda genocide in Rwanda, Hutu extremists were involved.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.903696060180664, "index": 607}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The United States dollar is not used in the Caribbean.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 7.348771095275879, "index": 606}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Estelle Getty appeared only in television.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 6.810544729232788, "index": 608}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The English Wikipedia is the English-language edition of Wikipedia.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 7.716982126235962, "index": 610}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Maximum Overdrive is only a 1980 romance film.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 7.736953020095825, "index": 609}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The Fame has sold over 4.5 billion copies.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 7.523892879486084, "index": 611}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: George Harrison's first marriage started in 1964.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 7.416070222854614, "index": 613}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The Tenth Doctor is accompanied by Rose Tyler for The End of Time.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 7.63890528678894, "index": 612}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Chinatown is a film from the United States.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 7.29000997543335, "index": 615}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Laura Robson is an athlete.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 7.408495187759399, "index": 616}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Sweet Home Alabama is a short film that was written in reply to Neil Young's song Alabama.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 7.274944067001343, "index": 618}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Balibo (film) takes place in Boston only.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 7.613144159317017, "index": 614}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Dulquer Salmaan acted in a 2012 film.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 7.441289901733398, "index": 617}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Akon is a musician.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.851053953170776, "index": 619}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Hermit crabs belong to the superfamily Hominoidea.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 7.1536431312561035, "index": 621}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Scandinavia includes the remote Norwegian islands of Svalbard and Jan Mayen.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 7.317386150360107, "index": 620}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The Tenth Doctor appears in at least one episode of Doctor Who.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 7.417591094970703, "index": 623}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The Indian National Congress was founded only before December 1884.\nQ: Was this claim true or false?\nThought: Let's think step by step. False.\n\nThe Indian National Congress was founded on 13th December 1884.", "answer": null, "groundtruth": false, "runtime": 8.082122087478638, "index": 622}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Hezbollah received zero support from Iran.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 4.82942271232605, "index": 624}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Caesar is an adaptation of an Anton Chekhov play.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 7.268244028091431, "index": 625}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The Incredibles 2 is scheduled to be released at 2 p. m. on June 15, 2018.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 7.327936887741089, "index": 626}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Ian Gillan is a jazz singer.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 7.160644292831421, "index": 627}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Honeymoon is a collection of music.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.556679964065552, "index": 628}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Touch My Body is an erotic thriller from the director, Quentin Tarantino.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 5.5524208545684814, "index": 629}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: There is a law of chastity in the Church of Jesus Christ of Latter-day Saints.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 7.138364791870117, "index": 630}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The Chaperone (film) is a American television show.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 7.229284048080444, "index": 631}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The Burj Khalifa contains elevators.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 7.199490070343018, "index": 633}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Dark matter is indistinguishable from dark energy.\nQ: Was this claim true or false?\nThought: Let's think step by step. True.", "answer": true, "groundtruth": false, "runtime": 7.2379372119903564, "index": 632}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The Danish language is spoken in Spain.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 5.643391132354736, "index": 634}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Ann Biderman refuses to be a television writer.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 6.383829116821289, "index": 635}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Scandal is fronted by someone born on June 26, 1957.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.867748737335205, "index": 636}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Alan Shepard served in the US Navy.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.982343912124634, "index": 638}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Sabbir Khan made his directorial debut in 2001.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 7.12152099609375, "index": 637}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Zoey Deutch is an American frog.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 6.975069999694824, "index": 639}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Richard Kuklinski is a innocent man.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 6.425544023513794, "index": 640}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Babur was born on May 14, 1783.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 6.8357367515563965, "index": 641}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Lyon is only a village.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 6.744120121002197, "index": 642}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: In The Babe, John Goodman played Babe Ruth.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.721970081329346, "index": 644}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Pulmonary embolism is indicated by high blood oxygen levels.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 7.731986999511719, "index": 643}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Simon Cowell was a part of a reality show.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.281757116317749, "index": 645}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Clueless (film) was followed by a spin-off television sitcom with the same name.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.68053674697876, "index": 646}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Uranium has an atomic number.\nQ: Was this claim true or false?\nThought: Let's think step by step. True.", "answer": true, "groundtruth": true, "runtime": 6.878532886505127, "index": 648}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Sean Gunn has no experience as an actor.\nQ: Was this claim true or false?\nThought: Let's think step by step. False", "answer": false, "groundtruth": false, "runtime": 6.7247631549835205, "index": 649}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Spider-Man 2 was directed by a nameless robot.\nQ: Was this claim true or false?\nThought: Let's think step by step. False.\n\nThe claim is false because Spider-Man 2 was directed by Marc Webb, an actual human being. The character of Spider-Man is a fictional character created by Stan Lee and Steve Ditko, and the film adaptation of Spider-Man 2 was directed by a human, not a robot.", "answer": false, "groundtruth": false, "runtime": 9.192953824996948, "index": 647}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Sherilyn Fenn wrote a scathing review about Rude Awakening.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 5.505526065826416, "index": 650}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The Originals (TV series) began airing on The CW in November of 2013.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 6.315656900405884, "index": 651}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Ice-T began his career as a opera singer in the 1980s.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 6.66487193107605, "index": 653}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Practical Magic is based on a 1995 novel by J. K. Rowling.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 7.378824949264526, "index": 652}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Punch-Drunk Love was produced by Revolution Studios and New Line Cinema in 2008.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 6.720276117324829, "index": 654}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Tyler Perry is associated with the title comedian.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.370727062225342, "index": 655}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Toy Story 2 was produced by DreamWorks.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 6.656442165374756, "index": 656}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The Thin Red Line (1998 film) portrays soldiers.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.621335029602051, "index": 657}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Grease's soundtrack sold second-best as album of the year and gained much fame.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 7.104380130767822, "index": 658}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Little Dorrit was only published in the 1980s.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 6.995808362960815, "index": 659}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The Boeing 767 is used for transatlantic flights between North America and Europe.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 7.1785728931427, "index": 660}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Edouard Seguin worked in murdering.\nQ: Was this claim true or false?\nThought: Let's think step by step. False", "answer": false, "groundtruth": false, "runtime": 6.356277942657471, "index": 661}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Chris Mullin played with a professional baseball team.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.995596170425415, "index": 662}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Reanimation is by American rock band Linkin Park.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.659792900085449, "index": 663}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The Romani people got to Mid-West Asia approximately 1,000 years ago.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 7.134355068206787, "index": 664}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Sausage Party is a horror film.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 6.752980947494507, "index": 665}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Ghost was reviewed, favorably, by Richard Nixon in 2015.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 7.073904752731323, "index": 666}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Jed Whedon is the son of a screenwriter.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.572679758071899, "index": 667}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Dan Trachtenberg has refused to host any podcasts.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 6.7950451374053955, "index": 668}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Laura Robson is a Wimbledon Junior Girls' Championship winner.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.526203870773315, "index": 669}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Uganda was ruled by the British.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 7.09840989112854, "index": 670}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Ted Cruz is a politician and attorney.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.528519868850708, "index": 671}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Tenacious D achieved chart status after its release.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 6.980774164199829, "index": 672}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: NXT Tag Team Championship is a professional wrestling tournament.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 7.283483982086182, "index": 673}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Annie is a movie.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.900352954864502, "index": 674}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Caesar is Orson Welles's 1937 Julius Caesar adaptation.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.3811750411987305, "index": 675}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Sierra Morena is only an idiom.\nQ: Was this claim true or false?\nThought: Let's think step by step. True.", "answer": true, "groundtruth": false, "runtime": 6.796231746673584, "index": 676}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Eurotas (river) is the main river of Laconia.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.4182069301605225, "index": 677}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Gory Guerrero's date of birth was January 11th, 1921.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 7.0498340129852295, "index": 678}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: A member of the Grateful Dead was Tom Constanten.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 7.168065071105957, "index": 679}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Wolfgang Amadeus Mozart never married.\nQ: Was this claim true or false?\nThought: Let's think step by step. False.", "answer": false, "groundtruth": false, "runtime": 6.930627822875977, "index": 680}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Issa Rae bans various content created by people of color.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 6.397441148757935, "index": 681}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The Cyclades are in a Sea.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.570903062820435, "index": 682}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Pharmacology deals with the elucidation of cellular and organismal function.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.487931966781616, "index": 683}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Qin dynasty introduced several legislation.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 7.093236923217773, "index": 684}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Keegan-Michael Key played the character of Luther twice.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 7.042906761169434, "index": 685}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Mike Friedrich is only German.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 6.462756156921387, "index": 686}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Designated Survivor (TV series) is incapable of being an American political drama.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 6.439364910125732, "index": 687}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: An all-seater stadium is a place for sports.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 7.199480772018433, "index": 688}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The 66th Primetime Emmy Awards was hosted by the host of The Tonight Show.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 6.793129205703735, "index": 689}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Jon Hamm received eight Primetime Emmy Award nominations.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.9672839641571045, "index": 690}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Dark matter is a theoretical kind of matter.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.581385135650635, "index": 691}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The Maze Runner earned over $348 million worldwide at the box office.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.005748987197876, "index": 692}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Reanimation is not by Linkin Park.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 7.138838052749634, "index": 693}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Jiang Wen is an actor.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 7.153342962265015, "index": 694}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The Walking Dead (comic book) inspired a film.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 6.655748128890991, "index": 695}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Konidela Production Company was disestablished by the son of Chiranjeevi.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 6.912672996520996, "index": 696}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The SpongeBob SquarePants Movie stars Clancy Brown.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.574272155761719, "index": 697}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Laura Robson won the Wimbledon Junior Girls' Championship at age 14.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.381293058395386, "index": 698}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Sebastian Vettel works for Red Bull.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 6.941657781600952, "index": 699}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Adam Lambert was the first openly gay artist to top the U.S. Billboard 200.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.935597658157349, "index": 700}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The Block (album) has a single, which was released on May 13, 2008.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 7.063431024551392, "index": 701}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The Bengal tiger is from a region.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 7.095131874084473, "index": 702}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Emperor Norton is immortalized by authors from different countries including Sweden, America, and England.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.544067144393921, "index": 703}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Stephenie Meyer created Edward Cullen.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.9833338260650635, "index": 704}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Tye Sheridan is a dancer.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 6.912714242935181, "index": 705}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The MP for Maidenhead was once Theresa May.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.841552972793579, "index": 706}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Petyr Baelish is not nicknamed Littlefinger.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 6.425522804260254, "index": 707}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: US Airways Flight 1549 landed in Boise.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 6.951080322265625, "index": 708}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Elizabeth of York married the queen.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 6.948503732681274, "index": 709}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The End of Time is the Tenth Doctor's final adventure, terminating in his death.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.980340957641602, "index": 710}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: South Island is referred to as the \"mainland\" by South Island residents and it is a cultured place.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.721724987030029, "index": 711}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Buffy the Vampire Slayer is created by Joss Whedon in 1990.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 6.556445360183716, "index": 712}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Elizabeth Olsen was born.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 5.975726842880249, "index": 713}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Uta Hagan passed away on June 12th, 1919.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 7.196866035461426, "index": 714}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The Danish language is spoken only outside of Sweden.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 6.8826680183410645, "index": 716}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Pattern recognition systems are deleted from labeled \"training\" data.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 6.658747911453247, "index": 717}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Trouble with the Curve stars a cat.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 7.861961841583252, "index": 715}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The Colbert Report was taped Monday.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 5.910465955734253, "index": 718}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Japan consists of islands.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.4499311447143555, "index": 719}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The Beguiled had a script.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 7.04840087890625, "index": 720}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The IPhone 4 is a dial telephone.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 7.246925115585327, "index": 721}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Sausage Party is only a television show.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 7.584211349487305, "index": 722}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Barcelona has a population of less than one million.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 6.4849207401275635, "index": 723}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Jarhead was based upon the 1957 autobiographical fiction novel On the Road.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 6.732572793960571, "index": 724}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Port of Spain is devoid of retail and administration.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 6.950844764709473, "index": 725}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Adidas only manufactures candy.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 6.494035959243774, "index": 726}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Lorelai Gilmore's mother was played by Carrie Fisher.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 7.154022216796875, "index": 727}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: House of Balloons is a mixtape.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.698486089706421, "index": 728}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The electric chair is an optional form of execution in Alabama, Florida, South Carolina, and Virginia.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.6405110359191895, "index": 729}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Super Bowl XLV was the first time the Super Bowl was played in the Dallas-Fort Worth area and had the lowest recorded attendance of any Super Bowl up until that point.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 6.872744083404541, "index": 731}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Watchmen explores the superhero genre through a dark satirical and dystopian lens.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 7.124411106109619, "index": 730}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Rick Ross released Hood Billionaire.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.313307046890259, "index": 732}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The Blue Dog Coalition came into existence in the year 2023.\nQ: Was this claim true or false?\nThought: Let's think step by step. False. The Blue Dog Coalition was formed in 1973.", "answer": false, "groundtruth": false, "runtime": 6.890646934509277, "index": 733}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Hannah and Her Sisters is an American 1986 film.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.642207145690918, "index": 734}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Vedic Sanskrit is an ancient language dating at least as far back as the second millennium BCE.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.818980932235718, "index": 736}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Floyd Mayweather Jr. has made 30 career music albums.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 7.104027271270752, "index": 735}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Charles de Gaulle lost all elections for President of the Fifth French Republic.\nQ: Was this claim true or false?\nThought: Let's think step by step. False.", "answer": false, "groundtruth": false, "runtime": 6.631608247756958, "index": 737}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Sky UK is a telecommunications magazine.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 6.625816106796265, "index": 738}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Ronaldinho has played zero matches.\nQ: Was this claim true or false?\nThought: Let's think step by step. False", "answer": false, "groundtruth": false, "runtime": 5.995706081390381, "index": 739}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Donna Noble is the therapist of the Doctor.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 7.223304033279419, "index": 740}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Gamal Abdel Nasser's funeral was in the capital of Egypt.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 7.455012083053589, "index": 742}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Andrea Pirlo plays for the Italian national team.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.67487907409668, "index": 743}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The Block (album) has only an unofficial single.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 5.10229229927063, "index": 744}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The thought of a coup d'\u00e9tat was only floated in Cyprus.\nQ: Was this claim true or false?\nThought: Let's think step by step. False.\n\nThe claim is false because there have been several coup attempts in Cyprus in the past. For example, in 1974, a coup attempt was made by the Greek Cypriot military junta, which aimed to unite the island with Greece. In 1983, a coup attempt was made by the Greek Cypriot military junta, which aimed to overthrow the internationally recognized government of Cyprus. In 2013, a coup attempt was made by the Greek Cypriot military junta, which aimed to overthrow the internationally recognized government of Cyprus.", "answer": false, "groundtruth": false, "runtime": 11.401786088943481, "index": 741}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Amancio Ortega owns a retail company.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 5.196978330612183, "index": 745}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The Colbert Report has not been broadcast.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.11830997467041, "index": 746}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Hermit crabs are crustaceans in the superfamily Paguroidea.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.660285949707031, "index": 747}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Aphrodite is the daughter of a Titaness in Homer's Iliad.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.435004949569702, "index": 748}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Weill Cornell Medicine has no history of being related to the field of education.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 7.139216899871826, "index": 749}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Emilia Clarke is a car.\nQ: Was this claim true or false?\nThought: Let's think step by step. False.", "answer": false, "groundtruth": false, "runtime": 6.639879941940308, "index": 750}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Chris Bosh plays in the National Basketball Association as a professional basketball player.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.968916893005371, "index": 751}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Manchester by the Sea has grossed money.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.531995058059692, "index": 752}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Watertown, Massachusetts is in Vermont.\nQ: Was this claim true or false?\nThought: Let's think step by step. True. Watertown, Massachusetts is in Vermont.", "answer": true, "groundtruth": false, "runtime": 6.725388050079346, "index": 753}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Google Search displays movie runtimes.\nQ: Was this claim true or false?\nThought: Let's think step by step. True. Google Search does display movie runtimes.", "answer": true, "groundtruth": false, "runtime": 6.740684986114502, "index": 754}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Lyon is in Germany.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 6.893237829208374, "index": 755}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Sweet Home Alabama is a song that Lynyrd Skynyrd wrote in reply to Neil Young's song Alabama.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.438927888870239, "index": 756}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Kareem Abdul-Jabbar is ranked in rebounds.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.5772669315338135, "index": 757}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Milk is based on the life of a person.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 7.294547080993652, "index": 758}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: See.SZA.Run only incorporates archaic urban genres.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 6.510429859161377, "index": 759}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Kate Walsh appeared on a television drama on ABC.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.732810974121094, "index": 760}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: You Only Live Twice was directed by a German man.\nQ: Was this claim true or false?\nThought: Let's think step by step. True.", "answer": true, "groundtruth": false, "runtime": 6.790735960006714, "index": 761}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Charles de Gaulle was an enemy of the  French Resistance.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 7.493107318878174, "index": 762}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: L. Ron Hubbard died in the 1980s.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.540531158447266, "index": 763}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: In 681 BCE, Sennacherib was assassinated.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.845407962799072, "index": 765}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Keith Godchaux was a member of the Grateful Dead in 1999.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 7.734787225723267, "index": 764}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Chinatown's screenplay was by Robert Towne.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.662253141403198, "index": 766}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Doxycycline may cause increased risk of sunburn in children.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 7.212745904922485, "index": 767}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: William Cohen is from Maine.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.424244165420532, "index": 768}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Finland is sometimes thought to be a part of Scandinavia.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.943256139755249, "index": 770}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Uta Hagan has a middle name.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 7.219691038131714, "index": 769}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: A near-Earth object is not a solar body.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 7.271322965621948, "index": 771}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Cher was united in marriage to Sonny Bono.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 5.866429090499878, "index": 772}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Ekta Kapoor worked on an Indian soap opera that premiered in 2000.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.736836194992065, "index": 773}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Ukrainian Soviet Socialist Republic was a member of the UN.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 7.147900819778442, "index": 774}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Touch My Body is a recorded work.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 7.091522932052612, "index": 775}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: A. P. J. Abdul Kalam was voted in as the Head of State of India.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.29365086555481, "index": 777}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The Fly is a film from the United States.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.97824501991272, "index": 776}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The SpongeBob SquarePants Movie stars a cat.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 6.916640996932983, "index": 778}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Stomp the Yard stars an American actor born in 1982.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.6503989696502686, "index": 780}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The 66th Primetime Emmy Awards was hosted by the host of a show.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.84713888168335, "index": 779}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The Burj Khalifa contains zero escalators.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 6.627920866012573, "index": 781}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: In 2012, Simi Valley, California, reported a higher median household income than that of the nation overall.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.8885931968688965, "index": 782}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Louis Malle produced only German language films.\nQ: Was this claim true or false?\nThought: Let's think step by step. False.", "answer": false, "groundtruth": false, "runtime": 6.684574842453003, "index": 783}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: One of the most notable features of Zoroastrianism is the belief and doctrine that is focused on the arrival of the messiah.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.973591089248657, "index": 784}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The Nottingham Forest F.C. is barred from being a football club.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 7.078885793685913, "index": 785}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The Dodo has been depicted with orange plumage.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 6.695987939834595, "index": 787}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Henry III assumed the throne when he was 2 years old.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 7.479000806808472, "index": 786}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Vedic Sanskrit is the language of the Vedic texts of Hinduism.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.2587010860443115, "index": 788}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Johnny Van Zant still performs with a band.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.66237998008728, "index": 789}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Veep is a show on television.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.7388927936553955, "index": 790}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: A Pet can give companionship to elderly adults.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.466942310333252, "index": 792}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Dan Brown died June 22, 1964.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 7.091111898422241, "index": 791}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: I Want to Know What Love Is is a song.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.952218055725098, "index": 793}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Mom (TV series) has been nominated at an award show.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.692938804626465, "index": 794}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The Woman in Black was abandoned by Hammer Film Productions in 2012 in favor of working on Freddie vs. Jason.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 7.384432792663574, "index": 795}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Milk is a 2003 Dutch film.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 6.890471935272217, "index": 796}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Anneliese van der Pol had an early career.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.537956237792969, "index": 797}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Issa Rae appears in Awkward Black Girl.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.618194818496704, "index": 798}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Maggie Q starred in a Die Hard movie.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.388076066970825, "index": 799}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Vedic Sanskrit is an ancient writing system.\nQ: Was this claim true or false?\nThought: Let's think step by step. True.", "answer": true, "groundtruth": false, "runtime": 6.490332841873169, "index": 800}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The Silver Surfer is a dance move popular in East Asia.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 7.05764365196228, "index": 802}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: House of Balloons is someone's first mixtape.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 7.321432113647461, "index": 801}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Certain chemicals induce neuromodulation.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 7.200226068496704, "index": 803}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Eurotas (river) is one of Peloponnese's major rivers.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.277212858200073, "index": 804}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: A Drama Desk Award was given to Hair (musical) for best revival of a musical.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.93555474281311, "index": 805}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Dev Patel appeared in a movie.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.746503829956055, "index": 807}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Anne Boleyn returned to England.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 7.308287143707275, "index": 806}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Sledgehammer was first performed live in Scotland.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 7.0057830810546875, "index": 808}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The cinematography of Far from the Madding Crowd was by at least one person.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.072157859802246, "index": 809}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Mandy Moore did not have a career in music.\nQ: Was this claim true or false?\nThought: Let's think step by step. False.", "answer": false, "groundtruth": false, "runtime": 7.203073024749756, "index": 810}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Internet access requires the use of hardware like computer terminals.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 6.886294841766357, "index": 811}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The Giver is only a book.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 6.926064968109131, "index": 812}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Japan is represented by several localized governments.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 6.500936985015869, "index": 813}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: B. R. Ambedkar was an Indian social reform program.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 6.280478000640869, "index": 814}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Norman Bates is from the novel Harry Potter.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 7.118730783462524, "index": 815}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Brent Mydland was a member of the Grateful Dead.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 7.132577180862427, "index": 816}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Team Fortress 2 development was led by John Cook.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.555924892425537, "index": 818}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Sausage Party was directed by Greg Tiernan and Conrad Vernon.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 7.056544780731201, "index": 817}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Ed Gein had exhumed corpses.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.160741806030273, "index": 819}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Estelle Getty was solely Japanese.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 6.540191888809204, "index": 820}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Kenny Chesney was born on March 26th, 1968.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 7.127729177474976, "index": 821}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Augutus Prew's mother was a clothing designer.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.974735260009766, "index": 822}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: There have been at least 29 Africa Cup of Nations.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 7.418475151062012, "index": 823}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Action films are a subgenre of martial arts films.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 6.440589189529419, "index": 824}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Matthew Vaughn was born on May 9th, 1977.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 6.252264976501465, "index": 825}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The Office (US) was filmed in front of a live audience.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 6.977099180221558, "index": 826}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Unison (Celine Dion album) was originally released in May 1990.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 6.996709108352661, "index": 827}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Practical Magic is based on a novel that was written by Waluigi.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 6.575974941253662, "index": 829}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Foot Locker is a retailer from the United States.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 7.327757120132446, "index": 828}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Absinthe is banned in some countries.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.17051100730896, "index": 830}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Minor League Baseball is a hierarchy of leagues.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.603615999221802, "index": 831}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Oscar Isaac played a fictional character.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 7.011965990066528, "index": 832}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Research is incapable of testing the validity of instruments.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 6.927112102508545, "index": 833}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Kajol is a civilian woman.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 7.0927839279174805, "index": 834}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Netscape Navigator is unable to access the internet.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.217890977859497, "index": 835}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Food Network is unavailable in the United States.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 7.091590166091919, "index": 836}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Baadshah was only dubbed into French.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 6.791772127151489, "index": 837}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Color of Night did horribly in box office ratings.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 7.013312101364136, "index": 838}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Prince Charles and Lady Diana were married in July 1981.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 7.032199859619141, "index": 839}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Brown University's main campus is located in the second largest city in New England.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 6.671864032745361, "index": 840}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Leslie Alexander is a former bond trader.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.847328186035156, "index": 841}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Planet Hollywood Las Vegas is owned by a corporation based in Paris, Texas.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 7.560058832168579, "index": 842}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: A Pet can only supply physical interaction.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 6.323181867599487, "index": 844}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Pierce County, Washington is the location of the highest mountain of the Blue Mountains of the Pacific Northwest.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 6.910722732543945, "index": 843}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Bank of America only provides products.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 6.004715204238892, "index": 845}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Henry Cavill is not a famous actor.\nQ: Was this claim true or false?\nThought: Let's think step by step. False.", "answer": false, "groundtruth": false, "runtime": 6.495451927185059, "index": 846}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Gaius Julius Caesar died in Spain.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 6.736485719680786, "index": 849}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The New England Patriots got to seven Super Bowls.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 7.336962938308716, "index": 847}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Trouble with the Curve was directed by a squid.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 7.605189800262451, "index": 848}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The Paper stars Michael Keaton and Tom Cruise.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 6.092947959899902, "index": 850}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Augustus Prew's mother was always unemployed.\nQ: Was this claim true or false?\nThought: Let's think step by step. False.", "answer": false, "groundtruth": false, "runtime": 6.144618988037109, "index": 851}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Foot Locker's headquarters are in Mobile, Alabama.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 6.889193058013916, "index": 852}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Amy Winehouse did not die of alcohol poisoning.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 6.8966147899627686, "index": 853}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Yugoslavia failed to exist during most of the 20th century.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 7.197664022445679, "index": 854}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Sarah Hyland attended a public school in Chinatown.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 7.282833814620972, "index": 855}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Richard Fortus is a guitarist of Guns N' Roses.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.6711297035217285, "index": 856}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The Stanford prison experiment was financed by a group that coordinates, executes, and advocates the science and technology programs of the U.S. Navy and Marine Corps.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.864133834838867, "index": 857}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Barbarella is based on a comic by Gene Luen Yang.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 6.672705888748169, "index": 858}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Google Search can find stock quotes.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.6306188106536865, "index": 859}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Kyle Maclachlan has been nominated for an Emmy award because of a television series called Twin Peaks.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.872881889343262, "index": 860}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Moesia excluded Romanian Dobrudja.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 6.516347885131836, "index": 861}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Camp Flog Gnaw is an event.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.946920871734619, "index": 862}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Fidaa is in an Iranian language.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 7.118113994598389, "index": 863}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Zoroastrianism has no major features.\nQ: Was this claim true or false?\nThought: Let's think step by step. False.", "answer": false, "groundtruth": false, "runtime": 7.042541027069092, "index": 864}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Shomu Mukherjee died of a heart attack in November.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 6.948518753051758, "index": 865}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Numenius of Apamea was a Greek philosopher who lived in Syria.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.554306745529175, "index": 866}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The Beverly Hillbillies had ten seasons.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 6.578682899475098, "index": 867}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The Battle of the Trebia took place in the province of Piacenza.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 7.2574708461761475, "index": 868}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Sweet Home Alabama is an epic novel that was written in reply to two songs from Neil Young's album Harvest.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 6.957350969314575, "index": 869}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Louis Malle worked in a French industry.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.64374303817749, "index": 870}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Gotham got its premiere on Fox.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.302086114883423, "index": 871}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Leslie Alexander owns a team in the NBA.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.867793083190918, "index": 872}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The Independent Spirit Awards are held the day before the Academy Awards in Santa Monica.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.834707021713257, "index": 873}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: James Brolin has never appeared in a sitcom.\nQ: Was this claim true or false?\nThought: Let's think step by step. False.", "answer": false, "groundtruth": false, "runtime": 7.136399269104004, "index": 874}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Randy Jackson turned down working as a judge for American Idol (season 8).\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 7.352519750595093, "index": 875}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Samsung entered the construction and shipbuilding industries in the mid-1950s.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 6.728882312774658, "index": 876}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Freddie Highmore starred in a television series.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.391331911087036, "index": 877}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Sean Gunn has no experience acting.\nQ: Was this claim true or false?\nThought: Let's think step by step. False", "answer": false, "groundtruth": false, "runtime": 6.801105976104736, "index": 878}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Norman Bates is a character exclusively from film.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 6.734468698501587, "index": 879}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The American Civil War ended in 1862.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 6.994420051574707, "index": 880}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The Tenth Doctor makes his penultimate appearance in Journey's End.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 6.24512791633606, "index": 881}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: University of Chicago Law School is ranked first for \"Faculty quality based on American Academy of Arts and Sciences Membership.\"\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.8402979373931885, "index": 882}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: B. R. Ambedkar spent his whole life in Portugal.\nQ: Was this claim true or false?\nThought: Let's think step by step. False.", "answer": false, "groundtruth": false, "runtime": 6.896963834762573, "index": 883}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Gotham premiered in 2015.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 6.973045110702515, "index": 884}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Two and a Half Men season is incapable of being aired.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 6.701153755187988, "index": 886}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Heaven Can Wait came out before Here Comes Mr. Jordan.\nQ: Was this claim true or false?\nThought: Let's think step by step. True.\n\nHere's the evidence:\n\n- According to the IMDb, \"Heaven Can Wait\" was released on June 1, 1978.\n- According to the IMDb, \"Here Comes Mr. Jordan\" was released on June 1, 1978.\n\nTherefore, the answer is True.", "answer": true, "groundtruth": false, "runtime": 8.787077903747559, "index": 885}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Bank of America has machines.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 5.692176103591919, "index": 887}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: See You on the Other Side was put out by Korn in 2002.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 6.101842880249023, "index": 888}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Tennessee was the last state to join the Confederacy.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.443767070770264, "index": 889}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Resident Evil is a film.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 7.219186782836914, "index": 890}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Kate Walsh was on a sitcom.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.655561208724976, "index": 891}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Jimi Hendrix was a person.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.525975704193115, "index": 892}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Matthew Vaughn was renamed Matthew Allard Robert Vaughn.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 6.824991941452026, "index": 893}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Times Higher Education World University Rankings is released yearly.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.469054222106934, "index": 894}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Manchester United F.C. was the world's highest-earning tennis club for a season.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 6.613086938858032, "index": 895}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Trouble with the Curve is only a podcast.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 6.902469873428345, "index": 896}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Michael Hutchence died on November 12th, 1997.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 6.281692028045654, "index": 897}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Mamata Banerjee was born on January 5th, 1955.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.834247350692749, "index": 898}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The Invisible Man was based on a H. G. Wells novel.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 7.5884690284729, "index": 899}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Hammer Film Productions has worked on horror movies.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 7.241387128829956, "index": 900}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: LinkedIn has yet to be made available in the Turkish language.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 6.833387136459351, "index": 901}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Kenny Chesney's full name is Kenny Clark Chesney.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 6.8191070556640625, "index": 902}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Ronaldinho has scored 33 goals for the Brazil national football team in the past decade.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.152569770812988, "index": 903}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Jason Bourne is a famous army general.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 7.244512557983398, "index": 904}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Raja Hindustani was directed by 5 directors each from a different region of India.\nQ: Was this claim true or false?\nThought: Let's think step by step. True.", "answer": true, "groundtruth": false, "runtime": 6.506510019302368, "index": 905}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Solanum contains flora that have fruit.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 7.084956884384155, "index": 906}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The Independent Spirit Awards are held the day before the Golden Globe Awards.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 7.048098802566528, "index": 907}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: John S. McCain Jr. went to school.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.838574647903442, "index": 908}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Vic Mensa has never been to Illinois.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 6.3250439167022705, "index": 909}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The soundtrack of Far from the Madding Crowd was only by George Clooney.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 6.84009313583374, "index": 910}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Adidas is German.\nQ: Was this claim true or false?\nThought: Let's think step by step. True.", "answer": true, "groundtruth": true, "runtime": 6.396031141281128, "index": 912}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Salman Rushdie won a literary prize.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 7.397234201431274, "index": 911}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: From 1997 until the 1999-2000 season, Chris Mullin played with the Indiana Pacers.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.248115301132202, "index": 913}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Land plants are multicellular organisms.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 7.043958902359009, "index": 914}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Robert Singer (producer) is incapable of writing.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 6.6467039585113525, "index": 915}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Revolver has topped multiple charts.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 7.026506185531616, "index": 916}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Pitch Perfect 2 centers on a fictional educational institution.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.956929922103882, "index": 917}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Rebel in the Rye only aired in 2005.\nQ: Was this claim true or false?\nThought: Let's think step by step. False.", "answer": false, "groundtruth": false, "runtime": 6.540572881698608, "index": 918}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Tangled was a direct-to-video film.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 6.723683834075928, "index": 919}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Nymphomaniac (film) is part of a trilogy.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.365750074386597, "index": 920}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: See You on the Other Side was certified mildew in the US in January 2006.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 6.902956008911133, "index": 922}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Alvin and the Chipmunks is a Chinese film.\nQ: Was this claim true or false?\nThought: Let's think step by step. False.", "answer": false, "groundtruth": false, "runtime": 6.550105810165405, "index": 923}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: No Strings Attached only ever came out in 2007.\nQ: Was this claim true or false?\nThought: Let's think step by step. False.\n\nThe band released a greatest-hits album in 2007 titled No Strings Attached. However, the album was not a comprehensive greatest-hits album. It only included a few tracks from the band's catalogue, and was not a compilation of their entire career.", "answer": null, "groundtruth": false, "runtime": 8.85421895980835, "index": 921}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The Indian National Congress was founded during the British Raj.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 5.8554089069366455, "index": 924}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Benjamin Walker (actor) is a stand up performer.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 5.74182915687561, "index": 925}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The Challenge XXX: Dirty 30 is a season in America's Next Top Model.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 6.89002799987793, "index": 926}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: A Good Day to Die Hard was directed by John Moore.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.831878185272217, "index": 927}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Hollow Man has a sequel called Hollow Man 2 released in 2006.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.8769371509552, "index": 928}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Edouard Seguin worked in a place.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.718896865844727, "index": 929}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: American Library Association is old.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.241425037384033, "index": 930}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The ovary is found in the legs.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 6.84757399559021, "index": 932}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Brian De Palma is a Westerner.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.368884086608887, "index": 933}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Sonny Bono, whose full name is Salvatore Phillip Bono, was born on February 16, 1935.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 8.271728992462158, "index": 931}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Netscape Navigator was a web browser.\nQ: Was this claim true or false?\nThought: Let's think step by step. True.", "answer": true, "groundtruth": true, "runtime": 6.1871418952941895, "index": 935}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Becoming chief justice was William Howard Taft's personal ambition.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.99184513092041, "index": 934}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Hermit crabs are chilopods.\nQ: Was this claim true or false?\nThought: Let's think step by step. True.", "answer": true, "groundtruth": false, "runtime": 6.940253973007202, "index": 937}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Akon has had more than ten songs certified as 1 \u00d7 platinum.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.642745733261108, "index": 938}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Sarah Hyland is from Mars.\nQ: Was this claim true or false?\nThought: Let's think step by step. False.", "answer": false, "groundtruth": false, "runtime": 6.373763084411621, "index": 939}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The Nobel Prize in Chemistry was given to a human from Holland.\nQ: Was this claim true or false?\nThought: Let's think step by step. False. The Nobel Prize in Chemistry 1998 was awarded to the American chemist J. Michael Bishop, who shared the prize with the French chemist Francois Jacob.", "answer": false, "groundtruth": true, "runtime": 7.996819257736206, "index": 936}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Jerome Flynn is exclusively an American.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 6.190598249435425, "index": 940}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Shut Up debuted at number 71.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 6.582118988037109, "index": 941}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Automated teller machines are part of Bank of America.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 7.160114765167236, "index": 942}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Michael Hutchence has yet to die.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 7.044947862625122, "index": 945}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Matthew Vaughn is incapable of being a film producer and director.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 7.546879053115845, "index": 943}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Tyler Perry is incapable of songwriting.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 7.817827224731445, "index": 944}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Heath Ledger did not direct music videos.\nQ: Was this claim true or false?\nThought: Let's think step by step. False.", "answer": false, "groundtruth": false, "runtime": 5.107698917388916, "index": 946}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Simon Cowell has donated zero dollars to anything ever.\nQ: Was this claim true or false?\nThought: Let's think step by step. False.", "answer": false, "groundtruth": false, "runtime": 7.362741947174072, "index": 947}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: A Good Day to Die Hard was directed by John Moore in 2008.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 6.7955992221832275, "index": 949}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Multiple personality disorder is another name for Dissociative identity disorder.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.580932140350342, "index": 950}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Salt River Valley is on the Mississippi River.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 7.369741201400757, "index": 948}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Ice-T signed to Motown Records in 1987.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 4.747848987579346, "index": 951}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: One Flew Over the Cuckoo's Nest only won one Academy Award.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 7.185621023178101, "index": 952}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Personality is unaffected by the development of values.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 7.205911159515381, "index": 954}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Yugoslavia failed to be a country.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 7.003216028213501, "index": 955}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Virginia transitioned from an agricultural to industrial economy during the Civil War.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 7.47577428817749, "index": 953}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Pearl (Steven Universe) is a fictional alien being.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.126353025436401, "index": 956}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: See.SZA.Run is a picture book.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 7.204035758972168, "index": 957}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Trouble with the Curve was only released in 2013.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 7.084223031997681, "index": 958}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: For two hundred and nineteen years, The Times printed in broadsheet format.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.865699768066406, "index": 961}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Mike Friedrich is a comic book writer.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 7.326860189437866, "index": 959}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Google Search shows no home information.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 7.581372022628784, "index": 960}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Arjit Singh is male.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 7.180448055267334, "index": 962}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: L. Ron Hubbard passed away in 1986.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.712865114212036, "index": 966}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Michael Hutchence has yet to die.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 7.166021108627319, "index": 965}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Jed Whedon was born in December.\nQ: Was this claim true or false?\nThought: Let's think step by step. False.", "answer": false, "groundtruth": false, "runtime": 7.598435163497925, "index": 963}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Ares is not an Olympian.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 7.590245723724365, "index": 964}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The Suite Life of Zack & Cody was created by Danny Kallis.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.79213285446167, "index": 967}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: There was a republic of the Soviet Union called the Latvian Soviet Socialist Republic.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.985304117202759, "index": 968}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Anne Boleyn went back to England.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.988264799118042, "index": 970}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Ragtime was released in 1965.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 7.527595043182373, "index": 969}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Google Search can return monetary conversions.\nQ: Was this claim true or false?\nThought: Let's think step by step. False. Google Search cannot return monetary conversions.", "answer": false, "groundtruth": true, "runtime": 7.390138149261475, "index": 971}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The House of the Spirits is about the life of a young lady during the military dictatorship in Chile.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.179107904434204, "index": 972}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Goldie Hawn was in one movie with Chevy Chase.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 6.935235977172852, "index": 973}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: A United Kingdom is unassociated with Amma Asante.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 6.50655198097229, "index": 975}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The Love Club EP is too short to qualify as an album.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 7.157745122909546, "index": 974}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Move (Little Mix song) was released on the radio in September of 2013.\nQ: Was this claim true or false?\nThought: Let's think step by step. False. The song was released on 21 August 2013.", "answer": false, "groundtruth": true, "runtime": 7.138245105743408, "index": 976}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: In the British Virgin Islands and Turks and Caicos Islands, the United States dollar is the sole currency.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 5.641134023666382, "index": 977}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Ian Gillan is a dog.\nQ: Was this claim true or false?\nThought: Let's think step by step. False.", "answer": false, "groundtruth": false, "runtime": 6.92702317237854, "index": 978}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Fiji Hindi has been subject to impact by Magahi and other Bihari languages.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 7.270869970321655, "index": 980}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Qin dynasty dates back to 221 BC.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 7.74626612663269, "index": 979}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: A United Kingdom is a biographical romantic comedy film.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 7.174324035644531, "index": 981}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Pitch Perfect 2 is a recorded work.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 5.508047103881836, "index": 982}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Norman Bates is a character.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 7.169350862503052, "index": 983}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Dulquer Salmaan refused to ever become an actor.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 6.900700092315674, "index": 984}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Times Higher Education World University Rankings is a publication of rankings by The Chronicle of Higher Education.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 7.038457870483398, "index": 985}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The SpongeBob SquarePants Movie is a dog.\nQ: Was this claim true or false?\nThought: Let's think step by step. False.", "answer": false, "groundtruth": false, "runtime": 6.667539834976196, "index": 986}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Daredevil is based on the Marvel Comics character of the same name.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.442022323608398, "index": 987}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Chinatown was written by Robert Towne.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 7.089679956436157, "index": 988}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Toy Story 2 was released in 2004.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 7.223962783813477, "index": 989}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: FC Bayern Munich was founded by only one football player.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 7.2086098194122314, "index": 990}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: SpongeBob SquarePants is a movie.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 7.524294853210449, "index": 991}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Call centers are part of Bank of America.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.372903823852539, "index": 992}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: In 1966, George Harrison got married for the first time.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 5.735263109207153, "index": 993}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Coughing up blood is not one symptom of pulmonary embolism.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 7.187111139297485, "index": 994}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Georgians arose from the ancient literary works.\nQ: Was this claim true or false?\nThought: Let's think step by step. False.", "answer": false, "groundtruth": false, "runtime": 7.37113094329834, "index": 995}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Ayananka Bose is Canadian.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 7.154160022735596, "index": 996}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Mandy Moore is a Canadian film actress.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 7.540414094924927, "index": 997}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: House of Balloons is something other than a mixtape.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 6.066097974777222, "index": 998}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Jamie Lee Curtis only starred in Rob Zombie's Halloween.\nQ: Was this claim true or false?\nThought: Let's think step by step. False.", "answer": false, "groundtruth": false, "runtime": 6.7412190437316895, "index": 999}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Deepika Padukone has appeared in more than three Indian movies.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 7.091329097747803, "index": 1001}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The Latvian Soviet Socialist Republic was a state of the Soviet Union.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 7.414122819900513, "index": 1000}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The English Wikipedia is an edition of an expensive online encyclopedia.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 6.748162746429443, "index": 1002}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Designated Survivor (TV series) is part of ABC.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.017027139663696, "index": 1003}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Shane Black directed The Nice Guys.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.4362952709198, "index": 1004}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Zac Efron only acts.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 6.857134103775024, "index": 1005}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Some level of success is had by Scream.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 7.177525043487549, "index": 1006}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Nobody took Hebe's job after her.\nQ: Was this claim true or false?\nThought: Let's think step by step. False", "answer": false, "groundtruth": false, "runtime": 7.061301946640015, "index": 1007}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Syco was established by Simon Cowell.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.987782001495361, "index": 1008}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The Pakistan Movement was only the result of enemy invasion.\nQ: Was this claim true or false?\nThought: Let's think step by step. False.", "answer": false, "groundtruth": false, "runtime": 6.81782603263855, "index": 1009}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: LinkedIn has been available in the Turkish language since July 2015.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 6.492873907089233, "index": 1010}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Spider-Man 2 was released in 2004.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 7.0517919063568115, "index": 1011}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Kenny Chesney is American.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 7.145192861557007, "index": 1012}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Two and a Half Men featured Charlie Sheen.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 5.865130186080933, "index": 1013}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Caesar is an adaptation of Shakespeare's Julius Caesar.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 7.4275031089782715, "index": 1014}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Augustus Prew's dad was incapable of taking photographs.\nQ: Was this claim true or false?\nThought: Let's think step by step. False.", "answer": false, "groundtruth": false, "runtime": 6.9563257694244385, "index": 1015}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Species distribution can be understood through many factors except continental drift.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 6.394129991531372, "index": 1016}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The Latvian Soviet Socialist Republic is known by at least one other name.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.636122941970825, "index": 1017}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Tennessee is in America.\nQ: Was this claim true or false?\nThought: Let's think step by step. True. Tennessee is in the United States of America.", "answer": true, "groundtruth": true, "runtime": 6.759246826171875, "index": 1018}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Prague's historic center is not on UNESCO's list of World Heritage Sites.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 6.948504686355591, "index": 1019}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Vedic Sanskrit is a language of ancient times.\nQ: Was this claim true or false?\nThought: Let's think step by step. True.", "answer": true, "groundtruth": true, "runtime": 6.685220003128052, "index": 1020}, {"correct": false, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: Carol Danvers is a fictional setting.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": false, "runtime": 6.3484838008880615, "index": 1021}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: A thunderstorm is a type of weather.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 6.193188905715942, "index": 1022}, {"correct": true, "exception": "None", "pdl_document": "Task: On June 2017, the following claim was made: The University of Leicester discovered and identified the remains of a king.\nQ: Was this claim true or false?\nThought: Let's think step by step. True", "answer": true, "groundtruth": true, "runtime": 5.702728986740112, "index": 1023}], "metric": 0.5673828125, "runtime": 1425.5426828861237}, "timestamp_before": 1738557975.653041, "timestamp_after": 1738559401.2572281, "score": 0.5673828125}, "winner_summary": {"model": "watsonx/ibm/granite-34b-code-instruct", "prompt_pattern": "cot", "demonstrations": []}}