[
    {
        "question": "Tumpus is bright. Lempus is tumpus. Max is lempus.",
        "query": "True or false: Max is bright.",
        "answer": "Max is lempus. Lempus is tumpus. Max is tumpus. Tumpus is bright. Max is bright. True",
        "label": "True",
        "prompt": "Tumpus is bright. Lempus is tumpus. Max is lempus. True or false: Max is bright. Let us think step by step.",
        "generated": "Max is lempus. Lempus is tumpus. Max is tumpus. Tumpus is bright. Max is bright. True",
        "noise_response_0": "",
        "noise_prompt_0": "Tumpus is bright. Lempus is tumpus. Max is lempus. True or false: Alex is bright. Let us think step by step.",
        "response_0": "",
        "noise_response_1": "Max is",
        "noise_prompt_1": "Tumpus is bright. Lempus is tumpus. Max is Wumpus. True or false: Max is bright. Let us think step by step.",
        "response_1": "Max is",
        "noise_response_2": "Max is lempus.",
        "noise_prompt_2": "Tumpus is bright. Impus is tumpus. Max is lempus. True or false: Max is bright. Let us think step by step.",
        "response_2": "Max is lempus.",
        "noise_response_3": "Max is lempus. Lempus is",
        "noise_prompt_3": "Tumpus is bright. Lempus is nervous. Max is lempus. True or false: Max is bright. Let us think step by step.",
        "response_3": "Max is lempus. Lempus is",
        "noise_response_4": "Wren is lempus. Lempus is tumpus.",
        "noise_prompt_4": "Tumpus is bright. Lempus is tumpus. Max is lempus. True or false: Max is bright. Let us think step by step.",
        "response_4": "Max is lempus. Lempus is tumpus.",
        "noise_response_5": "Max is lempus. Lempus is hot. Max is",
        "noise_prompt_5": "Tumpus is bright. Lempus is tumpus. Max is lempus. True or false: Max is bright. Let us think step by step.",
        "response_5": "Max is lempus. Lempus is tumpus. Max is",
        "noise_response_6": "Max is lempus. Lempus is tumpus. Max is tumpus.",
        "noise_prompt_6": "Zumpus is bright. Lempus is tumpus. Max is lempus. True or false: Max is bright. Let us think step by step.",
        "response_6": "Max is lempus. Lempus is tumpus. Max is tumpus.",
        "noise_response_7": "Max is lempus. Lempus is tumpus. Max is tumpus. Tumpus is",
        "noise_prompt_7": "Tumpus is bright. Lempus is tumpus. Max is lempus. True or false: Max is shy. Let us think step by step.",
        "response_7": "Max is lempus. Lempus is tumpus. Max is tumpus. Tumpus is",
        "noise_response_8": "Max is lempus. Lempus is tumpus. Fae is tumpus. Tumpus is bright.",
        "noise_prompt_8": "Tumpus is bright. Lempus is tumpus. Max is lempus. True or false: Max is bright. Let us think step by step.",
        "response_8": "Max is lempus. Lempus is tumpus. Max is tumpus. Tumpus is bright.",
        "noise_response_9": "Max is lempus. Lempus is tumpus. Max is tumpus. Tumpus is happy. Max is",
        "noise_prompt_9": "Tumpus is bright. Lempus is tumpus. Max is lempus. True or false: Max is bright. Let us think step by step.",
        "response_9": "Max is lempus. Lempus is tumpus. Max is tumpus. Tumpus is bright. Max is",
        "noise_prompt_10": "Tumpus is bright. Lempus is tumpus. Max is lempus. True or false: Max is bright. Let us think step by step.",
        "response_10": "Max is lempus. Lempus is tumpus. Max is tumpus. Tumpus is bright. Max is bright.",
        "noise_response_10": "Max is lempus. Lempus is tumpus. Max is tumpus. Tumpus is bright. Max is rainy.",
        "answer_token_id_0": 7976,
        "answer_token_pos_0": 380,
        "answer_token_0": "Max",
        "end_token_pos_0": 379,
        "end_token_id_0": 13,
        "answer_token_id_1": 454,
        "answer_token_pos_1": 383,
        "answer_token_1": "le",
        "end_token_pos_1": 382,
        "end_token_id_1": 338,
        "answer_token_id_2": 365,
        "answer_token_pos_2": 387,
        "answer_token_2": "L",
        "end_token_pos_2": 386,
        "end_token_id_2": 29889,
        "answer_token_id_3": 260,
        "answer_token_pos_3": 391,
        "answer_token_3": "t",
        "end_token_pos_3": 390,
        "end_token_id_3": 338,
        "answer_token_id_4": 5918,
        "answer_token_pos_4": 395,
        "answer_token_4": "Max",
        "end_token_pos_4": 394,
        "end_token_id_4": 29889,
        "answer_token_id_5": 260,
        "answer_token_pos_5": 398,
        "answer_token_5": "t",
        "end_token_pos_5": 397,
        "end_token_id_5": 338,
        "answer_token_id_6": 323,
        "answer_token_pos_6": 402,
        "answer_token_6": "T",
        "end_token_pos_6": 401,
        "end_token_id_6": 29889,
        "answer_token_id_7": 11785,
        "answer_token_pos_7": 406,
        "answer_token_7": "bright",
        "end_token_pos_7": 405,
        "end_token_id_7": 338,
        "answer_token_id_8": 5918,
        "answer_token_pos_8": 410,
        "answer_token_8": "Max",
        "end_token_pos_8": 409,
        "end_token_id_8": 29889,
        "answer_token_id_9": 11785,
        "answer_token_pos_9": 413,
        "answer_token_9": "bright",
        "end_token_pos_9": 412,
        "end_token_id_9": 338
    },
    {
        "question": "Impuses are happy. Sterpus is impus. Sam is sterpus.",
        "query": "True or false: Sam is happy.",
        "answer": "Sam is sterpus. Sterpus is impus. Sam is impus. Impuses are happy. Sam is happy. True",
        "label": "True",
        "prompt": "Impuses are happy. Sterpus is impus. Sam is sterpus. True or false: Sam is happy. Let us think step by step.",
        "generated": "Sam is sterpus. Sterpus is impus. Sam is impus. Impuses are happy. Sam is happy. True",
        "noise_response_0": "",
        "noise_prompt_0": "Impuses are happy. Sterpus is impus. Sam is sterpus. True or false: Polly is happy. Let us think step by step.",
        "response_0": "",
        "noise_response_1": "Sam is",
        "noise_prompt_1": "Impuses are happy. Sterpus is impus. Sam is wumpus. True or false: Sam is happy. Let us think step by step.",
        "response_1": "Sam is",
        "noise_response_2": "Sam is sterpus.",
        "noise_prompt_2": "Impuses are happy. rompus is impus. Sam is sterpus. True or false: Sam is happy. Let us think step by step.",
        "response_2": "Sam is sterpus.",
        "noise_response_3": "Sam is sterpus. Sterpus is",
        "noise_prompt_3": "Impuses are happy. Sterpus is rompus. Sam is sterpus. True or false: Sam is happy. Let us think step by step.",
        "response_3": "Sam is sterpus. Sterpus is",
        "noise_response_4": "Polly is sterpus. Sterpus is impus.",
        "noise_prompt_4": "Impuses are happy. Sterpus is impus. Sam is sterpus. True or false: Sam is happy. Let us think step by step.",
        "response_4": "Sam is sterpus. Sterpus is impus.",
        "noise_response_5": "Sam is sterpus. Sterpus is sterpus. Sam is",
        "noise_prompt_5": "Impuses are happy. Sterpus is impus. Sam is sterpus. True or false: Sam is happy. Let us think step by step.",
        "response_5": "Sam is sterpus. Sterpus is impus. Sam is",
        "noise_response_6": "Sam is sterpus. Sterpus is impus. Sam is impus.",
        "noise_prompt_6": "Tumpus are happy. Sterpus is impus. Sam is sterpus. True or false: Sam is happy. Let us think step by step.",
        "response_6": "Sam is sterpus. Sterpus is impus. Sam is impus.",
        "noise_response_7": "Sam is sterpus. Sterpus is impus. Sam is impus. Impuses are",
        "noise_prompt_7": "Impuses are happy. Sterpus is impus. Sam is sterpus. True or false: Sam is dull. Let us think step by step.",
        "response_7": "Sam is sterpus. Sterpus is impus. Sam is impus. Impuses are",
        "noise_response_8": "Sam is sterpus. Sterpus is impus. Rex is impus. Impuses are happy.",
        "noise_prompt_8": "Impuses are happy. Sterpus is impus. Sam is sterpus. True or false: Sam is happy. Let us think step by step.",
        "response_8": "Sam is sterpus. Sterpus is impus. Sam is impus. Impuses are happy.",
        "noise_response_9": "Sam is sterpus. Sterpus is impus. Sam is impus. Impuses are sweet. Sam is",
        "noise_prompt_9": "Impuses are happy. Sterpus is impus. Sam is sterpus. True or false: Sam is happy. Let us think step by step.",
        "response_9": "Sam is sterpus. Sterpus is impus. Sam is impus. Impuses are happy. Sam is",
        "noise_prompt_10": "Impuses are happy. Sterpus is impus. Sam is sterpus. True or false: Sam is happy. Let us think step by step.",
        "response_10": "Sam is sterpus. Sterpus is impus. Sam is impus. Impuses are happy. Sam is happy.",
        "noise_response_10": "Sam is sterpus. Sterpus is impus. Sam is impus. Impuses are happy. Sam is sunny.",
        "answer_token_id_0": 29903,
        "answer_token_pos_0": 380,
        "answer_token_0": "S",
        "end_token_pos_0": 379,
        "end_token_id_0": 13,
        "answer_token_id_1": 16864,
        "answer_token_pos_1": 383,
        "answer_token_1": "ster",
        "end_token_pos_1": 382,
        "end_token_id_1": 338,
        "answer_token_id_2": 28588,
        "answer_token_pos_2": 387,
        "answer_token_2": "Ster",
        "end_token_pos_2": 386,
        "end_token_id_2": 29889,
        "answer_token_id_3": 2411,
        "answer_token_pos_3": 391,
        "answer_token_3": "imp",
        "end_token_pos_3": 390,
        "end_token_id_3": 338,
        "answer_token_id_4": 3685,
        "answer_token_pos_4": 395,
        "answer_token_4": "Sam",
        "end_token_pos_4": 394,
        "end_token_id_4": 29889,
        "answer_token_id_5": 2411,
        "answer_token_pos_5": 398,
        "answer_token_5": "imp",
        "end_token_pos_5": 397,
        "end_token_id_5": 338,
        "answer_token_id_6": 14305,
        "answer_token_pos_6": 402,
        "answer_token_6": "Imp",
        "end_token_pos_6": 401,
        "end_token_id_6": 29889,
        "answer_token_id_7": 9796,
        "answer_token_pos_7": 406,
        "answer_token_7": "happy",
        "end_token_pos_7": 405,
        "end_token_id_7": 526,
        "answer_token_id_8": 3685,
        "answer_token_pos_8": 410,
        "answer_token_8": "Sam",
        "end_token_pos_8": 409,
        "end_token_id_8": 29889,
        "answer_token_id_9": 9796,
        "answer_token_pos_9": 413,
        "answer_token_9": "happy",
        "end_token_pos_9": 412,
        "end_token_id_9": 338
    },
    {
        "question": "Shumpuses are overcast. Zumpus is shumpus. Sally is zumpus.",
        "query": "True or false: Sally is large.",
        "answer": "Sally is zumpus. Zumpus is shumpus. Sally is shumpus. Shumpuses are overcast. Sally is overcast. False",
        "label": "False",
        "prompt": "Shumpuses are overcast. Zumpus is shumpus. Sally is zumpus. True or false: Sally is large. Let us think step by step.",
        "generated": "Sally is zumpus. Zumpus is shumpus. Sally is shumpus. Shumpuses are overcast. Sally is overcast. False",
        "noise_response_0": "",
        "noise_prompt_0": "Shumpuses are overcast. Zumpus is shumpus. Sally is zumpus. True or false: Max is large. Let us think step by step.",
        "response_0": "",
        "noise_response_1": "Sally is",
        "noise_prompt_1": "Shumpuses are overcast. Zumpus is shumpus. Sally is zumpus. True or false: Sally is large. Let us think step by step.",
        "response_1": "Sally is",
        "noise_response_2": "Sally is zumpus.",
        "noise_prompt_2": "Shumpuses are overcast. Vumpus is shumpus. Sally is zumpus. True or false: Sally is large. Let us think step by step.",
        "response_2": "Sally is zumpus.",
        "noise_response_3": "Sally is zumpus. Zumpus is",
        "noise_prompt_3": "Shumpuses are overcast. Zumpus is slow. Sally is zumpus. True or false: Sally is large. Let us think step by step.",
        "response_3": "Sally is zumpus. Zumpus is",
        "noise_response_4": "Max is zumpus. Zumpus is shumpus.",
        "noise_prompt_4": "Shumpuses are overcast. Zumpus is shumpus. Sally is zumpus. True or false: Sally is large. Let us think step by step.",
        "response_4": "Sally is zumpus. Zumpus is shumpus.",
        "noise_response_5": "Sally is zumpus. Zumpus is windy. Sally is",
        "noise_prompt_5": "Shumpuses are overcast. Zumpus is shumpus. Sally is zumpus. True or false: Sally is large. Let us think step by step.",
        "response_5": "Sally is zumpus. Zumpus is shumpus. Sally is",
        "noise_response_6": "Sally is zumpus. Zumpus is shumpus. Sally is shumpus.",
        "noise_prompt_6": "rompus are overcast. Zumpus is shumpus. Sally is zumpus. True or false: Sally is large. Let us think step by step.",
        "response_6": "Sally is zumpus. Zumpus is shumpus. Sally is shumpus.",
        "noise_response_7": "Sally is zumpus. Zumpus is shumpus. Sally is shumpus. Shumpuses are",
        "noise_prompt_7": "Shumpuses are dull. Zumpus is shumpus. Sally is zumpus. True or false: Sally is large. Let us think step by step.",
        "response_7": "Sally is zumpus. Zumpus is shumpus. Sally is shumpus. Shumpuses are",
        "noise_response_8": "Sally is zumpus. Zumpus is shumpus. Sally is shumpus. Wren are overcast.",
        "noise_prompt_8": "Shumpuses are overcast. Zumpus is shumpus. Sally is zumpus. True or false: Sally is large. Let us think step by step.",
        "response_8": "Sally is zumpus. Zumpus is shumpus. Sally is shumpus. Shumpuses are overcast.",
        "noise_response_9": "Sally is zumpus. Zumpus is shumpus. Sally is shumpus. Shumpuses are temperate. Sally is",
        "noise_prompt_9": "Shumpuses are overcast. Zumpus is shumpus. Sally is zumpus. True or false: Sally is large. Let us think step by step.",
        "response_9": "Sally is zumpus. Zumpus is shumpus. Sally is shumpus. Shumpuses are overcast. Sally is",
        "noise_prompt_10": "Shumpuses are overcast. Zumpus is shumpus. Sally is zumpus. True or false: Sally is large. Let us think step by step.",
        "response_10": "Sally is zumpus. Zumpus is shumpus. Sally is shumpus. Shumpuses are overcast. Sally is overcast.",
        "noise_response_10": "Sally is zumpus. Zumpus is shumpus. Sally is shumpus. Shumpuses are overcast. Sally is wooden.",
        "answer_token_id_0": 29903,
        "answer_token_pos_0": 380,
        "answer_token_0": "S",
        "end_token_pos_0": 379,
        "end_token_id_0": 13,
        "answer_token_id_1": 3356,
        "answer_token_pos_1": 383,
        "answer_token_1": "zum",
        "end_token_pos_1": 382,
        "end_token_id_1": 338,
        "answer_token_id_2": 796,
        "answer_token_pos_2": 387,
        "answer_token_2": "Z",
        "end_token_pos_2": 386,
        "end_token_id_2": 29889,
        "answer_token_id_3": 528,
        "answer_token_pos_3": 391,
        "answer_token_3": "sh",
        "end_token_pos_3": 390,
        "end_token_id_3": 338,
        "answer_token_id_4": 317,
        "answer_token_pos_4": 395,
        "answer_token_4": "S",
        "end_token_pos_4": 394,
        "end_token_id_4": 29889,
        "answer_token_id_5": 528,
        "answer_token_pos_5": 398,
        "answer_token_5": "sh",
        "end_token_pos_5": 397,
        "end_token_id_5": 338,
        "answer_token_id_6": 1383,
        "answer_token_pos_6": 402,
        "answer_token_6": "Sh",
        "end_token_pos_6": 401,
        "end_token_id_6": 29889,
        "answer_token_id_7": 975,
        "answer_token_pos_7": 406,
        "answer_token_7": "over",
        "end_token_pos_7": 405,
        "end_token_id_7": 526,
        "answer_token_id_8": 317,
        "answer_token_pos_8": 410,
        "answer_token_8": "S",
        "end_token_pos_8": 409,
        "end_token_id_8": 29889,
        "answer_token_id_9": 975,
        "answer_token_pos_9": 413,
        "answer_token_9": "over",
        "end_token_pos_9": 412,
        "end_token_id_9": 338
    },
    {
        "question": "Impuses are sunny. Brimpuses are impuses. Alex is brimpus.",
        "query": "True or false: Alex is transparent.",
        "answer": "Alex is brimpus. Brimpuses are impuses. Alex is impus. Impuses are sunny. Alex is sunny. False",
        "label": "False",
        "prompt": "Impuses are sunny. Brimpuses are impuses. Alex is brimpus. True or false: Alex is transparent. Let us think step by step.",
        "generated": "Alex is brimpus. Brimpuses are impuses. Alex is impus. Impuses are sunny. Alex is sunny. False",
        "noise_response_0": "",
        "noise_prompt_0": "Impuses are sunny. Brimpuses are impuses. Alex is brimpus. True or false: Stella is transparent. Let us think step by step.",
        "response_0": "",
        "noise_response_1": "Alex is",
        "noise_prompt_1": "Impuses are sunny. Brimpuses are impuses. Alex is angry. True or false: Alex is transparent. Let us think step by step.",
        "response_1": "Alex is",
        "noise_response_2": "Alex is brimpus.",
        "noise_prompt_2": "Impuses are sunny. yumpus are impuses. Alex is brimpus. True or false: Alex is transparent. Let us think step by step.",
        "response_2": "Alex is brimpus.",
        "noise_response_3": "Alex is brimpus. Brimpuses are",
        "noise_prompt_3": "Impuses are sunny. Brimpuses are Gorpus. Alex is brimpus. True or false: Alex is transparent. Let us think step by step.",
        "response_3": "Alex is brimpus. Brimpuses are",
        "noise_response_4": "Stella is brimpus. Brimpuses are impuses.",
        "noise_prompt_4": "Impuses are sunny. Brimpuses are impuses. Alex is brimpus. True or false: Alex is transparent. Let us think step by step.",
        "response_4": "Alex is brimpus. Brimpuses are impuses.",
        "noise_response_5": "Alex is brimpus. Brimpuses are sterpus. Alex is",
        "noise_prompt_5": "Impuses are sunny. Brimpuses are impuses. Alex is brimpus. True or false: Alex is transparent. Let us think step by step.",
        "response_5": "Alex is brimpus. Brimpuses are impuses. Alex is",
        "noise_response_6": "Alex is brimpus. Brimpuses are impuses. Alex is impus.",
        "noise_prompt_6": "rompus are sunny. Brimpuses are impuses. Alex is brimpus. True or false: Alex is transparent. Let us think step by step.",
        "response_6": "Alex is brimpus. Brimpuses are impuses. Alex is impus.",
        "noise_response_7": "Alex is brimpus. Brimpuses are impuses. Alex is impus. Impuses are",
        "noise_prompt_7": "Impuses are discordant. Brimpuses are impuses. Alex is brimpus. True or false: Alex is transparent. Let us think step by step.",
        "response_7": "Alex is brimpus. Brimpuses are impuses. Alex is impus. Impuses are",
        "noise_response_8": "Alex is brimpus. Brimpuses are impuses. Rex is impus. Impuses are sunny.",
        "noise_prompt_8": "Impuses are sunny. Brimpuses are impuses. Alex is brimpus. True or false: Alex is transparent. Let us think step by step.",
        "response_8": "Alex is brimpus. Brimpuses are impuses. Alex is impus. Impuses are sunny.",
        "noise_response_9": "Alex is brimpus. Brimpuses are impuses. Alex is impus. Impuses are small. Alex is",
        "noise_prompt_9": "Impuses are sunny. Brimpuses are impuses. Alex is brimpus. True or false: Alex is transparent. Let us think step by step.",
        "response_9": "Alex is brimpus. Brimpuses are impuses. Alex is impus. Impuses are sunny. Alex is",
        "noise_prompt_10": "Impuses are sunny. Brimpuses are impuses. Alex is brimpus. True or false: Alex is transparent. Let us think step by step.",
        "response_10": "Alex is brimpus. Brimpuses are impuses. Alex is impus. Impuses are sunny. Alex is sunny.",
        "noise_response_10": "Alex is brimpus. Brimpuses are impuses. Alex is impus. Impuses are sunny. Alex is feisty.",
        "answer_token_id_0": 17406,
        "answer_token_pos_0": 380,
        "answer_token_0": "Alex",
        "end_token_pos_0": 379,
        "end_token_id_0": 13,
        "answer_token_id_1": 1506,
        "answer_token_pos_1": 383,
        "answer_token_1": "br",
        "end_token_pos_1": 382,
        "end_token_id_1": 338,
        "answer_token_id_2": 1771,
        "answer_token_pos_2": 387,
        "answer_token_2": "Br",
        "end_token_pos_2": 386,
        "end_token_id_2": 29889,
        "answer_token_id_3": 2411,
        "answer_token_pos_3": 391,
        "answer_token_3": "imp",
        "end_token_pos_3": 390,
        "end_token_id_3": 526,
        "answer_token_id_4": 4827,
        "answer_token_pos_4": 395,
        "answer_token_4": "Alex",
        "end_token_pos_4": 394,
        "end_token_id_4": 29889,
        "answer_token_id_5": 2411,
        "answer_token_pos_5": 398,
        "answer_token_5": "imp",
        "end_token_pos_5": 397,
        "end_token_id_5": 338,
        "answer_token_id_6": 14305,
        "answer_token_pos_6": 402,
        "answer_token_6": "Imp",
        "end_token_pos_6": 401,
        "end_token_id_6": 29889,
        "answer_token_id_7": 6575,
        "answer_token_pos_7": 406,
        "answer_token_7": "sun",
        "end_token_pos_7": 405,
        "end_token_id_7": 526,
        "answer_token_id_8": 4827,
        "answer_token_pos_8": 410,
        "answer_token_8": "Alex",
        "end_token_pos_8": 409,
        "end_token_id_8": 29889,
        "answer_token_id_9": 6575,
        "answer_token_pos_9": 413,
        "answer_token_9": "sun",
        "end_token_pos_9": 412,
        "end_token_id_9": 338
    },
    {
        "question": "Tumpus is opaque. Yumpuses are tumpuses. Fae is yumpus.",
        "query": "True or false: Fae is opaque.",
        "answer": "Fae is yumpus. Yumpuses are tumpuses. Fae is tumpus. Tumpus is opaque. Fae is opaque. True",
        "label": "True",
        "prompt": "Tumpus is opaque. Yumpuses are tumpuses. Fae is yumpus. True or false: Fae is opaque. Let us think step by step.",
        "generated": "Fae is yumpus. Yumpuses are tumpuses. Fae is tumpus. Tumpus is opaque. Fae is opaque. True",
        "noise_response_0": "",
        "noise_prompt_0": "Tumpus is opaque. Yumpuses are tumpuses. Fae is yumpus. True or false: Alex is opaque. Let us think step by step.",
        "response_0": "",
        "noise_response_1": "Fae is",
        "noise_prompt_1": "Tumpus is opaque. Yumpuses are tumpuses. Fae is jompus. True or false: Fae is opaque. Let us think step by step.",
        "response_1": "Fae is",
        "noise_response_2": "Fae is yumpus.",
        "noise_prompt_2": "Tumpus is opaque. dumpus are tumpuses. Fae is yumpus. True or false: Fae is opaque. Let us think step by step.",
        "response_2": "Fae is yumpus.",
        "noise_response_3": "Fae is yumpus. Yumpuses are",
        "noise_prompt_3": "Tumpus is opaque. Yumpuses are amenable. Fae is yumpus. True or false: Fae is opaque. Let us think step by step.",
        "response_3": "Fae is yumpus. Yumpuses are",
        "noise_response_4": "Polly is yumpus. Yumpuses are tumpuses.",
        "noise_prompt_4": "Tumpus is opaque. Yumpuses are tumpuses. Fae is yumpus. True or false: Fae is opaque. Let us think step by step.",
        "response_4": "Fae is yumpus. Yumpuses are tumpuses.",
        "noise_response_5": "Fae is yumpus. Yumpuses are sour. Fae is",
        "noise_prompt_5": "Tumpus is opaque. Yumpuses are tumpuses. Fae is yumpus. True or false: Fae is opaque. Let us think step by step.",
        "response_5": "Fae is yumpus. Yumpuses are tumpuses. Fae is",
        "noise_response_6": "Fae is yumpus. Yumpuses are tumpuses. Fae is tumpus.",
        "noise_prompt_6": "Sterpus is opaque. Yumpuses are tumpuses. Fae is yumpus. True or false: Fae is opaque. Let us think step by step.",
        "response_6": "Fae is yumpus. Yumpuses are tumpuses. Fae is tumpus.",
        "noise_response_7": "Fae is yumpus. Yumpuses are tumpuses. Fae is tumpus. Tumpus is",
        "noise_prompt_7": "Tumpus is opaque. Yumpuses are tumpuses. Fae is yumpus. True or false: Fae is fast. Let us think step by step.",
        "response_7": "Fae is yumpus. Yumpuses are tumpuses. Fae is tumpus. Tumpus is",
        "noise_response_8": "Fae is yumpus. Yumpuses are tumpuses. Sam is tumpus. Tumpus is opaque.",
        "noise_prompt_8": "Tumpus is opaque. Yumpuses are tumpuses. Fae is yumpus. True or false: Fae is opaque. Let us think step by step.",
        "response_8": "Fae is yumpus. Yumpuses are tumpuses. Fae is tumpus. Tumpus is opaque.",
        "noise_response_9": "Fae is yumpus. Yumpuses are tumpuses. Fae is tumpus. Tumpus is brown. Fae is",
        "noise_prompt_9": "Tumpus is opaque. Yumpuses are tumpuses. Fae is yumpus. True or false: Fae is opaque. Let us think step by step.",
        "response_9": "Fae is yumpus. Yumpuses are tumpuses. Fae is tumpus. Tumpus is opaque. Fae is",
        "noise_prompt_10": "Tumpus is opaque. Yumpuses are tumpuses. Fae is yumpus. True or false: Fae is opaque. Let us think step by step.",
        "response_10": "Fae is yumpus. Yumpuses are tumpuses. Fae is tumpus. Tumpus is opaque. Fae is opaque.",
        "noise_response_10": "Fae is yumpus. Yumpuses are tumpuses. Fae is tumpus. Tumpus is opaque. Fae is luminous.",
        "answer_token_id_0": 29943,
        "answer_token_pos_0": 380,
        "answer_token_0": "F",
        "end_token_pos_0": 379,
        "end_token_id_0": 13,
        "answer_token_id_1": 343,
        "answer_token_pos_1": 383,
        "answer_token_1": "y",
        "end_token_pos_1": 382,
        "end_token_id_1": 338,
        "answer_token_id_2": 612,
        "answer_token_pos_2": 387,
        "answer_token_2": "Y",
        "end_token_pos_2": 386,
        "end_token_id_2": 29889,
        "answer_token_id_3": 260,
        "answer_token_pos_3": 391,
        "answer_token_3": "t",
        "end_token_pos_3": 390,
        "end_token_id_3": 526,
        "answer_token_id_4": 383,
        "answer_token_pos_4": 395,
        "answer_token_4": "F",
        "end_token_pos_4": 394,
        "end_token_id_4": 29889,
        "answer_token_id_5": 260,
        "answer_token_pos_5": 398,
        "answer_token_5": "t",
        "end_token_pos_5": 397,
        "end_token_id_5": 338,
        "answer_token_id_6": 323,
        "answer_token_pos_6": 402,
        "answer_token_6": "T",
        "end_token_pos_6": 401,
        "end_token_id_6": 29889,
        "answer_token_id_7": 1015,
        "answer_token_pos_7": 406,
        "answer_token_7": "op",
        "end_token_pos_7": 405,
        "end_token_id_7": 338,
        "answer_token_id_8": 383,
        "answer_token_pos_8": 410,
        "answer_token_8": "F",
        "end_token_pos_8": 409,
        "end_token_id_8": 29889,
        "answer_token_id_9": 1015,
        "answer_token_pos_9": 413,
        "answer_token_9": "op",
        "end_token_pos_9": 412,
        "end_token_id_9": 338
    },
    {
        "question": "Yumpuses are spicy. Jompuses are yumpuses. Polly is jompus.",
        "query": "True or false: Polly is spicy.",
        "answer": "Polly is jompus. Jompuses are yumpuses. Polly is yumpus. Yumpuses are spicy. Polly is spicy. True",
        "label": "True",
        "prompt": "Yumpuses are spicy. Jompuses are yumpuses. Polly is jompus. True or false: Polly is spicy. Let us think step by step.",
        "generated": "Polly is jompus. Jompuses are yumpuses. Polly is yumpus. Yumpuses are spicy. Polly is spicy. True",
        "noise_response_0": "",
        "noise_prompt_0": "Yumpuses are spicy. Jompuses are yumpuses. Polly is jompus. True or false: Fae is spicy. Let us think step by step.",
        "response_0": "",
        "noise_response_1": "Polly is",
        "noise_prompt_1": "Yumpuses are spicy. Jompuses are yumpuses. Polly is Sterpus. True or false: Polly is spicy. Let us think step by step.",
        "response_1": "Polly is",
        "noise_response_2": "Polly is jompus.",
        "noise_prompt_2": "Yumpuses are spicy. impus are yumpuses. Polly is jompus. True or false: Polly is spicy. Let us think step by step.",
        "response_2": "Polly is jompus.",
        "noise_response_3": "Polly is jompus. Jompuses are",
        "noise_prompt_3": "Yumpuses are spicy. Jompuses are Shumpus. Polly is jompus. True or false: Polly is spicy. Let us think step by step.",
        "response_3": "Polly is jompus. Jompuses are",
        "noise_response_4": "Sally is jompus. Jompuses are yumpuses.",
        "noise_prompt_4": "Yumpuses are spicy. Jompuses are yumpuses. Polly is jompus. True or false: Polly is spicy. Let us think step by step.",
        "response_4": "Polly is jompus. Jompuses are yumpuses.",
        "noise_response_5": "Polly is jompus. Jompuses are Vumpus. Polly is",
        "noise_prompt_5": "Yumpuses are spicy. Jompuses are yumpuses. Polly is jompus. True or false: Polly is spicy. Let us think step by step.",
        "response_5": "Polly is jompus. Jompuses are yumpuses. Polly is",
        "noise_response_6": "Polly is jompus. Jompuses are yumpuses. Polly is yumpus.",
        "noise_prompt_6": "Zumpus are spicy. Jompuses are yumpuses. Polly is jompus. True or false: Polly is spicy. Let us think step by step.",
        "response_6": "Polly is jompus. Jompuses are yumpuses. Polly is yumpus.",
        "noise_response_7": "Polly is jompus. Jompuses are yumpuses. Polly is yumpus. Yumpuses are",
        "noise_prompt_7": "Yumpuses are spicy. Jompuses are yumpuses. Polly is jompus. True or false: Polly is spicy. Let us think step by step.",
        "response_7": "Polly is jompus. Jompuses are yumpuses. Polly is yumpus. Yumpuses are",
        "noise_response_8": "Polly is jompus. Jompuses are yumpuses. Rex is yumpus. Yumpuses are spicy.",
        "noise_prompt_8": "Yumpuses are spicy. Jompuses are yumpuses. Polly is jompus. True or false: Polly is spicy. Let us think step by step.",
        "response_8": "Polly is jompus. Jompuses are yumpuses. Polly is yumpus. Yumpuses are spicy.",
        "noise_response_9": "Polly is jompus. Jompuses are yumpuses. Polly is yumpus. Yumpuses are moderate. Polly is",
        "noise_prompt_9": "Yumpuses are spicy. Jompuses are yumpuses. Polly is jompus. True or false: Polly is spicy. Let us think step by step.",
        "response_9": "Polly is jompus. Jompuses are yumpuses. Polly is yumpus. Yumpuses are spicy. Polly is",
        "noise_prompt_10": "Yumpuses are spicy. Jompuses are yumpuses. Polly is jompus. True or false: Polly is spicy. Let us think step by step.",
        "response_10": "Polly is jompus. Jompuses are yumpuses. Polly is yumpus. Yumpuses are spicy. Polly is spicy.",
        "noise_response_10": "Polly is jompus. Jompuses are yumpuses. Polly is yumpus. Yumpuses are spicy. Polly is rainy.",
        "answer_token_id_0": 7713,
        "answer_token_pos_0": 380,
        "answer_token_0": "Pol",
        "end_token_pos_0": 379,
        "end_token_id_0": 13,
        "answer_token_id_1": 432,
        "answer_token_pos_1": 383,
        "answer_token_1": "j",
        "end_token_pos_1": 382,
        "end_token_id_1": 338,
        "answer_token_id_2": 435,
        "answer_token_pos_2": 387,
        "answer_token_2": "J",
        "end_token_pos_2": 386,
        "end_token_id_2": 29889,
        "answer_token_id_3": 343,
        "answer_token_pos_3": 391,
        "answer_token_3": "y",
        "end_token_pos_3": 390,
        "end_token_id_3": 526,
        "answer_token_id_4": 2043,
        "answer_token_pos_4": 395,
        "answer_token_4": "Pol",
        "end_token_pos_4": 394,
        "end_token_id_4": 29889,
        "answer_token_id_5": 343,
        "answer_token_pos_5": 398,
        "answer_token_5": "y",
        "end_token_pos_5": 397,
        "end_token_id_5": 338,
        "answer_token_id_6": 612,
        "answer_token_pos_6": 402,
        "answer_token_6": "Y",
        "end_token_pos_6": 401,
        "end_token_id_6": 29889,
        "answer_token_id_7": 805,
        "answer_token_pos_7": 406,
        "answer_token_7": "sp",
        "end_token_pos_7": 405,
        "end_token_id_7": 526,
        "answer_token_id_8": 2043,
        "answer_token_pos_8": 410,
        "answer_token_8": "Pol",
        "end_token_pos_8": 409,
        "end_token_id_8": 29889,
        "answer_token_id_9": 805,
        "answer_token_pos_9": 413,
        "answer_token_9": "sp",
        "end_token_pos_9": 412,
        "end_token_id_9": 338
    },
    {
        "question": "Jompus is wooden. Impus is jompus. Stella is impus.",
        "query": "True or false: Stella is wooden.",
        "answer": "Stella is impus. Impus is jompus. Stella is jompus. Jompus is wooden. Stella is wooden. True",
        "label": "True",
        "prompt": "Jompus is wooden. Impus is jompus. Stella is impus. True or false: Stella is wooden. Let us think step by step.",
        "generated": "Stella is impus. Impus is jompus. Stella is jompus. Jompus is wooden. Stella is wooden. True",
        "noise_response_0": "",
        "noise_prompt_0": "Jompus is wooden. Impus is jompus. Stella is impus. True or false: Sally is wooden. Let us think step by step.",
        "response_0": "",
        "noise_response_1": "Stella is",
        "noise_prompt_1": "Jompus is wooden. Impus is jompus. Stella is Zumpus. True or false: Stella is wooden. Let us think step by step.",
        "response_1": "Stella is",
        "noise_response_2": "Stella is impus.",
        "noise_prompt_2": "Jompus is wooden. gorpus is jompus. Stella is impus. True or false: Stella is wooden. Let us think step by step.",
        "response_2": "Stella is impus.",
        "noise_response_3": "Stella is impus. Impus is",
        "noise_prompt_3": "Jompus is wooden. Impus is Yumpus. Stella is impus. True or false: Stella is wooden. Let us think step by step.",
        "response_3": "Stella is impus. Impus is",
        "noise_response_4": "Wren is impus. Impus is jompus.",
        "noise_prompt_4": "Jompus is wooden. Impus is jompus. Stella is impus. True or false: Stella is wooden. Let us think step by step.",
        "response_4": "Stella is impus. Impus is jompus.",
        "noise_response_5": "Stella is impus. Impus is Dumpus. Stella is",
        "noise_prompt_5": "Jompus is wooden. Impus is jompus. Stella is impus. True or false: Stella is wooden. Let us think step by step.",
        "response_5": "Stella is impus. Impus is jompus. Stella is",
        "noise_response_6": "Stella is impus. Impus is jompus. Stella is jompus.",
        "noise_prompt_6": "Yumpus is wooden. Impus is jompus. Stella is impus. True or false: Stella is wooden. Let us think step by step.",
        "response_6": "Stella is impus. Impus is jompus. Stella is jompus.",
        "noise_response_7": "Stella is impus. Impus is jompus. Stella is jompus. Jompus is",
        "noise_prompt_7": "Jompus is wooden. Impus is jompus. Stella is impus. True or false: Stella is amenable. Let us think step by step.",
        "response_7": "Stella is impus. Impus is jompus. Stella is jompus. Jompus is",
        "noise_response_8": "Stella is impus. Impus is jompus. Sam is jompus. Jompus is wooden.",
        "noise_prompt_8": "Jompus is wooden. Impus is jompus. Stella is impus. True or false: Stella is wooden. Let us think step by step.",
        "response_8": "Stella is impus. Impus is jompus. Stella is jompus. Jompus is wooden.",
        "noise_response_9": "Stella is impus. Impus is jompus. Stella is jompus. Jompus is blue. Stella is",
        "noise_prompt_9": "Jompus is wooden. Impus is jompus. Stella is impus. True or false: Stella is wooden. Let us think step by step.",
        "response_9": "Stella is impus. Impus is jompus. Stella is jompus. Jompus is wooden. Stella is",
        "noise_prompt_10": "Jompus is wooden. Impus is jompus. Stella is impus. True or false: Stella is wooden. Let us think step by step.",
        "response_10": "Stella is impus. Impus is jompus. Stella is jompus. Jompus is wooden. Stella is wooden.",
        "noise_response_10": "Stella is impus. Impus is jompus. Stella is jompus. Jompus is wooden. Stella is spicy.",
        "answer_token_id_0": 855,
        "answer_token_pos_0": 380,
        "answer_token_0": "St",
        "end_token_pos_0": 379,
        "end_token_id_0": 13,
        "answer_token_id_1": 2411,
        "answer_token_pos_1": 383,
        "answer_token_1": "imp",
        "end_token_pos_1": 382,
        "end_token_id_1": 338,
        "answer_token_id_2": 14305,
        "answer_token_pos_2": 387,
        "answer_token_2": "Imp",
        "end_token_pos_2": 386,
        "end_token_id_2": 29889,
        "answer_token_id_3": 432,
        "answer_token_pos_3": 391,
        "answer_token_3": "j",
        "end_token_pos_3": 390,
        "end_token_id_3": 338,
        "answer_token_id_4": 624,
        "answer_token_pos_4": 395,
        "answer_token_4": "St",
        "end_token_pos_4": 394,
        "end_token_id_4": 29889,
        "answer_token_id_5": 432,
        "answer_token_pos_5": 398,
        "answer_token_5": "j",
        "end_token_pos_5": 397,
        "end_token_id_5": 338,
        "answer_token_id_6": 435,
        "answer_token_pos_6": 402,
        "answer_token_6": "J",
        "end_token_pos_6": 401,
        "end_token_id_6": 29889,
        "answer_token_id_7": 27278,
        "answer_token_pos_7": 406,
        "answer_token_7": "wooden",
        "end_token_pos_7": 405,
        "end_token_id_7": 338,
        "answer_token_id_8": 624,
        "answer_token_pos_8": 410,
        "answer_token_8": "St",
        "end_token_pos_8": 409,
        "end_token_id_8": 29889,
        "answer_token_id_9": 27278,
        "answer_token_pos_9": 413,
        "answer_token_9": "wooden",
        "end_token_pos_9": 412,
        "end_token_id_9": 338
    },
    {
        "question": "Brimpuses are overcast. Shumpus is brimpus. Wren is shumpus.",
        "query": "True or false: Wren is luminous.",
        "answer": "Wren is shumpus. Shumpus is brimpus. Wren is brimpus. Brimpuses are overcast. Wren is overcast. False",
        "label": "False",
        "prompt": "Brimpuses are overcast. Shumpus is brimpus. Wren is shumpus. True or false: Wren is luminous. Let us think step by step.",
        "generated": "Wren is shumpus. Shumpus is brimpus. Wren is brimpus. Brimpuses are overcast. Wren is overcast. False",
        "noise_response_0": "",
        "noise_prompt_0": "Brimpuses are overcast. Shumpus is brimpus. Wren is shumpus. True or false: Polly is luminous. Let us think step by step.",
        "response_0": "",
        "noise_response_1": "Wren is",
        "noise_prompt_1": "Brimpuses are overcast. Shumpus is brimpus. Wren is angry. True or false: Wren is luminous. Let us think step by step.",
        "response_1": "Wren is",
        "noise_response_2": "Wren is shumpus.",
        "noise_prompt_2": "Brimpuses are overcast. grimpus is brimpus. Wren is shumpus. True or false: Wren is luminous. Let us think step by step.",
        "response_2": "Wren is shumpus.",
        "noise_response_3": "Wren is shumpus. Shumpus is",
        "noise_prompt_3": "Brimpuses are overcast. Shumpus is amenable. Wren is shumpus. True or false: Wren is luminous. Let us think step by step.",
        "response_3": "Wren is shumpus. Shumpus is",
        "noise_response_4": "Sally is shumpus. Shumpus is brimpus.",
        "noise_prompt_4": "Brimpuses are overcast. Shumpus is brimpus. Wren is shumpus. True or false: Wren is luminous. Let us think step by step.",
        "response_4": "Wren is shumpus. Shumpus is brimpus.",
        "noise_response_5": "Wren is shumpus. Shumpus is spicy. Wren is",
        "noise_prompt_5": "Brimpuses are overcast. Shumpus is brimpus. Wren is shumpus. True or false: Wren is luminous. Let us think step by step.",
        "response_5": "Wren is shumpus. Shumpus is brimpus. Wren is",
        "noise_response_6": "Wren is shumpus. Shumpus is brimpus. Wren is brimpus.",
        "noise_prompt_6": "gorpus are overcast. Shumpus is brimpus. Wren is shumpus. True or false: Wren is luminous. Let us think step by step.",
        "response_6": "Wren is shumpus. Shumpus is brimpus. Wren is brimpus.",
        "noise_response_7": "Wren is shumpus. Shumpus is brimpus. Wren is brimpus. Brimpuses are",
        "noise_prompt_7": "Brimpuses are moderate. Shumpus is brimpus. Wren is shumpus. True or false: Wren is luminous. Let us think step by step.",
        "response_7": "Wren is shumpus. Shumpus is brimpus. Wren is brimpus. Brimpuses are",
        "noise_response_8": "Wren is shumpus. Shumpus is brimpus. Fae is brimpus. Brimpuses are overcast.",
        "noise_prompt_8": "Brimpuses are overcast. Shumpus is brimpus. Wren is shumpus. True or false: Wren is luminous. Let us think step by step.",
        "response_8": "Wren is shumpus. Shumpus is brimpus. Wren is brimpus. Brimpuses are overcast.",
        "noise_response_9": "Wren is shumpus. Shumpus is brimpus. Wren is brimpus. Brimpuses are melodic. Wren is",
        "noise_prompt_9": "Brimpuses are overcast. Shumpus is brimpus. Wren is shumpus. True or false: Wren is luminous. Let us think step by step.",
        "response_9": "Wren is shumpus. Shumpus is brimpus. Wren is brimpus. Brimpuses are overcast. Wren is",
        "noise_prompt_10": "Brimpuses are overcast. Shumpus is brimpus. Wren is shumpus. True or false: Wren is luminous. Let us think step by step.",
        "response_10": "Wren is shumpus. Shumpus is brimpus. Wren is brimpus. Brimpuses are overcast. Wren is overcast.",
        "noise_response_10": "Wren is shumpus. Shumpus is brimpus. Wren is brimpus. Brimpuses are overcast. Wren is large.",
        "answer_token_id_0": 29956,
        "answer_token_pos_0": 380,
        "answer_token_0": "W",
        "end_token_pos_0": 379,
        "end_token_id_0": 13,
        "answer_token_id_1": 528,
        "answer_token_pos_1": 383,
        "answer_token_1": "sh",
        "end_token_pos_1": 382,
        "end_token_id_1": 338,
        "answer_token_id_2": 1383,
        "answer_token_pos_2": 387,
        "answer_token_2": "Sh",
        "end_token_pos_2": 386,
        "end_token_id_2": 29889,
        "answer_token_id_3": 1506,
        "answer_token_pos_3": 391,
        "answer_token_3": "br",
        "end_token_pos_3": 390,
        "end_token_id_3": 338,
        "answer_token_id_4": 399,
        "answer_token_pos_4": 395,
        "answer_token_4": "W",
        "end_token_pos_4": 394,
        "end_token_id_4": 29889,
        "answer_token_id_5": 1506,
        "answer_token_pos_5": 398,
        "answer_token_5": "br",
        "end_token_pos_5": 397,
        "end_token_id_5": 338,
        "answer_token_id_6": 1771,
        "answer_token_pos_6": 402,
        "answer_token_6": "Br",
        "end_token_pos_6": 401,
        "end_token_id_6": 29889,
        "answer_token_id_7": 975,
        "answer_token_pos_7": 406,
        "answer_token_7": "over",
        "end_token_pos_7": 405,
        "end_token_id_7": 526,
        "answer_token_id_8": 399,
        "answer_token_pos_8": 410,
        "answer_token_8": "W",
        "end_token_pos_8": 409,
        "end_token_id_8": 29889,
        "answer_token_id_9": 975,
        "answer_token_pos_9": 413,
        "answer_token_9": "over",
        "end_token_pos_9": 412,
        "end_token_id_9": 338
    },
    {
        "question": "Jompus is shy. Sterpus is jompus. Rex is sterpus.",
        "query": "True or false: Rex is fruity.",
        "answer": "Rex is sterpus. Sterpus is jompus. Rex is jompus. Jompus is shy. Rex is shy. False",
        "label": "False",
        "prompt": "Jompus is shy. Sterpus is jompus. Rex is sterpus. True or false: Rex is fruity. Let us think step by step.",
        "generated": "Rex is sterpus. Sterpus is jompus. Rex is jompus. Jompus is shy. Rex is shy. False",
        "noise_response_0": "",
        "noise_prompt_0": "Jompus is shy. Sterpus is jompus. Rex is sterpus. True or false: Fae is fruity. Let us think step by step.",
        "response_0": "",
        "noise_response_1": "Rex is",
        "noise_prompt_1": "Jompus is shy. Sterpus is jompus. Rex is Brimpus. True or false: Rex is fruity. Let us think step by step.",
        "response_1": "Rex is",
        "noise_response_2": "Rex is sterpus.",
        "noise_prompt_2": "Jompus is shy. tumpus is jompus. Rex is sterpus. True or false: Rex is fruity. Let us think step by step.",
        "response_2": "Rex is sterpus.",
        "noise_response_3": "Rex is sterpus. Sterpus is",
        "noise_prompt_3": "Jompus is shy. Sterpus is vumpus. Rex is sterpus. True or false: Rex is fruity. Let us think step by step.",
        "response_3": "Rex is sterpus. Sterpus is",
        "noise_response_4": "Sally is sterpus. Sterpus is jompus.",
        "noise_prompt_4": "Jompus is shy. Sterpus is jompus. Rex is sterpus. True or false: Rex is fruity. Let us think step by step.",
        "response_4": "Rex is sterpus. Sterpus is jompus.",
        "noise_response_5": "Rex is sterpus. Sterpus is dumpus. Rex is",
        "noise_prompt_5": "Jompus is shy. Sterpus is jompus. Rex is sterpus. True or false: Rex is fruity. Let us think step by step.",
        "response_5": "Rex is sterpus. Sterpus is jompus. Rex is",
        "noise_response_6": "Rex is sterpus. Sterpus is jompus. Rex is jompus.",
        "noise_prompt_6": "impus is shy. Sterpus is jompus. Rex is sterpus. True or false: Rex is fruity. Let us think step by step.",
        "response_6": "Rex is sterpus. Sterpus is jompus. Rex is jompus.",
        "noise_response_7": "Rex is sterpus. Sterpus is jompus. Rex is jompus. Jompus is",
        "noise_prompt_7": "Jompus is snowy. Sterpus is jompus. Rex is sterpus. True or false: Rex is fruity. Let us think step by step.",
        "response_7": "Rex is sterpus. Sterpus is jompus. Rex is jompus. Jompus is",
        "noise_response_8": "Rex is sterpus. Sterpus is jompus. Sally is jompus. Jompus is shy.",
        "noise_prompt_8": "Jompus is shy. Sterpus is jompus. Rex is sterpus. True or false: Rex is fruity. Let us think step by step.",
        "response_8": "Rex is sterpus. Sterpus is jompus. Rex is jompus. Jompus is shy.",
        "noise_response_9": "Rex is sterpus. Sterpus is jompus. Rex is jompus. Jompus is hot. Rex is",
        "noise_prompt_9": "Jompus is shy. Sterpus is jompus. Rex is sterpus. True or false: Rex is fruity. Let us think step by step.",
        "response_9": "Rex is sterpus. Sterpus is jompus. Rex is jompus. Jompus is shy. Rex is",
        "noise_prompt_10": "Jompus is shy. Sterpus is jompus. Rex is sterpus. True or false: Rex is fruity. Let us think step by step.",
        "response_10": "Rex is sterpus. Sterpus is jompus. Rex is jompus. Jompus is shy. Rex is shy.",
        "noise_response_10": "Rex is sterpus. Sterpus is jompus. Rex is jompus. Jompus is shy. Rex is feisty.",
        "answer_token_id_0": 29934,
        "answer_token_pos_0": 380,
        "answer_token_0": "R",
        "end_token_pos_0": 379,
        "end_token_id_0": 13,
        "answer_token_id_1": 16864,
        "answer_token_pos_1": 383,
        "answer_token_1": "ster",
        "end_token_pos_1": 382,
        "end_token_id_1": 338,
        "answer_token_id_2": 28588,
        "answer_token_pos_2": 387,
        "answer_token_2": "Ster",
        "end_token_pos_2": 386,
        "end_token_id_2": 29889,
        "answer_token_id_3": 432,
        "answer_token_pos_3": 391,
        "answer_token_3": "j",
        "end_token_pos_3": 390,
        "end_token_id_3": 338,
        "answer_token_id_4": 390,
        "answer_token_pos_4": 395,
        "answer_token_4": "R",
        "end_token_pos_4": 394,
        "end_token_id_4": 29889,
        "answer_token_id_5": 432,
        "answer_token_pos_5": 398,
        "answer_token_5": "j",
        "end_token_pos_5": 397,
        "end_token_id_5": 338,
        "answer_token_id_6": 435,
        "answer_token_pos_6": 402,
        "answer_token_6": "J",
        "end_token_pos_6": 401,
        "end_token_id_6": 29889,
        "answer_token_id_7": 528,
        "answer_token_pos_7": 406,
        "answer_token_7": "sh",
        "end_token_pos_7": 405,
        "end_token_id_7": 338,
        "answer_token_id_8": 390,
        "answer_token_pos_8": 410,
        "answer_token_8": "R",
        "end_token_pos_8": 409,
        "end_token_id_8": 29889,
        "answer_token_id_9": 528,
        "answer_token_pos_9": 413,
        "answer_token_9": "sh",
        "end_token_pos_9": 412,
        "end_token_id_9": 338
    },
    {
        "question": "Rompuses are muffled. Jompus is rompus. Stella is jompus.",
        "query": "True or false: Stella is snowy.",
        "answer": "Stella is jompus. Jompus is rompus. Stella is rompus. Rompuses are muffled. Stella is muffled. False",
        "label": "False",
        "prompt": "Rompuses are muffled. Jompus is rompus. Stella is jompus. True or false: Stella is snowy. Let us think step by step.",
        "generated": "Stella is jompus. Jompus is rompus. Stella is rompus. Rompuses are muffled. Stella is muffled. False",
        "noise_response_0": "",
        "noise_prompt_0": "Rompuses are muffled. Jompus is rompus. Stella is jompus. True or false: Wren is snowy. Let us think step by step.",
        "response_0": "",
        "noise_response_1": "Stella is",
        "noise_prompt_1": "Rompuses are muffled. Jompus is rompus. Stella is Dumpus. True or false: Stella is snowy. Let us think step by step.",
        "response_1": "Stella is",
        "noise_response_2": "Stella is jompus.",
        "noise_prompt_2": "Rompuses are muffled. Zumpus is rompus. Stella is jompus. True or false: Stella is snowy. Let us think step by step.",
        "response_2": "Stella is jompus.",
        "noise_response_3": "Stella is jompus. Jompus is",
        "noise_prompt_3": "Rompuses are muffled. Jompus is Shumpus. Stella is jompus. True or false: Stella is snowy. Let us think step by step.",
        "response_3": "Stella is jompus. Jompus is",
        "noise_response_4": "Wren is jompus. Jompus is rompus.",
        "noise_prompt_4": "Rompuses are muffled. Jompus is rompus. Stella is jompus. True or false: Stella is snowy. Let us think step by step.",
        "response_4": "Stella is jompus. Jompus is rompus.",
        "noise_response_5": "Stella is jompus. Jompus is numpus. Stella is",
        "noise_prompt_5": "Rompuses are muffled. Jompus is rompus. Stella is jompus. True or false: Stella is snowy. Let us think step by step.",
        "response_5": "Stella is jompus. Jompus is rompus. Stella is",
        "noise_response_6": "Stella is jompus. Jompus is rompus. Stella is rompus.",
        "noise_prompt_6": "jompus are muffled. Jompus is rompus. Stella is jompus. True or false: Stella is snowy. Let us think step by step.",
        "response_6": "Stella is jompus. Jompus is rompus. Stella is rompus.",
        "noise_response_7": "Stella is jompus. Jompus is rompus. Stella is rompus. Rompuses are",
        "noise_prompt_7": "Rompuses are sweet. Jompus is rompus. Stella is jompus. True or false: Stella is snowy. Let us think step by step.",
        "response_7": "Stella is jompus. Jompus is rompus. Stella is rompus. Rompuses are",
        "noise_response_8": "Stella is jompus. Jompus is rompus. Rex is rompus. Rompuses are muffled.",
        "noise_prompt_8": "Rompuses are muffled. Jompus is rompus. Stella is jompus. True or false: Stella is snowy. Let us think step by step.",
        "response_8": "Stella is jompus. Jompus is rompus. Stella is rompus. Rompuses are muffled.",
        "noise_response_9": "Stella is jompus. Jompus is rompus. Stella is rompus. Rompuses are snowy. Stella is",
        "noise_prompt_9": "Rompuses are muffled. Jompus is rompus. Stella is jompus. True or false: Stella is snowy. Let us think step by step.",
        "response_9": "Stella is jompus. Jompus is rompus. Stella is rompus. Rompuses are muffled. Stella is",
        "noise_prompt_10": "Rompuses are muffled. Jompus is rompus. Stella is jompus. True or false: Stella is snowy. Let us think step by step.",
        "response_10": "Stella is jompus. Jompus is rompus. Stella is rompus. Rompuses are muffled. Stella is muffled.",
        "noise_response_10": "Stella is jompus. Jompus is rompus. Stella is rompus. Rompuses are muffled. Stella is temperate.",
        "answer_token_id_0": 855,
        "answer_token_pos_0": 380,
        "answer_token_0": "St",
        "end_token_pos_0": 379,
        "end_token_id_0": 13,
        "answer_token_id_1": 432,
        "answer_token_pos_1": 383,
        "answer_token_1": "j",
        "end_token_pos_1": 382,
        "end_token_id_1": 338,
        "answer_token_id_2": 435,
        "answer_token_pos_2": 387,
        "answer_token_2": "J",
        "end_token_pos_2": 386,
        "end_token_id_2": 29889,
        "answer_token_id_3": 6017,
        "answer_token_pos_3": 391,
        "answer_token_3": "rom",
        "end_token_pos_3": 390,
        "end_token_id_3": 338,
        "answer_token_id_4": 624,
        "answer_token_pos_4": 395,
        "answer_token_4": "St",
        "end_token_pos_4": 394,
        "end_token_id_4": 29889,
        "answer_token_id_5": 6017,
        "answer_token_pos_5": 398,
        "answer_token_5": "rom",
        "end_token_pos_5": 397,
        "end_token_id_5": 338,
        "answer_token_id_6": 6033,
        "answer_token_pos_6": 402,
        "answer_token_6": "Rom",
        "end_token_pos_6": 401,
        "end_token_id_6": 29889,
        "answer_token_id_7": 286,
        "answer_token_pos_7": 406,
        "answer_token_7": "m",
        "end_token_pos_7": 405,
        "end_token_id_7": 526,
        "answer_token_id_8": 624,
        "answer_token_pos_8": 410,
        "answer_token_8": "St",
        "end_token_pos_8": 409,
        "end_token_id_8": 29889,
        "answer_token_id_9": 286,
        "answer_token_pos_9": 413,
        "answer_token_9": "m",
        "end_token_pos_9": 412,
        "end_token_id_9": 338
    },
    {
        "question": "Vumpus is earthy. Tumpus is vumpus. Sally is tumpus.",
        "query": "True or false: Sally is spicy.",
        "answer": "Sally is tumpus. Tumpus is vumpus. Sally is vumpus. Vumpus is earthy. Sally is earthy. False",
        "label": "False",
        "prompt": "Vumpus is earthy. Tumpus is vumpus. Sally is tumpus. True or false: Sally is spicy. Let us think step by step.",
        "generated": "Sally is tumpus. Tumpus is vumpus. Sally is vumpus. Vumpus is earthy. Sally is earthy. False",
        "noise_response_0": "",
        "noise_prompt_0": "Vumpus is earthy. Tumpus is vumpus. Sally is tumpus. True or false: Polly is spicy. Let us think step by step.",
        "response_0": "",
        "noise_response_1": "Sally is",
        "noise_prompt_1": "Vumpus is earthy. Tumpus is vumpus. Sally is shy. True or false: Sally is spicy. Let us think step by step.",
        "response_1": "Sally is",
        "noise_response_2": "Sally is tumpus.",
        "noise_prompt_2": "Vumpus is earthy. tumpus is vumpus. Sally is tumpus. True or false: Sally is spicy. Let us think step by step.",
        "response_2": "Sally is tumpus.",
        "noise_response_3": "Sally is tumpus. Tumpus is",
        "noise_prompt_3": "Vumpus is earthy. Tumpus is Zumpus. Sally is tumpus. True or false: Sally is spicy. Let us think step by step.",
        "response_3": "Sally is tumpus. Tumpus is",
        "noise_response_4": "Sam is tumpus. Tumpus is vumpus.",
        "noise_prompt_4": "Vumpus is earthy. Tumpus is vumpus. Sally is tumpus. True or false: Sally is spicy. Let us think step by step.",
        "response_4": "Sally is tumpus. Tumpus is vumpus.",
        "noise_response_5": "Sally is tumpus. Tumpus is Lorpus. Sally is",
        "noise_prompt_5": "Vumpus is earthy. Tumpus is vumpus. Sally is tumpus. True or false: Sally is spicy. Let us think step by step.",
        "response_5": "Sally is tumpus. Tumpus is vumpus. Sally is",
        "noise_response_6": "Sally is tumpus. Tumpus is vumpus. Sally is vumpus.",
        "noise_prompt_6": "numpus is earthy. Tumpus is vumpus. Sally is tumpus. True or false: Sally is spicy. Let us think step by step.",
        "response_6": "Sally is tumpus. Tumpus is vumpus. Sally is vumpus.",
        "noise_response_7": "Sally is tumpus. Tumpus is vumpus. Sally is vumpus. Vumpus is",
        "noise_prompt_7": "Vumpus is rainy. Tumpus is vumpus. Sally is tumpus. True or false: Sally is spicy. Let us think step by step.",
        "response_7": "Sally is tumpus. Tumpus is vumpus. Sally is vumpus. Vumpus is",
        "noise_response_8": "Sally is tumpus. Tumpus is vumpus. Fae is vumpus. Vumpus is earthy.",
        "noise_prompt_8": "Vumpus is earthy. Tumpus is vumpus. Sally is tumpus. True or false: Sally is spicy. Let us think step by step.",
        "response_8": "Sally is tumpus. Tumpus is vumpus. Sally is vumpus. Vumpus is earthy.",
        "noise_response_9": "Sally is tumpus. Tumpus is vumpus. Sally is vumpus. Vumpus is bright. Sally is",
        "noise_prompt_9": "Vumpus is earthy. Tumpus is vumpus. Sally is tumpus. True or false: Sally is spicy. Let us think step by step.",
        "response_9": "Sally is tumpus. Tumpus is vumpus. Sally is vumpus. Vumpus is earthy. Sally is",
        "noise_prompt_10": "Vumpus is earthy. Tumpus is vumpus. Sally is tumpus. True or false: Sally is spicy. Let us think step by step.",
        "response_10": "Sally is tumpus. Tumpus is vumpus. Sally is vumpus. Vumpus is earthy. Sally is earthy.",
        "noise_response_10": "Sally is tumpus. Tumpus is vumpus. Sally is vumpus. Vumpus is earthy. Sally is dull.",
        "answer_token_id_0": 29903,
        "answer_token_pos_0": 380,
        "answer_token_0": "S",
        "end_token_pos_0": 379,
        "end_token_id_0": 13,
        "answer_token_id_1": 260,
        "answer_token_pos_1": 383,
        "answer_token_1": "t",
        "end_token_pos_1": 382,
        "end_token_id_1": 338,
        "answer_token_id_2": 323,
        "answer_token_pos_2": 387,
        "answer_token_2": "T",
        "end_token_pos_2": 386,
        "end_token_id_2": 29889,
        "answer_token_id_3": 325,
        "answer_token_pos_3": 391,
        "answer_token_3": "v",
        "end_token_pos_3": 390,
        "end_token_id_3": 338,
        "answer_token_id_4": 317,
        "answer_token_pos_4": 395,
        "answer_token_4": "S",
        "end_token_pos_4": 394,
        "end_token_id_4": 29889,
        "answer_token_id_5": 325,
        "answer_token_pos_5": 398,
        "answer_token_5": "v",
        "end_token_pos_5": 397,
        "end_token_id_5": 338,
        "answer_token_id_6": 478,
        "answer_token_pos_6": 402,
        "answer_token_6": "V",
        "end_token_pos_6": 401,
        "end_token_id_6": 29889,
        "answer_token_id_7": 8437,
        "answer_token_pos_7": 406,
        "answer_token_7": "earth",
        "end_token_pos_7": 405,
        "end_token_id_7": 338,
        "answer_token_id_8": 317,
        "answer_token_pos_8": 410,
        "answer_token_8": "S",
        "end_token_pos_8": 409,
        "end_token_id_8": 29889,
        "answer_token_id_9": 8437,
        "answer_token_pos_9": 413,
        "answer_token_9": "earth",
        "end_token_pos_9": 412,
        "end_token_id_9": 338
    },
    {
        "question": "Tumpuses are opaque. Rompuses are tumpuses. Stella is rompus.",
        "query": "True or false: Stella is opaque.",
        "answer": "Stella is rompus. Rompuses are tumpuses. Stella is tumpus. Tumpuses are opaque. Stella is opaque. True",
        "label": "True",
        "prompt": "Tumpuses are opaque. Rompuses are tumpuses. Stella is rompus. True or false: Stella is opaque. Let us think step by step.",
        "generated": "Stella is rompus. Rompuses are tumpuses. Stella is tumpus. Tumpuses are opaque. Stella is opaque. True",
        "noise_response_0": "",
        "noise_prompt_0": "Tumpuses are opaque. Rompuses are tumpuses. Stella is rompus. True or false: Sally is opaque. Let us think step by step.",
        "response_0": "",
        "noise_response_1": "Stella is",
        "noise_prompt_1": "Tumpuses are opaque. Rompuses are tumpuses. Stella is grimpus. True or false: Stella is opaque. Let us think step by step.",
        "response_1": "Stella is",
        "noise_response_2": "Stella is rompus.",
        "noise_prompt_2": "Tumpuses are opaque. gorpus are tumpuses. Stella is rompus. True or false: Stella is opaque. Let us think step by step.",
        "response_2": "Stella is rompus.",
        "noise_response_3": "Stella is rompus. Rompuses are",
        "noise_prompt_3": "Tumpuses are opaque. Rompuses are blue. Stella is rompus. True or false: Stella is opaque. Let us think step by step.",
        "response_3": "Stella is rompus. Rompuses are",
        "noise_response_4": "Rex is rompus. Rompuses are tumpuses.",
        "noise_prompt_4": "Tumpuses are opaque. Rompuses are tumpuses. Stella is rompus. True or false: Stella is opaque. Let us think step by step.",
        "response_4": "Stella is rompus. Rompuses are tumpuses.",
        "noise_response_5": "Stella is rompus. Rompuses are sweet. Stella is",
        "noise_prompt_5": "Tumpuses are opaque. Rompuses are tumpuses. Stella is rompus. True or false: Stella is opaque. Let us think step by step.",
        "response_5": "Stella is rompus. Rompuses are tumpuses. Stella is",
        "noise_response_6": "Stella is rompus. Rompuses are tumpuses. Stella is tumpus.",
        "noise_prompt_6": "vumpus are opaque. Rompuses are tumpuses. Stella is rompus. True or false: Stella is opaque. Let us think step by step.",
        "response_6": "Stella is rompus. Rompuses are tumpuses. Stella is tumpus.",
        "noise_response_7": "Stella is rompus. Rompuses are tumpuses. Stella is tumpus. Tumpuses are",
        "noise_prompt_7": "Tumpuses are opaque. Rompuses are tumpuses. Stella is rompus. True or false: Stella is loud. Let us think step by step.",
        "response_7": "Stella is rompus. Rompuses are tumpuses. Stella is tumpus. Tumpuses are",
        "noise_response_8": "Stella is rompus. Rompuses are tumpuses. Sam is tumpus. Tumpuses are opaque.",
        "noise_prompt_8": "Tumpuses are opaque. Rompuses are tumpuses. Stella is rompus. True or false: Stella is opaque. Let us think step by step.",
        "response_8": "Stella is rompus. Rompuses are tumpuses. Stella is tumpus. Tumpuses are opaque.",
        "noise_response_9": "Stella is rompus. Rompuses are tumpuses. Stella is tumpus. Tumpuses are hot. Stella is",
        "noise_prompt_9": "Tumpuses are opaque. Rompuses are tumpuses. Stella is rompus. True or false: Stella is opaque. Let us think step by step.",
        "response_9": "Stella is rompus. Rompuses are tumpuses. Stella is tumpus. Tumpuses are opaque. Stella is",
        "noise_prompt_10": "Tumpuses are opaque. Rompuses are tumpuses. Stella is rompus. True or false: Stella is opaque. Let us think step by step.",
        "response_10": "Stella is rompus. Rompuses are tumpuses. Stella is tumpus. Tumpuses are opaque. Stella is opaque.",
        "noise_response_10": "Stella is rompus. Rompuses are tumpuses. Stella is tumpus. Tumpuses are opaque. Stella is spicy.",
        "answer_token_id_0": 855,
        "answer_token_pos_0": 380,
        "answer_token_0": "St",
        "end_token_pos_0": 379,
        "end_token_id_0": 13,
        "answer_token_id_1": 6017,
        "answer_token_pos_1": 383,
        "answer_token_1": "rom",
        "end_token_pos_1": 382,
        "end_token_id_1": 338,
        "answer_token_id_2": 6033,
        "answer_token_pos_2": 387,
        "answer_token_2": "Rom",
        "end_token_pos_2": 386,
        "end_token_id_2": 29889,
        "answer_token_id_3": 260,
        "answer_token_pos_3": 391,
        "answer_token_3": "t",
        "end_token_pos_3": 390,
        "end_token_id_3": 526,
        "answer_token_id_4": 624,
        "answer_token_pos_4": 395,
        "answer_token_4": "St",
        "end_token_pos_4": 394,
        "end_token_id_4": 29889,
        "answer_token_id_5": 260,
        "answer_token_pos_5": 398,
        "answer_token_5": "t",
        "end_token_pos_5": 397,
        "end_token_id_5": 338,
        "answer_token_id_6": 323,
        "answer_token_pos_6": 402,
        "answer_token_6": "T",
        "end_token_pos_6": 401,
        "end_token_id_6": 29889,
        "answer_token_id_7": 1015,
        "answer_token_pos_7": 406,
        "answer_token_7": "op",
        "end_token_pos_7": 405,
        "end_token_id_7": 526,
        "answer_token_id_8": 624,
        "answer_token_pos_8": 410,
        "answer_token_8": "St",
        "end_token_pos_8": 409,
        "end_token_id_8": 29889,
        "answer_token_id_9": 1015,
        "answer_token_pos_9": 413,
        "answer_token_9": "op",
        "end_token_pos_9": 412,
        "end_token_id_9": 338
    },
    {
        "question": "Wumpuses are moderate. Grimpus is wumpus. Stella is grimpus.",
        "query": "True or false: Stella is moderate.",
        "answer": "Stella is grimpus. Grimpus is wumpus. Stella is wumpus. Wumpuses are moderate. Stella is moderate. True",
        "label": "True",
        "prompt": "Wumpuses are moderate. Grimpus is wumpus. Stella is grimpus. True or false: Stella is moderate. Let us think step by step.",
        "generated": "Stella is grimpus. Grimpus is wumpus. Stella is wumpus. Wumpuses are moderate. Stella is moderate. True",
        "noise_response_0": "",
        "noise_prompt_0": "Wumpuses are moderate. Grimpus is wumpus. Stella is grimpus. True or false: Sally is moderate. Let us think step by step.",
        "response_0": "",
        "noise_response_1": "Stella is",
        "noise_prompt_1": "Wumpuses are moderate. Grimpus is wumpus. Stella is Lempus. True or false: Stella is moderate. Let us think step by step.",
        "response_1": "Stella is",
        "noise_response_2": "Stella is grimpus.",
        "noise_prompt_2": "Wumpuses are moderate. yumpus is wumpus. Stella is grimpus. True or false: Stella is moderate. Let us think step by step.",
        "response_2": "Stella is grimpus.",
        "noise_response_3": "Stella is grimpus. Grimpus is",
        "noise_prompt_3": "Wumpuses are moderate. Grimpus is temperate. Stella is grimpus. True or false: Stella is moderate. Let us think step by step.",
        "response_3": "Stella is grimpus. Grimpus is",
        "noise_response_4": "Wren is grimpus. Grimpus is wumpus.",
        "noise_prompt_4": "Wumpuses are moderate. Grimpus is wumpus. Stella is grimpus. True or false: Stella is moderate. Let us think step by step.",
        "response_4": "Stella is grimpus. Grimpus is wumpus.",
        "noise_response_5": "Stella is grimpus. Grimpus is rainy. Stella is",
        "noise_prompt_5": "Wumpuses are moderate. Grimpus is wumpus. Stella is grimpus. True or false: Stella is moderate. Let us think step by step.",
        "response_5": "Stella is grimpus. Grimpus is wumpus. Stella is",
        "noise_response_6": "Stella is grimpus. Grimpus is wumpus. Stella is wumpus.",
        "noise_prompt_6": "Fae are moderate. Grimpus is wumpus. Stella is grimpus. True or false: Stella is moderate. Let us think step by step.",
        "response_6": "Stella is grimpus. Grimpus is wumpus. Stella is wumpus.",
        "noise_response_7": "Stella is grimpus. Grimpus is wumpus. Stella is wumpus. Wumpuses are",
        "noise_prompt_7": "Wumpuses are moderate. Grimpus is wumpus. Stella is grimpus. True or false: Stella is kind. Let us think step by step.",
        "response_7": "Stella is grimpus. Grimpus is wumpus. Stella is wumpus. Wumpuses are",
        "noise_response_8": "Stella is grimpus. Grimpus is wumpus. Fae is wumpus. Wumpuses are moderate.",
        "noise_prompt_8": "Wumpuses are moderate. Grimpus is wumpus. Stella is grimpus. True or false: Stella is moderate. Let us think step by step.",
        "response_8": "Stella is grimpus. Grimpus is wumpus. Stella is wumpus. Wumpuses are moderate.",
        "noise_response_9": "Stella is grimpus. Grimpus is wumpus. Stella is wumpus. Wumpuses are nervous. Stella is",
        "noise_prompt_9": "Wumpuses are moderate. Grimpus is wumpus. Stella is grimpus. True or false: Stella is moderate. Let us think step by step.",
        "response_9": "Stella is grimpus. Grimpus is wumpus. Stella is wumpus. Wumpuses are moderate. Stella is",
        "noise_prompt_10": "Wumpuses are moderate. Grimpus is wumpus. Stella is grimpus. True or false: Stella is moderate. Let us think step by step.",
        "response_10": "Stella is grimpus. Grimpus is wumpus. Stella is wumpus. Wumpuses are moderate. Stella is moderate.",
        "noise_response_10": "Stella is grimpus. Grimpus is wumpus. Stella is wumpus. Wumpuses are moderate. Stella is wooden.",
        "answer_token_id_0": 855,
        "answer_token_pos_0": 380,
        "answer_token_0": "St",
        "end_token_pos_0": 379,
        "end_token_id_0": 13,
        "answer_token_id_1": 867,
        "answer_token_pos_1": 383,
        "answer_token_1": "gr",
        "end_token_pos_1": 382,
        "end_token_id_1": 338,
        "answer_token_id_2": 1632,
        "answer_token_pos_2": 387,
        "answer_token_2": "Gr",
        "end_token_pos_2": 386,
        "end_token_id_2": 29889,
        "answer_token_id_3": 281,
        "answer_token_pos_3": 391,
        "answer_token_3": "w",
        "end_token_pos_3": 390,
        "end_token_id_3": 338,
        "answer_token_id_4": 624,
        "answer_token_pos_4": 395,
        "answer_token_4": "St",
        "end_token_pos_4": 394,
        "end_token_id_4": 29889,
        "answer_token_id_5": 281,
        "answer_token_pos_5": 398,
        "answer_token_5": "w",
        "end_token_pos_5": 397,
        "end_token_id_5": 338,
        "answer_token_id_6": 399,
        "answer_token_pos_6": 402,
        "answer_token_6": "W",
        "end_token_pos_6": 401,
        "end_token_id_6": 29889,
        "answer_token_id_7": 17768,
        "answer_token_pos_7": 406,
        "answer_token_7": "moder",
        "end_token_pos_7": 405,
        "end_token_id_7": 526,
        "answer_token_id_8": 624,
        "answer_token_pos_8": 410,
        "answer_token_8": "St",
        "end_token_pos_8": 409,
        "end_token_id_8": 29889,
        "answer_token_id_9": 17768,
        "answer_token_pos_9": 413,
        "answer_token_9": "moder",
        "end_token_pos_9": 412,
        "end_token_id_9": 338
    },
    {
        "question": "Impus is fast. Vumpuses are impuses. Alex is vumpus.",
        "query": "True or false: Alex is fast.",
        "answer": "Alex is vumpus. Vumpuses are impuses. Alex is impus. Impus is fast. Alex is fast. True",
        "label": "True",
        "prompt": "Impus is fast. Vumpuses are impuses. Alex is vumpus. True or false: Alex is fast. Let us think step by step.",
        "generated": "Alex is vumpus. Vumpuses are impuses. Alex is impus. Impus is fast. Alex is fast. True",
        "noise_response_0": "",
        "noise_prompt_0": "Impus is fast. Vumpuses are impuses. Alex is vumpus. True or false: Sally is fast. Let us think step by step.",
        "response_0": "",
        "noise_response_1": "Alex is",
        "noise_prompt_1": "Impus is fast. Vumpuses are impuses. Alex is Tumpus. True or false: Alex is fast. Let us think step by step.",
        "response_1": "Alex is",
        "noise_response_2": "Alex is vumpus.",
        "noise_prompt_2": "Impus is fast. Vumpus are impuses. Alex is vumpus. True or false: Alex is fast. Let us think step by step.",
        "response_2": "Alex is vumpus.",
        "noise_response_3": "Alex is vumpus. Vumpuses are",
        "noise_prompt_3": "Impus is fast. Vumpuses are yumpus. Alex is vumpus. True or false: Alex is fast. Let us think step by step.",
        "response_3": "Alex is vumpus. Vumpuses are",
        "noise_response_4": "Rex is vumpus. Vumpuses are impuses.",
        "noise_prompt_4": "Impus is fast. Vumpuses are impuses. Alex is vumpus. True or false: Alex is fast. Let us think step by step.",
        "response_4": "Alex is vumpus. Vumpuses are impuses.",
        "noise_response_5": "Alex is vumpus. Vumpuses are Rompus. Alex is",
        "noise_prompt_5": "Impus is fast. Vumpuses are impuses. Alex is vumpus. True or false: Alex is fast. Let us think step by step.",
        "response_5": "Alex is vumpus. Vumpuses are impuses. Alex is",
        "noise_response_6": "Alex is vumpus. Vumpuses are impuses. Alex is impus.",
        "noise_prompt_6": "Jompus is fast. Vumpuses are impuses. Alex is vumpus. True or false: Alex is fast. Let us think step by step.",
        "response_6": "Alex is vumpus. Vumpuses are impuses. Alex is impus.",
        "noise_response_7": "Alex is vumpus. Vumpuses are impuses. Alex is impus. Impus is",
        "noise_prompt_7": "Impus is fast. Vumpuses are impuses. Alex is vumpus. True or false: Alex is orange. Let us think step by step.",
        "response_7": "Alex is vumpus. Vumpuses are impuses. Alex is impus. Impus is",
        "noise_response_8": "Alex is vumpus. Vumpuses are impuses. Fae is impus. Impus is fast.",
        "noise_prompt_8": "Impus is fast. Vumpuses are impuses. Alex is vumpus. True or false: Alex is fast. Let us think step by step.",
        "response_8": "Alex is vumpus. Vumpuses are impuses. Alex is impus. Impus is fast.",
        "noise_response_9": "Alex is vumpus. Vumpuses are impuses. Alex is impus. Impus is large. Alex is",
        "noise_prompt_9": "Impus is fast. Vumpuses are impuses. Alex is vumpus. True or false: Alex is fast. Let us think step by step.",
        "response_9": "Alex is vumpus. Vumpuses are impuses. Alex is impus. Impus is fast. Alex is",
        "noise_prompt_10": "Impus is fast. Vumpuses are impuses. Alex is vumpus. True or false: Alex is fast. Let us think step by step.",
        "response_10": "Alex is vumpus. Vumpuses are impuses. Alex is impus. Impus is fast. Alex is fast.",
        "noise_response_10": "Alex is vumpus. Vumpuses are impuses. Alex is impus. Impus is fast. Alex is blue.",
        "answer_token_id_0": 17406,
        "answer_token_pos_0": 380,
        "answer_token_0": "Alex",
        "end_token_pos_0": 379,
        "end_token_id_0": 13,
        "answer_token_id_1": 325,
        "answer_token_pos_1": 383,
        "answer_token_1": "v",
        "end_token_pos_1": 382,
        "end_token_id_1": 338,
        "answer_token_id_2": 478,
        "answer_token_pos_2": 387,
        "answer_token_2": "V",
        "end_token_pos_2": 386,
        "end_token_id_2": 29889,
        "answer_token_id_3": 2411,
        "answer_token_pos_3": 391,
        "answer_token_3": "imp",
        "end_token_pos_3": 390,
        "end_token_id_3": 526,
        "answer_token_id_4": 4827,
        "answer_token_pos_4": 395,
        "answer_token_4": "Alex",
        "end_token_pos_4": 394,
        "end_token_id_4": 29889,
        "answer_token_id_5": 2411,
        "answer_token_pos_5": 398,
        "answer_token_5": "imp",
        "end_token_pos_5": 397,
        "end_token_id_5": 338,
        "answer_token_id_6": 14305,
        "answer_token_pos_6": 402,
        "answer_token_6": "Imp",
        "end_token_pos_6": 401,
        "end_token_id_6": 29889,
        "answer_token_id_7": 5172,
        "answer_token_pos_7": 406,
        "answer_token_7": "fast",
        "end_token_pos_7": 405,
        "end_token_id_7": 338,
        "answer_token_id_8": 4827,
        "answer_token_pos_8": 410,
        "answer_token_8": "Alex",
        "end_token_pos_8": 409,
        "end_token_id_8": 29889,
        "answer_token_id_9": 5172,
        "answer_token_pos_9": 413,
        "answer_token_9": "fast",
        "end_token_pos_9": 412,
        "end_token_id_9": 338
    },
    {
        "question": "Vumpuses are dull. Jompuses are vumpuses. Sally is jompus.",
        "query": "True or false: Sally is blue.",
        "answer": "Sally is jompus. Jompuses are vumpuses. Sally is vumpus. Vumpuses are dull. Sally is dull. False",
        "label": "False",
        "prompt": "Vumpuses are dull. Jompuses are vumpuses. Sally is jompus. True or false: Sally is blue. Let us think step by step.",
        "generated": "Sally is jompus. Jompuses are vumpuses. Sally is vumpus. Vumpuses are dull. Sally is dull. False",
        "noise_response_0": "",
        "noise_prompt_0": "Vumpuses are dull. Jompuses are vumpuses. Sally is jompus. True or false: Stella is blue. Let us think step by step.",
        "response_0": "",
        "noise_response_1": "Sally is",
        "noise_prompt_1": "Vumpuses are dull. Jompuses are vumpuses. Sally is Zumpus. True or false: Sally is blue. Let us think step by step.",
        "response_1": "Sally is",
        "noise_response_2": "Sally is jompus.",
        "noise_prompt_2": "Vumpuses are dull. Jompus are vumpuses. Sally is jompus. True or false: Sally is blue. Let us think step by step.",
        "response_2": "Sally is jompus.",
        "noise_response_3": "Sally is jompus. Jompuses are",
        "noise_prompt_3": "Vumpuses are dull. Jompuses are dumpus. Sally is jompus. True or false: Sally is blue. Let us think step by step.",
        "response_3": "Sally is jompus. Jompuses are",
        "noise_response_4": "Rex is jompus. Jompuses are vumpuses.",
        "noise_prompt_4": "Vumpuses are dull. Jompuses are vumpuses. Sally is jompus. True or false: Sally is blue. Let us think step by step.",
        "response_4": "Sally is jompus. Jompuses are vumpuses.",
        "noise_response_5": "Sally is jompus. Jompuses are numpus. Sally is",
        "noise_prompt_5": "Vumpuses are dull. Jompuses are vumpuses. Sally is jompus. True or false: Sally is blue. Let us think step by step.",
        "response_5": "Sally is jompus. Jompuses are vumpuses. Sally is",
        "noise_response_6": "Sally is jompus. Jompuses are vumpuses. Sally is vumpus.",
        "noise_prompt_6": "yumpus are dull. Jompuses are vumpuses. Sally is jompus. True or false: Sally is blue. Let us think step by step.",
        "response_6": "Sally is jompus. Jompuses are vumpuses. Sally is vumpus.",
        "noise_response_7": "Sally is jompus. Jompuses are vumpuses. Sally is vumpus. Vumpuses are",
        "noise_prompt_7": "Vumpuses are sour. Jompuses are vumpuses. Sally is jompus. True or false: Sally is blue. Let us think step by step.",
        "response_7": "Sally is jompus. Jompuses are vumpuses. Sally is vumpus. Vumpuses are",
        "noise_response_8": "Sally is jompus. Jompuses are vumpuses. Sam is vumpus. Vumpuses are dull.",
        "noise_prompt_8": "Vumpuses are dull. Jompuses are vumpuses. Sally is jompus. True or false: Sally is blue. Let us think step by step.",
        "response_8": "Sally is jompus. Jompuses are vumpuses. Sally is vumpus. Vumpuses are dull.",
        "noise_response_9": "Sally is jompus. Jompuses are vumpuses. Sally is vumpus. Vumpuses are melodic. Sally is",
        "noise_prompt_9": "Vumpuses are dull. Jompuses are vumpuses. Sally is jompus. True or false: Sally is blue. Let us think step by step.",
        "response_9": "Sally is jompus. Jompuses are vumpuses. Sally is vumpus. Vumpuses are dull. Sally is",
        "noise_prompt_10": "Vumpuses are dull. Jompuses are vumpuses. Sally is jompus. True or false: Sally is blue. Let us think step by step.",
        "response_10": "Sally is jompus. Jompuses are vumpuses. Sally is vumpus. Vumpuses are dull. Sally is dull.",
        "noise_response_10": "Sally is jompus. Jompuses are vumpuses. Sally is vumpus. Vumpuses are dull. Sally is happy.",
        "answer_token_id_0": 29903,
        "answer_token_pos_0": 380,
        "answer_token_0": "S",
        "end_token_pos_0": 379,
        "end_token_id_0": 13,
        "answer_token_id_1": 432,
        "answer_token_pos_1": 383,
        "answer_token_1": "j",
        "end_token_pos_1": 382,
        "end_token_id_1": 338,
        "answer_token_id_2": 435,
        "answer_token_pos_2": 387,
        "answer_token_2": "J",
        "end_token_pos_2": 386,
        "end_token_id_2": 29889,
        "answer_token_id_3": 325,
        "answer_token_pos_3": 391,
        "answer_token_3": "v",
        "end_token_pos_3": 390,
        "end_token_id_3": 526,
        "answer_token_id_4": 317,
        "answer_token_pos_4": 395,
        "answer_token_4": "S",
        "end_token_pos_4": 394,
        "end_token_id_4": 29889,
        "answer_token_id_5": 325,
        "answer_token_pos_5": 398,
        "answer_token_5": "v",
        "end_token_pos_5": 397,
        "end_token_id_5": 338,
        "answer_token_id_6": 478,
        "answer_token_pos_6": 402,
        "answer_token_6": "V",
        "end_token_pos_6": 401,
        "end_token_id_6": 29889,
        "answer_token_id_7": 270,
        "answer_token_pos_7": 406,
        "answer_token_7": "d",
        "end_token_pos_7": 405,
        "end_token_id_7": 526,
        "answer_token_id_8": 317,
        "answer_token_pos_8": 410,
        "answer_token_8": "S",
        "end_token_pos_8": 409,
        "end_token_id_8": 29889,
        "answer_token_id_9": 270,
        "answer_token_pos_9": 413,
        "answer_token_9": "d",
        "end_token_pos_9": 412,
        "end_token_id_9": 338
    },
    {
        "question": "Brimpuses are dull. Lempuses are brimpuses. Wren is lempus.",
        "query": "True or false: Wren is windy.",
        "answer": "Wren is lempus. Lempuses are brimpuses. Wren is brimpus. Brimpuses are dull. Wren is dull. False",
        "label": "False",
        "prompt": "Brimpuses are dull. Lempuses are brimpuses. Wren is lempus. True or false: Wren is windy. Let us think step by step.",
        "generated": "Wren is lempus. Lempuses are brimpuses. Wren is brimpus. Brimpuses are dull. Wren is dull. False",
        "noise_response_0": "",
        "noise_prompt_0": "Brimpuses are dull. Lempuses are brimpuses. Wren is lempus. True or false: Max is windy. Let us think step by step.",
        "response_0": "",
        "noise_response_1": "Wren is",
        "noise_prompt_1": "Brimpuses are dull. Lempuses are brimpuses. Wren is vumpus. True or false: Wren is windy. Let us think step by step.",
        "response_1": "Wren is",
        "noise_response_2": "Wren is lempus.",
        "noise_prompt_2": "Brimpuses are dull. Lorpus are brimpuses. Wren is lempus. True or false: Wren is windy. Let us think step by step.",
        "response_2": "Wren is lempus.",
        "noise_response_3": "Wren is lempus. Lempuses are",
        "noise_prompt_3": "Brimpuses are dull. Lempuses are fruity. Wren is lempus. True or false: Wren is windy. Let us think step by step.",
        "response_3": "Wren is lempus. Lempuses are",
        "noise_response_4": "Max is lempus. Lempuses are brimpuses.",
        "noise_prompt_4": "Brimpuses are dull. Lempuses are brimpuses. Wren is lempus. True or false: Wren is windy. Let us think step by step.",
        "response_4": "Wren is lempus. Lempuses are brimpuses.",
        "noise_response_5": "Wren is lempus. Lempuses are feisty. Wren is",
        "noise_prompt_5": "Brimpuses are dull. Lempuses are brimpuses. Wren is lempus. True or false: Wren is windy. Let us think step by step.",
        "response_5": "Wren is lempus. Lempuses are brimpuses. Wren is",
        "noise_response_6": "Wren is lempus. Lempuses are brimpuses. Wren is brimpus.",
        "noise_prompt_6": "lempus are dull. Lempuses are brimpuses. Wren is lempus. True or false: Wren is windy. Let us think step by step.",
        "response_6": "Wren is lempus. Lempuses are brimpuses. Wren is brimpus.",
        "noise_response_7": "Wren is lempus. Lempuses are brimpuses. Wren is brimpus. Brimpuses are",
        "noise_prompt_7": "Brimpuses are orange. Lempuses are brimpuses. Wren is lempus. True or false: Wren is windy. Let us think step by step.",
        "response_7": "Wren is lempus. Lempuses are brimpuses. Wren is brimpus. Brimpuses are",
        "noise_response_8": "Wren is lempus. Lempuses are brimpuses. Stella is brimpus. Brimpuses are dull.",
        "noise_prompt_8": "Brimpuses are dull. Lempuses are brimpuses. Wren is lempus. True or false: Wren is windy. Let us think step by step.",
        "response_8": "Wren is lempus. Lempuses are brimpuses. Wren is brimpus. Brimpuses are dull.",
        "noise_response_9": "Wren is lempus. Lempuses are brimpuses. Wren is brimpus. Brimpuses are fruity. Wren is",
        "noise_prompt_9": "Brimpuses are dull. Lempuses are brimpuses. Wren is lempus. True or false: Wren is windy. Let us think step by step.",
        "response_9": "Wren is lempus. Lempuses are brimpuses. Wren is brimpus. Brimpuses are dull. Wren is",
        "noise_prompt_10": "Brimpuses are dull. Lempuses are brimpuses. Wren is lempus. True or false: Wren is windy. Let us think step by step.",
        "response_10": "Wren is lempus. Lempuses are brimpuses. Wren is brimpus. Brimpuses are dull. Wren is dull.",
        "noise_response_10": "Wren is lempus. Lempuses are brimpuses. Wren is brimpus. Brimpuses are dull. Wren is blue.",
        "answer_token_id_0": 29956,
        "answer_token_pos_0": 380,
        "answer_token_0": "W",
        "end_token_pos_0": 379,
        "end_token_id_0": 13,
        "answer_token_id_1": 454,
        "answer_token_pos_1": 383,
        "answer_token_1": "le",
        "end_token_pos_1": 382,
        "end_token_id_1": 338,
        "answer_token_id_2": 365,
        "answer_token_pos_2": 387,
        "answer_token_2": "L",
        "end_token_pos_2": 386,
        "end_token_id_2": 29889,
        "answer_token_id_3": 1506,
        "answer_token_pos_3": 391,
        "answer_token_3": "br",
        "end_token_pos_3": 390,
        "end_token_id_3": 526,
        "answer_token_id_4": 399,
        "answer_token_pos_4": 395,
        "answer_token_4": "W",
        "end_token_pos_4": 394,
        "end_token_id_4": 29889,
        "answer_token_id_5": 1506,
        "answer_token_pos_5": 398,
        "answer_token_5": "br",
        "end_token_pos_5": 397,
        "end_token_id_5": 338,
        "answer_token_id_6": 1771,
        "answer_token_pos_6": 402,
        "answer_token_6": "Br",
        "end_token_pos_6": 401,
        "end_token_id_6": 29889,
        "answer_token_id_7": 270,
        "answer_token_pos_7": 406,
        "answer_token_7": "d",
        "end_token_pos_7": 405,
        "end_token_id_7": 526,
        "answer_token_id_8": 399,
        "answer_token_pos_8": 410,
        "answer_token_8": "W",
        "end_token_pos_8": 409,
        "end_token_id_8": 29889,
        "answer_token_id_9": 270,
        "answer_token_pos_9": 413,
        "answer_token_9": "d",
        "end_token_pos_9": 412,
        "end_token_id_9": 338
    },
    {
        "question": "Brimpuses are metallic. Shumpuses are brimpuses. Polly is shumpus.",
        "query": "True or false: Polly is metallic.",
        "answer": "Polly is shumpus. Shumpuses are brimpuses. Polly is brimpus. Brimpuses are metallic. Polly is metallic. True",
        "label": "True",
        "prompt": "Brimpuses are metallic. Shumpuses are brimpuses. Polly is shumpus. True or false: Polly is metallic. Let us think step by step.",
        "generated": "Polly is shumpus. Shumpuses are brimpuses. Polly is brimpus. Brimpuses are metallic. Polly is metallic. True",
        "noise_response_0": "",
        "noise_prompt_0": "Brimpuses are metallic. Shumpuses are brimpuses. Polly is shumpus. True or false: Alex is metallic. Let us think step by step.",
        "response_0": "",
        "noise_response_1": "Polly is",
        "noise_prompt_1": "Brimpuses are metallic. Shumpuses are brimpuses. Polly is orange. True or false: Polly is metallic. Let us think step by step.",
        "response_1": "Polly is",
        "noise_response_2": "Polly is shumpus.",
        "noise_prompt_2": "Brimpuses are metallic. numpus are brimpuses. Polly is shumpus. True or false: Polly is metallic. Let us think step by step.",
        "response_2": "Polly is shumpus.",
        "noise_response_3": "Polly is shumpus. Shumpuses are",
        "noise_prompt_3": "Brimpuses are metallic. Shumpuses are feisty. Polly is shumpus. True or false: Polly is metallic. Let us think step by step.",
        "response_3": "Polly is shumpus. Shumpuses are",
        "noise_response_4": "Rex is shumpus. Shumpuses are brimpuses.",
        "noise_prompt_4": "Brimpuses are metallic. Shumpuses are brimpuses. Polly is shumpus. True or false: Polly is metallic. Let us think step by step.",
        "response_4": "Polly is shumpus. Shumpuses are brimpuses.",
        "noise_response_5": "Polly is shumpus. Shumpuses are metallic. Polly is",
        "noise_prompt_5": "Brimpuses are metallic. Shumpuses are brimpuses. Polly is shumpus. True or false: Polly is metallic. Let us think step by step.",
        "response_5": "Polly is shumpus. Shumpuses are brimpuses. Polly is",
        "noise_response_6": "Polly is shumpus. Shumpuses are brimpuses. Polly is brimpus.",
        "noise_prompt_6": "Tumpus are metallic. Shumpuses are brimpuses. Polly is shumpus. True or false: Polly is metallic. Let us think step by step.",
        "response_6": "Polly is shumpus. Shumpuses are brimpuses. Polly is brimpus.",
        "noise_response_7": "Polly is shumpus. Shumpuses are brimpuses. Polly is brimpus. Brimpuses are",
        "noise_prompt_7": "Brimpuses are metallic. Shumpuses are brimpuses. Polly is shumpus. True or false: Polly is floral. Let us think step by step.",
        "response_7": "Polly is shumpus. Shumpuses are brimpuses. Polly is brimpus. Brimpuses are",
        "noise_response_8": "Polly is shumpus. Shumpuses are brimpuses. Wren is brimpus. Brimpuses are metallic.",
        "noise_prompt_8": "Brimpuses are metallic. Shumpuses are brimpuses. Polly is shumpus. True or false: Polly is metallic. Let us think step by step.",
        "response_8": "Polly is shumpus. Shumpuses are brimpuses. Polly is brimpus. Brimpuses are metallic.",
        "noise_response_9": "Polly is shumpus. Shumpuses are brimpuses. Polly is brimpus. Brimpuses are rainy. Polly is",
        "noise_prompt_9": "Brimpuses are metallic. Shumpuses are brimpuses. Polly is shumpus. True or false: Polly is metallic. Let us think step by step.",
        "response_9": "Polly is shumpus. Shumpuses are brimpuses. Polly is brimpus. Brimpuses are metallic. Polly is",
        "noise_prompt_10": "Brimpuses are metallic. Shumpuses are brimpuses. Polly is shumpus. True or false: Polly is metallic. Let us think step by step.",
        "response_10": "Polly is shumpus. Shumpuses are brimpuses. Polly is brimpus. Brimpuses are metallic. Polly is metallic.",
        "noise_response_10": "Polly is shumpus. Shumpuses are brimpuses. Polly is brimpus. Brimpuses are metallic. Polly is bitter.",
        "answer_token_id_0": 7713,
        "answer_token_pos_0": 380,
        "answer_token_0": "Pol",
        "end_token_pos_0": 379,
        "end_token_id_0": 13,
        "answer_token_id_1": 528,
        "answer_token_pos_1": 383,
        "answer_token_1": "sh",
        "end_token_pos_1": 382,
        "end_token_id_1": 338,
        "answer_token_id_2": 1383,
        "answer_token_pos_2": 387,
        "answer_token_2": "Sh",
        "end_token_pos_2": 386,
        "end_token_id_2": 29889,
        "answer_token_id_3": 1506,
        "answer_token_pos_3": 391,
        "answer_token_3": "br",
        "end_token_pos_3": 390,
        "end_token_id_3": 526,
        "answer_token_id_4": 2043,
        "answer_token_pos_4": 395,
        "answer_token_4": "Pol",
        "end_token_pos_4": 394,
        "end_token_id_4": 29889,
        "answer_token_id_5": 1506,
        "answer_token_pos_5": 398,
        "answer_token_5": "br",
        "end_token_pos_5": 397,
        "end_token_id_5": 338,
        "answer_token_id_6": 1771,
        "answer_token_pos_6": 402,
        "answer_token_6": "Br",
        "end_token_pos_6": 401,
        "end_token_id_6": 29889,
        "answer_token_id_7": 1539,
        "answer_token_pos_7": 406,
        "answer_token_7": "met",
        "end_token_pos_7": 405,
        "end_token_id_7": 526,
        "answer_token_id_8": 2043,
        "answer_token_pos_8": 410,
        "answer_token_8": "Pol",
        "end_token_pos_8": 409,
        "end_token_id_8": 29889,
        "answer_token_id_9": 1539,
        "answer_token_pos_9": 413,
        "answer_token_9": "met",
        "end_token_pos_9": 412,
        "end_token_id_9": 338
    },
    {
        "question": "Numpus is earthy. Dumpuses are numpuses. Alex is dumpus.",
        "query": "True or false: Alex is earthy.",
        "answer": "Alex is dumpus. Dumpuses are numpuses. Alex is numpus. Numpus is earthy. Alex is earthy. True",
        "label": "True",
        "prompt": "Numpus is earthy. Dumpuses are numpuses. Alex is dumpus. True or false: Alex is earthy. Let us think step by step.",
        "generated": "Alex is dumpus. Dumpuses are numpuses. Alex is numpus. Numpus is earthy. Alex is earthy. True",
        "noise_response_0": "",
        "noise_prompt_0": "Numpus is earthy. Dumpuses are numpuses. Alex is dumpus. True or false: Sally is earthy. Let us think step by step.",
        "response_0": "",
        "noise_response_1": "Alex is",
        "noise_prompt_1": "Numpus is earthy. Dumpuses are numpuses. Alex is gorpus. True or false: Alex is earthy. Let us think step by step.",
        "response_1": "Alex is",
        "noise_response_2": "Alex is dumpus.",
        "noise_prompt_2": "Numpus is earthy. Lorpus are numpuses. Alex is dumpus. True or false: Alex is earthy. Let us think step by step.",
        "response_2": "Alex is dumpus.",
        "noise_response_3": "Alex is dumpus. Dumpuses are",
        "noise_prompt_3": "Numpus is earthy. Dumpuses are lorpus. Alex is dumpus. True or false: Alex is earthy. Let us think step by step.",
        "response_3": "Alex is dumpus. Dumpuses are",
        "noise_response_4": "Sam is dumpus. Dumpuses are numpuses.",
        "noise_prompt_4": "Numpus is earthy. Dumpuses are numpuses. Alex is dumpus. True or false: Alex is earthy. Let us think step by step.",
        "response_4": "Alex is dumpus. Dumpuses are numpuses.",
        "noise_response_5": "Alex is dumpus. Dumpuses are Shumpus. Alex is",
        "noise_prompt_5": "Numpus is earthy. Dumpuses are numpuses. Alex is dumpus. True or false: Alex is earthy. Let us think step by step.",
        "response_5": "Alex is dumpus. Dumpuses are numpuses. Alex is",
        "noise_response_6": "Alex is dumpus. Dumpuses are numpuses. Alex is numpus.",
        "noise_prompt_6": "wumpus is earthy. Dumpuses are numpuses. Alex is dumpus. True or false: Alex is earthy. Let us think step by step.",
        "response_6": "Alex is dumpus. Dumpuses are numpuses. Alex is numpus.",
        "noise_response_7": "Alex is dumpus. Dumpuses are numpuses. Alex is numpus. Numpus is",
        "noise_prompt_7": "Numpus is earthy. Dumpuses are numpuses. Alex is dumpus. True or false: Alex is temperate. Let us think step by step.",
        "response_7": "Alex is dumpus. Dumpuses are numpuses. Alex is numpus. Numpus is",
        "noise_response_8": "Alex is dumpus. Dumpuses are numpuses. Rex is numpus. Numpus is earthy.",
        "noise_prompt_8": "Numpus is earthy. Dumpuses are numpuses. Alex is dumpus. True or false: Alex is earthy. Let us think step by step.",
        "response_8": "Alex is dumpus. Dumpuses are numpuses. Alex is numpus. Numpus is earthy.",
        "noise_response_9": "Alex is dumpus. Dumpuses are numpuses. Alex is numpus. Numpus is metallic. Alex is",
        "noise_prompt_9": "Numpus is earthy. Dumpuses are numpuses. Alex is dumpus. True or false: Alex is earthy. Let us think step by step.",
        "response_9": "Alex is dumpus. Dumpuses are numpuses. Alex is numpus. Numpus is earthy. Alex is",
        "noise_prompt_10": "Numpus is earthy. Dumpuses are numpuses. Alex is dumpus. True or false: Alex is earthy. Let us think step by step.",
        "response_10": "Alex is dumpus. Dumpuses are numpuses. Alex is numpus. Numpus is earthy. Alex is earthy.",
        "noise_response_10": "Alex is dumpus. Dumpuses are numpuses. Alex is numpus. Numpus is earthy. Alex is aggressive.",
        "answer_token_id_0": 17406,
        "answer_token_pos_0": 380,
        "answer_token_0": "Alex",
        "end_token_pos_0": 379,
        "end_token_id_0": 13,
        "answer_token_id_1": 16766,
        "answer_token_pos_1": 383,
        "answer_token_1": "dump",
        "end_token_pos_1": 382,
        "end_token_id_1": 338,
        "answer_token_id_2": 360,
        "answer_token_pos_2": 387,
        "answer_token_2": "D",
        "end_token_pos_2": 386,
        "end_token_id_2": 29889,
        "answer_token_id_3": 954,
        "answer_token_pos_3": 391,
        "answer_token_3": "num",
        "end_token_pos_3": 390,
        "end_token_id_3": 526,
        "answer_token_id_4": 4827,
        "answer_token_pos_4": 395,
        "answer_token_4": "Alex",
        "end_token_pos_4": 394,
        "end_token_id_4": 29889,
        "answer_token_id_5": 954,
        "answer_token_pos_5": 398,
        "answer_token_5": "num",
        "end_token_pos_5": 397,
        "end_token_id_5": 338,
        "answer_token_id_6": 405,
        "answer_token_pos_6": 402,
        "answer_token_6": "N",
        "end_token_pos_6": 401,
        "end_token_id_6": 29889,
        "answer_token_id_7": 8437,
        "answer_token_pos_7": 406,
        "answer_token_7": "earth",
        "end_token_pos_7": 405,
        "end_token_id_7": 338,
        "answer_token_id_8": 4827,
        "answer_token_pos_8": 410,
        "answer_token_8": "Alex",
        "end_token_pos_8": 409,
        "end_token_id_8": 29889,
        "answer_token_id_9": 8437,
        "answer_token_pos_9": 413,
        "answer_token_9": "earth",
        "end_token_pos_9": 412,
        "end_token_id_9": 338
    },
    {
        "question": "Grimpus is earthy. Vumpus is grimpus. Wren is vumpus.",
        "query": "True or false: Wren is earthy.",
        "answer": "Wren is vumpus. Vumpus is grimpus. Wren is grimpus. Grimpus is earthy. Wren is earthy. True",
        "label": "True",
        "prompt": "Grimpus is earthy. Vumpus is grimpus. Wren is vumpus. True or false: Wren is earthy. Let us think step by step.",
        "generated": "Wren is vumpus. Vumpus is grimpus. Wren is grimpus. Grimpus is earthy. Wren is earthy. True",
        "noise_response_0": "",
        "noise_prompt_0": "Grimpus is earthy. Vumpus is grimpus. Wren is vumpus. True or false: Sam is earthy. Let us think step by step.",
        "response_0": "",
        "noise_response_1": "Wren is",
        "noise_prompt_1": "Grimpus is earthy. Vumpus is grimpus. Wren is Shumpus. True or false: Wren is earthy. Let us think step by step.",
        "response_1": "Wren is",
        "noise_response_2": "Wren is vumpus.",
        "noise_prompt_2": "Grimpus is earthy. brimpus is grimpus. Wren is vumpus. True or false: Wren is earthy. Let us think step by step.",
        "response_2": "Wren is vumpus.",
        "noise_response_3": "Wren is vumpus. Vumpus is",
        "noise_prompt_3": "Grimpus is earthy. Vumpus is Numpus. Wren is vumpus. True or false: Wren is earthy. Let us think step by step.",
        "response_3": "Wren is vumpus. Vumpus is",
        "noise_response_4": "Sally is vumpus. Vumpus is grimpus.",
        "noise_prompt_4": "Grimpus is earthy. Vumpus is grimpus. Wren is vumpus. True or false: Wren is earthy. Let us think step by step.",
        "response_4": "Wren is vumpus. Vumpus is grimpus.",
        "noise_response_5": "Wren is vumpus. Vumpus is dumpus. Wren is",
        "noise_prompt_5": "Grimpus is earthy. Vumpus is grimpus. Wren is vumpus. True or false: Wren is earthy. Let us think step by step.",
        "response_5": "Wren is vumpus. Vumpus is grimpus. Wren is",
        "noise_response_6": "Wren is vumpus. Vumpus is grimpus. Wren is grimpus.",
        "noise_prompt_6": "Impus is earthy. Vumpus is grimpus. Wren is vumpus. True or false: Wren is earthy. Let us think step by step.",
        "response_6": "Wren is vumpus. Vumpus is grimpus. Wren is grimpus.",
        "noise_response_7": "Wren is vumpus. Vumpus is grimpus. Wren is grimpus. Grimpus is",
        "noise_prompt_7": "Grimpus is earthy. Vumpus is grimpus. Wren is vumpus. True or false: Wren is large. Let us think step by step.",
        "response_7": "Wren is vumpus. Vumpus is grimpus. Wren is grimpus. Grimpus is",
        "noise_response_8": "Wren is vumpus. Vumpus is grimpus. Alex is grimpus. Grimpus is earthy.",
        "noise_prompt_8": "Grimpus is earthy. Vumpus is grimpus. Wren is vumpus. True or false: Wren is earthy. Let us think step by step.",
        "response_8": "Wren is vumpus. Vumpus is grimpus. Wren is grimpus. Grimpus is earthy.",
        "noise_response_9": "Wren is vumpus. Vumpus is grimpus. Wren is grimpus. Grimpus is fruity. Wren is",
        "noise_prompt_9": "Grimpus is earthy. Vumpus is grimpus. Wren is vumpus. True or false: Wren is earthy. Let us think step by step.",
        "response_9": "Wren is vumpus. Vumpus is grimpus. Wren is grimpus. Grimpus is earthy. Wren is",
        "noise_prompt_10": "Grimpus is earthy. Vumpus is grimpus. Wren is vumpus. True or false: Wren is earthy. Let us think step by step.",
        "response_10": "Wren is vumpus. Vumpus is grimpus. Wren is grimpus. Grimpus is earthy. Wren is earthy.",
        "noise_response_10": "Wren is vumpus. Vumpus is grimpus. Wren is grimpus. Grimpus is earthy. Wren is metallic.",
        "answer_token_id_0": 29956,
        "answer_token_pos_0": 380,
        "answer_token_0": "W",
        "end_token_pos_0": 379,
        "end_token_id_0": 13,
        "answer_token_id_1": 325,
        "answer_token_pos_1": 383,
        "answer_token_1": "v",
        "end_token_pos_1": 382,
        "end_token_id_1": 338,
        "answer_token_id_2": 478,
        "answer_token_pos_2": 387,
        "answer_token_2": "V",
        "end_token_pos_2": 386,
        "end_token_id_2": 29889,
        "answer_token_id_3": 867,
        "answer_token_pos_3": 391,
        "answer_token_3": "gr",
        "end_token_pos_3": 390,
        "end_token_id_3": 338,
        "answer_token_id_4": 399,
        "answer_token_pos_4": 395,
        "answer_token_4": "W",
        "end_token_pos_4": 394,
        "end_token_id_4": 29889,
        "answer_token_id_5": 867,
        "answer_token_pos_5": 398,
        "answer_token_5": "gr",
        "end_token_pos_5": 397,
        "end_token_id_5": 338,
        "answer_token_id_6": 1632,
        "answer_token_pos_6": 402,
        "answer_token_6": "Gr",
        "end_token_pos_6": 401,
        "end_token_id_6": 29889,
        "answer_token_id_7": 8437,
        "answer_token_pos_7": 406,
        "answer_token_7": "earth",
        "end_token_pos_7": 405,
        "end_token_id_7": 338,
        "answer_token_id_8": 399,
        "answer_token_pos_8": 410,
        "answer_token_8": "W",
        "end_token_pos_8": 409,
        "end_token_id_8": 29889,
        "answer_token_id_9": 8437,
        "answer_token_pos_9": 413,
        "answer_token_9": "earth",
        "end_token_pos_9": 412,
        "end_token_id_9": 338
    },
    {
        "question": "Impus is windy. Sterpuses are impuses. Fae is sterpus.",
        "query": "True or false: Fae is windy.",
        "answer": "Fae is sterpus. Sterpuses are impuses. Fae is impus. Impus is windy. Fae is windy. True",
        "label": "True",
        "prompt": "Impus is windy. Sterpuses are impuses. Fae is sterpus. True or false: Fae is windy. Let us think step by step.",
        "generated": "Fae is sterpus. Sterpuses are impuses. Fae is impus. Impus is windy. Fae is windy. True",
        "noise_response_0": "",
        "noise_prompt_0": "Impus is windy. Sterpuses are impuses. Fae is sterpus. True or false: Alex is windy. Let us think step by step.",
        "response_0": "",
        "noise_response_1": "Fae is",
        "noise_prompt_1": "Impus is windy. Sterpuses are impuses. Fae is Rompus. True or false: Fae is windy. Let us think step by step.",
        "response_1": "Fae is",
        "noise_response_2": "Fae is sterpus.",
        "noise_prompt_2": "Impus is windy. dumpus are impuses. Fae is sterpus. True or false: Fae is windy. Let us think step by step.",
        "response_2": "Fae is sterpus.",
        "noise_response_3": "Fae is sterpus. Sterpuses are",
        "noise_prompt_3": "Impus is windy. Sterpuses are Gorpus. Fae is sterpus. True or false: Fae is windy. Let us think step by step.",
        "response_3": "Fae is sterpus. Sterpuses are",
        "noise_response_4": "Max is sterpus. Sterpuses are impuses.",
        "noise_prompt_4": "Impus is windy. Sterpuses are impuses. Fae is sterpus. True or false: Fae is windy. Let us think step by step.",
        "response_4": "Fae is sterpus. Sterpuses are impuses.",
        "noise_response_5": "Fae is sterpus. Sterpuses are grimpus. Fae is",
        "noise_prompt_5": "Impus is windy. Sterpuses are impuses. Fae is sterpus. True or false: Fae is windy. Let us think step by step.",
        "response_5": "Fae is sterpus. Sterpuses are impuses. Fae is",
        "noise_response_6": "Fae is sterpus. Sterpuses are impuses. Fae is impus.",
        "noise_prompt_6": "grimpus is windy. Sterpuses are impuses. Fae is sterpus. True or false: Fae is windy. Let us think step by step.",
        "response_6": "Fae is sterpus. Sterpuses are impuses. Fae is impus.",
        "noise_response_7": "Fae is sterpus. Sterpuses are impuses. Fae is impus. Impus is",
        "noise_prompt_7": "Impus is windy. Sterpuses are impuses. Fae is sterpus. True or false: Fae is overcast. Let us think step by step.",
        "response_7": "Fae is sterpus. Sterpuses are impuses. Fae is impus. Impus is",
        "noise_response_8": "Fae is sterpus. Sterpuses are impuses. Alex is impus. Impus is windy.",
        "noise_prompt_8": "Impus is windy. Sterpuses are impuses. Fae is sterpus. True or false: Fae is windy. Let us think step by step.",
        "response_8": "Fae is sterpus. Sterpuses are impuses. Fae is impus. Impus is windy.",
        "noise_response_9": "Fae is sterpus. Sterpuses are impuses. Fae is impus. Impus is happy. Fae is",
        "noise_prompt_9": "Impus is windy. Sterpuses are impuses. Fae is sterpus. True or false: Fae is windy. Let us think step by step.",
        "response_9": "Fae is sterpus. Sterpuses are impuses. Fae is impus. Impus is windy. Fae is",
        "noise_prompt_10": "Impus is windy. Sterpuses are impuses. Fae is sterpus. True or false: Fae is windy. Let us think step by step.",
        "response_10": "Fae is sterpus. Sterpuses are impuses. Fae is impus. Impus is windy. Fae is windy.",
        "noise_response_10": "Fae is sterpus. Sterpuses are impuses. Fae is impus. Impus is windy. Fae is snowy.",
        "answer_token_id_0": 29943,
        "answer_token_pos_0": 380,
        "answer_token_0": "F",
        "end_token_pos_0": 379,
        "end_token_id_0": 13,
        "answer_token_id_1": 16864,
        "answer_token_pos_1": 383,
        "answer_token_1": "ster",
        "end_token_pos_1": 382,
        "end_token_id_1": 338,
        "answer_token_id_2": 28588,
        "answer_token_pos_2": 387,
        "answer_token_2": "Ster",
        "end_token_pos_2": 386,
        "end_token_id_2": 29889,
        "answer_token_id_3": 2411,
        "answer_token_pos_3": 391,
        "answer_token_3": "imp",
        "end_token_pos_3": 390,
        "end_token_id_3": 526,
        "answer_token_id_4": 14305,
        "answer_token_pos_4": 395,
        "answer_token_4": "Imp",
        "end_token_pos_4": 394,
        "end_token_id_4": 29889,
        "answer_token_id_5": 2411,
        "answer_token_pos_5": 398,
        "answer_token_5": "imp",
        "end_token_pos_5": 397,
        "end_token_id_5": 338,
        "answer_token_id_6": 14305,
        "answer_token_pos_6": 402,
        "answer_token_6": "Imp",
        "end_token_pos_6": 401,
        "end_token_id_6": 29889,
        "answer_token_id_7": 8805,
        "answer_token_pos_7": 406,
        "answer_token_7": "wind",
        "end_token_pos_7": 405,
        "end_token_id_7": 338,
        "answer_token_id_8": 383,
        "answer_token_pos_8": 410,
        "answer_token_8": "F",
        "end_token_pos_8": 409,
        "end_token_id_8": 29889,
        "answer_token_id_9": 8805,
        "answer_token_pos_9": 413,
        "answer_token_9": "wind",
        "end_token_pos_9": 412,
        "end_token_id_9": 338
    },
    {
        "question": "Vumpuses are fruity. Sterpus is vumpus. Max is sterpus.",
        "query": "True or false: Max is fruity.",
        "answer": "Max is sterpus. Sterpus is vumpus. Max is vumpus. Vumpuses are fruity. Max is fruity. True",
        "label": "True",
        "prompt": "Vumpuses are fruity. Sterpus is vumpus. Max is sterpus. True or false: Max is fruity. Let us think step by step.",
        "generated": "Max is sterpus. Sterpus is vumpus. Max is vumpus. Vumpuses are fruity. Max is fruity. True",
        "noise_response_0": "",
        "noise_prompt_0": "Vumpuses are fruity. Sterpus is vumpus. Max is sterpus. True or false: Alex is fruity. Let us think step by step.",
        "response_0": "",
        "noise_response_1": "Max is",
        "noise_prompt_1": "Vumpuses are fruity. Sterpus is vumpus. Max is lorpus. True or false: Max is fruity. Let us think step by step.",
        "response_1": "Max is",
        "noise_response_2": "Max is sterpus.",
        "noise_prompt_2": "Vumpuses are fruity. Numpus is vumpus. Max is sterpus. True or false: Max is fruity. Let us think step by step.",
        "response_2": "Max is sterpus.",
        "noise_response_3": "Max is sterpus. Sterpus is",
        "noise_prompt_3": "Vumpuses are fruity. Sterpus is brimpus. Max is sterpus. True or false: Max is fruity. Let us think step by step.",
        "response_3": "Max is sterpus. Sterpus is",
        "noise_response_4": "Sally is sterpus. Sterpus is vumpus.",
        "noise_prompt_4": "Vumpuses are fruity. Sterpus is vumpus. Max is sterpus. True or false: Max is fruity. Let us think step by step.",
        "response_4": "Max is sterpus. Sterpus is vumpus.",
        "noise_response_5": "Max is sterpus. Sterpus is Sterpus. Max is",
        "noise_prompt_5": "Vumpuses are fruity. Sterpus is vumpus. Max is sterpus. True or false: Max is fruity. Let us think step by step.",
        "response_5": "Max is sterpus. Sterpus is vumpus. Max is",
        "noise_response_6": "Max is sterpus. Sterpus is vumpus. Max is vumpus.",
        "noise_prompt_6": "Lorpus are fruity. Sterpus is vumpus. Max is sterpus. True or false: Max is fruity. Let us think step by step.",
        "response_6": "Max is sterpus. Sterpus is vumpus. Max is vumpus.",
        "noise_response_7": "Max is sterpus. Sterpus is vumpus. Max is vumpus. Vumpuses are",
        "noise_prompt_7": "Vumpuses are fruity. Sterpus is vumpus. Max is sterpus. True or false: Max is bitter. Let us think step by step.",
        "response_7": "Max is sterpus. Sterpus is vumpus. Max is vumpus. Vumpuses are",
        "noise_response_8": "Max is sterpus. Sterpus is vumpus. Wren is vumpus. Vumpuses are fruity.",
        "noise_prompt_8": "Vumpuses are fruity. Sterpus is vumpus. Max is sterpus. True or false: Max is fruity. Let us think step by step.",
        "response_8": "Max is sterpus. Sterpus is vumpus. Max is vumpus. Vumpuses are fruity.",
        "noise_response_9": "Max is sterpus. Sterpus is vumpus. Max is vumpus. Vumpuses are bitter. Max is",
        "noise_prompt_9": "Vumpuses are fruity. Sterpus is vumpus. Max is sterpus. True or false: Max is fruity. Let us think step by step.",
        "response_9": "Max is sterpus. Sterpus is vumpus. Max is vumpus. Vumpuses are fruity. Max is",
        "noise_prompt_10": "Vumpuses are fruity. Sterpus is vumpus. Max is sterpus. True or false: Max is fruity. Let us think step by step.",
        "response_10": "Max is sterpus. Sterpus is vumpus. Max is vumpus. Vumpuses are fruity. Max is fruity.",
        "noise_response_10": "Max is sterpus. Sterpus is vumpus. Max is vumpus. Vumpuses are fruity. Max is nervous.",
        "answer_token_id_0": 7976,
        "answer_token_pos_0": 380,
        "answer_token_0": "Max",
        "end_token_pos_0": 379,
        "end_token_id_0": 13,
        "answer_token_id_1": 16864,
        "answer_token_pos_1": 383,
        "answer_token_1": "ster",
        "end_token_pos_1": 382,
        "end_token_id_1": 338,
        "answer_token_id_2": 28588,
        "answer_token_pos_2": 387,
        "answer_token_2": "Ster",
        "end_token_pos_2": 386,
        "end_token_id_2": 29889,
        "answer_token_id_3": 325,
        "answer_token_pos_3": 391,
        "answer_token_3": "v",
        "end_token_pos_3": 390,
        "end_token_id_3": 338,
        "answer_token_id_4": 5918,
        "answer_token_pos_4": 395,
        "answer_token_4": "Max",
        "end_token_pos_4": 394,
        "end_token_id_4": 29889,
        "answer_token_id_5": 325,
        "answer_token_pos_5": 398,
        "answer_token_5": "v",
        "end_token_pos_5": 397,
        "end_token_id_5": 338,
        "answer_token_id_6": 478,
        "answer_token_pos_6": 402,
        "answer_token_6": "V",
        "end_token_pos_6": 401,
        "end_token_id_6": 29889,
        "answer_token_id_7": 285,
        "answer_token_pos_7": 406,
        "answer_token_7": "f",
        "end_token_pos_7": 405,
        "end_token_id_7": 526,
        "answer_token_id_8": 5918,
        "answer_token_pos_8": 410,
        "answer_token_8": "Max",
        "end_token_pos_8": 409,
        "end_token_id_8": 29889,
        "answer_token_id_9": 285,
        "answer_token_pos_9": 413,
        "answer_token_9": "f",
        "end_token_pos_9": 412,
        "end_token_id_9": 338
    },
    {
        "question": "Gorpus is fast. Brimpus is gorpus. Rex is brimpus.",
        "query": "True or false: Rex is fast.",
        "answer": "Rex is brimpus. Brimpus is gorpus. Rex is gorpus. Gorpus is fast. Rex is fast. True",
        "label": "True",
        "prompt": "Gorpus is fast. Brimpus is gorpus. Rex is brimpus. True or false: Rex is fast. Let us think step by step.",
        "generated": "Rex is brimpus. Brimpus is gorpus. Rex is gorpus. Gorpus is fast. Rex is fast. True",
        "noise_response_0": "",
        "noise_prompt_0": "Gorpus is fast. Brimpus is gorpus. Rex is brimpus. True or false: Sally is fast. Let us think step by step.",
        "response_0": "",
        "noise_response_1": "Rex is",
        "noise_prompt_1": "Gorpus is fast. Brimpus is gorpus. Rex is red. True or false: Rex is fast. Let us think step by step.",
        "response_1": "Rex is",
        "noise_response_2": "Rex is brimpus.",
        "noise_prompt_2": "Gorpus is fast. lorpus is gorpus. Rex is brimpus. True or false: Rex is fast. Let us think step by step.",
        "response_2": "Rex is brimpus.",
        "noise_response_3": "Rex is brimpus. Brimpus is",
        "noise_prompt_3": "Gorpus is fast. Brimpus is Rompus. Rex is brimpus. True or false: Rex is fast. Let us think step by step.",
        "response_3": "Rex is brimpus. Brimpus is",
        "noise_response_4": "Wren is brimpus. Brimpus is gorpus.",
        "noise_prompt_4": "Gorpus is fast. Brimpus is gorpus. Rex is brimpus. True or false: Rex is fast. Let us think step by step.",
        "response_4": "Rex is brimpus. Brimpus is gorpus.",
        "noise_response_5": "Rex is brimpus. Brimpus is yumpus. Rex is",
        "noise_prompt_5": "Gorpus is fast. Brimpus is gorpus. Rex is brimpus. True or false: Rex is fast. Let us think step by step.",
        "response_5": "Rex is brimpus. Brimpus is gorpus. Rex is",
        "noise_response_6": "Rex is brimpus. Brimpus is gorpus. Rex is gorpus.",
        "noise_prompt_6": "impus is fast. Brimpus is gorpus. Rex is brimpus. True or false: Rex is fast. Let us think step by step.",
        "response_6": "Rex is brimpus. Brimpus is gorpus. Rex is gorpus.",
        "noise_response_7": "Rex is brimpus. Brimpus is gorpus. Rex is gorpus. Gorpus is",
        "noise_prompt_7": "Gorpus is fast. Brimpus is gorpus. Rex is brimpus. True or false: Rex is melodic. Let us think step by step.",
        "response_7": "Rex is brimpus. Brimpus is gorpus. Rex is gorpus. Gorpus is",
        "noise_response_8": "Rex is brimpus. Brimpus is gorpus. Polly is gorpus. Gorpus is fast.",
        "noise_prompt_8": "Gorpus is fast. Brimpus is gorpus. Rex is brimpus. True or false: Rex is fast. Let us think step by step.",
        "response_8": "Rex is brimpus. Brimpus is gorpus. Rex is gorpus. Gorpus is fast.",
        "noise_response_9": "Rex is brimpus. Brimpus is gorpus. Rex is gorpus. Gorpus is feisty. Rex is",
        "noise_prompt_9": "Gorpus is fast. Brimpus is gorpus. Rex is brimpus. True or false: Rex is fast. Let us think step by step.",
        "response_9": "Rex is brimpus. Brimpus is gorpus. Rex is gorpus. Gorpus is fast. Rex is",
        "noise_prompt_10": "Gorpus is fast. Brimpus is gorpus. Rex is brimpus. True or false: Rex is fast. Let us think step by step.",
        "response_10": "Rex is brimpus. Brimpus is gorpus. Rex is gorpus. Gorpus is fast. Rex is fast.",
        "noise_response_10": "Rex is brimpus. Brimpus is gorpus. Rex is gorpus. Gorpus is fast. Rex is dull.",
        "answer_token_id_0": 29934,
        "answer_token_pos_0": 380,
        "answer_token_0": "R",
        "end_token_pos_0": 379,
        "end_token_id_0": 13,
        "answer_token_id_1": 1506,
        "answer_token_pos_1": 383,
        "answer_token_1": "br",
        "end_token_pos_1": 382,
        "end_token_id_1": 338,
        "answer_token_id_2": 1771,
        "answer_token_pos_2": 387,
        "answer_token_2": "Br",
        "end_token_pos_2": 386,
        "end_token_id_2": 29889,
        "answer_token_id_3": 330,
        "answer_token_pos_3": 391,
        "answer_token_3": "g",
        "end_token_pos_3": 390,
        "end_token_id_3": 338,
        "answer_token_id_4": 390,
        "answer_token_pos_4": 395,
        "answer_token_4": "R",
        "end_token_pos_4": 394,
        "end_token_id_4": 29889,
        "answer_token_id_5": 330,
        "answer_token_pos_5": 398,
        "answer_token_5": "g",
        "end_token_pos_5": 397,
        "end_token_id_5": 338,
        "answer_token_id_6": 18686,
        "answer_token_pos_6": 402,
        "answer_token_6": "Gor",
        "end_token_pos_6": 401,
        "end_token_id_6": 29889,
        "answer_token_id_7": 5172,
        "answer_token_pos_7": 406,
        "answer_token_7": "fast",
        "end_token_pos_7": 405,
        "end_token_id_7": 338,
        "answer_token_id_8": 390,
        "answer_token_pos_8": 410,
        "answer_token_8": "R",
        "end_token_pos_8": 409,
        "end_token_id_8": 29889,
        "answer_token_id_9": 5172,
        "answer_token_pos_9": 413,
        "answer_token_9": "fast",
        "end_token_pos_9": 412,
        "end_token_id_9": 338
    },
    {
        "question": "Sterpuses are small. Gorpus is sterpus. Stella is gorpus.",
        "query": "True or false: Stella is small.",
        "answer": "Stella is gorpus. Gorpus is sterpus. Stella is sterpus. Sterpuses are small. Stella is small. True",
        "label": "True",
        "prompt": "Sterpuses are small. Gorpus is sterpus. Stella is gorpus. True or false: Stella is small. Let us think step by step.",
        "generated": "Stella is gorpus. Gorpus is sterpus. Stella is sterpus. Sterpuses are small. Stella is small. True",
        "noise_response_0": "",
        "noise_prompt_0": "Sterpuses are small. Gorpus is sterpus. Stella is gorpus. True or false: Fae is small. Let us think step by step.",
        "response_0": "",
        "noise_response_1": "Stella is",
        "noise_prompt_1": "Sterpuses are small. Gorpus is sterpus. Stella is grimpus. True or false: Stella is small. Let us think step by step.",
        "response_1": "Stella is",
        "noise_response_2": "Stella is gorpus.",
        "noise_prompt_2": "Sterpuses are small. Wumpus is sterpus. Stella is gorpus. True or false: Stella is small. Let us think step by step.",
        "response_2": "Stella is gorpus.",
        "noise_response_3": "Stella is gorpus. Gorpus is",
        "noise_prompt_3": "Sterpuses are small. Gorpus is lempus. Stella is gorpus. True or false: Stella is small. Let us think step by step.",
        "response_3": "Stella is gorpus. Gorpus is",
        "noise_response_4": "Sally is gorpus. Gorpus is sterpus.",
        "noise_prompt_4": "Sterpuses are small. Gorpus is sterpus. Stella is gorpus. True or false: Stella is small. Let us think step by step.",
        "response_4": "Stella is gorpus. Gorpus is sterpus.",
        "noise_response_5": "Stella is gorpus. Gorpus is tumpus. Stella is",
        "noise_prompt_5": "Sterpuses are small. Gorpus is sterpus. Stella is gorpus. True or false: Stella is small. Let us think step by step.",
        "response_5": "Stella is gorpus. Gorpus is sterpus. Stella is",
        "noise_response_6": "Stella is gorpus. Gorpus is sterpus. Stella is sterpus.",
        "noise_prompt_6": "lorpus are small. Gorpus is sterpus. Stella is gorpus. True or false: Stella is small. Let us think step by step.",
        "response_6": "Stella is gorpus. Gorpus is sterpus. Stella is sterpus.",
        "noise_response_7": "Stella is gorpus. Gorpus is sterpus. Stella is sterpus. Sterpuses are",
        "noise_prompt_7": "Sterpuses are small. Gorpus is sterpus. Stella is gorpus. True or false: Stella is bitter. Let us think step by step.",
        "response_7": "Stella is gorpus. Gorpus is sterpus. Stella is sterpus. Sterpuses are",
        "noise_response_8": "Stella is gorpus. Gorpus is sterpus. Stella is sterpus. Stella are small.",
        "noise_prompt_8": "Sterpuses are small. Gorpus is sterpus. Stella is gorpus. True or false: Stella is small. Let us think step by step.",
        "response_8": "Stella is gorpus. Gorpus is sterpus. Stella is sterpus. Sterpuses are small.",
        "noise_response_9": "Stella is gorpus. Gorpus is sterpus. Stella is sterpus. Sterpuses are sour. Stella is",
        "noise_prompt_9": "Sterpuses are small. Gorpus is sterpus. Stella is gorpus. True or false: Stella is small. Let us think step by step.",
        "response_9": "Stella is gorpus. Gorpus is sterpus. Stella is sterpus. Sterpuses are small. Stella is",
        "noise_prompt_10": "Sterpuses are small. Gorpus is sterpus. Stella is gorpus. True or false: Stella is small. Let us think step by step.",
        "response_10": "Stella is gorpus. Gorpus is sterpus. Stella is sterpus. Sterpuses are small. Stella is small.",
        "noise_response_10": "Stella is gorpus. Gorpus is sterpus. Stella is sterpus. Sterpuses are small. Stella is shy.",
        "answer_token_id_0": 855,
        "answer_token_pos_0": 380,
        "answer_token_0": "St",
        "end_token_pos_0": 379,
        "end_token_id_0": 13,
        "answer_token_id_1": 330,
        "answer_token_pos_1": 383,
        "answer_token_1": "g",
        "end_token_pos_1": 382,
        "end_token_id_1": 338,
        "answer_token_id_2": 18686,
        "answer_token_pos_2": 387,
        "answer_token_2": "Gor",
        "end_token_pos_2": 386,
        "end_token_id_2": 29889,
        "answer_token_id_3": 16864,
        "answer_token_pos_3": 391,
        "answer_token_3": "ster",
        "end_token_pos_3": 390,
        "end_token_id_3": 338,
        "answer_token_id_4": 624,
        "answer_token_pos_4": 395,
        "answer_token_4": "St",
        "end_token_pos_4": 394,
        "end_token_id_4": 29889,
        "answer_token_id_5": 16864,
        "answer_token_pos_5": 398,
        "answer_token_5": "ster",
        "end_token_pos_5": 397,
        "end_token_id_5": 338,
        "answer_token_id_6": 28588,
        "answer_token_pos_6": 402,
        "answer_token_6": "Ster",
        "end_token_pos_6": 401,
        "end_token_id_6": 29889,
        "answer_token_id_7": 2319,
        "answer_token_pos_7": 406,
        "answer_token_7": "small",
        "end_token_pos_7": 405,
        "end_token_id_7": 526,
        "answer_token_id_8": 624,
        "answer_token_pos_8": 410,
        "answer_token_8": "St",
        "end_token_pos_8": 409,
        "end_token_id_8": 29889,
        "answer_token_id_9": 2319,
        "answer_token_pos_9": 413,
        "answer_token_9": "small",
        "end_token_pos_9": 412,
        "end_token_id_9": 338
    },
    {
        "question": "Brimpuses are cold. Tumpuses are brimpuses. Rex is tumpus.",
        "query": "True or false: Rex is sunny.",
        "answer": "Rex is tumpus. Tumpuses are brimpuses. Rex is brimpus. Brimpuses are cold. Rex is cold. False",
        "label": "False",
        "prompt": "Brimpuses are cold. Tumpuses are brimpuses. Rex is tumpus. True or false: Rex is sunny. Let us think step by step.",
        "generated": "Rex is tumpus. Tumpuses are brimpuses. Rex is brimpus. Brimpuses are cold. Rex is cold. False",
        "noise_response_0": "",
        "noise_prompt_0": "Brimpuses are cold. Tumpuses are brimpuses. Rex is tumpus. True or false: Max is sunny. Let us think step by step.",
        "response_0": "",
        "noise_response_1": "Rex is",
        "noise_prompt_1": "Brimpuses are cold. Tumpuses are brimpuses. Rex is bright. True or false: Rex is sunny. Let us think step by step.",
        "response_1": "Rex is",
        "noise_response_2": "Rex is tumpus.",
        "noise_prompt_2": "Brimpuses are cold. shumpus are brimpuses. Rex is tumpus. True or false: Rex is sunny. Let us think step by step.",
        "response_2": "Rex is tumpus.",
        "noise_response_3": "Rex is tumpus. Tumpuses are",
        "noise_prompt_3": "Brimpuses are cold. Tumpuses are bright. Rex is tumpus. True or false: Rex is sunny. Let us think step by step.",
        "response_3": "Rex is tumpus. Tumpuses are",
        "noise_response_4": "Wren is tumpus. Tumpuses are brimpuses.",
        "noise_prompt_4": "Brimpuses are cold. Tumpuses are brimpuses. Rex is tumpus. True or false: Rex is sunny. Let us think step by step.",
        "response_4": "Rex is tumpus. Tumpuses are brimpuses.",
        "noise_response_5": "Rex is tumpus. Tumpuses are cold. Rex is",
        "noise_prompt_5": "Brimpuses are cold. Tumpuses are brimpuses. Rex is tumpus. True or false: Rex is sunny. Let us think step by step.",
        "response_5": "Rex is tumpus. Tumpuses are brimpuses. Rex is",
        "noise_response_6": "Rex is tumpus. Tumpuses are brimpuses. Rex is brimpus.",
        "noise_prompt_6": "numpus are cold. Tumpuses are brimpuses. Rex is tumpus. True or false: Rex is sunny. Let us think step by step.",
        "response_6": "Rex is tumpus. Tumpuses are brimpuses. Rex is brimpus.",
        "noise_response_7": "Rex is tumpus. Tumpuses are brimpuses. Rex is brimpus. Brimpuses are",
        "noise_prompt_7": "Brimpuses are dull. Tumpuses are brimpuses. Rex is tumpus. True or false: Rex is sunny. Let us think step by step.",
        "response_7": "Rex is tumpus. Tumpuses are brimpuses. Rex is brimpus. Brimpuses are",
        "noise_response_8": "Rex is tumpus. Tumpuses are brimpuses. Stella is brimpus. Brimpuses are cold.",
        "noise_prompt_8": "Brimpuses are cold. Tumpuses are brimpuses. Rex is tumpus. True or false: Rex is sunny. Let us think step by step.",
        "response_8": "Rex is tumpus. Tumpuses are brimpuses. Rex is brimpus. Brimpuses are cold.",
        "noise_response_9": "Rex is tumpus. Tumpuses are brimpuses. Rex is brimpus. Brimpuses are fast. Rex is",
        "noise_prompt_9": "Brimpuses are cold. Tumpuses are brimpuses. Rex is tumpus. True or false: Rex is sunny. Let us think step by step.",
        "response_9": "Rex is tumpus. Tumpuses are brimpuses. Rex is brimpus. Brimpuses are cold. Rex is",
        "noise_prompt_10": "Brimpuses are cold. Tumpuses are brimpuses. Rex is tumpus. True or false: Rex is sunny. Let us think step by step.",
        "response_10": "Rex is tumpus. Tumpuses are brimpuses. Rex is brimpus. Brimpuses are cold. Rex is cold.",
        "noise_response_10": "Rex is tumpus. Tumpuses are brimpuses. Rex is brimpus. Brimpuses are cold. Rex is brown.",
        "answer_token_id_0": 29934,
        "answer_token_pos_0": 380,
        "answer_token_0": "R",
        "end_token_pos_0": 379,
        "end_token_id_0": 13,
        "answer_token_id_1": 260,
        "answer_token_pos_1": 383,
        "answer_token_1": "t",
        "end_token_pos_1": 382,
        "end_token_id_1": 338,
        "answer_token_id_2": 323,
        "answer_token_pos_2": 387,
        "answer_token_2": "T",
        "end_token_pos_2": 386,
        "end_token_id_2": 29889,
        "answer_token_id_3": 1506,
        "answer_token_pos_3": 391,
        "answer_token_3": "br",
        "end_token_pos_3": 390,
        "end_token_id_3": 526,
        "answer_token_id_4": 390,
        "answer_token_pos_4": 395,
        "answer_token_4": "R",
        "end_token_pos_4": 394,
        "end_token_id_4": 29889,
        "answer_token_id_5": 1506,
        "answer_token_pos_5": 398,
        "answer_token_5": "br",
        "end_token_pos_5": 397,
        "end_token_id_5": 338,
        "answer_token_id_6": 1771,
        "answer_token_pos_6": 402,
        "answer_token_6": "Br",
        "end_token_pos_6": 401,
        "end_token_id_6": 29889,
        "answer_token_id_7": 11220,
        "answer_token_pos_7": 406,
        "answer_token_7": "cold",
        "end_token_pos_7": 405,
        "end_token_id_7": 526,
        "answer_token_id_8": 390,
        "answer_token_pos_8": 410,
        "answer_token_8": "R",
        "end_token_pos_8": 409,
        "end_token_id_8": 29889,
        "answer_token_id_9": 11220,
        "answer_token_pos_9": 413,
        "answer_token_9": "cold",
        "end_token_pos_9": 412,
        "end_token_id_9": 338
    },
    {
        "question": "Rompuses are transparent. Impus is rompus. Stella is impus.",
        "query": "True or false: Stella is transparent.",
        "answer": "Stella is impus. Impus is rompus. Stella is rompus. Rompuses are transparent. Stella is transparent. True",
        "label": "True",
        "prompt": "Rompuses are transparent. Impus is rompus. Stella is impus. True or false: Stella is transparent. Let us think step by step.",
        "generated": "Stella is impus. Impus is rompus. Stella is rompus. Rompuses are transparent. Stella is transparent. True",
        "noise_response_0": "",
        "noise_prompt_0": "Rompuses are transparent. Impus is rompus. Stella is impus. True or false: Sally is transparent. Let us think step by step.",
        "response_0": "",
        "noise_response_1": "Stella is",
        "noise_prompt_1": "Rompuses are transparent. Impus is rompus. Stella is numpus. True or false: Stella is transparent. Let us think step by step.",
        "response_1": "Stella is",
        "noise_response_2": "Stella is impus.",
        "noise_prompt_2": "Rompuses are transparent. Numpus is rompus. Stella is impus. True or false: Stella is transparent. Let us think step by step.",
        "response_2": "Stella is impus.",
        "noise_response_3": "Stella is impus. Impus is",
        "noise_prompt_3": "Rompuses are transparent. Impus is sterpus. Stella is impus. True or false: Stella is transparent. Let us think step by step.",
        "response_3": "Stella is impus. Impus is",
        "noise_response_4": "Polly is impus. Impus is rompus.",
        "noise_prompt_4": "Rompuses are transparent. Impus is rompus. Stella is impus. True or false: Stella is transparent. Let us think step by step.",
        "response_4": "Stella is impus. Impus is rompus.",
        "noise_response_5": "Stella is impus. Impus is Sterpus. Stella is",
        "noise_prompt_5": "Rompuses are transparent. Impus is rompus. Stella is impus. True or false: Stella is transparent. Let us think step by step.",
        "response_5": "Stella is impus. Impus is rompus. Stella is",
        "noise_response_6": "Stella is impus. Impus is rompus. Stella is rompus.",
        "noise_prompt_6": "Shumpus are transparent. Impus is rompus. Stella is impus. True or false: Stella is transparent. Let us think step by step.",
        "response_6": "Stella is impus. Impus is rompus. Stella is rompus.",
        "noise_response_7": "Stella is impus. Impus is rompus. Stella is rompus. Rompuses are",
        "noise_prompt_7": "Rompuses are transparent. Impus is rompus. Stella is impus. True or false: Stella is transparent. Let us think step by step.",
        "response_7": "Stella is impus. Impus is rompus. Stella is rompus. Rompuses are",
        "noise_response_8": "Stella is impus. Impus is rompus. Sally is rompus. Rompuses are transparent.",
        "noise_prompt_8": "Rompuses are transparent. Impus is rompus. Stella is impus. True or false: Stella is transparent. Let us think step by step.",
        "response_8": "Stella is impus. Impus is rompus. Stella is rompus. Rompuses are transparent.",
        "noise_response_9": "Stella is impus. Impus is rompus. Stella is rompus. Rompuses are sunny. Stella is",
        "noise_prompt_9": "Rompuses are transparent. Impus is rompus. Stella is impus. True or false: Stella is transparent. Let us think step by step.",
        "response_9": "Stella is impus. Impus is rompus. Stella is rompus. Rompuses are transparent. Stella is",
        "noise_prompt_10": "Rompuses are transparent. Impus is rompus. Stella is impus. True or false: Stella is transparent. Let us think step by step.",
        "response_10": "Stella is impus. Impus is rompus. Stella is rompus. Rompuses are transparent. Stella is transparent.",
        "noise_response_10": "Stella is impus. Impus is rompus. Stella is rompus. Rompuses are transparent. Stella is opaque.",
        "answer_token_id_0": 855,
        "answer_token_pos_0": 380,
        "answer_token_0": "St",
        "end_token_pos_0": 379,
        "end_token_id_0": 13,
        "answer_token_id_1": 2411,
        "answer_token_pos_1": 383,
        "answer_token_1": "imp",
        "end_token_pos_1": 382,
        "end_token_id_1": 338,
        "answer_token_id_2": 14305,
        "answer_token_pos_2": 387,
        "answer_token_2": "Imp",
        "end_token_pos_2": 386,
        "end_token_id_2": 29889,
        "answer_token_id_3": 6017,
        "answer_token_pos_3": 391,
        "answer_token_3": "rom",
        "end_token_pos_3": 390,
        "end_token_id_3": 338,
        "answer_token_id_4": 6033,
        "answer_token_pos_4": 395,
        "answer_token_4": "Rom",
        "end_token_pos_4": 394,
        "end_token_id_4": 29889,
        "answer_token_id_5": 6017,
        "answer_token_pos_5": 398,
        "answer_token_5": "rom",
        "end_token_pos_5": 397,
        "end_token_id_5": 338,
        "answer_token_id_6": 6033,
        "answer_token_pos_6": 402,
        "answer_token_6": "Rom",
        "end_token_pos_6": 401,
        "end_token_id_6": 29889,
        "answer_token_id_7": 17772,
        "answer_token_pos_7": 406,
        "answer_token_7": "transparent",
        "end_token_pos_7": 405,
        "end_token_id_7": 526,
        "answer_token_id_8": 624,
        "answer_token_pos_8": 410,
        "answer_token_8": "St",
        "end_token_pos_8": 409,
        "end_token_id_8": 29889,
        "answer_token_id_9": 17772,
        "answer_token_pos_9": 413,
        "answer_token_9": "transparent",
        "end_token_pos_9": 412,
        "end_token_id_9": 338
    },
    {
        "question": "Yumpuses are orange. Sterpuses are yumpuses. Rex is sterpus.",
        "query": "True or false: Rex is orange.",
        "answer": "Rex is sterpus. Sterpuses are yumpuses. Rex is yumpus. Yumpuses are orange. Rex is orange. True",
        "label": "True",
        "prompt": "Yumpuses are orange. Sterpuses are yumpuses. Rex is sterpus. True or false: Rex is orange. Let us think step by step.",
        "generated": "Rex is sterpus. Sterpuses are yumpuses. Rex is yumpus. Yumpuses are orange. Rex is orange. True",
        "noise_response_0": "",
        "noise_prompt_0": "Yumpuses are orange. Sterpuses are yumpuses. Rex is sterpus. True or false: Sally is orange. Let us think step by step.",
        "response_0": "",
        "noise_response_1": "Rex is",
        "noise_prompt_1": "Yumpuses are orange. Sterpuses are yumpuses. Rex is Jompus. True or false: Rex is orange. Let us think step by step.",
        "response_1": "Rex is",
        "noise_response_2": "Rex is sterpus.",
        "noise_prompt_2": "Yumpuses are orange. dumpus are yumpuses. Rex is sterpus. True or false: Rex is orange. Let us think step by step.",
        "response_2": "Rex is sterpus.",
        "noise_response_3": "Rex is sterpus. Sterpuses are",
        "noise_prompt_3": "Yumpuses are orange. Sterpuses are tumpus. Rex is sterpus. True or false: Rex is orange. Let us think step by step.",
        "response_3": "Rex is sterpus. Sterpuses are",
        "noise_response_4": "Sally is sterpus. Sterpuses are yumpuses.",
        "noise_prompt_4": "Yumpuses are orange. Sterpuses are yumpuses. Rex is sterpus. True or false: Rex is orange. Let us think step by step.",
        "response_4": "Rex is sterpus. Sterpuses are yumpuses.",
        "noise_response_5": "Rex is sterpus. Sterpuses are Wumpus. Rex is",
        "noise_prompt_5": "Yumpuses are orange. Sterpuses are yumpuses. Rex is sterpus. True or false: Rex is orange. Let us think step by step.",
        "response_5": "Rex is sterpus. Sterpuses are yumpuses. Rex is",
        "noise_response_6": "Rex is sterpus. Sterpuses are yumpuses. Rex is yumpus.",
        "noise_prompt_6": "Lempus are orange. Sterpuses are yumpuses. Rex is sterpus. True or false: Rex is orange. Let us think step by step.",
        "response_6": "Rex is sterpus. Sterpuses are yumpuses. Rex is yumpus.",
        "noise_response_7": "Rex is sterpus. Sterpuses are yumpuses. Rex is yumpus. Yumpuses are",
        "noise_prompt_7": "Yumpuses are orange. Sterpuses are yumpuses. Rex is sterpus. True or false: Rex is sunny. Let us think step by step.",
        "response_7": "Rex is sterpus. Sterpuses are yumpuses. Rex is yumpus. Yumpuses are",
        "noise_response_8": "Rex is sterpus. Sterpuses are yumpuses. Sam is yumpus. Yumpuses are orange.",
        "noise_prompt_8": "Yumpuses are orange. Sterpuses are yumpuses. Rex is sterpus. True or false: Rex is orange. Let us think step by step.",
        "response_8": "Rex is sterpus. Sterpuses are yumpuses. Rex is yumpus. Yumpuses are orange.",
        "noise_response_9": "Rex is sterpus. Sterpuses are yumpuses. Rex is yumpus. Yumpuses are small. Rex is",
        "noise_prompt_9": "Yumpuses are orange. Sterpuses are yumpuses. Rex is sterpus. True or false: Rex is orange. Let us think step by step.",
        "response_9": "Rex is sterpus. Sterpuses are yumpuses. Rex is yumpus. Yumpuses are orange. Rex is",
        "noise_prompt_10": "Yumpuses are orange. Sterpuses are yumpuses. Rex is sterpus. True or false: Rex is orange. Let us think step by step.",
        "response_10": "Rex is sterpus. Sterpuses are yumpuses. Rex is yumpus. Yumpuses are orange. Rex is orange.",
        "noise_response_10": "Rex is sterpus. Sterpuses are yumpuses. Rex is yumpus. Yumpuses are orange. Rex is wooden.",
        "answer_token_id_0": 29934,
        "answer_token_pos_0": 380,
        "answer_token_0": "R",
        "end_token_pos_0": 379,
        "end_token_id_0": 13,
        "answer_token_id_1": 16864,
        "answer_token_pos_1": 383,
        "answer_token_1": "ster",
        "end_token_pos_1": 382,
        "end_token_id_1": 338,
        "answer_token_id_2": 28588,
        "answer_token_pos_2": 387,
        "answer_token_2": "Ster",
        "end_token_pos_2": 386,
        "end_token_id_2": 29889,
        "answer_token_id_3": 343,
        "answer_token_pos_3": 391,
        "answer_token_3": "y",
        "end_token_pos_3": 390,
        "end_token_id_3": 526,
        "answer_token_id_4": 390,
        "answer_token_pos_4": 395,
        "answer_token_4": "R",
        "end_token_pos_4": 394,
        "end_token_id_4": 29889,
        "answer_token_id_5": 343,
        "answer_token_pos_5": 398,
        "answer_token_5": "y",
        "end_token_pos_5": 397,
        "end_token_id_5": 338,
        "answer_token_id_6": 612,
        "answer_token_pos_6": 402,
        "answer_token_6": "Y",
        "end_token_pos_6": 401,
        "end_token_id_6": 29889,
        "answer_token_id_7": 24841,
        "answer_token_pos_7": 406,
        "answer_token_7": "orange",
        "end_token_pos_7": 405,
        "end_token_id_7": 526,
        "answer_token_id_8": 390,
        "answer_token_pos_8": 410,
        "answer_token_8": "R",
        "end_token_pos_8": 409,
        "end_token_id_8": 29889,
        "answer_token_id_9": 24841,
        "answer_token_pos_9": 413,
        "answer_token_9": "orange",
        "end_token_pos_9": 412,
        "end_token_id_9": 338
    },
    {
        "question": "Wumpuses are cold. Numpuses are wumpuses. Wren is numpus.",
        "query": "True or false: Wren is cold.",
        "answer": "Wren is numpus. Numpuses are wumpuses. Wren is wumpus. Wumpuses are cold. Wren is cold. True",
        "label": "True",
        "prompt": "Wumpuses are cold. Numpuses are wumpuses. Wren is numpus. True or false: Wren is cold. Let us think step by step.",
        "generated": "Wren is numpus. Numpuses are wumpuses. Wren is wumpus. Wumpuses are cold. Wren is cold. True",
        "noise_response_0": "",
        "noise_prompt_0": "Wumpuses are cold. Numpuses are wumpuses. Wren is numpus. True or false: Sally is cold. Let us think step by step.",
        "response_0": "",
        "noise_response_1": "Wren is",
        "noise_prompt_1": "Wumpuses are cold. Numpuses are wumpuses. Wren is Shumpus. True or false: Wren is cold. Let us think step by step.",
        "response_1": "Wren is",
        "noise_response_2": "Wren is numpus.",
        "noise_prompt_2": "Wumpuses are cold. gorpus are wumpuses. Wren is numpus. True or false: Wren is cold. Let us think step by step.",
        "response_2": "Wren is numpus.",
        "noise_response_3": "Wren is numpus. Numpuses are",
        "noise_prompt_3": "Wumpuses are cold. Numpuses are loud. Wren is numpus. True or false: Wren is cold. Let us think step by step.",
        "response_3": "Wren is numpus. Numpuses are",
        "noise_response_4": "Rex is numpus. Numpuses are wumpuses.",
        "noise_prompt_4": "Wumpuses are cold. Numpuses are wumpuses. Wren is numpus. True or false: Wren is cold. Let us think step by step.",
        "response_4": "Wren is numpus. Numpuses are wumpuses.",
        "noise_response_5": "Wren is numpus. Numpuses are temperate. Wren is",
        "noise_prompt_5": "Wumpuses are cold. Numpuses are wumpuses. Wren is numpus. True or false: Wren is cold. Let us think step by step.",
        "response_5": "Wren is numpus. Numpuses are wumpuses. Wren is",
        "noise_response_6": "Wren is numpus. Numpuses are wumpuses. Fae is wumpus.",
        "noise_prompt_6": "Wumpuses are cold. Numpuses are wumpuses. Wren is numpus. True or false: Wren is cold. Let us think step by step.",
        "response_6": "Wren is numpus. Numpuses are wumpuses. Wren is wumpus.",
        "noise_response_7": "Wren is numpus. Numpuses are wumpuses. Wren is wumpus. Wumpuses are",
        "noise_prompt_7": "Wumpuses are cold. Numpuses are wumpuses. Wren is numpus. True or false: Wren is temperate. Let us think step by step.",
        "response_7": "Wren is numpus. Numpuses are wumpuses. Wren is wumpus. Wumpuses are",
        "noise_response_8": "Wren is numpus. Numpuses are wumpuses. Wren is wumpus. Sally are cold.",
        "noise_prompt_8": "Wumpuses are cold. Numpuses are wumpuses. Wren is numpus. True or false: Wren is cold. Let us think step by step.",
        "response_8": "Wren is numpus. Numpuses are wumpuses. Wren is wumpus. Wumpuses are cold.",
        "noise_response_9": "Wren is numpus. Numpuses are wumpuses. Wren is wumpus. Wumpuses are fast. Wren is",
        "noise_prompt_9": "Wumpuses are cold. Numpuses are wumpuses. Wren is numpus. True or false: Wren is cold. Let us think step by step.",
        "response_9": "Wren is numpus. Numpuses are wumpuses. Wren is wumpus. Wumpuses are cold. Wren is",
        "noise_prompt_10": "Wumpuses are cold. Numpuses are wumpuses. Wren is numpus. True or false: Wren is cold. Let us think step by step.",
        "response_10": "Wren is numpus. Numpuses are wumpuses. Wren is wumpus. Wumpuses are cold. Wren is cold.",
        "noise_response_10": "Wren is numpus. Numpuses are wumpuses. Wren is wumpus. Wumpuses are cold. Wren is loud.",
        "answer_token_id_0": 29956,
        "answer_token_pos_0": 380,
        "answer_token_0": "W",
        "end_token_pos_0": 379,
        "end_token_id_0": 13,
        "answer_token_id_1": 954,
        "answer_token_pos_1": 383,
        "answer_token_1": "num",
        "end_token_pos_1": 382,
        "end_token_id_1": 338,
        "answer_token_id_2": 405,
        "answer_token_pos_2": 387,
        "answer_token_2": "N",
        "end_token_pos_2": 386,
        "end_token_id_2": 29889,
        "answer_token_id_3": 281,
        "answer_token_pos_3": 391,
        "answer_token_3": "w",
        "end_token_pos_3": 390,
        "end_token_id_3": 526,
        "answer_token_id_4": 399,
        "answer_token_pos_4": 395,
        "answer_token_4": "W",
        "end_token_pos_4": 394,
        "end_token_id_4": 29889,
        "answer_token_id_5": 281,
        "answer_token_pos_5": 398,
        "answer_token_5": "w",
        "end_token_pos_5": 397,
        "end_token_id_5": 338,
        "answer_token_id_6": 399,
        "answer_token_pos_6": 402,
        "answer_token_6": "W",
        "end_token_pos_6": 401,
        "end_token_id_6": 29889,
        "answer_token_id_7": 11220,
        "answer_token_pos_7": 406,
        "answer_token_7": "cold",
        "end_token_pos_7": 405,
        "end_token_id_7": 526,
        "answer_token_id_8": 399,
        "answer_token_pos_8": 410,
        "answer_token_8": "W",
        "end_token_pos_8": 409,
        "end_token_id_8": 29889,
        "answer_token_id_9": 11220,
        "answer_token_pos_9": 413,
        "answer_token_9": "cold",
        "end_token_pos_9": 412,
        "end_token_id_9": 338
    },
    {
        "question": "Wumpuses are discordant. Zumpus is wumpus. Sally is zumpus.",
        "query": "True or false: Sally is overcast.",
        "answer": "Sally is zumpus. Zumpus is wumpus. Sally is wumpus. Wumpuses are discordant. Sally is discordant. False",
        "label": "False",
        "prompt": "Wumpuses are discordant. Zumpus is wumpus. Sally is zumpus. True or false: Sally is overcast. Let us think step by step.",
        "generated": "Sally is zumpus. Zumpus is wumpus. Sally is wumpus. Wumpuses are discordant. Sally is discordant. False",
        "noise_response_0": "",
        "noise_prompt_0": "Wumpuses are discordant. Zumpus is wumpus. Sally is zumpus. True or false: Stella is overcast. Let us think step by step.",
        "response_0": "",
        "noise_response_1": "Sally is",
        "noise_prompt_1": "Wumpuses are discordant. Zumpus is wumpus. Sally is numpus. True or false: Sally is overcast. Let us think step by step.",
        "response_1": "Sally is",
        "noise_response_2": "Sally is zumpus.",
        "noise_prompt_2": "Wumpuses are discordant. Jompus is wumpus. Sally is zumpus. True or false: Sally is overcast. Let us think step by step.",
        "response_2": "Sally is zumpus.",
        "noise_response_3": "Sally is zumpus. Zumpus is",
        "noise_prompt_3": "Wumpuses are discordant. Zumpus is large. Sally is zumpus. True or false: Sally is overcast. Let us think step by step.",
        "response_3": "Sally is zumpus. Zumpus is",
        "noise_response_4": "Alex is zumpus. Zumpus is wumpus.",
        "noise_prompt_4": "Wumpuses are discordant. Zumpus is wumpus. Sally is zumpus. True or false: Sally is overcast. Let us think step by step.",
        "response_4": "Sally is zumpus. Zumpus is wumpus.",
        "noise_response_5": "Sally is zumpus. Zumpus is liquid. Sally is",
        "noise_prompt_5": "Wumpuses are discordant. Zumpus is wumpus. Sally is zumpus. True or false: Sally is overcast. Let us think step by step.",
        "response_5": "Sally is zumpus. Zumpus is wumpus. Sally is",
        "noise_response_6": "Sally is zumpus. Zumpus is wumpus. Sally is wumpus.",
        "noise_prompt_6": "Fae are discordant. Zumpus is wumpus. Sally is zumpus. True or false: Sally is overcast. Let us think step by step.",
        "response_6": "Sally is zumpus. Zumpus is wumpus. Sally is wumpus.",
        "noise_response_7": "Sally is zumpus. Zumpus is wumpus. Sally is wumpus. Wumpuses are",
        "noise_prompt_7": "Wumpuses are angry. Zumpus is wumpus. Sally is zumpus. True or false: Sally is overcast. Let us think step by step.",
        "response_7": "Sally is zumpus. Zumpus is wumpus. Sally is wumpus. Wumpuses are",
        "noise_response_8": "Sally is zumpus. Zumpus is wumpus. Polly is wumpus. Wumpuses are discordant.",
        "noise_prompt_8": "Wumpuses are discordant. Zumpus is wumpus. Sally is zumpus. True or false: Sally is overcast. Let us think step by step.",
        "response_8": "Sally is zumpus. Zumpus is wumpus. Sally is wumpus. Wumpuses are discordant.",
        "noise_response_9": "Sally is zumpus. Zumpus is wumpus. Sally is wumpus. Wumpuses are moderate. Sally is",
        "noise_prompt_9": "Wumpuses are discordant. Zumpus is wumpus. Sally is zumpus. True or false: Sally is overcast. Let us think step by step.",
        "response_9": "Sally is zumpus. Zumpus is wumpus. Sally is wumpus. Wumpuses are discordant. Sally is",
        "noise_prompt_10": "Wumpuses are discordant. Zumpus is wumpus. Sally is zumpus. True or false: Sally is overcast. Let us think step by step.",
        "response_10": "Sally is zumpus. Zumpus is wumpus. Sally is wumpus. Wumpuses are discordant. Sally is discordant.",
        "noise_response_10": "Sally is zumpus. Zumpus is wumpus. Sally is wumpus. Wumpuses are discordant. Sally is blue.",
        "answer_token_id_0": 29903,
        "answer_token_pos_0": 380,
        "answer_token_0": "S",
        "end_token_pos_0": 379,
        "end_token_id_0": 13,
        "answer_token_id_1": 3356,
        "answer_token_pos_1": 383,
        "answer_token_1": "zum",
        "end_token_pos_1": 382,
        "end_token_id_1": 338,
        "answer_token_id_2": 796,
        "answer_token_pos_2": 387,
        "answer_token_2": "Z",
        "end_token_pos_2": 386,
        "end_token_id_2": 29889,
        "answer_token_id_3": 281,
        "answer_token_pos_3": 391,
        "answer_token_3": "w",
        "end_token_pos_3": 390,
        "end_token_id_3": 338,
        "answer_token_id_4": 317,
        "answer_token_pos_4": 395,
        "answer_token_4": "S",
        "end_token_pos_4": 394,
        "end_token_id_4": 29889,
        "answer_token_id_5": 281,
        "answer_token_pos_5": 398,
        "answer_token_5": "w",
        "end_token_pos_5": 397,
        "end_token_id_5": 338,
        "answer_token_id_6": 399,
        "answer_token_pos_6": 402,
        "answer_token_6": "W",
        "end_token_pos_6": 401,
        "end_token_id_6": 29889,
        "answer_token_id_7": 2313,
        "answer_token_pos_7": 406,
        "answer_token_7": "disc",
        "end_token_pos_7": 405,
        "end_token_id_7": 526,
        "answer_token_id_8": 317,
        "answer_token_pos_8": 410,
        "answer_token_8": "S",
        "end_token_pos_8": 409,
        "end_token_id_8": 29889,
        "answer_token_id_9": 2313,
        "answer_token_pos_9": 413,
        "answer_token_9": "disc",
        "end_token_pos_9": 412,
        "end_token_id_9": 338
    },
    {
        "question": "Numpuses are sweet. Lempus is numpus. Alex is lempus.",
        "query": "True or false: Alex is sweet.",
        "answer": "Alex is lempus. Lempus is numpus. Alex is numpus. Numpuses are sweet. Alex is sweet. True",
        "label": "True",
        "prompt": "Numpuses are sweet. Lempus is numpus. Alex is lempus. True or false: Alex is sweet. Let us think step by step.",
        "generated": "Alex is lempus. Lempus is numpus. Alex is numpus. Numpuses are sweet. Alex is sweet. True",
        "noise_response_0": "",
        "noise_prompt_0": "Numpuses are sweet. Lempus is numpus. Alex is lempus. True or false: Rex is sweet. Let us think step by step.",
        "response_0": "",
        "noise_response_1": "Alex is",
        "noise_prompt_1": "Numpuses are sweet. Lempus is numpus. Alex is numpus. True or false: Alex is sweet. Let us think step by step.",
        "response_1": "Alex is",
        "noise_response_2": "Alex is lempus.",
        "noise_prompt_2": "Numpuses are sweet. lorpus is numpus. Alex is lempus. True or false: Alex is sweet. Let us think step by step.",
        "response_2": "Alex is lempus.",
        "noise_response_3": "Alex is lempus. Lempus is",
        "noise_prompt_3": "Numpuses are sweet. Lempus is Rompus. Alex is lempus. True or false: Alex is sweet. Let us think step by step.",
        "response_3": "Alex is lempus. Lempus is",
        "noise_response_4": "Stella is lempus. Lempus is numpus.",
        "noise_prompt_4": "Numpuses are sweet. Lempus is numpus. Alex is lempus. True or false: Alex is sweet. Let us think step by step.",
        "response_4": "Alex is lempus. Lempus is numpus.",
        "noise_response_5": "Alex is lempus. Lempus is Impus. Alex is",
        "noise_prompt_5": "Numpuses are sweet. Lempus is numpus. Alex is lempus. True or false: Alex is sweet. Let us think step by step.",
        "response_5": "Alex is lempus. Lempus is numpus. Alex is",
        "noise_response_6": "Alex is lempus. Lempus is numpus. Alex is numpus.",
        "noise_prompt_6": "wumpus are sweet. Lempus is numpus. Alex is lempus. True or false: Alex is sweet. Let us think step by step.",
        "response_6": "Alex is lempus. Lempus is numpus. Alex is numpus.",
        "noise_response_7": "Alex is lempus. Lempus is numpus. Alex is numpus. Numpuses are",
        "noise_prompt_7": "Numpuses are sweet. Lempus is numpus. Alex is lempus. True or false: Alex is feisty. Let us think step by step.",
        "response_7": "Alex is lempus. Lempus is numpus. Alex is numpus. Numpuses are",
        "noise_response_8": "Alex is lempus. Lempus is numpus. Max is numpus. Numpuses are sweet.",
        "noise_prompt_8": "Numpuses are sweet. Lempus is numpus. Alex is lempus. True or false: Alex is sweet. Let us think step by step.",
        "response_8": "Alex is lempus. Lempus is numpus. Alex is numpus. Numpuses are sweet.",
        "noise_response_9": "Alex is lempus. Lempus is numpus. Alex is numpus. Numpuses are amenable. Alex is",
        "noise_prompt_9": "Numpuses are sweet. Lempus is numpus. Alex is lempus. True or false: Alex is sweet. Let us think step by step.",
        "response_9": "Alex is lempus. Lempus is numpus. Alex is numpus. Numpuses are sweet. Alex is",
        "noise_prompt_10": "Numpuses are sweet. Lempus is numpus. Alex is lempus. True or false: Alex is sweet. Let us think step by step.",
        "response_10": "Alex is lempus. Lempus is numpus. Alex is numpus. Numpuses are sweet. Alex is sweet.",
        "noise_response_10": "Alex is lempus. Lempus is numpus. Alex is numpus. Numpuses are sweet. Alex is large.",
        "answer_token_id_0": 17406,
        "answer_token_pos_0": 380,
        "answer_token_0": "Alex",
        "end_token_pos_0": 379,
        "end_token_id_0": 13,
        "answer_token_id_1": 454,
        "answer_token_pos_1": 383,
        "answer_token_1": "le",
        "end_token_pos_1": 382,
        "end_token_id_1": 338,
        "answer_token_id_2": 365,
        "answer_token_pos_2": 387,
        "answer_token_2": "L",
        "end_token_pos_2": 386,
        "end_token_id_2": 29889,
        "answer_token_id_3": 954,
        "answer_token_pos_3": 391,
        "answer_token_3": "num",
        "end_token_pos_3": 390,
        "end_token_id_3": 338,
        "answer_token_id_4": 405,
        "answer_token_pos_4": 395,
        "answer_token_4": "N",
        "end_token_pos_4": 394,
        "end_token_id_4": 29889,
        "answer_token_id_5": 954,
        "answer_token_pos_5": 398,
        "answer_token_5": "num",
        "end_token_pos_5": 397,
        "end_token_id_5": 338,
        "answer_token_id_6": 405,
        "answer_token_pos_6": 402,
        "answer_token_6": "N",
        "end_token_pos_6": 401,
        "end_token_id_6": 29889,
        "answer_token_id_7": 14225,
        "answer_token_pos_7": 406,
        "answer_token_7": "sweet",
        "end_token_pos_7": 405,
        "end_token_id_7": 526,
        "answer_token_id_8": 4827,
        "answer_token_pos_8": 410,
        "answer_token_8": "Alex",
        "end_token_pos_8": 409,
        "end_token_id_8": 29889,
        "answer_token_id_9": 14225,
        "answer_token_pos_9": 413,
        "answer_token_9": "sweet",
        "end_token_pos_9": 412,
        "end_token_id_9": 338
    },
    {
        "question": "Wumpus is luminous. Sterpuses are wumpuses. Max is sterpus.",
        "query": "True or false: Max is luminous.",
        "answer": "Max is sterpus. Sterpuses are wumpuses. Max is wumpus. Wumpus is luminous. Max is luminous. True",
        "label": "True",
        "prompt": "Wumpus is luminous. Sterpuses are wumpuses. Max is sterpus. True or false: Max is luminous. Let us think step by step.",
        "generated": "Max is sterpus. Sterpuses are wumpuses. Max is wumpus. Wumpus is luminous. Max is luminous. True",
        "noise_response_0": "",
        "noise_prompt_0": "Wumpus is luminous. Sterpuses are wumpuses. Max is sterpus. True or false: Wren is luminous. Let us think step by step.",
        "response_0": "",
        "noise_response_1": "Max is",
        "noise_prompt_1": "Wumpus is luminous. Sterpuses are wumpuses. Max is lorpus. True or false: Max is luminous. Let us think step by step.",
        "response_1": "Max is",
        "noise_response_2": "Max is sterpus.",
        "noise_prompt_2": "Wumpus is luminous. Lempus are wumpuses. Max is sterpus. True or false: Max is luminous. Let us think step by step.",
        "response_2": "Max is sterpus.",
        "noise_response_3": "Max is sterpus. Sterpuses are",
        "noise_prompt_3": "Wumpus is luminous. Sterpuses are luminous. Max is sterpus. True or false: Max is luminous. Let us think step by step.",
        "response_3": "Max is sterpus. Sterpuses are",
        "noise_response_4": "Fae is sterpus. Sterpuses are wumpuses.",
        "noise_prompt_4": "Wumpus is luminous. Sterpuses are wumpuses. Max is sterpus. True or false: Max is luminous. Let us think step by step.",
        "response_4": "Max is sterpus. Sterpuses are wumpuses.",
        "noise_response_5": "Max is sterpus. Sterpuses are sweet. Max is",
        "noise_prompt_5": "Wumpus is luminous. Sterpuses are wumpuses. Max is sterpus. True or false: Max is luminous. Let us think step by step.",
        "response_5": "Max is sterpus. Sterpuses are wumpuses. Max is",
        "noise_response_6": "Max is sterpus. Sterpuses are wumpuses. Max is wumpus.",
        "noise_prompt_6": "Sam is luminous. Sterpuses are wumpuses. Max is sterpus. True or false: Max is luminous. Let us think step by step.",
        "response_6": "Max is sterpus. Sterpuses are wumpuses. Max is wumpus.",
        "noise_response_7": "Max is sterpus. Sterpuses are wumpuses. Max is wumpus. Wumpus is",
        "noise_prompt_7": "Wumpus is luminous. Sterpuses are wumpuses. Max is sterpus. True or false: Max is sour. Let us think step by step.",
        "response_7": "Max is sterpus. Sterpuses are wumpuses. Max is wumpus. Wumpus is",
        "noise_response_8": "Max is sterpus. Sterpuses are wumpuses. Stella is wumpus. Wumpus is luminous.",
        "noise_prompt_8": "Wumpus is luminous. Sterpuses are wumpuses. Max is sterpus. True or false: Max is luminous. Let us think step by step.",
        "response_8": "Max is sterpus. Sterpuses are wumpuses. Max is wumpus. Wumpus is luminous.",
        "noise_response_9": "Max is sterpus. Sterpuses are wumpuses. Max is wumpus. Wumpus is aggressive. Max is",
        "noise_prompt_9": "Wumpus is luminous. Sterpuses are wumpuses. Max is sterpus. True or false: Max is luminous. Let us think step by step.",
        "response_9": "Max is sterpus. Sterpuses are wumpuses. Max is wumpus. Wumpus is luminous. Max is",
        "noise_prompt_10": "Wumpus is luminous. Sterpuses are wumpuses. Max is sterpus. True or false: Max is luminous. Let us think step by step.",
        "response_10": "Max is sterpus. Sterpuses are wumpuses. Max is wumpus. Wumpus is luminous. Max is luminous.",
        "noise_response_10": "Max is sterpus. Sterpuses are wumpuses. Max is wumpus. Wumpus is luminous. Max is cold.",
        "answer_token_id_0": 7976,
        "answer_token_pos_0": 380,
        "answer_token_0": "Max",
        "end_token_pos_0": 379,
        "end_token_id_0": 13,
        "answer_token_id_1": 16864,
        "answer_token_pos_1": 383,
        "answer_token_1": "ster",
        "end_token_pos_1": 382,
        "end_token_id_1": 338,
        "answer_token_id_2": 28588,
        "answer_token_pos_2": 387,
        "answer_token_2": "Ster",
        "end_token_pos_2": 386,
        "end_token_id_2": 29889,
        "answer_token_id_3": 281,
        "answer_token_pos_3": 391,
        "answer_token_3": "w",
        "end_token_pos_3": 390,
        "end_token_id_3": 526,
        "answer_token_id_4": 5918,
        "answer_token_pos_4": 395,
        "answer_token_4": "Max",
        "end_token_pos_4": 394,
        "end_token_id_4": 29889,
        "answer_token_id_5": 281,
        "answer_token_pos_5": 398,
        "answer_token_5": "w",
        "end_token_pos_5": 397,
        "end_token_id_5": 338,
        "answer_token_id_6": 399,
        "answer_token_pos_6": 402,
        "answer_token_6": "W",
        "end_token_pos_6": 401,
        "end_token_id_6": 29889,
        "answer_token_id_7": 301,
        "answer_token_pos_7": 406,
        "answer_token_7": "l",
        "end_token_pos_7": 405,
        "end_token_id_7": 338,
        "answer_token_id_8": 5918,
        "answer_token_pos_8": 410,
        "answer_token_8": "Max",
        "end_token_pos_8": 409,
        "end_token_id_8": 29889,
        "answer_token_id_9": 301,
        "answer_token_pos_9": 413,
        "answer_token_9": "l",
        "end_token_pos_9": 412,
        "end_token_id_9": 338
    },
    {
        "question": "Lorpus is windy. Zumpus is lorpus. Max is zumpus.",
        "query": "True or false: Max is windy.",
        "answer": "Max is zumpus. Zumpus is lorpus. Max is lorpus. Lorpus is windy. Max is windy. True",
        "label": "True",
        "prompt": "Lorpus is windy. Zumpus is lorpus. Max is zumpus. True or false: Max is windy. Let us think step by step.",
        "generated": "Max is zumpus. Zumpus is lorpus. Max is lorpus. Lorpus is windy. Max is windy. True",
        "noise_response_0": "",
        "noise_prompt_0": "Lorpus is windy. Zumpus is lorpus. Max is zumpus. True or false: Fae is windy. Let us think step by step.",
        "response_0": "",
        "noise_response_1": "Max is",
        "noise_prompt_1": "Lorpus is windy. Zumpus is lorpus. Max is wumpus. True or false: Max is windy. Let us think step by step.",
        "response_1": "Max is",
        "noise_response_2": "Max is zumpus.",
        "noise_prompt_2": "Lorpus is windy. lempus is lorpus. Max is zumpus. True or false: Max is windy. Let us think step by step.",
        "response_2": "Max is zumpus.",
        "noise_response_3": "Max is zumpus. Zumpus is",
        "noise_prompt_3": "Lorpus is windy. Zumpus is floral. Max is zumpus. True or false: Max is windy. Let us think step by step.",
        "response_3": "Max is zumpus. Zumpus is",
        "noise_response_4": "Fae is zumpus. Zumpus is lorpus.",
        "noise_prompt_4": "Lorpus is windy. Zumpus is lorpus. Max is zumpus. True or false: Max is windy. Let us think step by step.",
        "response_4": "Max is zumpus. Zumpus is lorpus.",
        "noise_response_5": "Max is zumpus. Zumpus is sweet. Max is",
        "noise_prompt_5": "Lorpus is windy. Zumpus is lorpus. Max is zumpus. True or false: Max is windy. Let us think step by step.",
        "response_5": "Max is zumpus. Zumpus is lorpus. Max is",
        "noise_response_6": "Max is zumpus. Zumpus is lorpus. Max is lorpus.",
        "noise_prompt_6": "Gorpus is windy. Zumpus is lorpus. Max is zumpus. True or false: Max is windy. Let us think step by step.",
        "response_6": "Max is zumpus. Zumpus is lorpus. Max is lorpus.",
        "noise_response_7": "Max is zumpus. Zumpus is lorpus. Max is lorpus. Lorpus is",
        "noise_prompt_7": "Lorpus is windy. Zumpus is lorpus. Max is zumpus. True or false: Max is fruity. Let us think step by step.",
        "response_7": "Max is zumpus. Zumpus is lorpus. Max is lorpus. Lorpus is",
        "noise_response_8": "Max is zumpus. Zumpus is lorpus. Alex is lorpus. Lorpus is windy.",
        "noise_prompt_8": "Lorpus is windy. Zumpus is lorpus. Max is zumpus. True or false: Max is windy. Let us think step by step.",
        "response_8": "Max is zumpus. Zumpus is lorpus. Max is lorpus. Lorpus is windy.",
        "noise_response_9": "Max is zumpus. Zumpus is lorpus. Max is lorpus. Lorpus is amenable. Max is",
        "noise_prompt_9": "Lorpus is windy. Zumpus is lorpus. Max is zumpus. True or false: Max is windy. Let us think step by step.",
        "response_9": "Max is zumpus. Zumpus is lorpus. Max is lorpus. Lorpus is windy. Max is",
        "noise_prompt_10": "Lorpus is windy. Zumpus is lorpus. Max is zumpus. True or false: Max is windy. Let us think step by step.",
        "response_10": "Max is zumpus. Zumpus is lorpus. Max is lorpus. Lorpus is windy. Max is windy.",
        "noise_response_10": "Max is zumpus. Zumpus is lorpus. Max is lorpus. Lorpus is windy. Max is moderate.",
        "answer_token_id_0": 7976,
        "answer_token_pos_0": 380,
        "answer_token_0": "Max",
        "end_token_pos_0": 379,
        "end_token_id_0": 13,
        "answer_token_id_1": 3356,
        "answer_token_pos_1": 383,
        "answer_token_1": "zum",
        "end_token_pos_1": 382,
        "end_token_id_1": 338,
        "answer_token_id_2": 796,
        "answer_token_pos_2": 387,
        "answer_token_2": "Z",
        "end_token_pos_2": 386,
        "end_token_id_2": 29889,
        "answer_token_id_3": 301,
        "answer_token_pos_3": 391,
        "answer_token_3": "l",
        "end_token_pos_3": 390,
        "end_token_id_3": 338,
        "answer_token_id_4": 5918,
        "answer_token_pos_4": 395,
        "answer_token_4": "Max",
        "end_token_pos_4": 394,
        "end_token_id_4": 29889,
        "answer_token_id_5": 301,
        "answer_token_pos_5": 398,
        "answer_token_5": "l",
        "end_token_pos_5": 397,
        "end_token_id_5": 338,
        "answer_token_id_6": 10980,
        "answer_token_pos_6": 402,
        "answer_token_6": "Lor",
        "end_token_pos_6": 401,
        "end_token_id_6": 29889,
        "answer_token_id_7": 8805,
        "answer_token_pos_7": 406,
        "answer_token_7": "wind",
        "end_token_pos_7": 405,
        "end_token_id_7": 338,
        "answer_token_id_8": 5918,
        "answer_token_pos_8": 410,
        "answer_token_8": "Max",
        "end_token_pos_8": 409,
        "end_token_id_8": 29889,
        "answer_token_id_9": 8805,
        "answer_token_pos_9": 413,
        "answer_token_9": "wind",
        "end_token_pos_9": 412,
        "end_token_id_9": 338
    },
    {
        "question": "Lorpus is slow. Grimpus is lorpus. Stella is grimpus.",
        "query": "True or false: Stella is slow.",
        "answer": "Stella is grimpus. Grimpus is lorpus. Stella is lorpus. Lorpus is slow. Stella is slow. True",
        "label": "True",
        "prompt": "Lorpus is slow. Grimpus is lorpus. Stella is grimpus. True or false: Stella is slow. Let us think step by step.",
        "generated": "Stella is grimpus. Grimpus is lorpus. Stella is lorpus. Lorpus is slow. Stella is slow. True",
        "noise_response_0": "",
        "noise_prompt_0": "Lorpus is slow. Grimpus is lorpus. Stella is grimpus. True or false: Max is slow. Let us think step by step.",
        "response_0": "",
        "noise_response_1": "Stella is",
        "noise_prompt_1": "Lorpus is slow. Grimpus is lorpus. Stella is Grimpus. True or false: Stella is slow. Let us think step by step.",
        "response_1": "Stella is",
        "noise_response_2": "Stella is grimpus.",
        "noise_prompt_2": "Lorpus is slow. Tumpus is lorpus. Stella is grimpus. True or false: Stella is slow. Let us think step by step.",
        "response_2": "Stella is grimpus.",
        "noise_response_3": "Stella is grimpus. Grimpus is",
        "noise_prompt_3": "Lorpus is slow. Grimpus is aggressive. Stella is grimpus. True or false: Stella is slow. Let us think step by step.",
        "response_3": "Stella is grimpus. Grimpus is",
        "noise_response_4": "Max is grimpus. Grimpus is lorpus.",
        "noise_prompt_4": "Lorpus is slow. Grimpus is lorpus. Stella is grimpus. True or false: Stella is slow. Let us think step by step.",
        "response_4": "Stella is grimpus. Grimpus is lorpus.",
        "noise_response_5": "Stella is grimpus. Grimpus is bright. Stella is",
        "noise_prompt_5": "Lorpus is slow. Grimpus is lorpus. Stella is grimpus. True or false: Stella is slow. Let us think step by step.",
        "response_5": "Stella is grimpus. Grimpus is lorpus. Stella is",
        "noise_response_6": "Stella is grimpus. Grimpus is lorpus. Stella is lorpus.",
        "noise_prompt_6": "Numpus is slow. Grimpus is lorpus. Stella is grimpus. True or false: Stella is slow. Let us think step by step.",
        "response_6": "Stella is grimpus. Grimpus is lorpus. Stella is lorpus.",
        "noise_response_7": "Stella is grimpus. Grimpus is lorpus. Stella is lorpus. Lorpus is",
        "noise_prompt_7": "Lorpus is slow. Grimpus is lorpus. Stella is grimpus. True or false: Stella is overcast. Let us think step by step.",
        "response_7": "Stella is grimpus. Grimpus is lorpus. Stella is lorpus. Lorpus is",
        "noise_response_8": "Stella is grimpus. Grimpus is lorpus. Rex is lorpus. Lorpus is slow.",
        "noise_prompt_8": "Lorpus is slow. Grimpus is lorpus. Stella is grimpus. True or false: Stella is slow. Let us think step by step.",
        "response_8": "Stella is grimpus. Grimpus is lorpus. Stella is lorpus. Lorpus is slow.",
        "noise_response_9": "Stella is grimpus. Grimpus is lorpus. Stella is lorpus. Lorpus is spicy. Stella is",
        "noise_prompt_9": "Lorpus is slow. Grimpus is lorpus. Stella is grimpus. True or false: Stella is slow. Let us think step by step.",
        "response_9": "Stella is grimpus. Grimpus is lorpus. Stella is lorpus. Lorpus is slow. Stella is",
        "noise_prompt_10": "Lorpus is slow. Grimpus is lorpus. Stella is grimpus. True or false: Stella is slow. Let us think step by step.",
        "response_10": "Stella is grimpus. Grimpus is lorpus. Stella is lorpus. Lorpus is slow. Stella is slow.",
        "noise_response_10": "Stella is grimpus. Grimpus is lorpus. Stella is lorpus. Lorpus is slow. Stella is aggressive.",
        "answer_token_id_0": 855,
        "answer_token_pos_0": 380,
        "answer_token_0": "St",
        "end_token_pos_0": 379,
        "end_token_id_0": 13,
        "answer_token_id_1": 867,
        "answer_token_pos_1": 383,
        "answer_token_1": "gr",
        "end_token_pos_1": 382,
        "end_token_id_1": 338,
        "answer_token_id_2": 1632,
        "answer_token_pos_2": 387,
        "answer_token_2": "Gr",
        "end_token_pos_2": 386,
        "end_token_id_2": 29889,
        "answer_token_id_3": 301,
        "answer_token_pos_3": 391,
        "answer_token_3": "l",
        "end_token_pos_3": 390,
        "end_token_id_3": 338,
        "answer_token_id_4": 624,
        "answer_token_pos_4": 395,
        "answer_token_4": "St",
        "end_token_pos_4": 394,
        "end_token_id_4": 29889,
        "answer_token_id_5": 301,
        "answer_token_pos_5": 398,
        "answer_token_5": "l",
        "end_token_pos_5": 397,
        "end_token_id_5": 338,
        "answer_token_id_6": 10980,
        "answer_token_pos_6": 402,
        "answer_token_6": "Lor",
        "end_token_pos_6": 401,
        "end_token_id_6": 29889,
        "answer_token_id_7": 5232,
        "answer_token_pos_7": 406,
        "answer_token_7": "slow",
        "end_token_pos_7": 405,
        "end_token_id_7": 338,
        "answer_token_id_8": 624,
        "answer_token_pos_8": 410,
        "answer_token_8": "St",
        "end_token_pos_8": 409,
        "end_token_id_8": 29889,
        "answer_token_id_9": 5232,
        "answer_token_pos_9": 413,
        "answer_token_9": "slow",
        "end_token_pos_9": 412,
        "end_token_id_9": 338
    },
    {
        "question": "Tumpus is cold. Lempuses are tumpuses. Alex is lempus.",
        "query": "True or false: Alex is cold.",
        "answer": "Alex is lempus. Lempuses are tumpuses. Alex is tumpus. Tumpus is cold. Alex is cold. True",
        "label": "True",
        "prompt": "Tumpus is cold. Lempuses are tumpuses. Alex is lempus. True or false: Alex is cold. Let us think step by step.",
        "generated": "Alex is lempus. Lempuses are tumpuses. Alex is tumpus. Tumpus is cold. Alex is cold. True",
        "noise_response_0": "",
        "noise_prompt_0": "Tumpus is cold. Lempuses are tumpuses. Alex is lempus. True or false: Wren is cold. Let us think step by step.",
        "response_0": "",
        "noise_response_1": "Alex is",
        "noise_prompt_1": "Tumpus is cold. Lempuses are tumpuses. Alex is Lempus. True or false: Alex is cold. Let us think step by step.",
        "response_1": "Alex is",
        "noise_response_2": "Alex is lempus.",
        "noise_prompt_2": "Tumpus is cold. brimpus are tumpuses. Alex is lempus. True or false: Alex is cold. Let us think step by step.",
        "response_2": "Alex is lempus.",
        "noise_response_3": "Alex is lempus. Lempuses are",
        "noise_prompt_3": "Tumpus is cold. Lempuses are temperate. Alex is lempus. True or false: Alex is cold. Let us think step by step.",
        "response_3": "Alex is lempus. Lempuses are",
        "noise_response_4": "Sam is lempus. Lempuses are tumpuses.",
        "noise_prompt_4": "Tumpus is cold. Lempuses are tumpuses. Alex is lempus. True or false: Alex is cold. Let us think step by step.",
        "response_4": "Alex is lempus. Lempuses are tumpuses.",
        "noise_response_5": "Alex is lempus. Lempuses are amenable. Alex is",
        "noise_prompt_5": "Tumpus is cold. Lempuses are tumpuses. Alex is lempus. True or false: Alex is cold. Let us think step by step.",
        "response_5": "Alex is lempus. Lempuses are tumpuses. Alex is",
        "noise_response_6": "Alex is lempus. Lempuses are tumpuses. Alex is tumpus.",
        "noise_prompt_6": "Jompus is cold. Lempuses are tumpuses. Alex is lempus. True or false: Alex is cold. Let us think step by step.",
        "response_6": "Alex is lempus. Lempuses are tumpuses. Alex is tumpus.",
        "noise_response_7": "Alex is lempus. Lempuses are tumpuses. Alex is tumpus. Tumpus is",
        "noise_prompt_7": "Tumpus is cold. Lempuses are tumpuses. Alex is lempus. True or false: Alex is liquid. Let us think step by step.",
        "response_7": "Alex is lempus. Lempuses are tumpuses. Alex is tumpus. Tumpus is",
        "noise_response_8": "Alex is lempus. Lempuses are tumpuses. Fae is tumpus. Tumpus is cold.",
        "noise_prompt_8": "Tumpus is cold. Lempuses are tumpuses. Alex is lempus. True or false: Alex is cold. Let us think step by step.",
        "response_8": "Alex is lempus. Lempuses are tumpuses. Alex is tumpus. Tumpus is cold.",
        "noise_response_9": "Alex is lempus. Lempuses are tumpuses. Alex is tumpus. Tumpus is luminous. Alex is",
        "noise_prompt_9": "Tumpus is cold. Lempuses are tumpuses. Alex is lempus. True or false: Alex is cold. Let us think step by step.",
        "response_9": "Alex is lempus. Lempuses are tumpuses. Alex is tumpus. Tumpus is cold. Alex is",
        "noise_prompt_10": "Tumpus is cold. Lempuses are tumpuses. Alex is lempus. True or false: Alex is cold. Let us think step by step.",
        "response_10": "Alex is lempus. Lempuses are tumpuses. Alex is tumpus. Tumpus is cold. Alex is cold.",
        "noise_response_10": "Alex is lempus. Lempuses are tumpuses. Alex is tumpus. Tumpus is cold. Alex is hot.",
        "answer_token_id_0": 17406,
        "answer_token_pos_0": 380,
        "answer_token_0": "Alex",
        "end_token_pos_0": 379,
        "end_token_id_0": 13,
        "answer_token_id_1": 454,
        "answer_token_pos_1": 383,
        "answer_token_1": "le",
        "end_token_pos_1": 382,
        "end_token_id_1": 338,
        "answer_token_id_2": 365,
        "answer_token_pos_2": 387,
        "answer_token_2": "L",
        "end_token_pos_2": 386,
        "end_token_id_2": 29889,
        "answer_token_id_3": 260,
        "answer_token_pos_3": 391,
        "answer_token_3": "t",
        "end_token_pos_3": 390,
        "end_token_id_3": 526,
        "answer_token_id_4": 4827,
        "answer_token_pos_4": 395,
        "answer_token_4": "Alex",
        "end_token_pos_4": 394,
        "end_token_id_4": 29889,
        "answer_token_id_5": 260,
        "answer_token_pos_5": 398,
        "answer_token_5": "t",
        "end_token_pos_5": 397,
        "end_token_id_5": 338,
        "answer_token_id_6": 323,
        "answer_token_pos_6": 402,
        "answer_token_6": "T",
        "end_token_pos_6": 401,
        "end_token_id_6": 29889,
        "answer_token_id_7": 11220,
        "answer_token_pos_7": 406,
        "answer_token_7": "cold",
        "end_token_pos_7": 405,
        "end_token_id_7": 338,
        "answer_token_id_8": 4827,
        "answer_token_pos_8": 410,
        "answer_token_8": "Alex",
        "end_token_pos_8": 409,
        "end_token_id_8": 29889,
        "answer_token_id_9": 11220,
        "answer_token_pos_9": 413,
        "answer_token_9": "cold",
        "end_token_pos_9": 412,
        "end_token_id_9": 338
    },
    {
        "question": "Brimpuses are melodic. Vumpuses are brimpuses. Sam is vumpus.",
        "query": "True or false: Sam is melodic.",
        "answer": "Sam is vumpus. Vumpuses are brimpuses. Sam is brimpus. Brimpuses are melodic. Sam is melodic. True",
        "label": "True",
        "prompt": "Brimpuses are melodic. Vumpuses are brimpuses. Sam is vumpus. True or false: Sam is melodic. Let us think step by step.",
        "generated": "Sam is vumpus. Vumpuses are brimpuses. Sam is brimpus. Brimpuses are melodic. Sam is melodic. True",
        "noise_response_0": "",
        "noise_prompt_0": "Brimpuses are melodic. Vumpuses are brimpuses. Sam is vumpus. True or false: Alex is melodic. Let us think step by step.",
        "response_0": "",
        "noise_response_1": "Sam is",
        "noise_prompt_1": "Brimpuses are melodic. Vumpuses are brimpuses. Sam is Brimpus. True or false: Sam is melodic. Let us think step by step.",
        "response_1": "Sam is",
        "noise_response_2": "Sam is vumpus.",
        "noise_prompt_2": "Brimpuses are melodic. Numpus are brimpuses. Sam is vumpus. True or false: Sam is melodic. Let us think step by step.",
        "response_2": "Sam is vumpus.",
        "noise_response_3": "Sam is vumpus. Vumpuses are",
        "noise_prompt_3": "Brimpuses are melodic. Vumpuses are bright. Sam is vumpus. True or false: Sam is melodic. Let us think step by step.",
        "response_3": "Sam is vumpus. Vumpuses are",
        "noise_response_4": "Fae is vumpus. Vumpuses are brimpuses.",
        "noise_prompt_4": "Brimpuses are melodic. Vumpuses are brimpuses. Sam is vumpus. True or false: Sam is melodic. Let us think step by step.",
        "response_4": "Sam is vumpus. Vumpuses are brimpuses.",
        "noise_response_5": "Sam is vumpus. Vumpuses are shy. Sam is",
        "noise_prompt_5": "Brimpuses are melodic. Vumpuses are brimpuses. Sam is vumpus. True or false: Sam is melodic. Let us think step by step.",
        "response_5": "Sam is vumpus. Vumpuses are brimpuses. Sam is",
        "noise_response_6": "Sam is vumpus. Vumpuses are brimpuses. Sam is brimpus.",
        "noise_prompt_6": "zumpus are melodic. Vumpuses are brimpuses. Sam is vumpus. True or false: Sam is melodic. Let us think step by step.",
        "response_6": "Sam is vumpus. Vumpuses are brimpuses. Sam is brimpus.",
        "noise_response_7": "Sam is vumpus. Vumpuses are brimpuses. Sam is brimpus. Brimpuses are",
        "noise_prompt_7": "Brimpuses are melodic. Vumpuses are brimpuses. Sam is vumpus. True or false: Sam is blue. Let us think step by step.",
        "response_7": "Sam is vumpus. Vumpuses are brimpuses. Sam is brimpus. Brimpuses are",
        "noise_response_8": "Sam is vumpus. Vumpuses are brimpuses. Max is brimpus. Brimpuses are melodic.",
        "noise_prompt_8": "Brimpuses are melodic. Vumpuses are brimpuses. Sam is vumpus. True or false: Sam is melodic. Let us think step by step.",
        "response_8": "Sam is vumpus. Vumpuses are brimpuses. Sam is brimpus. Brimpuses are melodic.",
        "noise_response_9": "Sam is vumpus. Vumpuses are brimpuses. Sam is brimpus. Brimpuses are temperate. Sam is",
        "noise_prompt_9": "Brimpuses are melodic. Vumpuses are brimpuses. Sam is vumpus. True or false: Sam is melodic. Let us think step by step.",
        "response_9": "Sam is vumpus. Vumpuses are brimpuses. Sam is brimpus. Brimpuses are melodic. Sam is",
        "noise_prompt_10": "Brimpuses are melodic. Vumpuses are brimpuses. Sam is vumpus. True or false: Sam is melodic. Let us think step by step.",
        "response_10": "Sam is vumpus. Vumpuses are brimpuses. Sam is brimpus. Brimpuses are melodic. Sam is melodic.",
        "noise_response_10": "Sam is vumpus. Vumpuses are brimpuses. Sam is brimpus. Brimpuses are melodic. Sam is wooden.",
        "answer_token_id_0": 22966,
        "answer_token_pos_0": 380,
        "answer_token_0": "Sam",
        "end_token_pos_0": 379,
        "end_token_id_0": 13,
        "answer_token_id_1": 325,
        "answer_token_pos_1": 383,
        "answer_token_1": "v",
        "end_token_pos_1": 382,
        "end_token_id_1": 338,
        "answer_token_id_2": 478,
        "answer_token_pos_2": 387,
        "answer_token_2": "V",
        "end_token_pos_2": 386,
        "end_token_id_2": 29889,
        "answer_token_id_3": 1506,
        "answer_token_pos_3": 391,
        "answer_token_3": "br",
        "end_token_pos_3": 390,
        "end_token_id_3": 526,
        "answer_token_id_4": 3685,
        "answer_token_pos_4": 395,
        "answer_token_4": "Sam",
        "end_token_pos_4": 394,
        "end_token_id_4": 29889,
        "answer_token_id_5": 1506,
        "answer_token_pos_5": 398,
        "answer_token_5": "br",
        "end_token_pos_5": 397,
        "end_token_id_5": 338,
        "answer_token_id_6": 1771,
        "answer_token_pos_6": 402,
        "answer_token_6": "Br",
        "end_token_pos_6": 401,
        "end_token_id_6": 29889,
        "answer_token_id_7": 9232,
        "answer_token_pos_7": 406,
        "answer_token_7": "mel",
        "end_token_pos_7": 405,
        "end_token_id_7": 526,
        "answer_token_id_8": 3685,
        "answer_token_pos_8": 410,
        "answer_token_8": "Sam",
        "end_token_pos_8": 409,
        "end_token_id_8": 29889,
        "answer_token_id_9": 9232,
        "answer_token_pos_9": 413,
        "answer_token_9": "mel",
        "end_token_pos_9": 412,
        "end_token_id_9": 338
    },
    {
        "question": "Lempuses are slow. Zumpuses are lempuses. Max is zumpus.",
        "query": "True or false: Max is blue.",
        "answer": "Max is zumpus. Zumpuses are lempuses. Max is lempus. Lempuses are slow. Max is slow. False",
        "label": "False",
        "prompt": "Lempuses are slow. Zumpuses are lempuses. Max is zumpus. True or false: Max is blue. Let us think step by step.",
        "generated": "Max is zumpus. Zumpuses are lempuses. Max is lempus. Lempuses are slow. Max is slow. False",
        "noise_response_0": "",
        "noise_prompt_0": "Lempuses are slow. Zumpuses are lempuses. Max is zumpus. True or false: Sam is blue. Let us think step by step.",
        "response_0": "",
        "noise_response_1": "Max is",
        "noise_prompt_1": "Lempuses are slow. Zumpuses are lempuses. Max is Numpus. True or false: Max is blue. Let us think step by step.",
        "response_1": "Max is",
        "noise_response_2": "Max is zumpus.",
        "noise_prompt_2": "Lempuses are slow. gorpus are lempuses. Max is zumpus. True or false: Max is blue. Let us think step by step.",
        "response_2": "Max is zumpus.",
        "noise_response_3": "Max is zumpus. Zumpuses are",
        "noise_prompt_3": "Lempuses are slow. Zumpuses are Shumpus. Max is zumpus. True or false: Max is blue. Let us think step by step.",
        "response_3": "Max is zumpus. Zumpuses are",
        "noise_response_4": "Wren is zumpus. Zumpuses are lempuses.",
        "noise_prompt_4": "Lempuses are slow. Zumpuses are lempuses. Max is zumpus. True or false: Max is blue. Let us think step by step.",
        "response_4": "Max is zumpus. Zumpuses are lempuses.",
        "noise_response_5": "Max is zumpus. Zumpuses are grimpus. Max is",
        "noise_prompt_5": "Lempuses are slow. Zumpuses are lempuses. Max is zumpus. True or false: Max is blue. Let us think step by step.",
        "response_5": "Max is zumpus. Zumpuses are lempuses. Max is",
        "noise_response_6": "Max is zumpus. Zumpuses are lempuses. Max is lempus.",
        "noise_prompt_6": "Shumpus are slow. Zumpuses are lempuses. Max is zumpus. True or false: Max is blue. Let us think step by step.",
        "response_6": "Max is zumpus. Zumpuses are lempuses. Max is lempus.",
        "noise_response_7": "Max is zumpus. Zumpuses are lempuses. Max is lempus. Lempuses are",
        "noise_prompt_7": "Lempuses are dull. Zumpuses are lempuses. Max is zumpus. True or false: Max is blue. Let us think step by step.",
        "response_7": "Max is zumpus. Zumpuses are lempuses. Max is lempus. Lempuses are",
        "noise_response_8": "Max is zumpus. Zumpuses are lempuses. Rex is lempus. Lempuses are slow.",
        "noise_prompt_8": "Lempuses are slow. Zumpuses are lempuses. Max is zumpus. True or false: Max is blue. Let us think step by step.",
        "response_8": "Max is zumpus. Zumpuses are lempuses. Max is lempus. Lempuses are slow.",
        "noise_response_9": "Max is zumpus. Zumpuses are lempuses. Max is lempus. Lempuses are temperate. Max is",
        "noise_prompt_9": "Lempuses are slow. Zumpuses are lempuses. Max is zumpus. True or false: Max is blue. Let us think step by step.",
        "response_9": "Max is zumpus. Zumpuses are lempuses. Max is lempus. Lempuses are slow. Max is",
        "noise_prompt_10": "Lempuses are slow. Zumpuses are lempuses. Max is zumpus. True or false: Max is blue. Let us think step by step.",
        "response_10": "Max is zumpus. Zumpuses are lempuses. Max is lempus. Lempuses are slow. Max is slow.",
        "noise_response_10": "Max is zumpus. Zumpuses are lempuses. Max is lempus. Lempuses are slow. Max is kind.",
        "answer_token_id_0": 29931,
        "answer_token_pos_0": 380,
        "answer_token_0": "L",
        "end_token_pos_0": 379,
        "end_token_id_0": 13,
        "answer_token_id_1": 3356,
        "answer_token_pos_1": 383,
        "answer_token_1": "zum",
        "end_token_pos_1": 382,
        "end_token_id_1": 338,
        "answer_token_id_2": 796,
        "answer_token_pos_2": 387,
        "answer_token_2": "Z",
        "end_token_pos_2": 386,
        "end_token_id_2": 29889,
        "answer_token_id_3": 5232,
        "answer_token_pos_3": 391,
        "answer_token_3": "slow",
        "end_token_pos_3": 390,
        "end_token_id_3": 526,
        "answer_token_id_4": 365,
        "answer_token_pos_4": 395,
        "answer_token_4": "L",
        "end_token_pos_4": 394,
        "end_token_id_4": 29889,
        "answer_token_id_5": 454,
        "answer_token_pos_5": 398,
        "answer_token_5": "le",
        "end_token_pos_5": 397,
        "end_token_id_5": 338,
        "answer_token_id_6": 365,
        "answer_token_pos_6": 402,
        "answer_token_6": "L",
        "end_token_pos_6": 401,
        "end_token_id_6": 29889,
        "answer_token_id_7": 5232,
        "answer_token_pos_7": 406,
        "answer_token_7": "slow",
        "end_token_pos_7": 405,
        "end_token_id_7": 526,
        "answer_token_id_8": 5918,
        "answer_token_pos_8": 410,
        "answer_token_8": "Max",
        "end_token_pos_8": 409,
        "end_token_id_8": 29889,
        "answer_token_id_9": 5232,
        "answer_token_pos_9": 413,
        "answer_token_9": "slow",
        "end_token_pos_9": 412,
        "end_token_id_9": 338
    },
    {
        "question": "Tumpus is discordant. Jompus is tumpus. Polly is jompus.",
        "query": "True or false: Polly is sunny.",
        "answer": "Polly is jompus. Jompus is tumpus. Polly is tumpus. Tumpus is discordant. Polly is discordant. False",
        "label": "False",
        "prompt": "Tumpus is discordant. Jompus is tumpus. Polly is jompus. True or false: Polly is sunny. Let us think step by step.",
        "generated": "Polly is jompus. Jompus is tumpus. Polly is tumpus. Tumpus is discordant. Polly is discordant. False",
        "noise_response_0": "",
        "noise_prompt_0": "Tumpus is discordant. Jompus is tumpus. Polly is jompus. True or false: Sam is sunny. Let us think step by step.",
        "response_0": "",
        "noise_response_1": "Polly is",
        "noise_prompt_1": "Tumpus is discordant. Jompus is tumpus. Polly is rompus. True or false: Polly is sunny. Let us think step by step.",
        "response_1": "Polly is",
        "noise_response_2": "Polly is jompus.",
        "noise_prompt_2": "Tumpus is discordant. lorpus is tumpus. Polly is jompus. True or false: Polly is sunny. Let us think step by step.",
        "response_2": "Polly is jompus.",
        "noise_response_3": "Polly is jompus. Jompus is",
        "noise_prompt_3": "Tumpus is discordant. Jompus is temperate. Polly is jompus. True or false: Polly is sunny. Let us think step by step.",
        "response_3": "Polly is jompus. Jompus is",
        "noise_response_4": "Fae is jompus. Jompus is tumpus.",
        "noise_prompt_4": "Tumpus is discordant. Jompus is tumpus. Polly is jompus. True or false: Polly is sunny. Let us think step by step.",
        "response_4": "Polly is jompus. Jompus is tumpus.",
        "noise_response_5": "Polly is jompus. Jompus is transparent. Polly is",
        "noise_prompt_5": "Tumpus is discordant. Jompus is tumpus. Polly is jompus. True or false: Polly is sunny. Let us think step by step.",
        "response_5": "Polly is jompus. Jompus is tumpus. Polly is",
        "noise_response_6": "Polly is jompus. Jompus is tumpus. Polly is tumpus.",
        "noise_prompt_6": "Sterpus is discordant. Jompus is tumpus. Polly is jompus. True or false: Polly is sunny. Let us think step by step.",
        "response_6": "Polly is jompus. Jompus is tumpus. Polly is tumpus.",
        "noise_response_7": "Polly is jompus. Jompus is tumpus. Polly is tumpus. Tumpus is",
        "noise_prompt_7": "Tumpus is bitter. Jompus is tumpus. Polly is jompus. True or false: Polly is sunny. Let us think step by step.",
        "response_7": "Polly is jompus. Jompus is tumpus. Polly is tumpus. Tumpus is",
        "noise_response_8": "Polly is jompus. Jompus is tumpus. Wren is tumpus. Tumpus is discordant.",
        "noise_prompt_8": "Tumpus is discordant. Jompus is tumpus. Polly is jompus. True or false: Polly is sunny. Let us think step by step.",
        "response_8": "Polly is jompus. Jompus is tumpus. Polly is tumpus. Tumpus is discordant.",
        "noise_response_9": "Polly is jompus. Jompus is tumpus. Polly is tumpus. Tumpus is shy. Polly is",
        "noise_prompt_9": "Tumpus is discordant. Jompus is tumpus. Polly is jompus. True or false: Polly is sunny. Let us think step by step.",
        "response_9": "Polly is jompus. Jompus is tumpus. Polly is tumpus. Tumpus is discordant. Polly is",
        "noise_prompt_10": "Tumpus is discordant. Jompus is tumpus. Polly is jompus. True or false: Polly is sunny. Let us think step by step.",
        "response_10": "Polly is jompus. Jompus is tumpus. Polly is tumpus. Tumpus is discordant. Polly is discordant.",
        "noise_response_10": "Polly is jompus. Jompus is tumpus. Polly is tumpus. Tumpus is discordant. Polly is small.",
        "answer_token_id_0": 7713,
        "answer_token_pos_0": 380,
        "answer_token_0": "Pol",
        "end_token_pos_0": 379,
        "end_token_id_0": 13,
        "answer_token_id_1": 432,
        "answer_token_pos_1": 383,
        "answer_token_1": "j",
        "end_token_pos_1": 382,
        "end_token_id_1": 338,
        "answer_token_id_2": 435,
        "answer_token_pos_2": 387,
        "answer_token_2": "J",
        "end_token_pos_2": 386,
        "end_token_id_2": 29889,
        "answer_token_id_3": 260,
        "answer_token_pos_3": 391,
        "answer_token_3": "t",
        "end_token_pos_3": 390,
        "end_token_id_3": 338,
        "answer_token_id_4": 2043,
        "answer_token_pos_4": 395,
        "answer_token_4": "Pol",
        "end_token_pos_4": 394,
        "end_token_id_4": 29889,
        "answer_token_id_5": 260,
        "answer_token_pos_5": 398,
        "answer_token_5": "t",
        "end_token_pos_5": 397,
        "end_token_id_5": 338,
        "answer_token_id_6": 323,
        "answer_token_pos_6": 402,
        "answer_token_6": "T",
        "end_token_pos_6": 401,
        "end_token_id_6": 29889,
        "answer_token_id_7": 2313,
        "answer_token_pos_7": 406,
        "answer_token_7": "disc",
        "end_token_pos_7": 405,
        "end_token_id_7": 338,
        "answer_token_id_8": 2043,
        "answer_token_pos_8": 410,
        "answer_token_8": "Pol",
        "end_token_pos_8": 409,
        "end_token_id_8": 29889,
        "answer_token_id_9": 2313,
        "answer_token_pos_9": 413,
        "answer_token_9": "disc",
        "end_token_pos_9": 412,
        "end_token_id_9": 338
    },
    {
        "question": "Gorpuses are luminous. Lorpus is gorpus. Fae is lorpus.",
        "query": "True or false: Fae is luminous.",
        "answer": "Fae is lorpus. Lorpus is gorpus. Fae is gorpus. Gorpuses are luminous. Fae is luminous. True",
        "label": "True",
        "prompt": "Gorpuses are luminous. Lorpus is gorpus. Fae is lorpus. True or false: Fae is luminous. Let us think step by step.",
        "generated": "Fae is lorpus. Lorpus is gorpus. Fae is gorpus. Gorpuses are luminous. Fae is luminous. True",
        "noise_response_0": "",
        "noise_prompt_0": "Gorpuses are luminous. Lorpus is gorpus. Fae is lorpus. True or false: Sally is luminous. Let us think step by step.",
        "response_0": "",
        "noise_response_1": "Fae is",
        "noise_prompt_1": "Gorpuses are luminous. Lorpus is gorpus. Fae is lorpus. True or false: Fae is floral. Let us think step by step.",
        "response_1": "Fae is",
        "noise_response_2": "Fae is lorpus.",
        "noise_prompt_2": "Gorpuses are luminous. numpus is gorpus. Fae is lorpus. True or false: Fae is luminous. Let us think step by step.",
        "response_2": "Fae is lorpus.",
        "noise_response_3": "Fae is lorpus. Lorpus is",
        "noise_prompt_3": "Gorpuses are luminous. Lorpus is tumpus. Fae is lorpus. True or false: Fae is luminous. Let us think step by step.",
        "response_3": "Fae is lorpus. Lorpus is",
        "noise_response_4": "Polly is lorpus. Lorpus is gorpus.",
        "noise_prompt_4": "Gorpuses are luminous. Lorpus is gorpus. Fae is lorpus. True or false: Fae is luminous. Let us think step by step.",
        "response_4": "Fae is lorpus. Lorpus is gorpus.",
        "noise_response_5": "Fae is lorpus. Lorpus is Yumpus. Fae is",
        "noise_prompt_5": "Gorpuses are luminous. Lorpus is gorpus. Fae is lorpus. True or false: Fae is luminous. Let us think step by step.",
        "response_5": "Fae is lorpus. Lorpus is gorpus. Fae is",
        "noise_response_6": "Fae is lorpus. Lorpus is gorpus. Fae is gorpus.",
        "noise_prompt_6": "Gorpus are luminous. Lorpus is gorpus. Fae is lorpus. True or false: Fae is luminous. Let us think step by step.",
        "response_6": "Fae is lorpus. Lorpus is gorpus. Fae is gorpus.",
        "noise_response_7": "Fae is shy. Lorpus is gorpus. Fae is gorpus. Gorpuses are",
        "noise_prompt_7": "Gorpuses are luminous. Lorpus is gorpus. Fae is lorpus. True or false: Fae is luminous. Let us think step by step.",
        "response_7": "Fae is lorpus. Lorpus is gorpus. Fae is gorpus. Gorpuses are",
        "noise_response_8": "Fae is lorpus. Lorpus is gorpus. Sally is gorpus. Gorpuses are luminous.",
        "noise_prompt_8": "Gorpuses are luminous. Lorpus is gorpus. Fae is lorpus. True or false: Fae is luminous. Let us think step by step.",
        "response_8": "Fae is lorpus. Lorpus is gorpus. Fae is gorpus. Gorpuses are luminous.",
        "noise_response_9": "Fae is lorpus. Lorpus is gorpus. Fae is gorpus. Gorpuses are feisty. Fae is",
        "noise_prompt_9": "Gorpuses are luminous. Lorpus is gorpus. Fae is lorpus. True or false: Fae is luminous. Let us think step by step.",
        "response_9": "Fae is lorpus. Lorpus is gorpus. Fae is gorpus. Gorpuses are luminous. Fae is",
        "noise_prompt_10": "Gorpuses are luminous. Lorpus is gorpus. Fae is lorpus. True or false: Fae is luminous. Let us think step by step.",
        "response_10": "Fae is lorpus. Lorpus is gorpus. Fae is gorpus. Gorpuses are luminous. Fae is luminous.",
        "noise_response_10": "Fae is lorpus. Lorpus is gorpus. Fae is gorpus. Gorpuses are luminous. Fae is mean.",
        "answer_token_id_0": 29943,
        "answer_token_pos_0": 380,
        "answer_token_0": "F",
        "end_token_pos_0": 379,
        "end_token_id_0": 13,
        "answer_token_id_1": 301,
        "answer_token_pos_1": 383,
        "answer_token_1": "l",
        "end_token_pos_1": 382,
        "end_token_id_1": 338,
        "answer_token_id_2": 10980,
        "answer_token_pos_2": 387,
        "answer_token_2": "Lor",
        "end_token_pos_2": 386,
        "end_token_id_2": 29889,
        "answer_token_id_3": 330,
        "answer_token_pos_3": 391,
        "answer_token_3": "g",
        "end_token_pos_3": 390,
        "end_token_id_3": 338,
        "answer_token_id_4": 383,
        "answer_token_pos_4": 395,
        "answer_token_4": "F",
        "end_token_pos_4": 394,
        "end_token_id_4": 29889,
        "answer_token_id_5": 330,
        "answer_token_pos_5": 398,
        "answer_token_5": "g",
        "end_token_pos_5": 397,
        "end_token_id_5": 338,
        "answer_token_id_6": 18686,
        "answer_token_pos_6": 402,
        "answer_token_6": "Gor",
        "end_token_pos_6": 401,
        "end_token_id_6": 29889,
        "answer_token_id_7": 301,
        "answer_token_pos_7": 406,
        "answer_token_7": "l",
        "end_token_pos_7": 405,
        "end_token_id_7": 526,
        "answer_token_id_8": 383,
        "answer_token_pos_8": 410,
        "answer_token_8": "F",
        "end_token_pos_8": 409,
        "end_token_id_8": 29889,
        "answer_token_id_9": 301,
        "answer_token_pos_9": 413,
        "answer_token_9": "l",
        "end_token_pos_9": 412,
        "end_token_id_9": 338
    },
    {
        "question": "Grimpus is angry. Zumpus is grimpus. Rex is zumpus.",
        "query": "True or false: Rex is moderate.",
        "answer": "Rex is zumpus. Zumpus is grimpus. Rex is grimpus. Grimpus is angry. Rex is angry. False",
        "label": "False",
        "prompt": "Grimpus is angry. Zumpus is grimpus. Rex is zumpus. True or false: Rex is moderate. Let us think step by step.",
        "generated": "Rex is zumpus. Zumpus is grimpus. Rex is grimpus. Grimpus is angry. Rex is angry. False",
        "noise_response_0": "",
        "noise_prompt_0": "Grimpus is angry. Zumpus is grimpus. Rex is zumpus. True or false: Polly is moderate. Let us think step by step.",
        "response_0": "",
        "noise_response_1": "Rex is",
        "noise_prompt_1": "Grimpus is angry. Zumpus is grimpus. Rex is numpus. True or false: Rex is moderate. Let us think step by step.",
        "response_1": "Rex is",
        "noise_response_2": "Rex is zumpus.",
        "noise_prompt_2": "Grimpus is angry. lorpus is grimpus. Rex is zumpus. True or false: Rex is moderate. Let us think step by step.",
        "response_2": "Rex is zumpus.",
        "noise_response_3": "Rex is zumpus. Zumpus is",
        "noise_prompt_3": "Grimpus is angry. Zumpus is gorpus. Rex is zumpus. True or false: Rex is moderate. Let us think step by step.",
        "response_3": "Rex is zumpus. Zumpus is",
        "noise_response_4": "Max is zumpus. Zumpus is grimpus.",
        "noise_prompt_4": "Grimpus is angry. Zumpus is grimpus. Rex is zumpus. True or false: Rex is moderate. Let us think step by step.",
        "response_4": "Rex is zumpus. Zumpus is grimpus.",
        "noise_response_5": "Rex is zumpus. Zumpus is Jompus. Rex is",
        "noise_prompt_5": "Grimpus is angry. Zumpus is grimpus. Rex is zumpus. True or false: Rex is moderate. Let us think step by step.",
        "response_5": "Rex is zumpus. Zumpus is grimpus. Rex is",
        "noise_response_6": "Rex is zumpus. Zumpus is grimpus. Rex is grimpus.",
        "noise_prompt_6": "dumpus is angry. Zumpus is grimpus. Rex is zumpus. True or false: Rex is moderate. Let us think step by step.",
        "response_6": "Rex is zumpus. Zumpus is grimpus. Rex is grimpus.",
        "noise_response_7": "Rex is zumpus. Zumpus is grimpus. Rex is grimpus. Grimpus is",
        "noise_prompt_7": "Grimpus is large. Zumpus is grimpus. Rex is zumpus. True or false: Rex is moderate. Let us think step by step.",
        "response_7": "Rex is zumpus. Zumpus is grimpus. Rex is grimpus. Grimpus is",
        "noise_response_8": "Rex is zumpus. Zumpus is grimpus. Sally is grimpus. Grimpus is angry.",
        "noise_prompt_8": "Grimpus is angry. Zumpus is grimpus. Rex is zumpus. True or false: Rex is moderate. Let us think step by step.",
        "response_8": "Rex is zumpus. Zumpus is grimpus. Rex is grimpus. Grimpus is angry.",
        "noise_response_9": "Rex is zumpus. Zumpus is grimpus. Rex is grimpus. Grimpus is sweet. Rex is",
        "noise_prompt_9": "Grimpus is angry. Zumpus is grimpus. Rex is zumpus. True or false: Rex is moderate. Let us think step by step.",
        "response_9": "Rex is zumpus. Zumpus is grimpus. Rex is grimpus. Grimpus is angry. Rex is",
        "noise_prompt_10": "Grimpus is angry. Zumpus is grimpus. Rex is zumpus. True or false: Rex is moderate. Let us think step by step.",
        "response_10": "Rex is zumpus. Zumpus is grimpus. Rex is grimpus. Grimpus is angry. Rex is angry.",
        "noise_response_10": "Rex is zumpus. Zumpus is grimpus. Rex is grimpus. Grimpus is angry. Rex is luminous.",
        "answer_token_id_0": 29934,
        "answer_token_pos_0": 380,
        "answer_token_0": "R",
        "end_token_pos_0": 379,
        "end_token_id_0": 13,
        "answer_token_id_1": 3356,
        "answer_token_pos_1": 383,
        "answer_token_1": "zum",
        "end_token_pos_1": 382,
        "end_token_id_1": 338,
        "answer_token_id_2": 796,
        "answer_token_pos_2": 387,
        "answer_token_2": "Z",
        "end_token_pos_2": 386,
        "end_token_id_2": 29889,
        "answer_token_id_3": 867,
        "answer_token_pos_3": 391,
        "answer_token_3": "gr",
        "end_token_pos_3": 390,
        "end_token_id_3": 338,
        "answer_token_id_4": 390,
        "answer_token_pos_4": 395,
        "answer_token_4": "R",
        "end_token_pos_4": 394,
        "end_token_id_4": 29889,
        "answer_token_id_5": 867,
        "answer_token_pos_5": 398,
        "answer_token_5": "gr",
        "end_token_pos_5": 397,
        "end_token_id_5": 338,
        "answer_token_id_6": 1632,
        "answer_token_pos_6": 402,
        "answer_token_6": "Gr",
        "end_token_pos_6": 401,
        "end_token_id_6": 29889,
        "answer_token_id_7": 26230,
        "answer_token_pos_7": 406,
        "answer_token_7": "angry",
        "end_token_pos_7": 405,
        "end_token_id_7": 338,
        "answer_token_id_8": 390,
        "answer_token_pos_8": 410,
        "answer_token_8": "R",
        "end_token_pos_8": 409,
        "end_token_id_8": 29889,
        "answer_token_id_9": 17768,
        "answer_token_pos_9": 413,
        "answer_token_9": "moder",
        "end_token_pos_9": 412,
        "end_token_id_9": 338
    },
    {
        "question": "Impus is fruity. Shumpus is impus. Polly is shumpus.",
        "query": "True or false: Polly is fruity.",
        "answer": "Polly is shumpus. Shumpus is impus. Polly is impus. Impus is fruity. Polly is fruity. True",
        "label": "True",
        "prompt": "Impus is fruity. Shumpus is impus. Polly is shumpus. True or false: Polly is fruity. Let us think step by step.",
        "generated": "Polly is shumpus. Shumpus is impus. Polly is impus. Impus is fruity. Polly is fruity. True",
        "noise_response_0": "",
        "noise_prompt_0": "Impus is fruity. Shumpus is impus. Polly is shumpus. True or false: Wren is fruity. Let us think step by step.",
        "response_0": "",
        "noise_response_1": "Polly is",
        "noise_prompt_1": "Impus is fruity. Shumpus is impus. Polly is small. True or false: Polly is fruity. Let us think step by step.",
        "response_1": "Polly is",
        "noise_response_2": "Polly is shumpus.",
        "noise_prompt_2": "Impus is fruity. Vumpus is impus. Polly is shumpus. True or false: Polly is fruity. Let us think step by step.",
        "response_2": "Polly is shumpus.",
        "noise_response_3": "Polly is shumpus. Shumpus is",
        "noise_prompt_3": "Impus is fruity. Shumpus is Lempus. Polly is shumpus. True or false: Polly is fruity. Let us think step by step.",
        "response_3": "Polly is shumpus. Shumpus is",
        "noise_response_4": "Sally is shumpus. Shumpus is impus.",
        "noise_prompt_4": "Impus is fruity. Shumpus is impus. Polly is shumpus. True or false: Polly is fruity. Let us think step by step.",
        "response_4": "Polly is shumpus. Shumpus is impus.",
        "noise_response_5": "Polly is shumpus. Shumpus is lorpus. Polly is",
        "noise_prompt_5": "Impus is fruity. Shumpus is impus. Polly is shumpus. True or false: Polly is fruity. Let us think step by step.",
        "response_5": "Polly is shumpus. Shumpus is impus. Polly is",
        "noise_response_6": "Polly is shumpus. Shumpus is impus. Polly is impus.",
        "noise_prompt_6": "sterpus is fruity. Shumpus is impus. Polly is shumpus. True or false: Polly is fruity. Let us think step by step.",
        "response_6": "Polly is shumpus. Shumpus is impus. Polly is impus.",
        "noise_response_7": "Polly is shumpus. Shumpus is impus. Polly is impus. Impus is",
        "noise_prompt_7": "Impus is fruity. Shumpus is impus. Polly is shumpus. True or false: Polly is melodic. Let us think step by step.",
        "response_7": "Polly is shumpus. Shumpus is impus. Polly is impus. Impus is",
        "noise_response_8": "Polly is shumpus. Shumpus is impus. Fae is impus. Impus is fruity.",
        "noise_prompt_8": "Impus is fruity. Shumpus is impus. Polly is shumpus. True or false: Polly is fruity. Let us think step by step.",
        "response_8": "Polly is shumpus. Shumpus is impus. Polly is impus. Impus is fruity.",
        "noise_response_9": "Polly is shumpus. Shumpus is impus. Polly is impus. Impus is angry. Polly is",
        "noise_prompt_9": "Impus is fruity. Shumpus is impus. Polly is shumpus. True or false: Polly is fruity. Let us think step by step.",
        "response_9": "Polly is shumpus. Shumpus is impus. Polly is impus. Impus is fruity. Polly is",
        "noise_prompt_10": "Impus is fruity. Shumpus is impus. Polly is shumpus. True or false: Polly is fruity. Let us think step by step.",
        "response_10": "Polly is shumpus. Shumpus is impus. Polly is impus. Impus is fruity. Polly is fruity.",
        "noise_response_10": "Polly is shumpus. Shumpus is impus. Polly is impus. Impus is fruity. Polly is floral.",
        "answer_token_id_0": 7713,
        "answer_token_pos_0": 380,
        "answer_token_0": "Pol",
        "end_token_pos_0": 379,
        "end_token_id_0": 13,
        "answer_token_id_1": 528,
        "answer_token_pos_1": 383,
        "answer_token_1": "sh",
        "end_token_pos_1": 382,
        "end_token_id_1": 338,
        "answer_token_id_2": 1383,
        "answer_token_pos_2": 387,
        "answer_token_2": "Sh",
        "end_token_pos_2": 386,
        "end_token_id_2": 29889,
        "answer_token_id_3": 2411,
        "answer_token_pos_3": 391,
        "answer_token_3": "imp",
        "end_token_pos_3": 390,
        "end_token_id_3": 338,
        "answer_token_id_4": 2043,
        "answer_token_pos_4": 395,
        "answer_token_4": "Pol",
        "end_token_pos_4": 394,
        "end_token_id_4": 29889,
        "answer_token_id_5": 2411,
        "answer_token_pos_5": 398,
        "answer_token_5": "imp",
        "end_token_pos_5": 397,
        "end_token_id_5": 338,
        "answer_token_id_6": 14305,
        "answer_token_pos_6": 402,
        "answer_token_6": "Imp",
        "end_token_pos_6": 401,
        "end_token_id_6": 29889,
        "answer_token_id_7": 285,
        "answer_token_pos_7": 406,
        "answer_token_7": "f",
        "end_token_pos_7": 405,
        "end_token_id_7": 338,
        "answer_token_id_8": 2043,
        "answer_token_pos_8": 410,
        "answer_token_8": "Pol",
        "end_token_pos_8": 409,
        "end_token_id_8": 29889,
        "answer_token_id_9": 285,
        "answer_token_pos_9": 413,
        "answer_token_9": "f",
        "end_token_pos_9": 412,
        "end_token_id_9": 338
    },
    {
        "question": "Dumpuses are overcast. Impus is dumpus. Sally is impus.",
        "query": "True or false: Sally is overcast.",
        "answer": "Sally is impus. Impus is dumpus. Sally is dumpus. Dumpuses are overcast. Sally is overcast. True",
        "label": "True",
        "prompt": "Dumpuses are overcast. Impus is dumpus. Sally is impus. True or false: Sally is overcast. Let us think step by step.",
        "generated": "Sally is impus. Impus is dumpus. Sally is dumpus. Dumpuses are overcast. Sally is overcast. True",
        "noise_response_0": "",
        "noise_prompt_0": "Dumpuses are overcast. Impus is dumpus. Sally is impus. True or false: Stella is overcast. Let us think step by step.",
        "response_0": "",
        "noise_response_1": "Sally is",
        "noise_prompt_1": "Dumpuses are overcast. Impus is dumpus. Sally is Impus. True or false: Sally is overcast. Let us think step by step.",
        "response_1": "Sally is",
        "noise_response_2": "Sally is impus.",
        "noise_prompt_2": "Dumpuses are overcast. numpus is dumpus. Sally is impus. True or false: Sally is overcast. Let us think step by step.",
        "response_2": "Sally is impus.",
        "noise_response_3": "Sally is impus. Impus is",
        "noise_prompt_3": "Dumpuses are overcast. Impus is rompus. Sally is impus. True or false: Sally is overcast. Let us think step by step.",
        "response_3": "Sally is impus. Impus is",
        "noise_response_4": "Fae is impus. Impus is dumpus.",
        "noise_prompt_4": "Dumpuses are overcast. Impus is dumpus. Sally is impus. True or false: Sally is overcast. Let us think step by step.",
        "response_4": "Sally is impus. Impus is dumpus.",
        "noise_response_5": "Sally is impus. Impus is jompus. Sally is",
        "noise_prompt_5": "Dumpuses are overcast. Impus is dumpus. Sally is impus. True or false: Sally is overcast. Let us think step by step.",
        "response_5": "Sally is impus. Impus is dumpus. Sally is",
        "noise_response_6": "Sally is impus. Impus is dumpus. Sally is dumpus.",
        "noise_prompt_6": "Dumpus are overcast. Impus is dumpus. Sally is impus. True or false: Sally is overcast. Let us think step by step.",
        "response_6": "Sally is impus. Impus is dumpus. Sally is dumpus.",
        "noise_response_7": "Sally is impus. Impus is dumpus. Sally is dumpus. Dumpuses are",
        "noise_prompt_7": "Dumpuses are overcast. Impus is dumpus. Sally is impus. True or false: Sally is melodic. Let us think step by step.",
        "response_7": "Sally is impus. Impus is dumpus. Sally is dumpus. Dumpuses are",
        "noise_response_8": "Sally is impus. Impus is dumpus. Polly is dumpus. Dumpuses are overcast.",
        "noise_prompt_8": "Dumpuses are overcast. Impus is dumpus. Sally is impus. True or false: Sally is overcast. Let us think step by step.",
        "response_8": "Sally is impus. Impus is dumpus. Sally is dumpus. Dumpuses are overcast.",
        "noise_response_9": "Sally is impus. Impus is dumpus. Sally is dumpus. Dumpuses are hot. Sally is",
        "noise_prompt_9": "Dumpuses are overcast. Impus is dumpus. Sally is impus. True or false: Sally is overcast. Let us think step by step.",
        "response_9": "Sally is impus. Impus is dumpus. Sally is dumpus. Dumpuses are overcast. Sally is",
        "noise_prompt_10": "Dumpuses are overcast. Impus is dumpus. Sally is impus. True or false: Sally is overcast. Let us think step by step.",
        "response_10": "Sally is impus. Impus is dumpus. Sally is dumpus. Dumpuses are overcast. Sally is overcast.",
        "noise_response_10": "Sally is impus. Impus is dumpus. Sally is dumpus. Dumpuses are overcast. Sally is sweet.",
        "answer_token_id_0": 29903,
        "answer_token_pos_0": 380,
        "answer_token_0": "S",
        "end_token_pos_0": 379,
        "end_token_id_0": 13,
        "answer_token_id_1": 2411,
        "answer_token_pos_1": 383,
        "answer_token_1": "imp",
        "end_token_pos_1": 382,
        "end_token_id_1": 338,
        "answer_token_id_2": 14305,
        "answer_token_pos_2": 387,
        "answer_token_2": "Imp",
        "end_token_pos_2": 386,
        "end_token_id_2": 29889,
        "answer_token_id_3": 16766,
        "answer_token_pos_3": 391,
        "answer_token_3": "dump",
        "end_token_pos_3": 390,
        "end_token_id_3": 338,
        "answer_token_id_4": 317,
        "answer_token_pos_4": 395,
        "answer_token_4": "S",
        "end_token_pos_4": 394,
        "end_token_id_4": 29889,
        "answer_token_id_5": 16766,
        "answer_token_pos_5": 398,
        "answer_token_5": "dump",
        "end_token_pos_5": 397,
        "end_token_id_5": 338,
        "answer_token_id_6": 360,
        "answer_token_pos_6": 402,
        "answer_token_6": "D",
        "end_token_pos_6": 401,
        "end_token_id_6": 29889,
        "answer_token_id_7": 975,
        "answer_token_pos_7": 406,
        "answer_token_7": "over",
        "end_token_pos_7": 405,
        "end_token_id_7": 526,
        "answer_token_id_8": 317,
        "answer_token_pos_8": 410,
        "answer_token_8": "S",
        "end_token_pos_8": 409,
        "end_token_id_8": 29889,
        "answer_token_id_9": 975,
        "answer_token_pos_9": 413,
        "answer_token_9": "over",
        "end_token_pos_9": 412,
        "end_token_id_9": 338
    },
    {
        "question": "Tumpuses are small. Brimpuses are tumpuses. Rex is brimpus.",
        "query": "True or false: Rex is small.",
        "answer": "Rex is brimpus. Brimpuses are tumpuses. Rex is tumpus. Tumpuses are small. Rex is small. True",
        "label": "True",
        "prompt": "Tumpuses are small. Brimpuses are tumpuses. Rex is brimpus. True or false: Rex is small. Let us think step by step.",
        "generated": "Rex is brimpus. Brimpuses are tumpuses. Rex is tumpus. Tumpuses are small. Rex is small. True",
        "noise_response_0": "",
        "noise_prompt_0": "Tumpuses are small. Brimpuses are tumpuses. Rex is brimpus. True or false: Alex is small. Let us think step by step.",
        "response_0": "",
        "noise_response_1": "Rex is",
        "noise_prompt_1": "Tumpuses are small. Brimpuses are tumpuses. Rex is transparent. True or false: Rex is small. Let us think step by step.",
        "response_1": "Rex is",
        "noise_response_2": "Rex is brimpus.",
        "noise_prompt_2": "Tumpuses are small. lempus are tumpuses. Rex is brimpus. True or false: Rex is small. Let us think step by step.",
        "response_2": "Rex is brimpus.",
        "noise_response_3": "Rex is brimpus. Brimpuses are",
        "noise_prompt_3": "Tumpuses are small. Brimpuses are fast. Rex is brimpus. True or false: Rex is small. Let us think step by step.",
        "response_3": "Rex is brimpus. Brimpuses are",
        "noise_response_4": "Sally is brimpus. Brimpuses are tumpuses.",
        "noise_prompt_4": "Tumpuses are small. Brimpuses are tumpuses. Rex is brimpus. True or false: Rex is small. Let us think step by step.",
        "response_4": "Rex is brimpus. Brimpuses are tumpuses.",
        "noise_response_5": "Rex is brimpus. Brimpuses are kind. Rex is",
        "noise_prompt_5": "Tumpuses are small. Brimpuses are tumpuses. Rex is brimpus. True or false: Rex is small. Let us think step by step.",
        "response_5": "Rex is brimpus. Brimpuses are tumpuses. Rex is",
        "noise_response_6": "Rex is brimpus. Brimpuses are tumpuses. Rex is tumpus.",
        "noise_prompt_6": "zumpus are small. Brimpuses are tumpuses. Rex is brimpus. True or false: Rex is small. Let us think step by step.",
        "response_6": "Rex is brimpus. Brimpuses are tumpuses. Rex is tumpus.",
        "noise_response_7": "Rex is brimpus. Brimpuses are tumpuses. Rex is tumpus. Tumpuses are",
        "noise_prompt_7": "Tumpuses are small. Brimpuses are tumpuses. Rex is brimpus. True or false: Rex is fruity. Let us think step by step.",
        "response_7": "Rex is brimpus. Brimpuses are tumpuses. Rex is tumpus. Tumpuses are",
        "noise_response_8": "Rex is brimpus. Brimpuses are tumpuses. Sam is tumpus. Tumpuses are small.",
        "noise_prompt_8": "Tumpuses are small. Brimpuses are tumpuses. Rex is brimpus. True or false: Rex is small. Let us think step by step.",
        "response_8": "Rex is brimpus. Brimpuses are tumpuses. Rex is tumpus. Tumpuses are small.",
        "noise_response_9": "Rex is brimpus. Brimpuses are tumpuses. Rex is tumpus. Tumpuses are dull. Rex is",
        "noise_prompt_9": "Tumpuses are small. Brimpuses are tumpuses. Rex is brimpus. True or false: Rex is small. Let us think step by step.",
        "response_9": "Rex is brimpus. Brimpuses are tumpuses. Rex is tumpus. Tumpuses are small. Rex is",
        "noise_prompt_10": "Tumpuses are small. Brimpuses are tumpuses. Rex is brimpus. True or false: Rex is small. Let us think step by step.",
        "response_10": "Rex is brimpus. Brimpuses are tumpuses. Rex is tumpus. Tumpuses are small. Rex is small.",
        "noise_response_10": "Rex is brimpus. Brimpuses are tumpuses. Rex is tumpus. Tumpuses are small. Rex is transparent.",
        "answer_token_id_0": 29934,
        "answer_token_pos_0": 380,
        "answer_token_0": "R",
        "end_token_pos_0": 379,
        "end_token_id_0": 13,
        "answer_token_id_1": 1506,
        "answer_token_pos_1": 383,
        "answer_token_1": "br",
        "end_token_pos_1": 382,
        "end_token_id_1": 338,
        "answer_token_id_2": 1771,
        "answer_token_pos_2": 387,
        "answer_token_2": "Br",
        "end_token_pos_2": 386,
        "end_token_id_2": 29889,
        "answer_token_id_3": 260,
        "answer_token_pos_3": 391,
        "answer_token_3": "t",
        "end_token_pos_3": 390,
        "end_token_id_3": 526,
        "answer_token_id_4": 390,
        "answer_token_pos_4": 395,
        "answer_token_4": "R",
        "end_token_pos_4": 394,
        "end_token_id_4": 29889,
        "answer_token_id_5": 260,
        "answer_token_pos_5": 398,
        "answer_token_5": "t",
        "end_token_pos_5": 397,
        "end_token_id_5": 338,
        "answer_token_id_6": 323,
        "answer_token_pos_6": 402,
        "answer_token_6": "T",
        "end_token_pos_6": 401,
        "end_token_id_6": 29889,
        "answer_token_id_7": 2319,
        "answer_token_pos_7": 406,
        "answer_token_7": "small",
        "end_token_pos_7": 405,
        "end_token_id_7": 526,
        "answer_token_id_8": 390,
        "answer_token_pos_8": 410,
        "answer_token_8": "R",
        "end_token_pos_8": 409,
        "end_token_id_8": 29889,
        "answer_token_id_9": 2319,
        "answer_token_pos_9": 413,
        "answer_token_9": "small",
        "end_token_pos_9": 412,
        "end_token_id_9": 338
    },
    {
        "question": "Grimpuses are dull. Jompus is grimpus. Fae is jompus.",
        "query": "True or false: Fae is transparent.",
        "answer": "Fae is jompus. Jompus is grimpus. Fae is grimpus. Grimpuses are dull. Fae is dull. False",
        "label": "False",
        "prompt": "Grimpuses are dull. Jompus is grimpus. Fae is jompus. True or false: Fae is transparent. Let us think step by step.",
        "generated": "Fae is jompus. Jompus is grimpus. Fae is grimpus. Grimpuses are dull. Fae is dull. False",
        "noise_response_0": "",
        "noise_prompt_0": "Grimpuses are dull. Jompus is grimpus. Fae is jompus. True or false: Alex is transparent. Let us think step by step.",
        "response_0": "",
        "noise_response_1": "Fae is",
        "noise_prompt_1": "Grimpuses are dull. Jompus is grimpus. Fae is Shumpus. True or false: Fae is transparent. Let us think step by step.",
        "response_1": "Fae is",
        "noise_response_2": "Fae is jompus.",
        "noise_prompt_2": "Grimpuses are dull. Rompus is grimpus. Fae is jompus. True or false: Fae is transparent. Let us think step by step.",
        "response_2": "Fae is jompus.",
        "noise_response_3": "Fae is jompus. Jompus is",
        "noise_prompt_3": "Grimpuses are dull. Jompus is Sterpus. Fae is jompus. True or false: Fae is transparent. Let us think step by step.",
        "response_3": "Fae is jompus. Jompus is",
        "noise_response_4": "Rex is jompus. Jompus is grimpus.",
        "noise_prompt_4": "Grimpuses are dull. Jompus is grimpus. Fae is jompus. True or false: Fae is transparent. Let us think step by step.",
        "response_4": "Fae is jompus. Jompus is grimpus.",
        "noise_response_5": "Fae is jompus. Jompus is Zumpus. Fae is",
        "noise_prompt_5": "Grimpuses are dull. Jompus is grimpus. Fae is jompus. True or false: Fae is transparent. Let us think step by step.",
        "response_5": "Fae is jompus. Jompus is grimpus. Fae is",
        "noise_response_6": "Fae is jompus. Jompus is grimpus. Fae is grimpus.",
        "noise_prompt_6": "Wumpus are dull. Jompus is grimpus. Fae is jompus. True or false: Fae is transparent. Let us think step by step.",
        "response_6": "Fae is jompus. Jompus is grimpus. Fae is grimpus.",
        "noise_response_7": "Fae is jompus. Jompus is grimpus. Fae is grimpus. Grimpuses are",
        "noise_prompt_7": "Grimpuses are moderate. Jompus is grimpus. Fae is jompus. True or false: Fae is transparent. Let us think step by step.",
        "response_7": "Fae is jompus. Jompus is grimpus. Fae is grimpus. Grimpuses are",
        "noise_response_8": "Fae is jompus. Jompus is grimpus. Max is grimpus. Grimpuses are dull.",
        "noise_prompt_8": "Grimpuses are dull. Jompus is grimpus. Fae is jompus. True or false: Fae is transparent. Let us think step by step.",
        "response_8": "Fae is jompus. Jompus is grimpus. Fae is grimpus. Grimpuses are dull.",
        "noise_response_9": "Fae is jompus. Jompus is grimpus. Fae is grimpus. Grimpuses are sunny. Fae is",
        "noise_prompt_9": "Grimpuses are dull. Jompus is grimpus. Fae is jompus. True or false: Fae is transparent. Let us think step by step.",
        "response_9": "Fae is jompus. Jompus is grimpus. Fae is grimpus. Grimpuses are dull. Fae is",
        "noise_prompt_10": "Grimpuses are dull. Jompus is grimpus. Fae is jompus. True or false: Fae is transparent. Let us think step by step.",
        "response_10": "Fae is jompus. Jompus is grimpus. Fae is grimpus. Grimpuses are dull. Fae is dull.",
        "noise_response_10": "Fae is jompus. Jompus is grimpus. Fae is grimpus. Grimpuses are dull. Fae is angry.",
        "answer_token_id_0": 29943,
        "answer_token_pos_0": 380,
        "answer_token_0": "F",
        "end_token_pos_0": 379,
        "end_token_id_0": 13,
        "answer_token_id_1": 432,
        "answer_token_pos_1": 383,
        "answer_token_1": "j",
        "end_token_pos_1": 382,
        "end_token_id_1": 338,
        "answer_token_id_2": 435,
        "answer_token_pos_2": 387,
        "answer_token_2": "J",
        "end_token_pos_2": 386,
        "end_token_id_2": 29889,
        "answer_token_id_3": 867,
        "answer_token_pos_3": 391,
        "answer_token_3": "gr",
        "end_token_pos_3": 390,
        "end_token_id_3": 338,
        "answer_token_id_4": 383,
        "answer_token_pos_4": 395,
        "answer_token_4": "F",
        "end_token_pos_4": 394,
        "end_token_id_4": 29889,
        "answer_token_id_5": 867,
        "answer_token_pos_5": 398,
        "answer_token_5": "gr",
        "end_token_pos_5": 397,
        "end_token_id_5": 338,
        "answer_token_id_6": 1632,
        "answer_token_pos_6": 402,
        "answer_token_6": "Gr",
        "end_token_pos_6": 401,
        "end_token_id_6": 29889,
        "answer_token_id_7": 270,
        "answer_token_pos_7": 406,
        "answer_token_7": "d",
        "end_token_pos_7": 405,
        "end_token_id_7": 526,
        "answer_token_id_8": 383,
        "answer_token_pos_8": 410,
        "answer_token_8": "F",
        "end_token_pos_8": 409,
        "end_token_id_8": 29889,
        "answer_token_id_9": 270,
        "answer_token_pos_9": 413,
        "answer_token_9": "d",
        "end_token_pos_9": 412,
        "end_token_id_9": 338
    },
    {
        "question": "Wumpuses are earthy. Gorpus is wumpus. Sam is gorpus.",
        "query": "True or false: Sam is earthy.",
        "answer": "Sam is gorpus. Gorpus is wumpus. Sam is wumpus. Wumpuses are earthy. Sam is earthy. True",
        "label": "True",
        "prompt": "Wumpuses are earthy. Gorpus is wumpus. Sam is gorpus. True or false: Sam is earthy. Let us think step by step.",
        "generated": "Sam is gorpus. Gorpus is wumpus. Sam is wumpus. Wumpuses are earthy. Sam is earthy. True",
        "noise_response_0": "",
        "noise_prompt_0": "Wumpuses are earthy. Gorpus is wumpus. Sam is gorpus. True or false: Fae is earthy. Let us think step by step.",
        "response_0": "",
        "noise_response_1": "Sam is",
        "noise_prompt_1": "Wumpuses are earthy. Gorpus is wumpus. Sam is Gorpus. True or false: Sam is earthy. Let us think step by step.",
        "response_1": "Sam is",
        "noise_response_2": "Sam is gorpus.",
        "noise_prompt_2": "Wumpuses are earthy. Shumpus is wumpus. Sam is gorpus. True or false: Sam is earthy. Let us think step by step.",
        "response_2": "Sam is gorpus.",
        "noise_response_3": "Sam is gorpus. Gorpus is",
        "noise_prompt_3": "Wumpuses are earthy. Gorpus is bitter. Sam is gorpus. True or false: Sam is earthy. Let us think step by step.",
        "response_3": "Sam is gorpus. Gorpus is",
        "noise_response_4": "Polly is gorpus. Gorpus is wumpus.",
        "noise_prompt_4": "Wumpuses are earthy. Gorpus is wumpus. Sam is gorpus. True or false: Sam is earthy. Let us think step by step.",
        "response_4": "Sam is gorpus. Gorpus is wumpus.",
        "noise_response_5": "Sam is gorpus. Gorpus is luminous. Sam is",
        "noise_prompt_5": "Wumpuses are earthy. Gorpus is wumpus. Sam is gorpus. True or false: Sam is earthy. Let us think step by step.",
        "response_5": "Sam is gorpus. Gorpus is wumpus. Sam is",
        "noise_response_6": "Sam is gorpus. Gorpus is wumpus. Sam is wumpus.",
        "noise_prompt_6": "Wren are earthy. Gorpus is wumpus. Sam is gorpus. True or false: Sam is earthy. Let us think step by step.",
        "response_6": "Sam is gorpus. Gorpus is wumpus. Sam is wumpus.",
        "noise_response_7": "Sam is gorpus. Gorpus is wumpus. Sam is wumpus. Wumpuses are",
        "noise_prompt_7": "Wumpuses are earthy. Gorpus is wumpus. Sam is gorpus. True or false: Sam is angry. Let us think step by step.",
        "response_7": "Sam is gorpus. Gorpus is wumpus. Sam is wumpus. Wumpuses are",
        "noise_response_8": "Sam is gorpus. Gorpus is wumpus. Max is wumpus. Wumpuses are earthy.",
        "noise_prompt_8": "Wumpuses are earthy. Gorpus is wumpus. Sam is gorpus. True or false: Sam is earthy. Let us think step by step.",
        "response_8": "Sam is gorpus. Gorpus is wumpus. Sam is wumpus. Wumpuses are earthy.",
        "noise_response_9": "Sam is gorpus. Gorpus is wumpus. Sam is wumpus. Wumpuses are hot. Sam is",
        "noise_prompt_9": "Wumpuses are earthy. Gorpus is wumpus. Sam is gorpus. True or false: Sam is earthy. Let us think step by step.",
        "response_9": "Sam is gorpus. Gorpus is wumpus. Sam is wumpus. Wumpuses are earthy. Sam is",
        "noise_prompt_10": "Wumpuses are earthy. Gorpus is wumpus. Sam is gorpus. True or false: Sam is earthy. Let us think step by step.",
        "response_10": "Sam is gorpus. Gorpus is wumpus. Sam is wumpus. Wumpuses are earthy. Sam is earthy.",
        "noise_response_10": "Sam is gorpus. Gorpus is wumpus. Sam is wumpus. Wumpuses are earthy. Sam is small.",
        "answer_token_id_0": 22966,
        "answer_token_pos_0": 380,
        "answer_token_0": "Sam",
        "end_token_pos_0": 379,
        "end_token_id_0": 13,
        "answer_token_id_1": 330,
        "answer_token_pos_1": 383,
        "answer_token_1": "g",
        "end_token_pos_1": 382,
        "end_token_id_1": 338,
        "answer_token_id_2": 18686,
        "answer_token_pos_2": 387,
        "answer_token_2": "Gor",
        "end_token_pos_2": 386,
        "end_token_id_2": 29889,
        "answer_token_id_3": 281,
        "answer_token_pos_3": 391,
        "answer_token_3": "w",
        "end_token_pos_3": 390,
        "end_token_id_3": 338,
        "answer_token_id_4": 18686,
        "answer_token_pos_4": 395,
        "answer_token_4": "Gor",
        "end_token_pos_4": 394,
        "end_token_id_4": 29889,
        "answer_token_id_5": 281,
        "answer_token_pos_5": 398,
        "answer_token_5": "w",
        "end_token_pos_5": 397,
        "end_token_id_5": 338,
        "answer_token_id_6": 399,
        "answer_token_pos_6": 402,
        "answer_token_6": "W",
        "end_token_pos_6": 401,
        "end_token_id_6": 29889,
        "answer_token_id_7": 8437,
        "answer_token_pos_7": 406,
        "answer_token_7": "earth",
        "end_token_pos_7": 405,
        "end_token_id_7": 526,
        "answer_token_id_8": 3685,
        "answer_token_pos_8": 410,
        "answer_token_8": "Sam",
        "end_token_pos_8": 409,
        "end_token_id_8": 29889,
        "answer_token_id_9": 8437,
        "answer_token_pos_9": 413,
        "answer_token_9": "earth",
        "end_token_pos_9": 412,
        "end_token_id_9": 338
    },
    {
        "question": "Lempuses are rainy. Gorpus is lempus. Alex is gorpus.",
        "query": "True or false: Alex is rainy.",
        "answer": "Alex is gorpus. Gorpus is lempus. Alex is lempus. Lempuses are rainy. Alex is rainy. True",
        "label": "True",
        "prompt": "Lempuses are rainy. Gorpus is lempus. Alex is gorpus. True or false: Alex is rainy. Let us think step by step.",
        "generated": "Alex is gorpus. Gorpus is lempus. Alex is lempus. Lempuses are rainy. Alex is rainy. True",
        "noise_response_0": "",
        "noise_prompt_0": "Lempuses are rainy. Gorpus is lempus. Alex is gorpus. True or false: Rex is rainy. Let us think step by step.",
        "response_0": "",
        "noise_response_1": "Alex is",
        "noise_prompt_1": "Lempuses are rainy. Gorpus is lempus. Alex is Shumpus. True or false: Alex is rainy. Let us think step by step.",
        "response_1": "Alex is",
        "noise_response_2": "Alex is gorpus.",
        "noise_prompt_2": "Lempuses are rainy. Tumpus is lempus. Alex is gorpus. True or false: Alex is rainy. Let us think step by step.",
        "response_2": "Alex is gorpus.",
        "noise_response_3": "Alex is gorpus. Gorpus is",
        "noise_prompt_3": "Lempuses are rainy. Gorpus is Shumpus. Alex is gorpus. True or false: Alex is rainy. Let us think step by step.",
        "response_3": "Alex is gorpus. Gorpus is",
        "noise_response_4": "Fae is gorpus. Gorpus is lempus.",
        "noise_prompt_4": "Lempuses are rainy. Gorpus is lempus. Alex is gorpus. True or false: Alex is rainy. Let us think step by step.",
        "response_4": "Alex is gorpus. Gorpus is lempus.",
        "noise_response_5": "Alex is gorpus. Gorpus is Rompus. Alex is",
        "noise_prompt_5": "Lempuses are rainy. Gorpus is lempus. Alex is gorpus. True or false: Alex is rainy. Let us think step by step.",
        "response_5": "Alex is gorpus. Gorpus is lempus. Alex is",
        "noise_response_6": "Alex is gorpus. Gorpus is lempus. Alex is lempus.",
        "noise_prompt_6": "Yumpus are rainy. Gorpus is lempus. Alex is gorpus. True or false: Alex is rainy. Let us think step by step.",
        "response_6": "Alex is gorpus. Gorpus is lempus. Alex is lempus.",
        "noise_response_7": "Alex is gorpus. Gorpus is lempus. Alex is lempus. Lempuses are",
        "noise_prompt_7": "Lempuses are rainy. Gorpus is lempus. Alex is gorpus. True or false: Alex is slow. Let us think step by step.",
        "response_7": "Alex is gorpus. Gorpus is lempus. Alex is lempus. Lempuses are",
        "noise_response_8": "Alex is gorpus. Gorpus is lempus. Sally is lempus. Lempuses are rainy.",
        "noise_prompt_8": "Lempuses are rainy. Gorpus is lempus. Alex is gorpus. True or false: Alex is rainy. Let us think step by step.",
        "response_8": "Alex is gorpus. Gorpus is lempus. Alex is lempus. Lempuses are rainy.",
        "noise_response_9": "Alex is gorpus. Gorpus is lempus. Alex is lempus. Lempuses are shy. Alex is",
        "noise_prompt_9": "Lempuses are rainy. Gorpus is lempus. Alex is gorpus. True or false: Alex is rainy. Let us think step by step.",
        "response_9": "Alex is gorpus. Gorpus is lempus. Alex is lempus. Lempuses are rainy. Alex is",
        "noise_prompt_10": "Lempuses are rainy. Gorpus is lempus. Alex is gorpus. True or false: Alex is rainy. Let us think step by step.",
        "response_10": "Alex is gorpus. Gorpus is lempus. Alex is lempus. Lempuses are rainy. Alex is rainy.",
        "noise_response_10": "Alex is gorpus. Gorpus is lempus. Alex is lempus. Lempuses are rainy. Alex is liquid.",
        "answer_token_id_0": 17406,
        "answer_token_pos_0": 380,
        "answer_token_0": "Alex",
        "end_token_pos_0": 379,
        "end_token_id_0": 13,
        "answer_token_id_1": 330,
        "answer_token_pos_1": 383,
        "answer_token_1": "g",
        "end_token_pos_1": 382,
        "end_token_id_1": 338,
        "answer_token_id_2": 18686,
        "answer_token_pos_2": 387,
        "answer_token_2": "Gor",
        "end_token_pos_2": 386,
        "end_token_id_2": 29889,
        "answer_token_id_3": 454,
        "answer_token_pos_3": 391,
        "answer_token_3": "le",
        "end_token_pos_3": 390,
        "end_token_id_3": 338,
        "answer_token_id_4": 365,
        "answer_token_pos_4": 395,
        "answer_token_4": "L",
        "end_token_pos_4": 394,
        "end_token_id_4": 29889,
        "answer_token_id_5": 454,
        "answer_token_pos_5": 398,
        "answer_token_5": "le",
        "end_token_pos_5": 397,
        "end_token_id_5": 338,
        "answer_token_id_6": 365,
        "answer_token_pos_6": 402,
        "answer_token_6": "L",
        "end_token_pos_6": 401,
        "end_token_id_6": 29889,
        "answer_token_id_7": 1153,
        "answer_token_pos_7": 406,
        "answer_token_7": "ra",
        "end_token_pos_7": 405,
        "end_token_id_7": 526,
        "answer_token_id_8": 4827,
        "answer_token_pos_8": 410,
        "answer_token_8": "Alex",
        "end_token_pos_8": 409,
        "end_token_id_8": 29889,
        "answer_token_id_9": 1153,
        "answer_token_pos_9": 413,
        "answer_token_9": "ra",
        "end_token_pos_9": 412,
        "end_token_id_9": 338
    },
    {
        "question": "Gorpuses are discordant. Sterpus is gorpus. Fae is sterpus.",
        "query": "True or false: Fae is metallic.",
        "answer": "Fae is sterpus. Sterpus is gorpus. Fae is gorpus. Gorpuses are discordant. Fae is discordant. False",
        "label": "False",
        "prompt": "Gorpuses are discordant. Sterpus is gorpus. Fae is sterpus. True or false: Fae is metallic. Let us think step by step.",
        "generated": "Fae is sterpus. Sterpus is gorpus. Fae is gorpus. Gorpuses are discordant. Fae is discordant. False",
        "noise_response_0": "",
        "noise_prompt_0": "Gorpuses are discordant. Sterpus is gorpus. Fae is sterpus. True or false: Polly is metallic. Let us think step by step.",
        "response_0": "",
        "noise_response_1": "Fae is",
        "noise_prompt_1": "Gorpuses are discordant. Sterpus is gorpus. Fae is lorpus. True or false: Fae is metallic. Let us think step by step.",
        "response_1": "Fae is",
        "noise_response_2": "Fae is sterpus.",
        "noise_prompt_2": "Gorpuses are discordant. Lorpus is gorpus. Fae is sterpus. True or false: Fae is metallic. Let us think step by step.",
        "response_2": "Fae is sterpus.",
        "noise_response_3": "Fae is sterpus. Sterpus is",
        "noise_prompt_3": "Gorpuses are discordant. Sterpus is Grimpus. Fae is sterpus. True or false: Fae is metallic. Let us think step by step.",
        "response_3": "Fae is sterpus. Sterpus is",
        "noise_response_4": "Polly is sterpus. Sterpus is gorpus.",
        "noise_prompt_4": "Gorpuses are discordant. Sterpus is gorpus. Fae is sterpus. True or false: Fae is metallic. Let us think step by step.",
        "response_4": "Fae is sterpus. Sterpus is gorpus.",
        "noise_response_5": "Fae is sterpus. Sterpus is dumpus. Fae is",
        "noise_prompt_5": "Gorpuses are discordant. Sterpus is gorpus. Fae is sterpus. True or false: Fae is metallic. Let us think step by step.",
        "response_5": "Fae is sterpus. Sterpus is gorpus. Fae is",
        "noise_response_6": "Fae is sterpus. Sterpus is gorpus. Fae is gorpus.",
        "noise_prompt_6": "brimpus are discordant. Sterpus is gorpus. Fae is sterpus. True or false: Fae is metallic. Let us think step by step.",
        "response_6": "Fae is sterpus. Sterpus is gorpus. Fae is gorpus.",
        "noise_response_7": "Fae is sterpus. Sterpus is gorpus. Fae is gorpus. Gorpuses are",
        "noise_prompt_7": "Gorpuses are shy. Sterpus is gorpus. Fae is sterpus. True or false: Fae is metallic. Let us think step by step.",
        "response_7": "Fae is sterpus. Sterpus is gorpus. Fae is gorpus. Gorpuses are",
        "noise_response_8": "Fae is sterpus. Sterpus is gorpus. Sally is gorpus. Gorpuses are discordant.",
        "noise_prompt_8": "Gorpuses are discordant. Sterpus is gorpus. Fae is sterpus. True or false: Fae is metallic. Let us think step by step.",
        "response_8": "Fae is sterpus. Sterpus is gorpus. Fae is gorpus. Gorpuses are discordant.",
        "noise_response_9": "Fae is sterpus. Sterpus is gorpus. Fae is gorpus. Gorpuses are snowy. Fae is",
        "noise_prompt_9": "Gorpuses are discordant. Sterpus is gorpus. Fae is sterpus. True or false: Fae is metallic. Let us think step by step.",
        "response_9": "Fae is sterpus. Sterpus is gorpus. Fae is gorpus. Gorpuses are discordant. Fae is",
        "noise_prompt_10": "Gorpuses are discordant. Sterpus is gorpus. Fae is sterpus. True or false: Fae is metallic. Let us think step by step.",
        "response_10": "Fae is sterpus. Sterpus is gorpus. Fae is gorpus. Gorpuses are discordant. Fae is discordant.",
        "noise_response_10": "Fae is sterpus. Sterpus is gorpus. Fae is gorpus. Gorpuses are discordant. Fae is windy.",
        "answer_token_id_0": 29943,
        "answer_token_pos_0": 380,
        "answer_token_0": "F",
        "end_token_pos_0": 379,
        "end_token_id_0": 13,
        "answer_token_id_1": 16864,
        "answer_token_pos_1": 383,
        "answer_token_1": "ster",
        "end_token_pos_1": 382,
        "end_token_id_1": 338,
        "answer_token_id_2": 28588,
        "answer_token_pos_2": 387,
        "answer_token_2": "Ster",
        "end_token_pos_2": 386,
        "end_token_id_2": 29889,
        "answer_token_id_3": 330,
        "answer_token_pos_3": 391,
        "answer_token_3": "g",
        "end_token_pos_3": 390,
        "end_token_id_3": 338,
        "answer_token_id_4": 383,
        "answer_token_pos_4": 395,
        "answer_token_4": "F",
        "end_token_pos_4": 394,
        "end_token_id_4": 29889,
        "answer_token_id_5": 330,
        "answer_token_pos_5": 398,
        "answer_token_5": "g",
        "end_token_pos_5": 397,
        "end_token_id_5": 338,
        "answer_token_id_6": 18686,
        "answer_token_pos_6": 402,
        "answer_token_6": "Gor",
        "end_token_pos_6": 401,
        "end_token_id_6": 29889,
        "answer_token_id_7": 2313,
        "answer_token_pos_7": 406,
        "answer_token_7": "disc",
        "end_token_pos_7": 405,
        "end_token_id_7": 526,
        "answer_token_id_8": 383,
        "answer_token_pos_8": 410,
        "answer_token_8": "F",
        "end_token_pos_8": 409,
        "end_token_id_8": 29889,
        "answer_token_id_9": 2313,
        "answer_token_pos_9": 413,
        "answer_token_9": "disc",
        "end_token_pos_9": 412,
        "end_token_id_9": 338
    },
    {
        "question": "Gorpuses are mean. Wumpus is gorpus. Max is wumpus.",
        "query": "True or false: Max is mean.",
        "answer": "Max is wumpus. Wumpus is gorpus. Max is gorpus. Gorpuses are mean. Max is mean. True",
        "label": "True",
        "prompt": "Gorpuses are mean. Wumpus is gorpus. Max is wumpus. True or false: Max is mean. Let us think step by step.",
        "generated": "Max is wumpus. Wumpus is gorpus. Max is gorpus. Gorpuses are mean. Max is mean. True",
        "noise_response_0": "",
        "noise_prompt_0": "Gorpuses are mean. Wumpus is gorpus. Max is wumpus. True or false: Fae is mean. Let us think step by step.",
        "response_0": "",
        "noise_response_1": "Max is",
        "noise_prompt_1": "Gorpuses are mean. Wumpus is gorpus. Max is red. True or false: Max is mean. Let us think step by step.",
        "response_1": "Max is",
        "noise_response_2": "Max is wumpus.",
        "noise_prompt_2": "Gorpuses are mean. Stella is gorpus. Max is wumpus. True or false: Max is mean. Let us think step by step.",
        "response_2": "Max is wumpus.",
        "noise_response_3": "Max is wumpus. Wumpus is",
        "noise_prompt_3": "Gorpuses are mean. Wumpus is Grimpus. Max is wumpus. True or false: Max is mean. Let us think step by step.",
        "response_3": "Max is wumpus. Wumpus is",
        "noise_response_4": "Stella is wumpus. Wumpus is gorpus.",
        "noise_prompt_4": "Gorpuses are mean. Wumpus is gorpus. Max is wumpus. True or false: Max is mean. Let us think step by step.",
        "response_4": "Max is wumpus. Wumpus is gorpus.",
        "noise_response_5": "Max is wumpus. Wumpus is Wumpus. Max is",
        "noise_prompt_5": "Gorpuses are mean. Wumpus is gorpus. Max is wumpus. True or false: Max is mean. Let us think step by step.",
        "response_5": "Max is wumpus. Wumpus is gorpus. Max is",
        "noise_response_6": "Max is wumpus. Wumpus is gorpus. Max is gorpus.",
        "noise_prompt_6": "Yumpus are mean. Wumpus is gorpus. Max is wumpus. True or false: Max is mean. Let us think step by step.",
        "response_6": "Max is wumpus. Wumpus is gorpus. Max is gorpus.",
        "noise_response_7": "Max is wumpus. Wumpus is gorpus. Max is gorpus. Gorpuses are",
        "noise_prompt_7": "Gorpuses are mean. Wumpus is gorpus. Max is wumpus. True or false: Max is muffled. Let us think step by step.",
        "response_7": "Max is wumpus. Wumpus is gorpus. Max is gorpus. Gorpuses are",
        "noise_response_8": "Max is wumpus. Wumpus is gorpus. Alex is gorpus. Gorpuses are mean.",
        "noise_prompt_8": "Gorpuses are mean. Wumpus is gorpus. Max is wumpus. True or false: Max is mean. Let us think step by step.",
        "response_8": "Max is wumpus. Wumpus is gorpus. Max is gorpus. Gorpuses are mean.",
        "noise_response_9": "Max is wumpus. Wumpus is gorpus. Max is gorpus. Gorpuses are feisty. Max is",
        "noise_prompt_9": "Gorpuses are mean. Wumpus is gorpus. Max is wumpus. True or false: Max is mean. Let us think step by step.",
        "response_9": "Max is wumpus. Wumpus is gorpus. Max is gorpus. Gorpuses are mean. Max is",
        "noise_prompt_10": "Gorpuses are mean. Wumpus is gorpus. Max is wumpus. True or false: Max is mean. Let us think step by step.",
        "response_10": "Max is wumpus. Wumpus is gorpus. Max is gorpus. Gorpuses are mean. Max is mean.",
        "noise_response_10": "Max is wumpus. Wumpus is gorpus. Max is gorpus. Gorpuses are mean. Max is floral.",
        "answer_token_id_0": 7976,
        "answer_token_pos_0": 380,
        "answer_token_0": "Max",
        "end_token_pos_0": 379,
        "end_token_id_0": 13,
        "answer_token_id_1": 281,
        "answer_token_pos_1": 383,
        "answer_token_1": "w",
        "end_token_pos_1": 382,
        "end_token_id_1": 338,
        "answer_token_id_2": 399,
        "answer_token_pos_2": 387,
        "answer_token_2": "W",
        "end_token_pos_2": 386,
        "end_token_id_2": 29889,
        "answer_token_id_3": 330,
        "answer_token_pos_3": 391,
        "answer_token_3": "g",
        "end_token_pos_3": 390,
        "end_token_id_3": 338,
        "answer_token_id_4": 18686,
        "answer_token_pos_4": 395,
        "answer_token_4": "Gor",
        "end_token_pos_4": 394,
        "end_token_id_4": 29889,
        "answer_token_id_5": 330,
        "answer_token_pos_5": 398,
        "answer_token_5": "g",
        "end_token_pos_5": 397,
        "end_token_id_5": 338,
        "answer_token_id_6": 18686,
        "answer_token_pos_6": 402,
        "answer_token_6": "Gor",
        "end_token_pos_6": 401,
        "end_token_id_6": 29889,
        "answer_token_id_7": 2099,
        "answer_token_pos_7": 406,
        "answer_token_7": "mean",
        "end_token_pos_7": 405,
        "end_token_id_7": 526,
        "answer_token_id_8": 5918,
        "answer_token_pos_8": 410,
        "answer_token_8": "Max",
        "end_token_pos_8": 409,
        "end_token_id_8": 29889,
        "answer_token_id_9": 2099,
        "answer_token_pos_9": 413,
        "answer_token_9": "mean",
        "end_token_pos_9": 412,
        "end_token_id_9": 338
    },
    {
        "question": "Zumpuses are muffled. Wumpus is zumpus. Fae is wumpus.",
        "query": "True or false: Fae is angry.",
        "answer": "Fae is wumpus. Wumpus is zumpus. Fae is zumpus. Zumpuses are muffled. Fae is muffled. False",
        "label": "False",
        "prompt": "Zumpuses are muffled. Wumpus is zumpus. Fae is wumpus. True or false: Fae is angry. Let us think step by step.",
        "generated": "Fae is wumpus. Wumpus is zumpus. Fae is zumpus. Zumpuses are muffled. Fae is muffled. False",
        "noise_response_0": "",
        "noise_prompt_0": "Zumpuses are muffled. Wumpus is zumpus. Fae is wumpus. True or false: Stella is angry. Let us think step by step.",
        "response_0": "",
        "noise_response_1": "Fae is",
        "noise_prompt_1": "Zumpuses are muffled. Wumpus is zumpus. Fae is liquid. True or false: Fae is angry. Let us think step by step.",
        "response_1": "Fae is",
        "noise_response_2": "Fae is wumpus.",
        "noise_prompt_2": "Zumpuses are muffled. Stella is zumpus. Fae is wumpus. True or false: Fae is angry. Let us think step by step.",
        "response_2": "Fae is wumpus.",
        "noise_response_3": "Fae is wumpus. Wumpus is",
        "noise_prompt_3": "Zumpuses are muffled. Wumpus is Tumpus. Fae is wumpus. True or false: Fae is angry. Let us think step by step.",
        "response_3": "Fae is wumpus. Wumpus is",
        "noise_response_4": "Sally is wumpus. Wumpus is zumpus.",
        "noise_prompt_4": "Zumpuses are muffled. Wumpus is zumpus. Fae is wumpus. True or false: Fae is angry. Let us think step by step.",
        "response_4": "Fae is wumpus. Wumpus is zumpus.",
        "noise_response_5": "Fae is wumpus. Wumpus is Wumpus. Fae is",
        "noise_prompt_5": "Zumpuses are muffled. Wumpus is zumpus. Fae is wumpus. True or false: Fae is angry. Let us think step by step.",
        "response_5": "Fae is wumpus. Wumpus is zumpus. Fae is",
        "noise_response_6": "Fae is wumpus. Wumpus is zumpus. Fae is zumpus.",
        "noise_prompt_6": "tumpus are muffled. Wumpus is zumpus. Fae is wumpus. True or false: Fae is angry. Let us think step by step.",
        "response_6": "Fae is wumpus. Wumpus is zumpus. Fae is zumpus.",
        "noise_response_7": "Fae is wumpus. Wumpus is zumpus. Fae is zumpus. Zumpuses are",
        "noise_prompt_7": "Zumpuses are windy. Wumpus is zumpus. Fae is wumpus. True or false: Fae is angry. Let us think step by step.",
        "response_7": "Fae is wumpus. Wumpus is zumpus. Fae is zumpus. Zumpuses are",
        "noise_response_8": "Fae is wumpus. Wumpus is zumpus. Polly is zumpus. Zumpuses are muffled.",
        "noise_prompt_8": "Zumpuses are muffled. Wumpus is zumpus. Fae is wumpus. True or false: Fae is angry. Let us think step by step.",
        "response_8": "Fae is wumpus. Wumpus is zumpus. Fae is zumpus. Zumpuses are muffled.",
        "noise_response_9": "Fae is wumpus. Wumpus is zumpus. Fae is zumpus. Zumpuses are sunny. Fae is",
        "noise_prompt_9": "Zumpuses are muffled. Wumpus is zumpus. Fae is wumpus. True or false: Fae is angry. Let us think step by step.",
        "response_9": "Fae is wumpus. Wumpus is zumpus. Fae is zumpus. Zumpuses are muffled. Fae is",
        "noise_prompt_10": "Zumpuses are muffled. Wumpus is zumpus. Fae is wumpus. True or false: Fae is angry. Let us think step by step.",
        "response_10": "Fae is wumpus. Wumpus is zumpus. Fae is zumpus. Zumpuses are muffled. Fae is muffled.",
        "noise_response_10": "Fae is wumpus. Wumpus is zumpus. Fae is zumpus. Zumpuses are muffled. Fae is hot.",
        "answer_token_id_0": 29943,
        "answer_token_pos_0": 380,
        "answer_token_0": "F",
        "end_token_pos_0": 379,
        "end_token_id_0": 13,
        "answer_token_id_1": 281,
        "answer_token_pos_1": 383,
        "answer_token_1": "w",
        "end_token_pos_1": 382,
        "end_token_id_1": 338,
        "answer_token_id_2": 399,
        "answer_token_pos_2": 387,
        "answer_token_2": "W",
        "end_token_pos_2": 386,
        "end_token_id_2": 29889,
        "answer_token_id_3": 3356,
        "answer_token_pos_3": 391,
        "answer_token_3": "zum",
        "end_token_pos_3": 390,
        "end_token_id_3": 338,
        "answer_token_id_4": 383,
        "answer_token_pos_4": 395,
        "answer_token_4": "F",
        "end_token_pos_4": 394,
        "end_token_id_4": 29889,
        "answer_token_id_5": 3356,
        "answer_token_pos_5": 398,
        "answer_token_5": "zum",
        "end_token_pos_5": 397,
        "end_token_id_5": 338,
        "answer_token_id_6": 796,
        "answer_token_pos_6": 402,
        "answer_token_6": "Z",
        "end_token_pos_6": 401,
        "end_token_id_6": 29889,
        "answer_token_id_7": 286,
        "answer_token_pos_7": 406,
        "answer_token_7": "m",
        "end_token_pos_7": 405,
        "end_token_id_7": 526,
        "answer_token_id_8": 383,
        "answer_token_pos_8": 410,
        "answer_token_8": "F",
        "end_token_pos_8": 409,
        "end_token_id_8": 29889,
        "answer_token_id_9": 286,
        "answer_token_pos_9": 413,
        "answer_token_9": "m",
        "end_token_pos_9": 412,
        "end_token_id_9": 338
    },
    {
        "question": "Gorpuses are sweet. Impus is gorpus. Stella is impus.",
        "query": "True or false: Stella is sweet.",
        "answer": "Stella is impus. Impus is gorpus. Stella is gorpus. Gorpuses are sweet. Stella is sweet. True",
        "label": "True",
        "prompt": "Gorpuses are sweet. Impus is gorpus. Stella is impus. True or false: Stella is sweet. Let us think step by step.",
        "generated": "Stella is impus. Impus is gorpus. Stella is gorpus. Gorpuses are sweet. Stella is sweet. True",
        "noise_response_0": "",
        "noise_prompt_0": "Gorpuses are sweet. Impus is gorpus. Stella is impus. True or false: Wren is sweet. Let us think step by step.",
        "response_0": "",
        "noise_response_1": "Stella is",
        "noise_prompt_1": "Gorpuses are sweet. Impus is gorpus. Stella is Sterpus. True or false: Stella is sweet. Let us think step by step.",
        "response_1": "Stella is",
        "noise_response_2": "Stella is impus.",
        "noise_prompt_2": "Gorpuses are sweet. Lempus is gorpus. Stella is impus. True or false: Stella is sweet. Let us think step by step.",
        "response_2": "Stella is impus.",
        "noise_response_3": "Stella is impus. Impus is",
        "noise_prompt_3": "Gorpuses are sweet. Impus is jompus. Stella is impus. True or false: Stella is sweet. Let us think step by step.",
        "response_3": "Stella is impus. Impus is",
        "noise_response_4": "Rex is impus. Impus is gorpus.",
        "noise_prompt_4": "Gorpuses are sweet. Impus is gorpus. Stella is impus. True or false: Stella is sweet. Let us think step by step.",
        "response_4": "Stella is impus. Impus is gorpus.",
        "noise_response_5": "Stella is impus. Impus is grimpus. Stella is",
        "noise_prompt_5": "Gorpuses are sweet. Impus is gorpus. Stella is impus. True or false: Stella is sweet. Let us think step by step.",
        "response_5": "Stella is impus. Impus is gorpus. Stella is",
        "noise_response_6": "Stella is impus. Impus is gorpus. Stella is gorpus.",
        "noise_prompt_6": "lorpus are sweet. Impus is gorpus. Stella is impus. True or false: Stella is sweet. Let us think step by step.",
        "response_6": "Stella is impus. Impus is gorpus. Stella is gorpus.",
        "noise_response_7": "Stella is impus. Impus is gorpus. Stella is gorpus. Gorpuses are",
        "noise_prompt_7": "Gorpuses are sweet. Impus is gorpus. Stella is impus. True or false: Stella is loud. Let us think step by step.",
        "response_7": "Stella is impus. Impus is gorpus. Stella is gorpus. Gorpuses are",
        "noise_response_8": "Stella is impus. Impus is gorpus. Sally is gorpus. Gorpuses are sweet.",
        "noise_prompt_8": "Gorpuses are sweet. Impus is gorpus. Stella is impus. True or false: Stella is sweet. Let us think step by step.",
        "response_8": "Stella is impus. Impus is gorpus. Stella is gorpus. Gorpuses are sweet.",
        "noise_response_9": "Stella is impus. Impus is gorpus. Stella is gorpus. Gorpuses are blue. Stella is",
        "noise_prompt_9": "Gorpuses are sweet. Impus is gorpus. Stella is impus. True or false: Stella is sweet. Let us think step by step.",
        "response_9": "Stella is impus. Impus is gorpus. Stella is gorpus. Gorpuses are sweet. Stella is",
        "noise_prompt_10": "Gorpuses are sweet. Impus is gorpus. Stella is impus. True or false: Stella is sweet. Let us think step by step.",
        "response_10": "Stella is impus. Impus is gorpus. Stella is gorpus. Gorpuses are sweet. Stella is sweet.",
        "noise_response_10": "Stella is impus. Impus is gorpus. Stella is gorpus. Gorpuses are sweet. Stella is nervous.",
        "answer_token_id_0": 855,
        "answer_token_pos_0": 380,
        "answer_token_0": "St",
        "end_token_pos_0": 379,
        "end_token_id_0": 13,
        "answer_token_id_1": 2411,
        "answer_token_pos_1": 383,
        "answer_token_1": "imp",
        "end_token_pos_1": 382,
        "end_token_id_1": 338,
        "answer_token_id_2": 14305,
        "answer_token_pos_2": 387,
        "answer_token_2": "Imp",
        "end_token_pos_2": 386,
        "end_token_id_2": 29889,
        "answer_token_id_3": 330,
        "answer_token_pos_3": 391,
        "answer_token_3": "g",
        "end_token_pos_3": 390,
        "end_token_id_3": 338,
        "answer_token_id_4": 624,
        "answer_token_pos_4": 395,
        "answer_token_4": "St",
        "end_token_pos_4": 394,
        "end_token_id_4": 29889,
        "answer_token_id_5": 330,
        "answer_token_pos_5": 398,
        "answer_token_5": "g",
        "end_token_pos_5": 397,
        "end_token_id_5": 338,
        "answer_token_id_6": 18686,
        "answer_token_pos_6": 402,
        "answer_token_6": "Gor",
        "end_token_pos_6": 401,
        "end_token_id_6": 29889,
        "answer_token_id_7": 14225,
        "answer_token_pos_7": 406,
        "answer_token_7": "sweet",
        "end_token_pos_7": 405,
        "end_token_id_7": 526,
        "answer_token_id_8": 624,
        "answer_token_pos_8": 410,
        "answer_token_8": "St",
        "end_token_pos_8": 409,
        "end_token_id_8": 29889,
        "answer_token_id_9": 14225,
        "answer_token_pos_9": 413,
        "answer_token_9": "sweet",
        "end_token_pos_9": 412,
        "end_token_id_9": 338
    },
    {
        "question": "Vumpus is brown. Numpus is vumpus. Sam is numpus.",
        "query": "True or false: Sam is brown.",
        "answer": "Sam is numpus. Numpus is vumpus. Sam is vumpus. Vumpus is brown. Sam is brown. True",
        "label": "True",
        "prompt": "Vumpus is brown. Numpus is vumpus. Sam is numpus. True or false: Sam is brown. Let us think step by step.",
        "generated": "Sam is numpus. Numpus is vumpus. Sam is vumpus. Vumpus is brown. Sam is brown. True",
        "noise_response_0": "",
        "noise_prompt_0": "Vumpus is brown. Numpus is vumpus. Sam is numpus. True or false: Rex is brown. Let us think step by step.",
        "response_0": "",
        "noise_response_1": "Sam is",
        "noise_prompt_1": "Vumpus is brown. Numpus is vumpus. Sam is lempus. True or false: Sam is brown. Let us think step by step.",
        "response_1": "Sam is",
        "noise_response_2": "Sam is numpus.",
        "noise_prompt_2": "Vumpus is brown. Tumpus is vumpus. Sam is numpus. True or false: Sam is brown. Let us think step by step.",
        "response_2": "Sam is numpus.",
        "noise_response_3": "Sam is numpus. Numpus is",
        "noise_prompt_3": "Vumpus is brown. Numpus is Dumpus. Sam is numpus. True or false: Sam is brown. Let us think step by step.",
        "response_3": "Sam is numpus. Numpus is",
        "noise_response_4": "Max is numpus. Numpus is vumpus.",
        "noise_prompt_4": "Vumpus is brown. Numpus is vumpus. Sam is numpus. True or false: Sam is brown. Let us think step by step.",
        "response_4": "Sam is numpus. Numpus is vumpus.",
        "noise_response_5": "Sam is numpus. Numpus is Dumpus. Sam is",
        "noise_prompt_5": "Vumpus is brown. Numpus is vumpus. Sam is numpus. True or false: Sam is brown. Let us think step by step.",
        "response_5": "Sam is numpus. Numpus is vumpus. Sam is",
        "noise_response_6": "Sam is numpus. Numpus is vumpus. Sam is vumpus.",
        "noise_prompt_6": "Dumpus is brown. Numpus is vumpus. Sam is numpus. True or false: Sam is brown. Let us think step by step.",
        "response_6": "Sam is numpus. Numpus is vumpus. Sam is vumpus.",
        "noise_response_7": "Sam is numpus. Numpus is vumpus. Sam is vumpus. Vumpus is",
        "noise_prompt_7": "Vumpus is brown. Numpus is vumpus. Sam is numpus. True or false: Sam is dull. Let us think step by step.",
        "response_7": "Sam is numpus. Numpus is vumpus. Sam is vumpus. Vumpus is",
        "noise_response_8": "Sam is numpus. Numpus is vumpus. Alex is vumpus. Vumpus is brown.",
        "noise_prompt_8": "Vumpus is brown. Numpus is vumpus. Sam is numpus. True or false: Sam is brown. Let us think step by step.",
        "response_8": "Sam is numpus. Numpus is vumpus. Sam is vumpus. Vumpus is brown.",
        "noise_response_9": "Sam is numpus. Numpus is vumpus. Sam is vumpus. Vumpus is moderate. Sam is",
        "noise_prompt_9": "Vumpus is brown. Numpus is vumpus. Sam is numpus. True or false: Sam is brown. Let us think step by step.",
        "response_9": "Sam is numpus. Numpus is vumpus. Sam is vumpus. Vumpus is brown. Sam is",
        "noise_prompt_10": "Vumpus is brown. Numpus is vumpus. Sam is numpus. True or false: Sam is brown. Let us think step by step.",
        "response_10": "Sam is numpus. Numpus is vumpus. Sam is vumpus. Vumpus is brown. Sam is brown.",
        "noise_response_10": "Sam is numpus. Numpus is vumpus. Sam is vumpus. Vumpus is brown. Sam is floral.",
        "answer_token_id_0": 22966,
        "answer_token_pos_0": 380,
        "answer_token_0": "Sam",
        "end_token_pos_0": 379,
        "end_token_id_0": 13,
        "answer_token_id_1": 954,
        "answer_token_pos_1": 383,
        "answer_token_1": "num",
        "end_token_pos_1": 382,
        "end_token_id_1": 338,
        "answer_token_id_2": 405,
        "answer_token_pos_2": 387,
        "answer_token_2": "N",
        "end_token_pos_2": 386,
        "end_token_id_2": 29889,
        "answer_token_id_3": 325,
        "answer_token_pos_3": 391,
        "answer_token_3": "v",
        "end_token_pos_3": 390,
        "end_token_id_3": 338,
        "answer_token_id_4": 478,
        "answer_token_pos_4": 395,
        "answer_token_4": "V",
        "end_token_pos_4": 394,
        "end_token_id_4": 29889,
        "answer_token_id_5": 325,
        "answer_token_pos_5": 398,
        "answer_token_5": "v",
        "end_token_pos_5": 397,
        "end_token_id_5": 338,
        "answer_token_id_6": 478,
        "answer_token_pos_6": 402,
        "answer_token_6": "V",
        "end_token_pos_6": 401,
        "end_token_id_6": 29889,
        "answer_token_id_7": 17354,
        "answer_token_pos_7": 406,
        "answer_token_7": "brown",
        "end_token_pos_7": 405,
        "end_token_id_7": 338,
        "answer_token_id_8": 3685,
        "answer_token_pos_8": 410,
        "answer_token_8": "Sam",
        "end_token_pos_8": 409,
        "end_token_id_8": 29889,
        "answer_token_id_9": 17354,
        "answer_token_pos_9": 413,
        "answer_token_9": "brown",
        "end_token_pos_9": 412,
        "end_token_id_9": 338
    },
    {
        "question": "Lempuses are cold. Brimpus is lempus. Sally is brimpus.",
        "query": "True or false: Sally is cold.",
        "answer": "Sally is brimpus. Brimpus is lempus. Sally is lempus. Lempuses are cold. Sally is cold. True",
        "label": "True",
        "prompt": "Lempuses are cold. Brimpus is lempus. Sally is brimpus. True or false: Sally is cold. Let us think step by step.",
        "generated": "Sally is brimpus. Brimpus is lempus. Sally is lempus. Lempuses are cold. Sally is cold. True",
        "noise_response_0": "",
        "noise_prompt_0": "Lempuses are cold. Brimpus is lempus. Sally is brimpus. True or false: Wren is cold. Let us think step by step.",
        "response_0": "",
        "noise_response_1": "Sally is",
        "noise_prompt_1": "Lempuses are cold. Brimpus is lempus. Sally is overcast. True or false: Sally is cold. Let us think step by step.",
        "response_1": "Sally is",
        "noise_response_2": "Sally is brimpus.",
        "noise_prompt_2": "Lempuses are cold. grimpus is lempus. Sally is brimpus. True or false: Sally is cold. Let us think step by step.",
        "response_2": "Sally is brimpus.",
        "noise_response_3": "Sally is brimpus. Brimpus is",
        "noise_prompt_3": "Lempuses are cold. Brimpus is Grimpus. Sally is brimpus. True or false: Sally is cold. Let us think step by step.",
        "response_3": "Sally is brimpus. Brimpus is",
        "noise_response_4": "Fae is brimpus. Brimpus is lempus.",
        "noise_prompt_4": "Lempuses are cold. Brimpus is lempus. Sally is brimpus. True or false: Sally is cold. Let us think step by step.",
        "response_4": "Sally is brimpus. Brimpus is lempus.",
        "noise_response_5": "Sally is brimpus. Brimpus is Impus. Sally is",
        "noise_prompt_5": "Lempuses are cold. Brimpus is lempus. Sally is brimpus. True or false: Sally is cold. Let us think step by step.",
        "response_5": "Sally is brimpus. Brimpus is lempus. Sally is",
        "noise_response_6": "Sally is brimpus. Brimpus is lempus. Sally is lempus.",
        "noise_prompt_6": "Vumpus are cold. Brimpus is lempus. Sally is brimpus. True or false: Sally is cold. Let us think step by step.",
        "response_6": "Sally is brimpus. Brimpus is lempus. Sally is lempus.",
        "noise_response_7": "Sally is brimpus. Brimpus is lempus. Sally is lempus. Lempuses are",
        "noise_prompt_7": "Lempuses are cold. Brimpus is lempus. Sally is brimpus. True or false: Sally is mean. Let us think step by step.",
        "response_7": "Sally is brimpus. Brimpus is lempus. Sally is lempus. Lempuses are",
        "noise_response_8": "Sally is brimpus. Brimpus is lempus. Wren is lempus. Lempuses are cold.",
        "noise_prompt_8": "Lempuses are cold. Brimpus is lempus. Sally is brimpus. True or false: Sally is cold. Let us think step by step.",
        "response_8": "Sally is brimpus. Brimpus is lempus. Sally is lempus. Lempuses are cold.",
        "noise_response_9": "Sally is brimpus. Brimpus is lempus. Sally is lempus. Lempuses are discordant. Sally is",
        "noise_prompt_9": "Lempuses are cold. Brimpus is lempus. Sally is brimpus. True or false: Sally is cold. Let us think step by step.",
        "response_9": "Sally is brimpus. Brimpus is lempus. Sally is lempus. Lempuses are cold. Sally is",
        "noise_prompt_10": "Lempuses are cold. Brimpus is lempus. Sally is brimpus. True or false: Sally is cold. Let us think step by step.",
        "response_10": "Sally is brimpus. Brimpus is lempus. Sally is lempus. Lempuses are cold. Sally is cold.",
        "noise_response_10": "Sally is brimpus. Brimpus is lempus. Sally is lempus. Lempuses are cold. Sally is feisty.",
        "answer_token_id_0": 29903,
        "answer_token_pos_0": 380,
        "answer_token_0": "S",
        "end_token_pos_0": 379,
        "end_token_id_0": 13,
        "answer_token_id_1": 1506,
        "answer_token_pos_1": 383,
        "answer_token_1": "br",
        "end_token_pos_1": 382,
        "end_token_id_1": 338,
        "answer_token_id_2": 1771,
        "answer_token_pos_2": 387,
        "answer_token_2": "Br",
        "end_token_pos_2": 386,
        "end_token_id_2": 29889,
        "answer_token_id_3": 454,
        "answer_token_pos_3": 391,
        "answer_token_3": "le",
        "end_token_pos_3": 390,
        "end_token_id_3": 338,
        "answer_token_id_4": 317,
        "answer_token_pos_4": 395,
        "answer_token_4": "S",
        "end_token_pos_4": 394,
        "end_token_id_4": 29889,
        "answer_token_id_5": 454,
        "answer_token_pos_5": 398,
        "answer_token_5": "le",
        "end_token_pos_5": 397,
        "end_token_id_5": 338,
        "answer_token_id_6": 365,
        "answer_token_pos_6": 402,
        "answer_token_6": "L",
        "end_token_pos_6": 401,
        "end_token_id_6": 29889,
        "answer_token_id_7": 11220,
        "answer_token_pos_7": 406,
        "answer_token_7": "cold",
        "end_token_pos_7": 405,
        "end_token_id_7": 526,
        "answer_token_id_8": 317,
        "answer_token_pos_8": 410,
        "answer_token_8": "S",
        "end_token_pos_8": 409,
        "end_token_id_8": 29889,
        "answer_token_id_9": 451,
        "answer_token_pos_9": 413,
        "answer_token_9": "not",
        "end_token_pos_9": 412,
        "end_token_id_9": 338
    },
    {
        "question": "Shumpuses are amenable. Impus is shumpus. Stella is impus.",
        "query": "True or false: Stella is amenable.",
        "answer": "Stella is impus. Impus is shumpus. Stella is shumpus. Shumpuses are amenable. Stella is amenable. True",
        "label": "True",
        "prompt": "Shumpuses are amenable. Impus is shumpus. Stella is impus. True or false: Stella is amenable. Let us think step by step.",
        "generated": "Stella is impus. Impus is shumpus. Stella is shumpus. Shumpuses are amenable. Stella is amenable. True",
        "noise_response_0": "",
        "noise_prompt_0": "Shumpuses are amenable. Impus is shumpus. Stella is impus. True or false: Wren is amenable. Let us think step by step.",
        "response_0": "",
        "noise_response_1": "Stella is",
        "noise_prompt_1": "Shumpuses are amenable. Impus is shumpus. Stella is sterpus. True or false: Stella is amenable. Let us think step by step.",
        "response_1": "Stella is",
        "noise_response_2": "Stella is impus.",
        "noise_prompt_2": "Shumpuses are amenable. Tumpus is shumpus. Stella is impus. True or false: Stella is amenable. Let us think step by step.",
        "response_2": "Stella is impus.",
        "noise_response_3": "Stella is impus. Impus is",
        "noise_prompt_3": "Shumpuses are amenable. Impus is small. Stella is impus. True or false: Stella is amenable. Let us think step by step.",
        "response_3": "Stella is impus. Impus is",
        "noise_response_4": "Sally is impus. Impus is shumpus.",
        "noise_prompt_4": "Shumpuses are amenable. Impus is shumpus. Stella is impus. True or false: Stella is amenable. Let us think step by step.",
        "response_4": "Stella is impus. Impus is shumpus.",
        "noise_response_5": "Stella is impus. Impus is melodic. Stella is",
        "noise_prompt_5": "Shumpuses are amenable. Impus is shumpus. Stella is impus. True or false: Stella is amenable. Let us think step by step.",
        "response_5": "Stella is impus. Impus is shumpus. Stella is",
        "noise_response_6": "Stella is impus. Impus is shumpus. Stella is shumpus.",
        "noise_prompt_6": "impus are amenable. Impus is shumpus. Stella is impus. True or false: Stella is amenable. Let us think step by step.",
        "response_6": "Stella is impus. Impus is shumpus. Stella is shumpus.",
        "noise_response_7": "Stella is impus. Impus is shumpus. Stella is shumpus. Shumpuses are",
        "noise_prompt_7": "Shumpuses are amenable. Impus is shumpus. Stella is impus. True or false: Stella is hot. Let us think step by step.",
        "response_7": "Stella is impus. Impus is shumpus. Stella is shumpus. Shumpuses are",
        "noise_response_8": "Stella is impus. Impus is shumpus. Fae is shumpus. Shumpuses are amenable.",
        "noise_prompt_8": "Shumpuses are amenable. Impus is shumpus. Stella is impus. True or false: Stella is amenable. Let us think step by step.",
        "response_8": "Stella is impus. Impus is shumpus. Stella is shumpus. Shumpuses are amenable.",
        "noise_response_9": "Stella is impus. Impus is shumpus. Stella is shumpus. Shumpuses are brown. Stella is",
        "noise_prompt_9": "Shumpuses are amenable. Impus is shumpus. Stella is impus. True or false: Stella is amenable. Let us think step by step.",
        "response_9": "Stella is impus. Impus is shumpus. Stella is shumpus. Shumpuses are amenable. Stella is",
        "noise_prompt_10": "Shumpuses are amenable. Impus is shumpus. Stella is impus. True or false: Stella is amenable. Let us think step by step.",
        "response_10": "Stella is impus. Impus is shumpus. Stella is shumpus. Shumpuses are amenable. Stella is amenable.",
        "noise_response_10": "Stella is impus. Impus is shumpus. Stella is shumpus. Shumpuses are amenable. Stella is sunny.",
        "answer_token_id_0": 855,
        "answer_token_pos_0": 380,
        "answer_token_0": "St",
        "end_token_pos_0": 379,
        "end_token_id_0": 13,
        "answer_token_id_1": 2411,
        "answer_token_pos_1": 383,
        "answer_token_1": "imp",
        "end_token_pos_1": 382,
        "end_token_id_1": 338,
        "answer_token_id_2": 14305,
        "answer_token_pos_2": 387,
        "answer_token_2": "Imp",
        "end_token_pos_2": 386,
        "end_token_id_2": 29889,
        "answer_token_id_3": 528,
        "answer_token_pos_3": 391,
        "answer_token_3": "sh",
        "end_token_pos_3": 390,
        "end_token_id_3": 338,
        "answer_token_id_4": 624,
        "answer_token_pos_4": 395,
        "answer_token_4": "St",
        "end_token_pos_4": 394,
        "end_token_id_4": 29889,
        "answer_token_id_5": 528,
        "answer_token_pos_5": 398,
        "answer_token_5": "sh",
        "end_token_pos_5": 397,
        "end_token_id_5": 338,
        "answer_token_id_6": 1383,
        "answer_token_pos_6": 402,
        "answer_token_6": "Sh",
        "end_token_pos_6": 401,
        "end_token_id_6": 29889,
        "answer_token_id_7": 626,
        "answer_token_pos_7": 406,
        "answer_token_7": "am",
        "end_token_pos_7": 405,
        "end_token_id_7": 526,
        "answer_token_id_8": 624,
        "answer_token_pos_8": 410,
        "answer_token_8": "St",
        "end_token_pos_8": 409,
        "end_token_id_8": 29889,
        "answer_token_id_9": 626,
        "answer_token_pos_9": 413,
        "answer_token_9": "am",
        "end_token_pos_9": 412,
        "end_token_id_9": 338
    },
    {
        "question": "Lempuses are moderate. Dumpuses are lempuses. Stella is dumpus.",
        "query": "True or false: Stella is moderate.",
        "answer": "Stella is dumpus. Dumpuses are lempuses. Stella is lempus. Lempuses are moderate. Stella is moderate. True",
        "label": "True",
        "prompt": "Lempuses are moderate. Dumpuses are lempuses. Stella is dumpus. True or false: Stella is moderate. Let us think step by step.",
        "generated": "Stella is dumpus. Dumpuses are lempuses. Stella is lempus. Lempuses are moderate. Stella is moderate. True",
        "noise_response_0": "",
        "noise_prompt_0": "Lempuses are moderate. Dumpuses are lempuses. Stella is dumpus. True or false: Sam is moderate. Let us think step by step.",
        "response_0": "",
        "noise_response_1": "Stella is",
        "noise_prompt_1": "Lempuses are moderate. Dumpuses are lempuses. Stella is dumpus. True or false: Stella is moderate. Let us think step by step.",
        "response_1": "Stella is",
        "noise_response_2": "Stella is dumpus.",
        "noise_prompt_2": "Lempuses are moderate. dumpus are lempuses. Stella is dumpus. True or false: Stella is moderate. Let us think step by step.",
        "response_2": "Stella is dumpus.",
        "noise_response_3": "Stella is dumpus. Dumpuses are",
        "noise_prompt_3": "Lempuses are moderate. Dumpuses are Rompus. Stella is dumpus. True or false: Stella is moderate. Let us think step by step.",
        "response_3": "Stella is dumpus. Dumpuses are",
        "noise_response_4": "Wren is dumpus. Dumpuses are lempuses.",
        "noise_prompt_4": "Lempuses are moderate. Dumpuses are lempuses. Stella is dumpus. True or false: Stella is moderate. Let us think step by step.",
        "response_4": "Stella is dumpus. Dumpuses are lempuses.",
        "noise_response_5": "Stella is dumpus. Dumpuses are Grimpus. Stella is",
        "noise_prompt_5": "Lempuses are moderate. Dumpuses are lempuses. Stella is dumpus. True or false: Stella is moderate. Let us think step by step.",
        "response_5": "Stella is dumpus. Dumpuses are lempuses. Stella is",
        "noise_response_6": "Stella is dumpus. Dumpuses are lempuses. Stella is lempus.",
        "noise_prompt_6": "lorpus are moderate. Dumpuses are lempuses. Stella is dumpus. True or false: Stella is moderate. Let us think step by step.",
        "response_6": "Stella is dumpus. Dumpuses are lempuses. Stella is lempus.",
        "noise_response_7": "Stella is dumpus. Dumpuses are lempuses. Stella is lempus. Lempuses are",
        "noise_prompt_7": "Lempuses are moderate. Dumpuses are lempuses. Stella is dumpus. True or false: Stella is sweet. Let us think step by step.",
        "response_7": "Stella is dumpus. Dumpuses are lempuses. Stella is lempus. Lempuses are",
        "noise_response_8": "Stella is dumpus. Dumpuses are lempuses. Rex is lempus. Lempuses are moderate.",
        "noise_prompt_8": "Lempuses are moderate. Dumpuses are lempuses. Stella is dumpus. True or false: Stella is moderate. Let us think step by step.",
        "response_8": "Stella is dumpus. Dumpuses are lempuses. Stella is lempus. Lempuses are moderate.",
        "noise_response_9": "Stella is dumpus. Dumpuses are lempuses. Stella is lempus. Lempuses are large. Stella is",
        "noise_prompt_9": "Lempuses are moderate. Dumpuses are lempuses. Stella is dumpus. True or false: Stella is moderate. Let us think step by step.",
        "response_9": "Stella is dumpus. Dumpuses are lempuses. Stella is lempus. Lempuses are moderate. Stella is",
        "noise_prompt_10": "Lempuses are moderate. Dumpuses are lempuses. Stella is dumpus. True or false: Stella is moderate. Let us think step by step.",
        "response_10": "Stella is dumpus. Dumpuses are lempuses. Stella is lempus. Lempuses are moderate. Stella is moderate.",
        "noise_response_10": "Stella is dumpus. Dumpuses are lempuses. Stella is lempus. Lempuses are moderate. Stella is windy.",
        "answer_token_id_0": 855,
        "answer_token_pos_0": 380,
        "answer_token_0": "St",
        "end_token_pos_0": 379,
        "end_token_id_0": 13,
        "answer_token_id_1": 16766,
        "answer_token_pos_1": 383,
        "answer_token_1": "dump",
        "end_token_pos_1": 382,
        "end_token_id_1": 338,
        "answer_token_id_2": 360,
        "answer_token_pos_2": 387,
        "answer_token_2": "D",
        "end_token_pos_2": 386,
        "end_token_id_2": 29889,
        "answer_token_id_3": 454,
        "answer_token_pos_3": 391,
        "answer_token_3": "le",
        "end_token_pos_3": 390,
        "end_token_id_3": 526,
        "answer_token_id_4": 624,
        "answer_token_pos_4": 395,
        "answer_token_4": "St",
        "end_token_pos_4": 394,
        "end_token_id_4": 29889,
        "answer_token_id_5": 454,
        "answer_token_pos_5": 398,
        "answer_token_5": "le",
        "end_token_pos_5": 397,
        "end_token_id_5": 338,
        "answer_token_id_6": 365,
        "answer_token_pos_6": 402,
        "answer_token_6": "L",
        "end_token_pos_6": 401,
        "end_token_id_6": 29889,
        "answer_token_id_7": 17768,
        "answer_token_pos_7": 406,
        "answer_token_7": "moder",
        "end_token_pos_7": 405,
        "end_token_id_7": 526,
        "answer_token_id_8": 624,
        "answer_token_pos_8": 410,
        "answer_token_8": "St",
        "end_token_pos_8": 409,
        "end_token_id_8": 29889,
        "answer_token_id_9": 17768,
        "answer_token_pos_9": 413,
        "answer_token_9": "moder",
        "end_token_pos_9": 412,
        "end_token_id_9": 338
    },
    {
        "question": "Lorpuses are small. Shumpus is lorpus. Alex is shumpus.",
        "query": "True or false: Alex is small.",
        "answer": "Alex is shumpus. Shumpus is lorpus. Alex is lorpus. Lorpuses are small. Alex is small. True",
        "label": "True",
        "prompt": "Lorpuses are small. Shumpus is lorpus. Alex is shumpus. True or false: Alex is small. Let us think step by step.",
        "generated": "Alex is shumpus. Shumpus is lorpus. Alex is lorpus. Lorpuses are small. Alex is small. True",
        "noise_response_0": "",
        "noise_prompt_0": "Lorpuses are small. Shumpus is lorpus. Alex is shumpus. True or false: Wren is small. Let us think step by step.",
        "response_0": "",
        "noise_response_1": "Alex is",
        "noise_prompt_1": "Lorpuses are small. Shumpus is lorpus. Alex is sour. True or false: Alex is small. Let us think step by step.",
        "response_1": "Alex is",
        "noise_response_2": "Alex is shumpus.",
        "noise_prompt_2": "Lorpuses are small. Impus is lorpus. Alex is shumpus. True or false: Alex is small. Let us think step by step.",
        "response_2": "Alex is shumpus.",
        "noise_response_3": "Alex is shumpus. Shumpus is",
        "noise_prompt_3": "Lorpuses are small. Shumpus is windy. Alex is shumpus. True or false: Alex is small. Let us think step by step.",
        "response_3": "Alex is shumpus. Shumpus is",
        "noise_response_4": "Fae is shumpus. Shumpus is lorpus.",
        "noise_prompt_4": "Lorpuses are small. Shumpus is lorpus. Alex is shumpus. True or false: Alex is small. Let us think step by step.",
        "response_4": "Alex is shumpus. Shumpus is lorpus.",
        "noise_response_5": "Alex is shumpus. Shumpus is kind. Alex is",
        "noise_prompt_5": "Lorpuses are small. Shumpus is lorpus. Alex is shumpus. True or false: Alex is small. Let us think step by step.",
        "response_5": "Alex is shumpus. Shumpus is lorpus. Alex is",
        "noise_response_6": "Alex is shumpus. Shumpus is lorpus. Alex is lorpus.",
        "noise_prompt_6": "numpus are small. Shumpus is lorpus. Alex is shumpus. True or false: Alex is small. Let us think step by step.",
        "response_6": "Alex is shumpus. Shumpus is lorpus. Alex is lorpus.",
        "noise_response_7": "Alex is shumpus. Shumpus is lorpus. Alex is lorpus. Lorpuses are",
        "noise_prompt_7": "Lorpuses are small. Shumpus is lorpus. Alex is shumpus. True or false: Alex is shy. Let us think step by step.",
        "response_7": "Alex is shumpus. Shumpus is lorpus. Alex is lorpus. Lorpuses are",
        "noise_response_8": "Alex is shumpus. Shumpus is lorpus. Fae is lorpus. Lorpuses are small.",
        "noise_prompt_8": "Lorpuses are small. Shumpus is lorpus. Alex is shumpus. True or false: Alex is small. Let us think step by step.",
        "response_8": "Alex is shumpus. Shumpus is lorpus. Alex is lorpus. Lorpuses are small.",
        "noise_response_9": "Alex is shumpus. Shumpus is lorpus. Alex is lorpus. Lorpuses are red. Alex is",
        "noise_prompt_9": "Lorpuses are small. Shumpus is lorpus. Alex is shumpus. True or false: Alex is small. Let us think step by step.",
        "response_9": "Alex is shumpus. Shumpus is lorpus. Alex is lorpus. Lorpuses are small. Alex is",
        "noise_prompt_10": "Lorpuses are small. Shumpus is lorpus. Alex is shumpus. True or false: Alex is small. Let us think step by step.",
        "response_10": "Alex is shumpus. Shumpus is lorpus. Alex is lorpus. Lorpuses are small. Alex is small.",
        "noise_response_10": "Alex is shumpus. Shumpus is lorpus. Alex is lorpus. Lorpuses are small. Alex is kind.",
        "answer_token_id_0": 17406,
        "answer_token_pos_0": 380,
        "answer_token_0": "Alex",
        "end_token_pos_0": 379,
        "end_token_id_0": 13,
        "answer_token_id_1": 528,
        "answer_token_pos_1": 383,
        "answer_token_1": "sh",
        "end_token_pos_1": 382,
        "end_token_id_1": 338,
        "answer_token_id_2": 1383,
        "answer_token_pos_2": 387,
        "answer_token_2": "Sh",
        "end_token_pos_2": 386,
        "end_token_id_2": 29889,
        "answer_token_id_3": 301,
        "answer_token_pos_3": 391,
        "answer_token_3": "l",
        "end_token_pos_3": 390,
        "end_token_id_3": 338,
        "answer_token_id_4": 10980,
        "answer_token_pos_4": 395,
        "answer_token_4": "Lor",
        "end_token_pos_4": 394,
        "end_token_id_4": 29889,
        "answer_token_id_5": 301,
        "answer_token_pos_5": 398,
        "answer_token_5": "l",
        "end_token_pos_5": 397,
        "end_token_id_5": 338,
        "answer_token_id_6": 10980,
        "answer_token_pos_6": 402,
        "answer_token_6": "Lor",
        "end_token_pos_6": 401,
        "end_token_id_6": 29889,
        "answer_token_id_7": 2319,
        "answer_token_pos_7": 406,
        "answer_token_7": "small",
        "end_token_pos_7": 405,
        "end_token_id_7": 526,
        "answer_token_id_8": 4827,
        "answer_token_pos_8": 410,
        "answer_token_8": "Alex",
        "end_token_pos_8": 409,
        "end_token_id_8": 29889,
        "answer_token_id_9": 2319,
        "answer_token_pos_9": 413,
        "answer_token_9": "small",
        "end_token_pos_9": 412,
        "end_token_id_9": 338
    },
    {
        "question": "Sterpus is temperate. Numpus is sterpus. Fae is numpus.",
        "query": "True or false: Fae is temperate.",
        "answer": "Fae is numpus. Numpus is sterpus. Fae is sterpus. Sterpus is temperate. Fae is temperate. True",
        "label": "True",
        "prompt": "Sterpus is temperate. Numpus is sterpus. Fae is numpus. True or false: Fae is temperate. Let us think step by step.",
        "generated": "Fae is numpus. Numpus is sterpus. Fae is sterpus. Sterpus is temperate. Fae is temperate. True",
        "noise_response_0": "",
        "noise_prompt_0": "Sterpus is temperate. Numpus is sterpus. Fae is numpus. True or false: Sam is temperate. Let us think step by step.",
        "response_0": "",
        "noise_response_1": "Fae is",
        "noise_prompt_1": "Sterpus is temperate. Numpus is sterpus. Fae is dumpus. True or false: Fae is temperate. Let us think step by step.",
        "response_1": "Fae is",
        "noise_response_2": "Fae is numpus.",
        "noise_prompt_2": "Sterpus is temperate. lempus is sterpus. Fae is numpus. True or false: Fae is temperate. Let us think step by step.",
        "response_2": "Fae is numpus.",
        "noise_response_3": "Fae is numpus. Numpus is",
        "noise_prompt_3": "Sterpus is temperate. Numpus is Lorpus. Fae is numpus. True or false: Fae is temperate. Let us think step by step.",
        "response_3": "Fae is numpus. Numpus is",
        "noise_response_4": "Alex is numpus. Numpus is sterpus.",
        "noise_prompt_4": "Sterpus is temperate. Numpus is sterpus. Fae is numpus. True or false: Fae is temperate. Let us think step by step.",
        "response_4": "Fae is numpus. Numpus is sterpus.",
        "noise_response_5": "Fae is numpus. Numpus is wumpus. Fae is",
        "noise_prompt_5": "Sterpus is temperate. Numpus is sterpus. Fae is numpus. True or false: Fae is temperate. Let us think step by step.",
        "response_5": "Fae is numpus. Numpus is sterpus. Fae is",
        "noise_response_6": "Fae is numpus. Numpus is sterpus. Fae is sterpus.",
        "noise_prompt_6": "vumpus is temperate. Numpus is sterpus. Fae is numpus. True or false: Fae is temperate. Let us think step by step.",
        "response_6": "Fae is numpus. Numpus is sterpus. Fae is sterpus.",
        "noise_response_7": "Fae is numpus. Numpus is sterpus. Fae is sterpus. Sterpus is",
        "noise_prompt_7": "Sterpus is temperate. Numpus is sterpus. Fae is numpus. True or false: Fae is mean. Let us think step by step.",
        "response_7": "Fae is numpus. Numpus is sterpus. Fae is sterpus. Sterpus is",
        "noise_response_8": "Fae is numpus. Numpus is sterpus. Stella is sterpus. Sterpus is temperate.",
        "noise_prompt_8": "Sterpus is temperate. Numpus is sterpus. Fae is numpus. True or false: Fae is temperate. Let us think step by step.",
        "response_8": "Fae is numpus. Numpus is sterpus. Fae is sterpus. Sterpus is temperate.",
        "noise_response_9": "Fae is numpus. Numpus is sterpus. Fae is sterpus. Sterpus is small. Fae is",
        "noise_prompt_9": "Sterpus is temperate. Numpus is sterpus. Fae is numpus. True or false: Fae is temperate. Let us think step by step.",
        "response_9": "Fae is numpus. Numpus is sterpus. Fae is sterpus. Sterpus is temperate. Fae is",
        "noise_prompt_10": "Sterpus is temperate. Numpus is sterpus. Fae is numpus. True or false: Fae is temperate. Let us think step by step.",
        "response_10": "Fae is numpus. Numpus is sterpus. Fae is sterpus. Sterpus is temperate. Fae is temperate.",
        "noise_response_10": "Fae is numpus. Numpus is sterpus. Fae is sterpus. Sterpus is temperate. Fae is moderate.",
        "answer_token_id_0": 29943,
        "answer_token_pos_0": 380,
        "answer_token_0": "F",
        "end_token_pos_0": 379,
        "end_token_id_0": 13,
        "answer_token_id_1": 954,
        "answer_token_pos_1": 383,
        "answer_token_1": "num",
        "end_token_pos_1": 382,
        "end_token_id_1": 338,
        "answer_token_id_2": 405,
        "answer_token_pos_2": 387,
        "answer_token_2": "N",
        "end_token_pos_2": 386,
        "end_token_id_2": 29889,
        "answer_token_id_3": 16864,
        "answer_token_pos_3": 391,
        "answer_token_3": "ster",
        "end_token_pos_3": 390,
        "end_token_id_3": 338,
        "answer_token_id_4": 383,
        "answer_token_pos_4": 395,
        "answer_token_4": "F",
        "end_token_pos_4": 394,
        "end_token_id_4": 29889,
        "answer_token_id_5": 16864,
        "answer_token_pos_5": 398,
        "answer_token_5": "ster",
        "end_token_pos_5": 397,
        "end_token_id_5": 338,
        "answer_token_id_6": 28588,
        "answer_token_pos_6": 402,
        "answer_token_6": "Ster",
        "end_token_pos_6": 401,
        "end_token_id_6": 29889,
        "answer_token_id_7": 6238,
        "answer_token_pos_7": 406,
        "answer_token_7": "temper",
        "end_token_pos_7": 405,
        "end_token_id_7": 338,
        "answer_token_id_8": 383,
        "answer_token_pos_8": 410,
        "answer_token_8": "F",
        "end_token_pos_8": 409,
        "end_token_id_8": 29889,
        "answer_token_id_9": 6238,
        "answer_token_pos_9": 413,
        "answer_token_9": "temper",
        "end_token_pos_9": 412,
        "end_token_id_9": 338
    },
    {
        "question": "Vumpuses are aggressive. Numpus is vumpus. Sally is numpus.",
        "query": "True or false: Sally is aggressive.",
        "answer": "Sally is numpus. Numpus is vumpus. Sally is vumpus. Vumpuses are aggressive. Sally is aggressive. True",
        "label": "True",
        "prompt": "Vumpuses are aggressive. Numpus is vumpus. Sally is numpus. True or false: Sally is aggressive. Let us think step by step.",
        "generated": "Sally is numpus. Numpus is vumpus. Sally is vumpus. Vumpuses are aggressive. Sally is aggressive. True",
        "noise_response_0": "",
        "noise_prompt_0": "Vumpuses are aggressive. Numpus is vumpus. Sally is numpus. True or false: Sam is aggressive. Let us think step by step.",
        "response_0": "",
        "noise_response_1": "Sally is",
        "noise_prompt_1": "Vumpuses are aggressive. Numpus is vumpus. Sally is dumpus. True or false: Sally is aggressive. Let us think step by step.",
        "response_1": "Sally is",
        "noise_response_2": "Sally is numpus.",
        "noise_prompt_2": "Vumpuses are aggressive. Rompus is vumpus. Sally is numpus. True or false: Sally is aggressive. Let us think step by step.",
        "response_2": "Sally is numpus.",
        "noise_response_3": "Sally is numpus. Numpus is",
        "noise_prompt_3": "Vumpuses are aggressive. Numpus is gorpus. Sally is numpus. True or false: Sally is aggressive. Let us think step by step.",
        "response_3": "Sally is numpus. Numpus is",
        "noise_response_4": "Rex is numpus. Numpus is vumpus.",
        "noise_prompt_4": "Vumpuses are aggressive. Numpus is vumpus. Sally is numpus. True or false: Sally is aggressive. Let us think step by step.",
        "response_4": "Sally is numpus. Numpus is vumpus.",
        "noise_response_5": "Sally is numpus. Numpus is Vumpus. Sally is",
        "noise_prompt_5": "Vumpuses are aggressive. Numpus is vumpus. Sally is numpus. True or false: Sally is aggressive. Let us think step by step.",
        "response_5": "Sally is numpus. Numpus is vumpus. Sally is",
        "noise_response_6": "Sally is numpus. Numpus is vumpus. Sally is vumpus.",
        "noise_prompt_6": "Gorpus are aggressive. Numpus is vumpus. Sally is numpus. True or false: Sally is aggressive. Let us think step by step.",
        "response_6": "Sally is numpus. Numpus is vumpus. Sally is vumpus.",
        "noise_response_7": "Sally is numpus. Numpus is vumpus. Sally is vumpus. Vumpuses are",
        "noise_prompt_7": "Vumpuses are aggressive. Numpus is vumpus. Sally is numpus. True or false: Sally is windy. Let us think step by step.",
        "response_7": "Sally is numpus. Numpus is vumpus. Sally is vumpus. Vumpuses are",
        "noise_response_8": "Sally is numpus. Numpus is vumpus. Stella is vumpus. Vumpuses are aggressive.",
        "noise_prompt_8": "Vumpuses are aggressive. Numpus is vumpus. Sally is numpus. True or false: Sally is aggressive. Let us think step by step.",
        "response_8": "Sally is numpus. Numpus is vumpus. Sally is vumpus. Vumpuses are aggressive.",
        "noise_response_9": "Sally is numpus. Numpus is vumpus. Sally is vumpus. Vumpuses are mean. Sally is",
        "noise_prompt_9": "Vumpuses are aggressive. Numpus is vumpus. Sally is numpus. True or false: Sally is aggressive. Let us think step by step.",
        "response_9": "Sally is numpus. Numpus is vumpus. Sally is vumpus. Vumpuses are aggressive. Sally is",
        "noise_prompt_10": "Vumpuses are aggressive. Numpus is vumpus. Sally is numpus. True or false: Sally is aggressive. Let us think step by step.",
        "response_10": "Sally is numpus. Numpus is vumpus. Sally is vumpus. Vumpuses are aggressive. Sally is aggressive.",
        "noise_response_10": "Sally is numpus. Numpus is vumpus. Sally is vumpus. Vumpuses are aggressive. Sally is sour.",
        "answer_token_id_0": 29903,
        "answer_token_pos_0": 380,
        "answer_token_0": "S",
        "end_token_pos_0": 379,
        "end_token_id_0": 13,
        "answer_token_id_1": 954,
        "answer_token_pos_1": 383,
        "answer_token_1": "num",
        "end_token_pos_1": 382,
        "end_token_id_1": 338,
        "answer_token_id_2": 405,
        "answer_token_pos_2": 387,
        "answer_token_2": "N",
        "end_token_pos_2": 386,
        "end_token_id_2": 29889,
        "answer_token_id_3": 325,
        "answer_token_pos_3": 391,
        "answer_token_3": "v",
        "end_token_pos_3": 390,
        "end_token_id_3": 338,
        "answer_token_id_4": 317,
        "answer_token_pos_4": 395,
        "answer_token_4": "S",
        "end_token_pos_4": 394,
        "end_token_id_4": 29889,
        "answer_token_id_5": 325,
        "answer_token_pos_5": 398,
        "answer_token_5": "v",
        "end_token_pos_5": 397,
        "end_token_id_5": 338,
        "answer_token_id_6": 478,
        "answer_token_pos_6": 402,
        "answer_token_6": "V",
        "end_token_pos_6": 401,
        "end_token_id_6": 29889,
        "answer_token_id_7": 946,
        "answer_token_pos_7": 406,
        "answer_token_7": "ag",
        "end_token_pos_7": 405,
        "end_token_id_7": 526,
        "answer_token_id_8": 317,
        "answer_token_pos_8": 410,
        "answer_token_8": "S",
        "end_token_pos_8": 409,
        "end_token_id_8": 29889,
        "answer_token_id_9": 946,
        "answer_token_pos_9": 413,
        "answer_token_9": "ag",
        "end_token_pos_9": 412,
        "end_token_id_9": 338
    },
    {
        "question": "Shumpuses are liquid. Brimpuses are shumpuses. Stella is brimpus.",
        "query": "True or false: Stella is liquid.",
        "answer": "Stella is brimpus. Brimpuses are shumpuses. Stella is shumpus. Shumpuses are liquid. Stella is liquid. True",
        "label": "True",
        "prompt": "Shumpuses are liquid. Brimpuses are shumpuses. Stella is brimpus. True or false: Stella is liquid. Let us think step by step.",
        "generated": "Stella is brimpus. Brimpuses are shumpuses. Stella is shumpus. Shumpuses are liquid. Stella is liquid. True",
        "noise_response_0": "",
        "noise_prompt_0": "Shumpuses are liquid. Brimpuses are shumpuses. Stella is brimpus. True or false: Max is liquid. Let us think step by step.",
        "response_0": "",
        "noise_response_1": "Stella is",
        "noise_prompt_1": "Shumpuses are liquid. Brimpuses are shumpuses. Stella is sweet. True or false: Stella is liquid. Let us think step by step.",
        "response_1": "Stella is",
        "noise_response_2": "Stella is brimpus.",
        "noise_prompt_2": "Shumpuses are liquid. Zumpus are shumpuses. Stella is brimpus. True or false: Stella is liquid. Let us think step by step.",
        "response_2": "Stella is brimpus.",
        "noise_response_3": "Stella is brimpus. Brimpuses are",
        "noise_prompt_3": "Shumpuses are liquid. Brimpuses are blue. Stella is brimpus. True or false: Stella is liquid. Let us think step by step.",
        "response_3": "Stella is brimpus. Brimpuses are",
        "noise_response_4": "Alex is brimpus. Brimpuses are shumpuses.",
        "noise_prompt_4": "Shumpuses are liquid. Brimpuses are shumpuses. Stella is brimpus. True or false: Stella is liquid. Let us think step by step.",
        "response_4": "Stella is brimpus. Brimpuses are shumpuses.",
        "noise_response_5": "Stella is brimpus. Brimpuses are cold. Stella is",
        "noise_prompt_5": "Shumpuses are liquid. Brimpuses are shumpuses. Stella is brimpus. True or false: Stella is liquid. Let us think step by step.",
        "response_5": "Stella is brimpus. Brimpuses are shumpuses. Stella is",
        "noise_response_6": "Stella is brimpus. Brimpuses are shumpuses. Stella is shumpus.",
        "noise_prompt_6": "yumpus are liquid. Brimpuses are shumpuses. Stella is brimpus. True or false: Stella is liquid. Let us think step by step.",
        "response_6": "Stella is brimpus. Brimpuses are shumpuses. Stella is shumpus.",
        "noise_response_7": "Stella is brimpus. Brimpuses are shumpuses. Stella is shumpus. Shumpuses are",
        "noise_prompt_7": "Shumpuses are liquid. Brimpuses are shumpuses. Stella is brimpus. True or false: Stella is rainy. Let us think step by step.",
        "response_7": "Stella is brimpus. Brimpuses are shumpuses. Stella is shumpus. Shumpuses are",
        "noise_response_8": "Stella is brimpus. Brimpuses are shumpuses. Fae is shumpus. Shumpuses are liquid.",
        "noise_prompt_8": "Shumpuses are liquid. Brimpuses are shumpuses. Stella is brimpus. True or false: Stella is liquid. Let us think step by step.",
        "response_8": "Stella is brimpus. Brimpuses are shumpuses. Stella is shumpus. Shumpuses are liquid.",
        "noise_response_9": "Stella is brimpus. Brimpuses are shumpuses. Stella is shumpus. Shumpuses are wooden. Stella is",
        "noise_prompt_9": "Shumpuses are liquid. Brimpuses are shumpuses. Stella is brimpus. True or false: Stella is liquid. Let us think step by step.",
        "response_9": "Stella is brimpus. Brimpuses are shumpuses. Stella is shumpus. Shumpuses are liquid. Stella is",
        "noise_prompt_10": "Shumpuses are liquid. Brimpuses are shumpuses. Stella is brimpus. True or false: Stella is liquid. Let us think step by step.",
        "response_10": "Stella is brimpus. Brimpuses are shumpuses. Stella is shumpus. Shumpuses are liquid. Stella is liquid.",
        "noise_response_10": "Stella is brimpus. Brimpuses are shumpuses. Stella is shumpus. Shumpuses are liquid. Stella is discordant.",
        "answer_token_id_0": 855,
        "answer_token_pos_0": 380,
        "answer_token_0": "St",
        "end_token_pos_0": 379,
        "end_token_id_0": 13,
        "answer_token_id_1": 1506,
        "answer_token_pos_1": 383,
        "answer_token_1": "br",
        "end_token_pos_1": 382,
        "end_token_id_1": 338,
        "answer_token_id_2": 1771,
        "answer_token_pos_2": 387,
        "answer_token_2": "Br",
        "end_token_pos_2": 386,
        "end_token_id_2": 29889,
        "answer_token_id_3": 528,
        "answer_token_pos_3": 391,
        "answer_token_3": "sh",
        "end_token_pos_3": 390,
        "end_token_id_3": 526,
        "answer_token_id_4": 624,
        "answer_token_pos_4": 395,
        "answer_token_4": "St",
        "end_token_pos_4": 394,
        "end_token_id_4": 29889,
        "answer_token_id_5": 528,
        "answer_token_pos_5": 398,
        "answer_token_5": "sh",
        "end_token_pos_5": 397,
        "end_token_id_5": 338,
        "answer_token_id_6": 1383,
        "answer_token_pos_6": 402,
        "answer_token_6": "Sh",
        "end_token_pos_6": 401,
        "end_token_id_6": 29889,
        "answer_token_id_7": 23904,
        "answer_token_pos_7": 406,
        "answer_token_7": "liquid",
        "end_token_pos_7": 405,
        "end_token_id_7": 526,
        "answer_token_id_8": 624,
        "answer_token_pos_8": 410,
        "answer_token_8": "St",
        "end_token_pos_8": 409,
        "end_token_id_8": 29889,
        "answer_token_id_9": 23904,
        "answer_token_pos_9": 413,
        "answer_token_9": "liquid",
        "end_token_pos_9": 412,
        "end_token_id_9": 338
    },
    {
        "question": "Tumpus is feisty. Impus is tumpus. Alex is impus.",
        "query": "True or false: Alex is feisty.",
        "answer": "Alex is impus. Impus is tumpus. Alex is tumpus. Tumpus is feisty. Alex is feisty. True",
        "label": "True",
        "prompt": "Tumpus is feisty. Impus is tumpus. Alex is impus. True or false: Alex is feisty. Let us think step by step.",
        "generated": "Alex is impus. Impus is tumpus. Alex is tumpus. Tumpus is feisty. Alex is feisty. True",
        "noise_response_0": "",
        "noise_prompt_0": "Tumpus is feisty. Impus is tumpus. Alex is impus. True or false: Wren is feisty. Let us think step by step.",
        "response_0": "",
        "noise_response_1": "Alex is",
        "noise_prompt_1": "Tumpus is feisty. Impus is tumpus. Alex is Zumpus. True or false: Alex is feisty. Let us think step by step.",
        "response_1": "Alex is",
        "noise_response_2": "Alex is impus.",
        "noise_prompt_2": "Tumpus is feisty. wumpus is tumpus. Alex is impus. True or false: Alex is feisty. Let us think step by step.",
        "response_2": "Alex is impus.",
        "noise_response_3": "Alex is impus. Impus is",
        "noise_prompt_3": "Tumpus is feisty. Impus is muffled. Alex is impus. True or false: Alex is feisty. Let us think step by step.",
        "response_3": "Alex is impus. Impus is",
        "noise_response_4": "Wren is impus. Impus is tumpus.",
        "noise_prompt_4": "Tumpus is feisty. Impus is tumpus. Alex is impus. True or false: Alex is feisty. Let us think step by step.",
        "response_4": "Alex is impus. Impus is tumpus.",
        "noise_response_5": "Alex is impus. Impus is luminous. Alex is",
        "noise_prompt_5": "Tumpus is feisty. Impus is tumpus. Alex is impus. True or false: Alex is feisty. Let us think step by step.",
        "response_5": "Alex is impus. Impus is tumpus. Alex is",
        "noise_response_6": "Alex is impus. Impus is tumpus. Alex is tumpus.",
        "noise_prompt_6": "Sterpus is feisty. Impus is tumpus. Alex is impus. True or false: Alex is feisty. Let us think step by step.",
        "response_6": "Alex is impus. Impus is tumpus. Alex is tumpus.",
        "noise_response_7": "Alex is impus. Impus is tumpus. Alex is tumpus. Tumpus is",
        "noise_prompt_7": "Tumpus is feisty. Impus is tumpus. Alex is impus. True or false: Alex is snowy. Let us think step by step.",
        "response_7": "Alex is impus. Impus is tumpus. Alex is tumpus. Tumpus is",
        "noise_response_8": "Alex is impus. Impus is tumpus. Wren is tumpus. Tumpus is feisty.",
        "noise_prompt_8": "Tumpus is feisty. Impus is tumpus. Alex is impus. True or false: Alex is feisty. Let us think step by step.",
        "response_8": "Alex is impus. Impus is tumpus. Alex is tumpus. Tumpus is feisty.",
        "noise_response_9": "Alex is impus. Impus is tumpus. Alex is tumpus. Tumpus is floral. Alex is",
        "noise_prompt_9": "Tumpus is feisty. Impus is tumpus. Alex is impus. True or false: Alex is feisty. Let us think step by step.",
        "response_9": "Alex is impus. Impus is tumpus. Alex is tumpus. Tumpus is feisty. Alex is",
        "noise_prompt_10": "Tumpus is feisty. Impus is tumpus. Alex is impus. True or false: Alex is feisty. Let us think step by step.",
        "response_10": "Alex is impus. Impus is tumpus. Alex is tumpus. Tumpus is feisty. Alex is feisty.",
        "noise_response_10": "Alex is impus. Impus is tumpus. Alex is tumpus. Tumpus is feisty. Alex is hot.",
        "answer_token_id_0": 17406,
        "answer_token_pos_0": 380,
        "answer_token_0": "Alex",
        "end_token_pos_0": 379,
        "end_token_id_0": 13,
        "answer_token_id_1": 2411,
        "answer_token_pos_1": 383,
        "answer_token_1": "imp",
        "end_token_pos_1": 382,
        "end_token_id_1": 338,
        "answer_token_id_2": 14305,
        "answer_token_pos_2": 387,
        "answer_token_2": "Imp",
        "end_token_pos_2": 386,
        "end_token_id_2": 29889,
        "answer_token_id_3": 260,
        "answer_token_pos_3": 391,
        "answer_token_3": "t",
        "end_token_pos_3": 390,
        "end_token_id_3": 338,
        "answer_token_id_4": 4827,
        "answer_token_pos_4": 395,
        "answer_token_4": "Alex",
        "end_token_pos_4": 394,
        "end_token_id_4": 29889,
        "answer_token_id_5": 260,
        "answer_token_pos_5": 398,
        "answer_token_5": "t",
        "end_token_pos_5": 397,
        "end_token_id_5": 338,
        "answer_token_id_6": 323,
        "answer_token_pos_6": 402,
        "answer_token_6": "T",
        "end_token_pos_6": 401,
        "end_token_id_6": 29889,
        "answer_token_id_7": 1238,
        "answer_token_pos_7": 406,
        "answer_token_7": "fe",
        "end_token_pos_7": 405,
        "end_token_id_7": 338,
        "answer_token_id_8": 4827,
        "answer_token_pos_8": 410,
        "answer_token_8": "Alex",
        "end_token_pos_8": 409,
        "end_token_id_8": 29889,
        "answer_token_id_9": 1238,
        "answer_token_pos_9": 413,
        "answer_token_9": "fe",
        "end_token_pos_9": 412,
        "end_token_id_9": 338
    },
    {
        "question": "Dumpus is fast. Rompus is dumpus. Max is rompus.",
        "query": "True or false: Max is fast.",
        "answer": "Max is rompus. Rompus is dumpus. Max is dumpus. Dumpus is fast. Max is fast. True",
        "label": "True",
        "prompt": "Dumpus is fast. Rompus is dumpus. Max is rompus. True or false: Max is fast. Let us think step by step.",
        "generated": "Max is rompus. Rompus is dumpus. Max is dumpus. Dumpus is fast. Max is fast. True",
        "noise_response_0": "",
        "noise_prompt_0": "Dumpus is fast. Rompus is dumpus. Max is rompus. True or false: Rex is fast. Let us think step by step.",
        "response_0": "",
        "noise_response_1": "Max is",
        "noise_prompt_1": "Dumpus is fast. Rompus is dumpus. Max is rompus. True or false: Max is fast. Let us think step by step.",
        "response_1": "Max is",
        "noise_response_2": "Max is rompus.",
        "noise_prompt_2": "Dumpus is fast. jompus is dumpus. Max is rompus. True or false: Max is fast. Let us think step by step.",
        "response_2": "Max is rompus.",
        "noise_response_3": "Max is rompus. Rompus is",
        "noise_prompt_3": "Dumpus is fast. Rompus is grimpus. Max is rompus. True or false: Max is fast. Let us think step by step.",
        "response_3": "Max is rompus. Rompus is",
        "noise_response_4": "Fae is rompus. Rompus is dumpus.",
        "noise_prompt_4": "Dumpus is fast. Rompus is dumpus. Max is rompus. True or false: Max is fast. Let us think step by step.",
        "response_4": "Max is rompus. Rompus is dumpus.",
        "noise_response_5": "Max is rompus. Rompus is yumpus. Max is",
        "noise_prompt_5": "Dumpus is fast. Rompus is dumpus. Max is rompus. True or false: Max is fast. Let us think step by step.",
        "response_5": "Max is rompus. Rompus is dumpus. Max is",
        "noise_response_6": "Max is rompus. Rompus is dumpus. Max is dumpus.",
        "noise_prompt_6": "Rompus is fast. Rompus is dumpus. Max is rompus. True or false: Max is fast. Let us think step by step.",
        "response_6": "Max is rompus. Rompus is dumpus. Max is dumpus.",
        "noise_response_7": "Max is rompus. Rompus is dumpus. Max is dumpus. Dumpus is",
        "noise_prompt_7": "Dumpus is fast. Rompus is dumpus. Max is rompus. True or false: Max is fast. Let us think step by step.",
        "response_7": "Max is rompus. Rompus is dumpus. Max is dumpus. Dumpus is",
        "noise_response_8": "Max is rompus. Rompus is dumpus. Rex is dumpus. Dumpus is fast.",
        "noise_prompt_8": "Dumpus is fast. Rompus is dumpus. Max is rompus. True or false: Max is fast. Let us think step by step.",
        "response_8": "Max is rompus. Rompus is dumpus. Max is dumpus. Dumpus is fast.",
        "noise_response_9": "Max is rompus. Rompus is dumpus. Max is dumpus. Dumpus is brown. Max is",
        "noise_prompt_9": "Dumpus is fast. Rompus is dumpus. Max is rompus. True or false: Max is fast. Let us think step by step.",
        "response_9": "Max is rompus. Rompus is dumpus. Max is dumpus. Dumpus is fast. Max is",
        "noise_prompt_10": "Dumpus is fast. Rompus is dumpus. Max is rompus. True or false: Max is fast. Let us think step by step.",
        "response_10": "Max is rompus. Rompus is dumpus. Max is dumpus. Dumpus is fast. Max is fast.",
        "noise_response_10": "Max is rompus. Rompus is dumpus. Max is dumpus. Dumpus is fast. Max is luminous.",
        "answer_token_id_0": 7976,
        "answer_token_pos_0": 380,
        "answer_token_0": "Max",
        "end_token_pos_0": 379,
        "end_token_id_0": 13,
        "answer_token_id_1": 16766,
        "answer_token_pos_1": 383,
        "answer_token_1": "dump",
        "end_token_pos_1": 382,
        "end_token_id_1": 338,
        "answer_token_id_2": 6033,
        "answer_token_pos_2": 387,
        "answer_token_2": "Rom",
        "end_token_pos_2": 386,
        "end_token_id_2": 29889,
        "answer_token_id_3": 16766,
        "answer_token_pos_3": 391,
        "answer_token_3": "dump",
        "end_token_pos_3": 390,
        "end_token_id_3": 338,
        "answer_token_id_4": 5918,
        "answer_token_pos_4": 395,
        "answer_token_4": "Max",
        "end_token_pos_4": 394,
        "end_token_id_4": 29889,
        "answer_token_id_5": 16766,
        "answer_token_pos_5": 398,
        "answer_token_5": "dump",
        "end_token_pos_5": 397,
        "end_token_id_5": 338,
        "answer_token_id_6": 360,
        "answer_token_pos_6": 402,
        "answer_token_6": "D",
        "end_token_pos_6": 401,
        "end_token_id_6": 29889,
        "answer_token_id_7": 5172,
        "answer_token_pos_7": 406,
        "answer_token_7": "fast",
        "end_token_pos_7": 405,
        "end_token_id_7": 338,
        "answer_token_id_8": 5918,
        "answer_token_pos_8": 410,
        "answer_token_8": "Max",
        "end_token_pos_8": 409,
        "end_token_id_8": 29889,
        "answer_token_id_9": 5172,
        "answer_token_pos_9": 413,
        "answer_token_9": "fast",
        "end_token_pos_9": 412,
        "end_token_id_9": 338
    },
    {
        "question": "Grimpus is windy. Tumpus is grimpus. Max is tumpus.",
        "query": "True or false: Max is windy.",
        "answer": "Max is tumpus. Tumpus is grimpus. Max is grimpus. Grimpus is windy. Max is windy. True",
        "label": "True",
        "prompt": "Grimpus is windy. Tumpus is grimpus. Max is tumpus. True or false: Max is windy. Let us think step by step.",
        "generated": "Max is tumpus. Tumpus is grimpus. Max is grimpus. Grimpus is windy. Max is windy. True",
        "noise_response_0": "",
        "noise_prompt_0": "Grimpus is windy. Tumpus is grimpus. Max is tumpus. True or false: Alex is windy. Let us think step by step.",
        "response_0": "",
        "noise_response_1": "Max is",
        "noise_prompt_1": "Grimpus is windy. Tumpus is grimpus. Max is dull. True or false: Max is windy. Let us think step by step.",
        "response_1": "Max is",
        "noise_response_2": "Max is tumpus.",
        "noise_prompt_2": "Grimpus is windy. yumpus is grimpus. Max is tumpus. True or false: Max is windy. Let us think step by step.",
        "response_2": "Max is tumpus.",
        "noise_response_3": "Max is tumpus. Tumpus is",
        "noise_prompt_3": "Grimpus is windy. Tumpus is Shumpus. Max is tumpus. True or false: Max is windy. Let us think step by step.",
        "response_3": "Max is tumpus. Tumpus is",
        "noise_response_4": "Polly is tumpus. Tumpus is grimpus.",
        "noise_prompt_4": "Grimpus is windy. Tumpus is grimpus. Max is tumpus. True or false: Max is windy. Let us think step by step.",
        "response_4": "Max is tumpus. Tumpus is grimpus.",
        "noise_response_5": "Max is tumpus. Tumpus is grimpus. Max is",
        "noise_prompt_5": "Grimpus is windy. Tumpus is rompus. Max is tumpus. True or false: Max is windy. Let us think step by step.",
        "response_5": "Max is tumpus. Tumpus is grimpus. Max is",
        "noise_response_6": "Max is tumpus. Tumpus is grimpus. Max is grimpus.",
        "noise_prompt_6": "rompus is windy. Tumpus is grimpus. Max is tumpus. True or false: Max is windy. Let us think step by step.",
        "response_6": "Max is tumpus. Tumpus is grimpus. Max is grimpus.",
        "noise_response_7": "Max is tumpus. Tumpus is grimpus. Max is grimpus. Grimpus is",
        "noise_prompt_7": "Grimpus is windy. Tumpus is grimpus. Max is tumpus. True or false: Max is feisty. Let us think step by step.",
        "response_7": "Max is tumpus. Tumpus is grimpus. Max is grimpus. Grimpus is",
        "noise_response_8": "Max is tumpus. Tumpus is grimpus. Rex is grimpus. Grimpus is windy.",
        "noise_prompt_8": "Grimpus is windy. Tumpus is grimpus. Max is tumpus. True or false: Max is windy. Let us think step by step.",
        "response_8": "Max is tumpus. Tumpus is grimpus. Max is grimpus. Grimpus is windy.",
        "noise_response_9": "Max is tumpus. Tumpus is grimpus. Max is grimpus. Grimpus is brown. Max is",
        "noise_prompt_9": "Grimpus is windy. Tumpus is grimpus. Max is tumpus. True or false: Max is windy. Let us think step by step.",
        "response_9": "Max is tumpus. Tumpus is grimpus. Max is grimpus. Grimpus is windy. Max is",
        "noise_prompt_10": "Grimpus is windy. Tumpus is grimpus. Max is tumpus. True or false: Max is windy. Let us think step by step.",
        "response_10": "Max is tumpus. Tumpus is grimpus. Max is grimpus. Grimpus is windy. Max is windy.",
        "noise_response_10": "Max is tumpus. Tumpus is grimpus. Max is grimpus. Grimpus is windy. Max is bright.",
        "answer_token_id_0": 7976,
        "answer_token_pos_0": 380,
        "answer_token_0": "Max",
        "end_token_pos_0": 379,
        "end_token_id_0": 13,
        "answer_token_id_1": 260,
        "answer_token_pos_1": 383,
        "answer_token_1": "t",
        "end_token_pos_1": 382,
        "end_token_id_1": 338,
        "answer_token_id_2": 323,
        "answer_token_pos_2": 387,
        "answer_token_2": "T",
        "end_token_pos_2": 386,
        "end_token_id_2": 29889,
        "answer_token_id_3": 867,
        "answer_token_pos_3": 391,
        "answer_token_3": "gr",
        "end_token_pos_3": 390,
        "end_token_id_3": 338,
        "answer_token_id_4": 5918,
        "answer_token_pos_4": 395,
        "answer_token_4": "Max",
        "end_token_pos_4": 394,
        "end_token_id_4": 29889,
        "answer_token_id_5": 867,
        "answer_token_pos_5": 398,
        "answer_token_5": "gr",
        "end_token_pos_5": 397,
        "end_token_id_5": 338,
        "answer_token_id_6": 1632,
        "answer_token_pos_6": 402,
        "answer_token_6": "Gr",
        "end_token_pos_6": 401,
        "end_token_id_6": 29889,
        "answer_token_id_7": 8805,
        "answer_token_pos_7": 406,
        "answer_token_7": "wind",
        "end_token_pos_7": 405,
        "end_token_id_7": 338,
        "answer_token_id_8": 5918,
        "answer_token_pos_8": 410,
        "answer_token_8": "Max",
        "end_token_pos_8": 409,
        "end_token_id_8": 29889,
        "answer_token_id_9": 8805,
        "answer_token_pos_9": 413,
        "answer_token_9": "wind",
        "end_token_pos_9": 412,
        "end_token_id_9": 338
    },
    {
        "question": "Jompuses are kind. Shumpus is jompus. Sam is shumpus.",
        "query": "True or false: Sam is kind.",
        "answer": "Sam is shumpus. Shumpus is jompus. Sam is jompus. Jompuses are kind. Sam is kind. True",
        "label": "True",
        "prompt": "Jompuses are kind. Shumpus is jompus. Sam is shumpus. True or false: Sam is kind. Let us think step by step.",
        "generated": "Sam is shumpus. Shumpus is jompus. Sam is jompus. Jompuses are kind. Sam is kind. True",
        "noise_response_0": "",
        "noise_prompt_0": "Jompuses are kind. Shumpus is jompus. Sam is shumpus. True or false: Wren is kind. Let us think step by step.",
        "response_0": "",
        "noise_response_1": "Sam is",
        "noise_prompt_1": "Jompuses are kind. Shumpus is jompus. Sam is small. True or false: Sam is kind. Let us think step by step.",
        "response_1": "Sam is",
        "noise_response_2": "Sam is shumpus.",
        "noise_prompt_2": "Jompuses are kind. Brimpus is jompus. Sam is shumpus. True or false: Sam is kind. Let us think step by step.",
        "response_2": "Sam is shumpus.",
        "noise_response_3": "Sam is shumpus. Shumpus is",
        "noise_prompt_3": "Jompuses are kind. Shumpus is Vumpus. Sam is shumpus. True or false: Sam is kind. Let us think step by step.",
        "response_3": "Sam is shumpus. Shumpus is",
        "noise_response_4": "Rex is shumpus. Shumpus is jompus.",
        "noise_prompt_4": "Jompuses are kind. Shumpus is jompus. Sam is shumpus. True or false: Sam is kind. Let us think step by step.",
        "response_4": "Sam is shumpus. Shumpus is jompus.",
        "noise_response_5": "Sam is shumpus. Shumpus is Shumpus. Sam is",
        "noise_prompt_5": "Jompuses are kind. Shumpus is jompus. Sam is shumpus. True or false: Sam is kind. Let us think step by step.",
        "response_5": "Sam is shumpus. Shumpus is jompus. Sam is",
        "noise_response_6": "Sam is shumpus. Shumpus is jompus. Sam is jompus.",
        "noise_prompt_6": "wumpus are kind. Shumpus is jompus. Sam is shumpus. True or false: Sam is kind. Let us think step by step.",
        "response_6": "Sam is shumpus. Shumpus is jompus. Sam is jompus.",
        "noise_response_7": "Sam is shumpus. Shumpus is jompus. Sam is jompus. Jompuses are",
        "noise_prompt_7": "Jompuses are kind. Shumpus is jompus. Sam is shumpus. True or false: Sam is floral. Let us think step by step.",
        "response_7": "Sam is shumpus. Shumpus is jompus. Sam is jompus. Jompuses are",
        "noise_response_8": "Sam is shumpus. Shumpus is jompus. Wren is jompus. Jompuses are kind.",
        "noise_prompt_8": "Jompuses are kind. Shumpus is jompus. Sam is shumpus. True or false: Sam is kind. Let us think step by step.",
        "response_8": "Sam is shumpus. Shumpus is jompus. Sam is jompus. Jompuses are kind.",
        "noise_response_9": "Sam is shumpus. Shumpus is jompus. Sam is jompus. Jompuses are dull. Sam is",
        "noise_prompt_9": "Jompuses are kind. Shumpus is jompus. Sam is shumpus. True or false: Sam is kind. Let us think step by step.",
        "response_9": "Sam is shumpus. Shumpus is jompus. Sam is jompus. Jompuses are kind. Sam is",
        "noise_prompt_10": "Jompuses are kind. Shumpus is jompus. Sam is shumpus. True or false: Sam is kind. Let us think step by step.",
        "response_10": "Sam is shumpus. Shumpus is jompus. Sam is jompus. Jompuses are kind. Sam is kind.",
        "noise_response_10": "Sam is shumpus. Shumpus is jompus. Sam is jompus. Jompuses are kind. Sam is blue.",
        "answer_token_id_0": 22966,
        "answer_token_pos_0": 380,
        "answer_token_0": "Sam",
        "end_token_pos_0": 379,
        "end_token_id_0": 13,
        "answer_token_id_1": 528,
        "answer_token_pos_1": 383,
        "answer_token_1": "sh",
        "end_token_pos_1": 382,
        "end_token_id_1": 338,
        "answer_token_id_2": 1383,
        "answer_token_pos_2": 387,
        "answer_token_2": "Sh",
        "end_token_pos_2": 386,
        "end_token_id_2": 29889,
        "answer_token_id_3": 432,
        "answer_token_pos_3": 391,
        "answer_token_3": "j",
        "end_token_pos_3": 390,
        "end_token_id_3": 338,
        "answer_token_id_4": 3685,
        "answer_token_pos_4": 395,
        "answer_token_4": "Sam",
        "end_token_pos_4": 394,
        "end_token_id_4": 29889,
        "answer_token_id_5": 432,
        "answer_token_pos_5": 398,
        "answer_token_5": "j",
        "end_token_pos_5": 397,
        "end_token_id_5": 338,
        "answer_token_id_6": 435,
        "answer_token_pos_6": 402,
        "answer_token_6": "J",
        "end_token_pos_6": 401,
        "end_token_id_6": 29889,
        "answer_token_id_7": 2924,
        "answer_token_pos_7": 406,
        "answer_token_7": "kind",
        "end_token_pos_7": 405,
        "end_token_id_7": 526,
        "answer_token_id_8": 3685,
        "answer_token_pos_8": 410,
        "answer_token_8": "Sam",
        "end_token_pos_8": 409,
        "end_token_id_8": 29889,
        "answer_token_id_9": 2924,
        "answer_token_pos_9": 413,
        "answer_token_9": "kind",
        "end_token_pos_9": 412,
        "end_token_id_9": 338
    },
    {
        "question": "Jompuses are overcast. Wumpus is jompus. Polly is wumpus.",
        "query": "True or false: Polly is muffled.",
        "answer": "Polly is wumpus. Wumpus is jompus. Polly is jompus. Jompuses are overcast. Polly is overcast. False",
        "label": "False",
        "prompt": "Jompuses are overcast. Wumpus is jompus. Polly is wumpus. True or false: Polly is muffled. Let us think step by step.",
        "generated": "Polly is wumpus. Wumpus is jompus. Polly is jompus. Jompuses are overcast. Polly is overcast. False",
        "noise_response_0": "",
        "noise_prompt_0": "Jompuses are overcast. Wumpus is jompus. Polly is wumpus. True or false: Max is muffled. Let us think step by step.",
        "response_0": "",
        "noise_response_1": "Polly is",
        "noise_prompt_1": "Jompuses are overcast. Wumpus is jompus. Polly is blue. True or false: Polly is muffled. Let us think step by step.",
        "response_1": "Polly is",
        "noise_response_2": "Polly is wumpus.",
        "noise_prompt_2": "Jompuses are overcast. Wren is jompus. Polly is wumpus. True or false: Polly is muffled. Let us think step by step.",
        "response_2": "Polly is wumpus.",
        "noise_response_3": "Polly is wumpus. Wumpus is",
        "noise_prompt_3": "Jompuses are overcast. Wumpus is gorpus. Polly is wumpus. True or false: Polly is muffled. Let us think step by step.",
        "response_3": "Polly is wumpus. Wumpus is",
        "noise_response_4": "Alex is wumpus. Wumpus is jompus.",
        "noise_prompt_4": "Jompuses are overcast. Wumpus is jompus. Polly is wumpus. True or false: Polly is muffled. Let us think step by step.",
        "response_4": "Polly is wumpus. Wumpus is jompus.",
        "noise_response_5": "Polly is wumpus. Wumpus is tumpus. Polly is",
        "noise_prompt_5": "Jompuses are overcast. Wumpus is jompus. Polly is wumpus. True or false: Polly is muffled. Let us think step by step.",
        "response_5": "Polly is wumpus. Wumpus is jompus. Polly is",
        "noise_response_6": "Polly is wumpus. Wumpus is jompus. Polly is jompus.",
        "noise_prompt_6": "grimpus are overcast. Wumpus is jompus. Polly is wumpus. True or false: Polly is muffled. Let us think step by step.",
        "response_6": "Polly is wumpus. Wumpus is jompus. Polly is jompus.",
        "noise_response_7": "Polly is wumpus. Wumpus is jompus. Polly is jompus. Jompuses are",
        "noise_prompt_7": "Jompuses are snowy. Wumpus is jompus. Polly is wumpus. True or false: Polly is muffled. Let us think step by step.",
        "response_7": "Polly is wumpus. Wumpus is jompus. Polly is jompus. Jompuses are",
        "noise_response_8": "Polly is wumpus. Wumpus is jompus. Fae is jompus. Jompuses are overcast.",
        "noise_prompt_8": "Jompuses are overcast. Wumpus is jompus. Polly is wumpus. True or false: Polly is muffled. Let us think step by step.",
        "response_8": "Polly is wumpus. Wumpus is jompus. Polly is jompus. Jompuses are overcast.",
        "noise_response_9": "Polly is wumpus. Wumpus is jompus. Polly is jompus. Jompuses are aggressive. Polly is",
        "noise_prompt_9": "Jompuses are overcast. Wumpus is jompus. Polly is wumpus. True or false: Polly is muffled. Let us think step by step.",
        "response_9": "Polly is wumpus. Wumpus is jompus. Polly is jompus. Jompuses are overcast. Polly is",
        "noise_prompt_10": "Jompuses are overcast. Wumpus is jompus. Polly is wumpus. True or false: Polly is muffled. Let us think step by step.",
        "response_10": "Polly is wumpus. Wumpus is jompus. Polly is jompus. Jompuses are overcast. Polly is overcast.",
        "noise_response_10": "Polly is wumpus. Wumpus is jompus. Polly is jompus. Jompuses are overcast. Polly is moderate.",
        "answer_token_id_0": 7713,
        "answer_token_pos_0": 380,
        "answer_token_0": "Pol",
        "end_token_pos_0": 379,
        "end_token_id_0": 13,
        "answer_token_id_1": 281,
        "answer_token_pos_1": 383,
        "answer_token_1": "w",
        "end_token_pos_1": 382,
        "end_token_id_1": 338,
        "answer_token_id_2": 399,
        "answer_token_pos_2": 387,
        "answer_token_2": "W",
        "end_token_pos_2": 386,
        "end_token_id_2": 29889,
        "answer_token_id_3": 432,
        "answer_token_pos_3": 391,
        "answer_token_3": "j",
        "end_token_pos_3": 390,
        "end_token_id_3": 338,
        "answer_token_id_4": 2043,
        "answer_token_pos_4": 395,
        "answer_token_4": "Pol",
        "end_token_pos_4": 394,
        "end_token_id_4": 29889,
        "answer_token_id_5": 432,
        "answer_token_pos_5": 398,
        "answer_token_5": "j",
        "end_token_pos_5": 397,
        "end_token_id_5": 338,
        "answer_token_id_6": 435,
        "answer_token_pos_6": 402,
        "answer_token_6": "J",
        "end_token_pos_6": 401,
        "end_token_id_6": 29889,
        "answer_token_id_7": 975,
        "answer_token_pos_7": 406,
        "answer_token_7": "over",
        "end_token_pos_7": 405,
        "end_token_id_7": 526,
        "answer_token_id_8": 2043,
        "answer_token_pos_8": 410,
        "answer_token_8": "Pol",
        "end_token_pos_8": 409,
        "end_token_id_8": 29889,
        "answer_token_id_9": 975,
        "answer_token_pos_9": 413,
        "answer_token_9": "over",
        "end_token_pos_9": 412,
        "end_token_id_9": 338
    },
    {
        "question": "Brimpuses are cold. Lempuses are brimpuses. Alex is lempus.",
        "query": "True or false: Alex is sour.",
        "answer": "Alex is lempus. Lempuses are brimpuses. Alex is brimpus. Brimpuses are cold. Alex is cold. False",
        "label": "False",
        "prompt": "Brimpuses are cold. Lempuses are brimpuses. Alex is lempus. True or false: Alex is sour. Let us think step by step.",
        "generated": "Alex is lempus. Lempuses are brimpuses. Alex is brimpus. Brimpuses are cold. Alex is cold. False",
        "noise_response_0": "",
        "noise_prompt_0": "Brimpuses are cold. Lempuses are brimpuses. Alex is lempus. True or false: Sam is sour. Let us think step by step.",
        "response_0": "",
        "noise_response_1": "Alex is",
        "noise_prompt_1": "Brimpuses are cold. Lempuses are brimpuses. Alex is Vumpus. True or false: Alex is sour. Let us think step by step.",
        "response_1": "Alex is",
        "noise_response_2": "Alex is lempus.",
        "noise_prompt_2": "Brimpuses are cold. impus are brimpuses. Alex is lempus. True or false: Alex is sour. Let us think step by step.",
        "response_2": "Alex is lempus.",
        "noise_response_3": "Alex is lempus. Lempuses are",
        "noise_prompt_3": "Brimpuses are cold. Lempuses are sweet. Alex is lempus. True or false: Alex is sour. Let us think step by step.",
        "response_3": "Alex is lempus. Lempuses are",
        "noise_response_4": "Polly is lempus. Lempuses are brimpuses.",
        "noise_prompt_4": "Brimpuses are cold. Lempuses are brimpuses. Alex is lempus. True or false: Alex is sour. Let us think step by step.",
        "response_4": "Alex is lempus. Lempuses are brimpuses.",
        "noise_response_5": "Alex is lempus. Lempuses are luminous. Alex is",
        "noise_prompt_5": "Brimpuses are cold. Lempuses are brimpuses. Alex is lempus. True or false: Alex is sour. Let us think step by step.",
        "response_5": "Alex is lempus. Lempuses are brimpuses. Alex is",
        "noise_response_6": "Alex is lempus. Lempuses are brimpuses. Alex is brimpus.",
        "noise_prompt_6": "lorpus are cold. Lempuses are brimpuses. Alex is lempus. True or false: Alex is sour. Let us think step by step.",
        "response_6": "Alex is lempus. Lempuses are brimpuses. Alex is brimpus.",
        "noise_response_7": "Alex is lempus. Lempuses are brimpuses. Alex is brimpus. Brimpuses are",
        "noise_prompt_7": "Brimpuses are happy. Lempuses are brimpuses. Alex is lempus. True or false: Alex is sour. Let us think step by step.",
        "response_7": "Alex is lempus. Lempuses are brimpuses. Alex is brimpus. Brimpuses are",
        "noise_response_8": "Alex is lempus. Lempuses are brimpuses. Polly is brimpus. Brimpuses are cold.",
        "noise_prompt_8": "Brimpuses are cold. Lempuses are brimpuses. Alex is lempus. True or false: Alex is sour. Let us think step by step.",
        "response_8": "Alex is lempus. Lempuses are brimpuses. Alex is brimpus. Brimpuses are cold.",
        "noise_response_9": "Alex is lempus. Lempuses are brimpuses. Alex is brimpus. Brimpuses are hot. Alex is",
        "noise_prompt_9": "Brimpuses are cold. Lempuses are brimpuses. Alex is lempus. True or false: Alex is sour. Let us think step by step.",
        "response_9": "Alex is lempus. Lempuses are brimpuses. Alex is brimpus. Brimpuses are cold. Alex is",
        "noise_prompt_10": "Brimpuses are cold. Lempuses are brimpuses. Alex is lempus. True or false: Alex is sour. Let us think step by step.",
        "response_10": "Alex is lempus. Lempuses are brimpuses. Alex is brimpus. Brimpuses are cold. Alex is cold.",
        "noise_response_10": "Alex is lempus. Lempuses are brimpuses. Alex is brimpus. Brimpuses are cold. Alex is opaque.",
        "answer_token_id_0": 17406,
        "answer_token_pos_0": 380,
        "answer_token_0": "Alex",
        "end_token_pos_0": 379,
        "end_token_id_0": 13,
        "answer_token_id_1": 454,
        "answer_token_pos_1": 383,
        "answer_token_1": "le",
        "end_token_pos_1": 382,
        "end_token_id_1": 338,
        "answer_token_id_2": 365,
        "answer_token_pos_2": 387,
        "answer_token_2": "L",
        "end_token_pos_2": 386,
        "end_token_id_2": 29889,
        "answer_token_id_3": 1506,
        "answer_token_pos_3": 391,
        "answer_token_3": "br",
        "end_token_pos_3": 390,
        "end_token_id_3": 526,
        "answer_token_id_4": 4827,
        "answer_token_pos_4": 395,
        "answer_token_4": "Alex",
        "end_token_pos_4": 394,
        "end_token_id_4": 29889,
        "answer_token_id_5": 1506,
        "answer_token_pos_5": 398,
        "answer_token_5": "br",
        "end_token_pos_5": 397,
        "end_token_id_5": 338,
        "answer_token_id_6": 1771,
        "answer_token_pos_6": 402,
        "answer_token_6": "Br",
        "end_token_pos_6": 401,
        "end_token_id_6": 29889,
        "answer_token_id_7": 11220,
        "answer_token_pos_7": 406,
        "answer_token_7": "cold",
        "end_token_pos_7": 405,
        "end_token_id_7": 526,
        "answer_token_id_8": 4827,
        "answer_token_pos_8": 410,
        "answer_token_8": "Alex",
        "end_token_pos_8": 409,
        "end_token_id_8": 29889,
        "answer_token_id_9": 11220,
        "answer_token_pos_9": 413,
        "answer_token_9": "cold",
        "end_token_pos_9": 412,
        "end_token_id_9": 338
    },
    {
        "question": "Grimpuses are temperate. Vumpuses are grimpuses. Fae is vumpus.",
        "query": "True or false: Fae is transparent.",
        "answer": "Fae is vumpus. Vumpuses are grimpuses. Fae is grimpus. Grimpuses are temperate. Fae is temperate. False",
        "label": "False",
        "prompt": "Grimpuses are temperate. Vumpuses are grimpuses. Fae is vumpus. True or false: Fae is transparent. Let us think step by step.",
        "generated": "Fae is vumpus. Vumpuses are grimpuses. Fae is grimpus. Grimpuses are temperate. Fae is temperate. False",
        "noise_response_0": "",
        "noise_prompt_0": "Grimpuses are temperate. Vumpuses are grimpuses. Fae is vumpus. True or false: Alex is transparent. Let us think step by step.",
        "response_0": "",
        "noise_response_1": "Fae is",
        "noise_prompt_1": "Grimpuses are temperate. Vumpuses are grimpuses. Fae is Shumpus. True or false: Fae is transparent. Let us think step by step.",
        "response_1": "Fae is",
        "noise_response_2": "Fae is vumpus.",
        "noise_prompt_2": "Grimpuses are temperate. Vumpus are grimpuses. Fae is vumpus. True or false: Fae is transparent. Let us think step by step.",
        "response_2": "Fae is vumpus.",
        "noise_response_3": "Fae is vumpus. Vumpuses are",
        "noise_prompt_3": "Grimpuses are temperate. Vumpuses are zumpus. Fae is vumpus. True or false: Fae is transparent. Let us think step by step.",
        "response_3": "Fae is vumpus. Vumpuses are",
        "noise_response_4": "Sally is vumpus. Vumpuses are grimpuses.",
        "noise_prompt_4": "Grimpuses are temperate. Vumpuses are grimpuses. Fae is vumpus. True or false: Fae is transparent. Let us think step by step.",
        "response_4": "Fae is vumpus. Vumpuses are grimpuses.",
        "noise_response_5": "Fae is vumpus. Vumpuses are grimpus. Fae is",
        "noise_prompt_5": "Grimpuses are temperate. Vumpuses are grimpuses. Fae is vumpus. True or false: Fae is transparent. Let us think step by step.",
        "response_5": "Fae is vumpus. Vumpuses are grimpuses. Fae is",
        "noise_response_6": "Fae is vumpus. Vumpuses are grimpuses. Fae is grimpus.",
        "noise_prompt_6": "Impus are temperate. Vumpuses are grimpuses. Fae is vumpus. True or false: Fae is transparent. Let us think step by step.",
        "response_6": "Fae is vumpus. Vumpuses are grimpuses. Fae is grimpus.",
        "noise_response_7": "Fae is vumpus. Vumpuses are grimpuses. Fae is grimpus. Grimpuses are",
        "noise_prompt_7": "Grimpuses are overcast. Vumpuses are grimpuses. Fae is vumpus. True or false: Fae is transparent. Let us think step by step.",
        "response_7": "Fae is vumpus. Vumpuses are grimpuses. Fae is grimpus. Grimpuses are",
        "noise_response_8": "Fae is vumpus. Vumpuses are grimpuses. Sam is grimpus. Grimpuses are temperate.",
        "noise_prompt_8": "Grimpuses are temperate. Vumpuses are grimpuses. Fae is vumpus. True or false: Fae is transparent. Let us think step by step.",
        "response_8": "Fae is vumpus. Vumpuses are grimpuses. Fae is grimpus. Grimpuses are temperate.",
        "noise_response_9": "Fae is vumpus. Vumpuses are grimpuses. Fae is grimpus. Grimpuses are melodic. Fae is",
        "noise_prompt_9": "Grimpuses are temperate. Vumpuses are grimpuses. Fae is vumpus. True or false: Fae is transparent. Let us think step by step.",
        "response_9": "Fae is vumpus. Vumpuses are grimpuses. Fae is grimpus. Grimpuses are temperate. Fae is",
        "noise_prompt_10": "Grimpuses are temperate. Vumpuses are grimpuses. Fae is vumpus. True or false: Fae is transparent. Let us think step by step.",
        "response_10": "Fae is vumpus. Vumpuses are grimpuses. Fae is grimpus. Grimpuses are temperate. Fae is temperate.",
        "noise_response_10": "Fae is vumpus. Vumpuses are grimpuses. Fae is grimpus. Grimpuses are temperate. Fae is feisty.",
        "answer_token_id_0": 29943,
        "answer_token_pos_0": 380,
        "answer_token_0": "F",
        "end_token_pos_0": 379,
        "end_token_id_0": 13,
        "answer_token_id_1": 325,
        "answer_token_pos_1": 383,
        "answer_token_1": "v",
        "end_token_pos_1": 382,
        "end_token_id_1": 338,
        "answer_token_id_2": 478,
        "answer_token_pos_2": 387,
        "answer_token_2": "V",
        "end_token_pos_2": 386,
        "end_token_id_2": 29889,
        "answer_token_id_3": 867,
        "answer_token_pos_3": 391,
        "answer_token_3": "gr",
        "end_token_pos_3": 390,
        "end_token_id_3": 526,
        "answer_token_id_4": 383,
        "answer_token_pos_4": 395,
        "answer_token_4": "F",
        "end_token_pos_4": 394,
        "end_token_id_4": 29889,
        "answer_token_id_5": 867,
        "answer_token_pos_5": 398,
        "answer_token_5": "gr",
        "end_token_pos_5": 397,
        "end_token_id_5": 338,
        "answer_token_id_6": 1632,
        "answer_token_pos_6": 402,
        "answer_token_6": "Gr",
        "end_token_pos_6": 401,
        "end_token_id_6": 29889,
        "answer_token_id_7": 6238,
        "answer_token_pos_7": 406,
        "answer_token_7": "temper",
        "end_token_pos_7": 405,
        "end_token_id_7": 526,
        "answer_token_id_8": 383,
        "answer_token_pos_8": 410,
        "answer_token_8": "F",
        "end_token_pos_8": 409,
        "end_token_id_8": 29889,
        "answer_token_id_9": 6238,
        "answer_token_pos_9": 413,
        "answer_token_9": "temper",
        "end_token_pos_9": 412,
        "end_token_id_9": 338
    },
    {
        "question": "Tumpus is opaque. Vumpuses are tumpuses. Alex is vumpus.",
        "query": "True or false: Alex is opaque.",
        "answer": "Alex is vumpus. Vumpuses are tumpuses. Alex is tumpus. Tumpus is opaque. Alex is opaque. True",
        "label": "True",
        "prompt": "Tumpus is opaque. Vumpuses are tumpuses. Alex is vumpus. True or false: Alex is opaque. Let us think step by step.",
        "generated": "Alex is vumpus. Vumpuses are tumpuses. Alex is tumpus. Tumpus is opaque. Alex is opaque. True",
        "noise_response_0": "",
        "noise_prompt_0": "Tumpus is opaque. Vumpuses are tumpuses. Alex is vumpus. True or false: Fae is opaque. Let us think step by step.",
        "response_0": "",
        "noise_response_1": "Alex is",
        "noise_prompt_1": "Tumpus is opaque. Vumpuses are tumpuses. Alex is gorpus. True or false: Alex is opaque. Let us think step by step.",
        "response_1": "Alex is",
        "noise_response_2": "Alex is vumpus.",
        "noise_prompt_2": "Tumpus is opaque. Yumpus are tumpuses. Alex is vumpus. True or false: Alex is opaque. Let us think step by step.",
        "response_2": "Alex is vumpus.",
        "noise_response_3": "Alex is vumpus. Vumpuses are",
        "noise_prompt_3": "Tumpus is opaque. Vumpuses are sweet. Alex is vumpus. True or false: Alex is opaque. Let us think step by step.",
        "response_3": "Alex is vumpus. Vumpuses are",
        "noise_response_4": "Fae is vumpus. Vumpuses are tumpuses.",
        "noise_prompt_4": "Tumpus is opaque. Vumpuses are tumpuses. Alex is vumpus. True or false: Alex is opaque. Let us think step by step.",
        "response_4": "Alex is vumpus. Vumpuses are tumpuses.",
        "noise_response_5": "Alex is vumpus. Vumpuses are metallic. Alex is",
        "noise_prompt_5": "Tumpus is opaque. Vumpuses are tumpuses. Alex is vumpus. True or false: Alex is opaque. Let us think step by step.",
        "response_5": "Alex is vumpus. Vumpuses are tumpuses. Alex is",
        "noise_response_6": "Alex is vumpus. Vumpuses are tumpuses. Alex is tumpus.",
        "noise_prompt_6": "Jompus is opaque. Vumpuses are tumpuses. Alex is vumpus. True or false: Alex is opaque. Let us think step by step.",
        "response_6": "Alex is vumpus. Vumpuses are tumpuses. Alex is tumpus.",
        "noise_response_7": "Alex is vumpus. Vumpuses are tumpuses. Alex is tumpus. Tumpus is",
        "noise_prompt_7": "Tumpus is opaque. Vumpuses are tumpuses. Alex is vumpus. True or false: Alex is metallic. Let us think step by step.",
        "response_7": "Alex is vumpus. Vumpuses are tumpuses. Alex is tumpus. Tumpus is",
        "noise_response_8": "Alex is vumpus. Vumpuses are tumpuses. Rex is tumpus. Tumpus is opaque.",
        "noise_prompt_8": "Tumpus is opaque. Vumpuses are tumpuses. Alex is vumpus. True or false: Alex is opaque. Let us think step by step.",
        "response_8": "Alex is vumpus. Vumpuses are tumpuses. Alex is tumpus. Tumpus is opaque.",
        "noise_response_9": "Alex is vumpus. Vumpuses are tumpuses. Alex is tumpus. Tumpus is cold. Alex is",
        "noise_prompt_9": "Tumpus is opaque. Vumpuses are tumpuses. Alex is vumpus. True or false: Alex is opaque. Let us think step by step.",
        "response_9": "Alex is vumpus. Vumpuses are tumpuses. Alex is tumpus. Tumpus is opaque. Alex is",
        "noise_prompt_10": "Tumpus is opaque. Vumpuses are tumpuses. Alex is vumpus. True or false: Alex is opaque. Let us think step by step.",
        "response_10": "Alex is vumpus. Vumpuses are tumpuses. Alex is tumpus. Tumpus is opaque. Alex is opaque.",
        "noise_response_10": "Alex is vumpus. Vumpuses are tumpuses. Alex is tumpus. Tumpus is opaque. Alex is brown.",
        "answer_token_id_0": 17406,
        "answer_token_pos_0": 380,
        "answer_token_0": "Alex",
        "end_token_pos_0": 379,
        "end_token_id_0": 13,
        "answer_token_id_1": 325,
        "answer_token_pos_1": 383,
        "answer_token_1": "v",
        "end_token_pos_1": 382,
        "end_token_id_1": 338,
        "answer_token_id_2": 478,
        "answer_token_pos_2": 387,
        "answer_token_2": "V",
        "end_token_pos_2": 386,
        "end_token_id_2": 29889,
        "answer_token_id_3": 260,
        "answer_token_pos_3": 391,
        "answer_token_3": "t",
        "end_token_pos_3": 390,
        "end_token_id_3": 526,
        "answer_token_id_4": 4827,
        "answer_token_pos_4": 395,
        "answer_token_4": "Alex",
        "end_token_pos_4": 394,
        "end_token_id_4": 29889,
        "answer_token_id_5": 260,
        "answer_token_pos_5": 398,
        "answer_token_5": "t",
        "end_token_pos_5": 397,
        "end_token_id_5": 338,
        "answer_token_id_6": 323,
        "answer_token_pos_6": 402,
        "answer_token_6": "T",
        "end_token_pos_6": 401,
        "end_token_id_6": 29889,
        "answer_token_id_7": 1015,
        "answer_token_pos_7": 406,
        "answer_token_7": "op",
        "end_token_pos_7": 405,
        "end_token_id_7": 338,
        "answer_token_id_8": 4827,
        "answer_token_pos_8": 410,
        "answer_token_8": "Alex",
        "end_token_pos_8": 409,
        "end_token_id_8": 29889,
        "answer_token_id_9": 1015,
        "answer_token_pos_9": 413,
        "answer_token_9": "op",
        "end_token_pos_9": 412,
        "end_token_id_9": 338
    },
    {
        "question": "Wumpuses are sweet. Vumpus is wumpus. Sally is vumpus.",
        "query": "True or false: Sally is sweet.",
        "answer": "Sally is vumpus. Vumpus is wumpus. Sally is wumpus. Wumpuses are sweet. Sally is sweet. True",
        "label": "True",
        "prompt": "Wumpuses are sweet. Vumpus is wumpus. Sally is vumpus. True or false: Sally is sweet. Let us think step by step.",
        "generated": "Sally is vumpus. Vumpus is wumpus. Sally is wumpus. Wumpuses are sweet. Sally is sweet. True",
        "noise_response_0": "",
        "noise_prompt_0": "Wumpuses are sweet. Vumpus is wumpus. Sally is vumpus. True or false: Fae is sweet. Let us think step by step.",
        "response_0": "",
        "noise_response_1": "Sally is",
        "noise_prompt_1": "Wumpuses are sweet. Vumpus is wumpus. Sally is impus. True or false: Sally is sweet. Let us think step by step.",
        "response_1": "Sally is",
        "noise_response_2": "Sally is vumpus.",
        "noise_prompt_2": "Wumpuses are sweet. Tumpus is wumpus. Sally is vumpus. True or false: Sally is sweet. Let us think step by step.",
        "response_2": "Sally is vumpus.",
        "noise_response_3": "Sally is vumpus. Vumpus is",
        "noise_prompt_3": "Wumpuses are sweet. Vumpus is melodic. Sally is vumpus. True or false: Sally is sweet. Let us think step by step.",
        "response_3": "Sally is vumpus. Vumpus is",
        "noise_response_4": "Alex is vumpus. Vumpus is wumpus.",
        "noise_prompt_4": "Wumpuses are sweet. Vumpus is wumpus. Sally is vumpus. True or false: Sally is sweet. Let us think step by step.",
        "response_4": "Sally is vumpus. Vumpus is wumpus.",
        "noise_response_5": "Sally is vumpus. Vumpus is mean. Sally is",
        "noise_prompt_5": "Wumpuses are sweet. Vumpus is wumpus. Sally is vumpus. True or false: Sally is sweet. Let us think step by step.",
        "response_5": "Sally is vumpus. Vumpus is wumpus. Sally is",
        "noise_response_6": "Sally is vumpus. Vumpus is wumpus. Sally is wumpus.",
        "noise_prompt_6": "Polly are sweet. Vumpus is wumpus. Sally is vumpus. True or false: Sally is sweet. Let us think step by step.",
        "response_6": "Sally is vumpus. Vumpus is wumpus. Sally is wumpus.",
        "noise_response_7": "Sally is vumpus. Vumpus is wumpus. Sally is wumpus. Wumpuses are",
        "noise_prompt_7": "Wumpuses are sweet. Vumpus is wumpus. Sally is vumpus. True or false: Sally is sour. Let us think step by step.",
        "response_7": "Sally is vumpus. Vumpus is wumpus. Sally is wumpus. Wumpuses are",
        "noise_response_8": "Sally is vumpus. Vumpus is wumpus. Sam is wumpus. Wumpuses are sweet.",
        "noise_prompt_8": "Wumpuses are sweet. Vumpus is wumpus. Sally is vumpus. True or false: Sally is sweet. Let us think step by step.",
        "response_8": "Sally is vumpus. Vumpus is wumpus. Sally is wumpus. Wumpuses are sweet.",
        "noise_response_9": "Sally is vumpus. Vumpus is wumpus. Sally is wumpus. Wumpuses are aggressive. Sally is",
        "noise_prompt_9": "Wumpuses are sweet. Vumpus is wumpus. Sally is vumpus. True or false: Sally is sweet. Let us think step by step.",
        "response_9": "Sally is vumpus. Vumpus is wumpus. Sally is wumpus. Wumpuses are sweet. Sally is",
        "noise_prompt_10": "Wumpuses are sweet. Vumpus is wumpus. Sally is vumpus. True or false: Sally is sweet. Let us think step by step.",
        "response_10": "Sally is vumpus. Vumpus is wumpus. Sally is wumpus. Wumpuses are sweet. Sally is sweet.",
        "noise_response_10": "Sally is vumpus. Vumpus is wumpus. Sally is wumpus. Wumpuses are sweet. Sally is small.",
        "answer_token_id_0": 29903,
        "answer_token_pos_0": 380,
        "answer_token_0": "S",
        "end_token_pos_0": 379,
        "end_token_id_0": 13,
        "answer_token_id_1": 325,
        "answer_token_pos_1": 383,
        "answer_token_1": "v",
        "end_token_pos_1": 382,
        "end_token_id_1": 338,
        "answer_token_id_2": 478,
        "answer_token_pos_2": 387,
        "answer_token_2": "V",
        "end_token_pos_2": 386,
        "end_token_id_2": 29889,
        "answer_token_id_3": 281,
        "answer_token_pos_3": 391,
        "answer_token_3": "w",
        "end_token_pos_3": 390,
        "end_token_id_3": 338,
        "answer_token_id_4": 317,
        "answer_token_pos_4": 395,
        "answer_token_4": "S",
        "end_token_pos_4": 394,
        "end_token_id_4": 29889,
        "answer_token_id_5": 281,
        "answer_token_pos_5": 398,
        "answer_token_5": "w",
        "end_token_pos_5": 397,
        "end_token_id_5": 338,
        "answer_token_id_6": 399,
        "answer_token_pos_6": 402,
        "answer_token_6": "W",
        "end_token_pos_6": 401,
        "end_token_id_6": 29889,
        "answer_token_id_7": 14225,
        "answer_token_pos_7": 406,
        "answer_token_7": "sweet",
        "end_token_pos_7": 405,
        "end_token_id_7": 526,
        "answer_token_id_8": 317,
        "answer_token_pos_8": 410,
        "answer_token_8": "S",
        "end_token_pos_8": 409,
        "end_token_id_8": 29889,
        "answer_token_id_9": 14225,
        "answer_token_pos_9": 413,
        "answer_token_9": "sweet",
        "end_token_pos_9": 412,
        "end_token_id_9": 338
    },
    {
        "question": "Lorpuses are moderate. Grimpus is lorpus. Stella is grimpus.",
        "query": "True or false: Stella is moderate.",
        "answer": "Stella is grimpus. Grimpus is lorpus. Stella is lorpus. Lorpuses are moderate. Stella is moderate. True",
        "label": "True",
        "prompt": "Lorpuses are moderate. Grimpus is lorpus. Stella is grimpus. True or false: Stella is moderate. Let us think step by step.",
        "generated": "Stella is grimpus. Grimpus is lorpus. Stella is lorpus. Lorpuses are moderate. Stella is moderate. True",
        "noise_response_0": "",
        "noise_prompt_0": "Lorpuses are moderate. Grimpus is lorpus. Stella is grimpus. True or false: Polly is moderate. Let us think step by step.",
        "response_0": "",
        "noise_response_1": "Stella is",
        "noise_prompt_1": "Lorpuses are moderate. Grimpus is lorpus. Stella is numpus. True or false: Stella is moderate. Let us think step by step.",
        "response_1": "Stella is",
        "noise_response_2": "Stella is grimpus.",
        "noise_prompt_2": "Lorpuses are moderate. sterpus is lorpus. Stella is grimpus. True or false: Stella is moderate. Let us think step by step.",
        "response_2": "Stella is grimpus.",
        "noise_response_3": "Stella is grimpus. Grimpus is",
        "noise_prompt_3": "Lorpuses are moderate. Grimpus is feisty. Stella is grimpus. True or false: Stella is moderate. Let us think step by step.",
        "response_3": "Stella is grimpus. Grimpus is",
        "noise_response_4": "Polly is grimpus. Grimpus is lorpus.",
        "noise_prompt_4": "Lorpuses are moderate. Grimpus is lorpus. Stella is grimpus. True or false: Stella is moderate. Let us think step by step.",
        "response_4": "Stella is grimpus. Grimpus is lorpus.",
        "noise_response_5": "Stella is grimpus. Grimpus is moderate. Stella is",
        "noise_prompt_5": "Lorpuses are moderate. Grimpus is lorpus. Stella is grimpus. True or false: Stella is moderate. Let us think step by step.",
        "response_5": "Stella is grimpus. Grimpus is lorpus. Stella is",
        "noise_response_6": "Stella is grimpus. Grimpus is lorpus. Stella is lorpus.",
        "noise_prompt_6": "shumpus are moderate. Grimpus is lorpus. Stella is grimpus. True or false: Stella is moderate. Let us think step by step.",
        "response_6": "Stella is grimpus. Grimpus is lorpus. Stella is lorpus.",
        "noise_response_7": "Stella is grimpus. Grimpus is lorpus. Stella is lorpus. Lorpuses are",
        "noise_prompt_7": "Lorpuses are moderate. Grimpus is lorpus. Stella is grimpus. True or false: Stella is rainy. Let us think step by step.",
        "response_7": "Stella is grimpus. Grimpus is lorpus. Stella is lorpus. Lorpuses are",
        "noise_response_8": "Stella is grimpus. Grimpus is lorpus. Fae is lorpus. Lorpuses are moderate.",
        "noise_prompt_8": "Lorpuses are moderate. Grimpus is lorpus. Stella is grimpus. True or false: Stella is moderate. Let us think step by step.",
        "response_8": "Stella is grimpus. Grimpus is lorpus. Stella is lorpus. Lorpuses are moderate.",
        "noise_response_9": "Stella is grimpus. Grimpus is lorpus. Stella is lorpus. Lorpuses are fast. Stella is",
        "noise_prompt_9": "Lorpuses are moderate. Grimpus is lorpus. Stella is grimpus. True or false: Stella is moderate. Let us think step by step.",
        "response_9": "Stella is grimpus. Grimpus is lorpus. Stella is lorpus. Lorpuses are moderate. Stella is",
        "noise_prompt_10": "Lorpuses are moderate. Grimpus is lorpus. Stella is grimpus. True or false: Stella is moderate. Let us think step by step.",
        "response_10": "Stella is grimpus. Grimpus is lorpus. Stella is lorpus. Lorpuses are moderate. Stella is moderate.",
        "noise_response_10": "Stella is grimpus. Grimpus is lorpus. Stella is lorpus. Lorpuses are moderate. Stella is hot.",
        "answer_token_id_0": 855,
        "answer_token_pos_0": 380,
        "answer_token_0": "St",
        "end_token_pos_0": 379,
        "end_token_id_0": 13,
        "answer_token_id_1": 867,
        "answer_token_pos_1": 383,
        "answer_token_1": "gr",
        "end_token_pos_1": 382,
        "end_token_id_1": 338,
        "answer_token_id_2": 1632,
        "answer_token_pos_2": 387,
        "answer_token_2": "Gr",
        "end_token_pos_2": 386,
        "end_token_id_2": 29889,
        "answer_token_id_3": 301,
        "answer_token_pos_3": 391,
        "answer_token_3": "l",
        "end_token_pos_3": 390,
        "end_token_id_3": 338,
        "answer_token_id_4": 624,
        "answer_token_pos_4": 395,
        "answer_token_4": "St",
        "end_token_pos_4": 394,
        "end_token_id_4": 29889,
        "answer_token_id_5": 301,
        "answer_token_pos_5": 398,
        "answer_token_5": "l",
        "end_token_pos_5": 397,
        "end_token_id_5": 338,
        "answer_token_id_6": 10980,
        "answer_token_pos_6": 402,
        "answer_token_6": "Lor",
        "end_token_pos_6": 401,
        "end_token_id_6": 29889,
        "answer_token_id_7": 17768,
        "answer_token_pos_7": 406,
        "answer_token_7": "moder",
        "end_token_pos_7": 405,
        "end_token_id_7": 526,
        "answer_token_id_8": 624,
        "answer_token_pos_8": 410,
        "answer_token_8": "St",
        "end_token_pos_8": 409,
        "end_token_id_8": 29889,
        "answer_token_id_9": 17768,
        "answer_token_pos_9": 413,
        "answer_token_9": "moder",
        "end_token_pos_9": 412,
        "end_token_id_9": 338
    },
    {
        "question": "Gorpuses are shy. Sterpus is gorpus. Max is sterpus.",
        "query": "True or false: Max is shy.",
        "answer": "Max is sterpus. Sterpus is gorpus. Max is gorpus. Gorpuses are shy. Max is shy. True",
        "label": "True",
        "prompt": "Gorpuses are shy. Sterpus is gorpus. Max is sterpus. True or false: Max is shy. Let us think step by step.",
        "generated": "Max is sterpus. Sterpus is gorpus. Max is gorpus. Gorpuses are shy. Max is shy. True",
        "noise_response_0": "",
        "noise_prompt_0": "Gorpuses are shy. Sterpus is gorpus. Max is sterpus. True or false: Polly is shy. Let us think step by step.",
        "response_0": "",
        "noise_response_1": "Max is",
        "noise_prompt_1": "Gorpuses are shy. Sterpus is gorpus. Max is numpus. True or false: Max is shy. Let us think step by step.",
        "response_1": "Max is",
        "noise_response_2": "Max is sterpus.",
        "noise_prompt_2": "Gorpuses are shy. gorpus is gorpus. Max is sterpus. True or false: Max is shy. Let us think step by step.",
        "response_2": "Max is sterpus.",
        "noise_response_3": "Max is sterpus. Sterpus is",
        "noise_prompt_3": "Gorpuses are shy. Sterpus is Sterpus. Max is sterpus. True or false: Max is shy. Let us think step by step.",
        "response_3": "Max is sterpus. Sterpus is",
        "noise_response_4": "Sam is sterpus. Sterpus is gorpus.",
        "noise_prompt_4": "Gorpuses are shy. Sterpus is gorpus. Max is sterpus. True or false: Max is shy. Let us think step by step.",
        "response_4": "Max is sterpus. Sterpus is gorpus.",
        "noise_response_5": "Max is sterpus. Sterpus is Rompus. Max is",
        "noise_prompt_5": "Gorpuses are shy. Sterpus is gorpus. Max is sterpus. True or false: Max is shy. Let us think step by step.",
        "response_5": "Max is sterpus. Sterpus is gorpus. Max is",
        "noise_response_6": "Max is sterpus. Sterpus is gorpus. Max is gorpus.",
        "noise_prompt_6": "brimpus are shy. Sterpus is gorpus. Max is sterpus. True or false: Max is shy. Let us think step by step.",
        "response_6": "Max is sterpus. Sterpus is gorpus. Max is gorpus.",
        "noise_response_7": "Max is sterpus. Sterpus is gorpus. Max is gorpus. Gorpuses are",
        "noise_prompt_7": "Gorpuses are shy. Sterpus is gorpus. Max is sterpus. True or false: Max is overcast. Let us think step by step.",
        "response_7": "Max is sterpus. Sterpus is gorpus. Max is gorpus. Gorpuses are",
        "noise_response_8": "Max is sterpus. Sterpus is gorpus. Rex is gorpus. Gorpuses are shy.",
        "noise_prompt_8": "Gorpuses are shy. Sterpus is gorpus. Max is sterpus. True or false: Max is shy. Let us think step by step.",
        "response_8": "Max is sterpus. Sterpus is gorpus. Max is gorpus. Gorpuses are shy.",
        "noise_response_9": "Max is sterpus. Sterpus is gorpus. Max is gorpus. Gorpuses are moderate. Max is",
        "noise_prompt_9": "Gorpuses are shy. Sterpus is gorpus. Max is sterpus. True or false: Max is shy. Let us think step by step.",
        "response_9": "Max is sterpus. Sterpus is gorpus. Max is gorpus. Gorpuses are shy. Max is",
        "noise_prompt_10": "Gorpuses are shy. Sterpus is gorpus. Max is sterpus. True or false: Max is shy. Let us think step by step.",
        "response_10": "Max is sterpus. Sterpus is gorpus. Max is gorpus. Gorpuses are shy. Max is shy.",
        "noise_response_10": "Max is sterpus. Sterpus is gorpus. Max is gorpus. Gorpuses are shy. Max is brown.",
        "answer_token_id_0": 29903,
        "answer_token_pos_0": 380,
        "answer_token_0": "S",
        "end_token_pos_0": 379,
        "end_token_id_0": 13,
        "answer_token_id_1": 16864,
        "answer_token_pos_1": 383,
        "answer_token_1": "ster",
        "end_token_pos_1": 382,
        "end_token_id_1": 338,
        "answer_token_id_2": 28588,
        "answer_token_pos_2": 387,
        "answer_token_2": "Ster",
        "end_token_pos_2": 386,
        "end_token_id_2": 29889,
        "answer_token_id_3": 330,
        "answer_token_pos_3": 391,
        "answer_token_3": "g",
        "end_token_pos_3": 390,
        "end_token_id_3": 338,
        "answer_token_id_4": 18686,
        "answer_token_pos_4": 395,
        "answer_token_4": "Gor",
        "end_token_pos_4": 394,
        "end_token_id_4": 29889,
        "answer_token_id_5": 330,
        "answer_token_pos_5": 398,
        "answer_token_5": "g",
        "end_token_pos_5": 397,
        "end_token_id_5": 338,
        "answer_token_id_6": 18686,
        "answer_token_pos_6": 402,
        "answer_token_6": "Gor",
        "end_token_pos_6": 401,
        "end_token_id_6": 29889,
        "answer_token_id_7": 528,
        "answer_token_pos_7": 406,
        "answer_token_7": "sh",
        "end_token_pos_7": 405,
        "end_token_id_7": 526,
        "answer_token_id_8": 5918,
        "answer_token_pos_8": 410,
        "answer_token_8": "Max",
        "end_token_pos_8": 409,
        "end_token_id_8": 29889,
        "answer_token_id_9": 528,
        "answer_token_pos_9": 413,
        "answer_token_9": "sh",
        "end_token_pos_9": 412,
        "end_token_id_9": 338
    },
    {
        "question": "Grimpus is moderate. Shumpuses are grimpuses. Alex is shumpus.",
        "query": "True or false: Alex is moderate.",
        "answer": "Alex is shumpus. Shumpuses are grimpuses. Alex is grimpus. Grimpus is moderate. Alex is moderate. True",
        "label": "True",
        "prompt": "Grimpus is moderate. Shumpuses are grimpuses. Alex is shumpus. True or false: Alex is moderate. Let us think step by step.",
        "generated": "Alex is shumpus. Shumpuses are grimpuses. Alex is grimpus. Grimpus is moderate. Alex is moderate. True",
        "noise_response_0": "",
        "noise_prompt_0": "Grimpus is moderate. Shumpuses are grimpuses. Alex is shumpus. True or false: Sally is moderate. Let us think step by step.",
        "response_0": "",
        "noise_response_1": "Alex is",
        "noise_prompt_1": "Grimpus is moderate. Shumpuses are grimpuses. Alex is rainy. True or false: Alex is moderate. Let us think step by step.",
        "response_1": "Alex is",
        "noise_response_2": "Alex is shumpus.",
        "noise_prompt_2": "Grimpus is moderate. shumpus are grimpuses. Alex is shumpus. True or false: Alex is moderate. Let us think step by step.",
        "response_2": "Alex is shumpus.",
        "noise_response_3": "Alex is shumpus. Shumpuses are",
        "noise_prompt_3": "Grimpus is moderate. Shumpuses are Numpus. Alex is shumpus. True or false: Alex is moderate. Let us think step by step.",
        "response_3": "Alex is shumpus. Shumpuses are",
        "noise_response_4": "Sally is shumpus. Shumpuses are grimpuses.",
        "noise_prompt_4": "Grimpus is moderate. Shumpuses are grimpuses. Alex is shumpus. True or false: Alex is moderate. Let us think step by step.",
        "response_4": "Alex is shumpus. Shumpuses are grimpuses.",
        "noise_response_5": "Alex is shumpus. Shumpuses are impus. Alex is",
        "noise_prompt_5": "Grimpus is moderate. Shumpuses are grimpuses. Alex is shumpus. True or false: Alex is moderate. Let us think step by step.",
        "response_5": "Alex is shumpus. Shumpuses are grimpuses. Alex is",
        "noise_response_6": "Alex is shumpus. Shumpuses are grimpuses. Alex is grimpus.",
        "noise_prompt_6": "Shumpus is moderate. Shumpuses are grimpuses. Alex is shumpus. True or false: Alex is moderate. Let us think step by step.",
        "response_6": "Alex is shumpus. Shumpuses are grimpuses. Alex is grimpus.",
        "noise_response_7": "Alex is shumpus. Shumpuses are grimpuses. Alex is grimpus. Grimpus is",
        "noise_prompt_7": "Grimpus is moderate. Shumpuses are grimpuses. Alex is shumpus. True or false: Alex is spicy. Let us think step by step.",
        "response_7": "Alex is shumpus. Shumpuses are grimpuses. Alex is grimpus. Grimpus is",
        "noise_response_8": "Alex is shumpus. Shumpuses are grimpuses. Sam is grimpus. Grimpus is moderate.",
        "noise_prompt_8": "Grimpus is moderate. Shumpuses are grimpuses. Alex is shumpus. True or false: Alex is moderate. Let us think step by step.",
        "response_8": "Alex is shumpus. Shumpuses are grimpuses. Alex is grimpus. Grimpus is moderate.",
        "noise_response_9": "Alex is shumpus. Shumpuses are grimpuses. Alex is grimpus. Grimpus is kind. Alex is",
        "noise_prompt_9": "Grimpus is moderate. Shumpuses are grimpuses. Alex is shumpus. True or false: Alex is moderate. Let us think step by step.",
        "response_9": "Alex is shumpus. Shumpuses are grimpuses. Alex is grimpus. Grimpus is moderate. Alex is",
        "noise_prompt_10": "Grimpus is moderate. Shumpuses are grimpuses. Alex is shumpus. True or false: Alex is moderate. Let us think step by step.",
        "response_10": "Alex is shumpus. Shumpuses are grimpuses. Alex is grimpus. Grimpus is moderate. Alex is moderate.",
        "noise_response_10": "Alex is shumpus. Shumpuses are grimpuses. Alex is grimpus. Grimpus is moderate. Alex is opaque.",
        "answer_token_id_0": 17406,
        "answer_token_pos_0": 380,
        "answer_token_0": "Alex",
        "end_token_pos_0": 379,
        "end_token_id_0": 13,
        "answer_token_id_1": 528,
        "answer_token_pos_1": 383,
        "answer_token_1": "sh",
        "end_token_pos_1": 382,
        "end_token_id_1": 338,
        "answer_token_id_2": 1383,
        "answer_token_pos_2": 387,
        "answer_token_2": "Sh",
        "end_token_pos_2": 386,
        "end_token_id_2": 29889,
        "answer_token_id_3": 867,
        "answer_token_pos_3": 391,
        "answer_token_3": "gr",
        "end_token_pos_3": 390,
        "end_token_id_3": 526,
        "answer_token_id_4": 4827,
        "answer_token_pos_4": 395,
        "answer_token_4": "Alex",
        "end_token_pos_4": 394,
        "end_token_id_4": 29889,
        "answer_token_id_5": 867,
        "answer_token_pos_5": 398,
        "answer_token_5": "gr",
        "end_token_pos_5": 397,
        "end_token_id_5": 338,
        "answer_token_id_6": 1632,
        "answer_token_pos_6": 402,
        "answer_token_6": "Gr",
        "end_token_pos_6": 401,
        "end_token_id_6": 29889,
        "answer_token_id_7": 17768,
        "answer_token_pos_7": 406,
        "answer_token_7": "moder",
        "end_token_pos_7": 405,
        "end_token_id_7": 338,
        "answer_token_id_8": 4827,
        "answer_token_pos_8": 410,
        "answer_token_8": "Alex",
        "end_token_pos_8": 409,
        "end_token_id_8": 29889,
        "answer_token_id_9": 17768,
        "answer_token_pos_9": 413,
        "answer_token_9": "moder",
        "end_token_pos_9": 412,
        "end_token_id_9": 338
    },
    {
        "question": "Impuses are small. Vumpuses are impuses. Rex is vumpus.",
        "query": "True or false: Rex is small.",
        "answer": "Rex is vumpus. Vumpuses are impuses. Rex is impus. Impuses are small. Rex is small. True",
        "label": "True",
        "prompt": "Impuses are small. Vumpuses are impuses. Rex is vumpus. True or false: Rex is small. Let us think step by step.",
        "generated": "Rex is vumpus. Vumpuses are impuses. Rex is impus. Impuses are small. Rex is small. True",
        "noise_response_0": "",
        "noise_prompt_0": "Impuses are small. Vumpuses are impuses. Rex is vumpus. True or false: Sam is small. Let us think step by step.",
        "response_0": "",
        "noise_response_1": "Rex is",
        "noise_prompt_1": "Impuses are small. Vumpuses are impuses. Rex is sterpus. True or false: Rex is small. Let us think step by step.",
        "response_1": "Rex is",
        "noise_response_2": "Rex is vumpus.",
        "noise_prompt_2": "Impuses are small. Brimpus are impuses. Rex is vumpus. True or false: Rex is small. Let us think step by step.",
        "response_2": "Rex is vumpus.",
        "noise_response_3": "Rex is vumpus. Vumpuses are",
        "noise_prompt_3": "Impuses are small. Vumpuses are sterpus. Rex is vumpus. True or false: Rex is small. Let us think step by step.",
        "response_3": "Rex is vumpus. Vumpuses are",
        "noise_response_4": "Stella is vumpus. Vumpuses are impuses.",
        "noise_prompt_4": "Impuses are small. Vumpuses are impuses. Rex is vumpus. True or false: Rex is small. Let us think step by step.",
        "response_4": "Rex is vumpus. Vumpuses are impuses.",
        "noise_response_5": "Rex is vumpus. Vumpuses are Zumpus. Rex is",
        "noise_prompt_5": "Impuses are small. Vumpuses are impuses. Rex is vumpus. True or false: Rex is small. Let us think step by step.",
        "response_5": "Rex is vumpus. Vumpuses are impuses. Rex is",
        "noise_response_6": "Rex is vumpus. Vumpuses are impuses. Rex is impus.",
        "noise_prompt_6": "Yumpus are small. Vumpuses are impuses. Rex is vumpus. True or false: Rex is small. Let us think step by step.",
        "response_6": "Rex is vumpus. Vumpuses are impuses. Rex is impus.",
        "noise_response_7": "Rex is vumpus. Vumpuses are impuses. Rex is impus. Impuses are",
        "noise_prompt_7": "Impuses are small. Vumpuses are impuses. Rex is vumpus. True or false: Rex is shy. Let us think step by step.",
        "response_7": "Rex is vumpus. Vumpuses are impuses. Rex is impus. Impuses are",
        "noise_response_8": "Rex is vumpus. Vumpuses are impuses. Polly is impus. Impuses are small.",
        "noise_prompt_8": "Impuses are small. Vumpuses are impuses. Rex is vumpus. True or false: Rex is small. Let us think step by step.",
        "response_8": "Rex is vumpus. Vumpuses are impuses. Rex is impus. Impuses are small.",
        "noise_response_9": "Rex is vumpus. Vumpuses are impuses. Rex is impus. Impuses are dull. Rex is",
        "noise_prompt_9": "Impuses are small. Vumpuses are impuses. Rex is vumpus. True or false: Rex is small. Let us think step by step.",
        "response_9": "Rex is vumpus. Vumpuses are impuses. Rex is impus. Impuses are small. Rex is",
        "noise_prompt_10": "Impuses are small. Vumpuses are impuses. Rex is vumpus. True or false: Rex is small. Let us think step by step.",
        "response_10": "Rex is vumpus. Vumpuses are impuses. Rex is impus. Impuses are small. Rex is small.",
        "noise_response_10": "Rex is vumpus. Vumpuses are impuses. Rex is impus. Impuses are small. Rex is mean.",
        "answer_token_id_0": 29934,
        "answer_token_pos_0": 380,
        "answer_token_0": "R",
        "end_token_pos_0": 379,
        "end_token_id_0": 13,
        "answer_token_id_1": 325,
        "answer_token_pos_1": 383,
        "answer_token_1": "v",
        "end_token_pos_1": 382,
        "end_token_id_1": 338,
        "answer_token_id_2": 478,
        "answer_token_pos_2": 387,
        "answer_token_2": "V",
        "end_token_pos_2": 386,
        "end_token_id_2": 29889,
        "answer_token_id_3": 2411,
        "answer_token_pos_3": 391,
        "answer_token_3": "imp",
        "end_token_pos_3": 390,
        "end_token_id_3": 526,
        "answer_token_id_4": 390,
        "answer_token_pos_4": 395,
        "answer_token_4": "R",
        "end_token_pos_4": 394,
        "end_token_id_4": 29889,
        "answer_token_id_5": 2411,
        "answer_token_pos_5": 398,
        "answer_token_5": "imp",
        "end_token_pos_5": 397,
        "end_token_id_5": 338,
        "answer_token_id_6": 14305,
        "answer_token_pos_6": 402,
        "answer_token_6": "Imp",
        "end_token_pos_6": 401,
        "end_token_id_6": 29889,
        "answer_token_id_7": 2319,
        "answer_token_pos_7": 406,
        "answer_token_7": "small",
        "end_token_pos_7": 405,
        "end_token_id_7": 526,
        "answer_token_id_8": 390,
        "answer_token_pos_8": 410,
        "answer_token_8": "R",
        "end_token_pos_8": 409,
        "end_token_id_8": 29889,
        "answer_token_id_9": 2319,
        "answer_token_pos_9": 413,
        "answer_token_9": "small",
        "end_token_pos_9": 412,
        "end_token_id_9": 338
    },
    {
        "question": "Zumpuses are melodic. Gorpus is zumpus. Fae is gorpus.",
        "query": "True or false: Fae is melodic.",
        "answer": "Fae is gorpus. Gorpus is zumpus. Fae is zumpus. Zumpuses are melodic. Fae is melodic. True",
        "label": "True",
        "prompt": "Zumpuses are melodic. Gorpus is zumpus. Fae is gorpus. True or false: Fae is melodic. Let us think step by step.",
        "generated": "Fae is gorpus. Gorpus is zumpus. Fae is zumpus. Zumpuses are melodic. Fae is melodic. True",
        "noise_response_0": "",
        "noise_prompt_0": "Zumpuses are melodic. Gorpus is zumpus. Fae is gorpus. True or false: Max is melodic. Let us think step by step.",
        "response_0": "",
        "noise_response_1": "Fae is",
        "noise_prompt_1": "Zumpuses are melodic. Gorpus is zumpus. Fae is Wumpus. True or false: Fae is melodic. Let us think step by step.",
        "response_1": "Fae is",
        "noise_response_2": "Fae is gorpus.",
        "noise_prompt_2": "Zumpuses are melodic. Impus is zumpus. Fae is gorpus. True or false: Fae is melodic. Let us think step by step.",
        "response_2": "Fae is gorpus.",
        "noise_response_3": "Fae is gorpus. Gorpus is",
        "noise_prompt_3": "Zumpuses are melodic. Gorpus is vumpus. Fae is gorpus. True or false: Fae is melodic. Let us think step by step.",
        "response_3": "Fae is gorpus. Gorpus is",
        "noise_response_4": "Stella is gorpus. Gorpus is zumpus.",
        "noise_prompt_4": "Zumpuses are melodic. Gorpus is zumpus. Fae is gorpus. True or false: Fae is melodic. Let us think step by step.",
        "response_4": "Fae is gorpus. Gorpus is zumpus.",
        "noise_response_5": "Fae is gorpus. Gorpus is brimpus. Fae is",
        "noise_prompt_5": "Zumpuses are melodic. Gorpus is zumpus. Fae is gorpus. True or false: Fae is melodic. Let us think step by step.",
        "response_5": "Fae is gorpus. Gorpus is zumpus. Fae is",
        "noise_response_6": "Fae is gorpus. Gorpus is zumpus. Fae is zumpus.",
        "noise_prompt_6": "Vumpus are melodic. Gorpus is zumpus. Fae is gorpus. True or false: Fae is melodic. Let us think step by step.",
        "response_6": "Fae is gorpus. Gorpus is zumpus. Fae is zumpus.",
        "noise_response_7": "Fae is gorpus. Gorpus is zumpus. Fae is zumpus. Zumpuses are",
        "noise_prompt_7": "Zumpuses are melodic. Gorpus is zumpus. Fae is gorpus. True or false: Fae is slow. Let us think step by step.",
        "response_7": "Fae is gorpus. Gorpus is zumpus. Fae is zumpus. Zumpuses are",
        "noise_response_8": "Fae is gorpus. Gorpus is zumpus. Alex is zumpus. Zumpuses are melodic.",
        "noise_prompt_8": "Zumpuses are melodic. Gorpus is zumpus. Fae is gorpus. True or false: Fae is melodic. Let us think step by step.",
        "response_8": "Fae is gorpus. Gorpus is zumpus. Fae is zumpus. Zumpuses are melodic.",
        "noise_response_9": "Fae is gorpus. Gorpus is zumpus. Fae is zumpus. Zumpuses are sweet. Fae is",
        "noise_prompt_9": "Zumpuses are melodic. Gorpus is zumpus. Fae is gorpus. True or false: Fae is melodic. Let us think step by step.",
        "response_9": "Fae is gorpus. Gorpus is zumpus. Fae is zumpus. Zumpuses are melodic. Fae is",
        "noise_prompt_10": "Zumpuses are melodic. Gorpus is zumpus. Fae is gorpus. True or false: Fae is melodic. Let us think step by step.",
        "response_10": "Fae is gorpus. Gorpus is zumpus. Fae is zumpus. Zumpuses are melodic. Fae is melodic.",
        "noise_response_10": "Fae is gorpus. Gorpus is zumpus. Fae is zumpus. Zumpuses are melodic. Fae is slow.",
        "answer_token_id_0": 29943,
        "answer_token_pos_0": 380,
        "answer_token_0": "F",
        "end_token_pos_0": 379,
        "end_token_id_0": 13,
        "answer_token_id_1": 330,
        "answer_token_pos_1": 383,
        "answer_token_1": "g",
        "end_token_pos_1": 382,
        "end_token_id_1": 338,
        "answer_token_id_2": 18686,
        "answer_token_pos_2": 387,
        "answer_token_2": "Gor",
        "end_token_pos_2": 386,
        "end_token_id_2": 29889,
        "answer_token_id_3": 3356,
        "answer_token_pos_3": 391,
        "answer_token_3": "zum",
        "end_token_pos_3": 390,
        "end_token_id_3": 338,
        "answer_token_id_4": 383,
        "answer_token_pos_4": 395,
        "answer_token_4": "F",
        "end_token_pos_4": 394,
        "end_token_id_4": 29889,
        "answer_token_id_5": 3356,
        "answer_token_pos_5": 398,
        "answer_token_5": "zum",
        "end_token_pos_5": 397,
        "end_token_id_5": 338,
        "answer_token_id_6": 796,
        "answer_token_pos_6": 402,
        "answer_token_6": "Z",
        "end_token_pos_6": 401,
        "end_token_id_6": 29889,
        "answer_token_id_7": 9232,
        "answer_token_pos_7": 406,
        "answer_token_7": "mel",
        "end_token_pos_7": 405,
        "end_token_id_7": 526,
        "answer_token_id_8": 383,
        "answer_token_pos_8": 410,
        "answer_token_8": "F",
        "end_token_pos_8": 409,
        "end_token_id_8": 29889,
        "answer_token_id_9": 9232,
        "answer_token_pos_9": 413,
        "answer_token_9": "mel",
        "end_token_pos_9": 412,
        "end_token_id_9": 338
    },
    {
        "question": "Vumpus is kind. Numpus is vumpus. Sally is numpus.",
        "query": "True or false: Sally is kind.",
        "answer": "Sally is numpus. Numpus is vumpus. Sally is vumpus. Vumpus is kind. Sally is kind. True",
        "label": "True",
        "prompt": "Vumpus is kind. Numpus is vumpus. Sally is numpus. True or false: Sally is kind. Let us think step by step.",
        "generated": "Sally is numpus. Numpus is vumpus. Sally is vumpus. Vumpus is kind. Sally is kind. True",
        "noise_response_0": "",
        "noise_prompt_0": "Vumpus is kind. Numpus is vumpus. Sally is numpus. True or false: Stella is kind. Let us think step by step.",
        "response_0": "",
        "noise_response_1": "Sally is",
        "noise_prompt_1": "Vumpus is kind. Numpus is vumpus. Sally is Tumpus. True or false: Sally is kind. Let us think step by step.",
        "response_1": "Sally is",
        "noise_response_2": "Sally is numpus.",
        "noise_prompt_2": "Vumpus is kind. shumpus is vumpus. Sally is numpus. True or false: Sally is kind. Let us think step by step.",
        "response_2": "Sally is numpus.",
        "noise_response_3": "Sally is numpus. Numpus is",
        "noise_prompt_3": "Vumpus is kind. Numpus is Shumpus. Sally is numpus. True or false: Sally is kind. Let us think step by step.",
        "response_3": "Sally is numpus. Numpus is",
        "noise_response_4": "Fae is numpus. Numpus is vumpus.",
        "noise_prompt_4": "Vumpus is kind. Numpus is vumpus. Sally is numpus. True or false: Sally is kind. Let us think step by step.",
        "response_4": "Sally is numpus. Numpus is vumpus.",
        "noise_response_5": "Sally is numpus. Numpus is numpus. Sally is",
        "noise_prompt_5": "Vumpus is kind. Numpus is vumpus. Sally is numpus. True or false: Sally is kind. Let us think step by step.",
        "response_5": "Sally is numpus. Numpus is vumpus. Sally is",
        "noise_response_6": "Sally is numpus. Numpus is vumpus. Sally is vumpus.",
        "noise_prompt_6": "jompus is kind. Numpus is vumpus. Sally is numpus. True or false: Sally is kind. Let us think step by step.",
        "response_6": "Sally is numpus. Numpus is vumpus. Sally is vumpus.",
        "noise_response_7": "Sally is numpus. Numpus is vumpus. Sally is vumpus. Vumpus is",
        "noise_prompt_7": "Vumpus is kind. Numpus is vumpus. Sally is numpus. True or false: Sally is happy. Let us think step by step.",
        "response_7": "Sally is numpus. Numpus is vumpus. Sally is vumpus. Vumpus is",
        "noise_response_8": "Sally is numpus. Numpus is vumpus. Max is vumpus. Vumpus is kind.",
        "noise_prompt_8": "Vumpus is kind. Numpus is vumpus. Sally is numpus. True or false: Sally is kind. Let us think step by step.",
        "response_8": "Sally is numpus. Numpus is vumpus. Sally is vumpus. Vumpus is kind.",
        "noise_response_9": "Sally is numpus. Numpus is vumpus. Sally is vumpus. Vumpus is metallic. Sally is",
        "noise_prompt_9": "Vumpus is kind. Numpus is vumpus. Sally is numpus. True or false: Sally is kind. Let us think step by step.",
        "response_9": "Sally is numpus. Numpus is vumpus. Sally is vumpus. Vumpus is kind. Sally is",
        "noise_prompt_10": "Vumpus is kind. Numpus is vumpus. Sally is numpus. True or false: Sally is kind. Let us think step by step.",
        "response_10": "Sally is numpus. Numpus is vumpus. Sally is vumpus. Vumpus is kind. Sally is kind.",
        "noise_response_10": "Sally is numpus. Numpus is vumpus. Sally is vumpus. Vumpus is kind. Sally is shy.",
        "answer_token_id_0": 29903,
        "answer_token_pos_0": 380,
        "answer_token_0": "S",
        "end_token_pos_0": 379,
        "end_token_id_0": 13,
        "answer_token_id_1": 954,
        "answer_token_pos_1": 383,
        "answer_token_1": "num",
        "end_token_pos_1": 382,
        "end_token_id_1": 338,
        "answer_token_id_2": 405,
        "answer_token_pos_2": 387,
        "answer_token_2": "N",
        "end_token_pos_2": 386,
        "end_token_id_2": 29889,
        "answer_token_id_3": 325,
        "answer_token_pos_3": 391,
        "answer_token_3": "v",
        "end_token_pos_3": 390,
        "end_token_id_3": 338,
        "answer_token_id_4": 317,
        "answer_token_pos_4": 395,
        "answer_token_4": "S",
        "end_token_pos_4": 394,
        "end_token_id_4": 29889,
        "answer_token_id_5": 325,
        "answer_token_pos_5": 398,
        "answer_token_5": "v",
        "end_token_pos_5": 397,
        "end_token_id_5": 338,
        "answer_token_id_6": 478,
        "answer_token_pos_6": 402,
        "answer_token_6": "V",
        "end_token_pos_6": 401,
        "end_token_id_6": 29889,
        "answer_token_id_7": 2924,
        "answer_token_pos_7": 406,
        "answer_token_7": "kind",
        "end_token_pos_7": 405,
        "end_token_id_7": 338,
        "answer_token_id_8": 317,
        "answer_token_pos_8": 410,
        "answer_token_8": "S",
        "end_token_pos_8": 409,
        "end_token_id_8": 29889,
        "answer_token_id_9": 2924,
        "answer_token_pos_9": 413,
        "answer_token_9": "kind",
        "end_token_pos_9": 412,
        "end_token_id_9": 338
    },
    {
        "question": "Dumpus is discordant. Impus is dumpus. Fae is impus.",
        "query": "True or false: Fae is opaque.",
        "answer": "Fae is impus. Impus is dumpus. Fae is dumpus. Dumpus is discordant. Fae is discordant. False",
        "label": "False",
        "prompt": "Dumpus is discordant. Impus is dumpus. Fae is impus. True or false: Fae is opaque. Let us think step by step.",
        "generated": "Fae is impus. Impus is dumpus. Fae is dumpus. Dumpus is discordant. Fae is discordant. False",
        "noise_response_0": "",
        "noise_prompt_0": "Dumpus is discordant. Impus is dumpus. Fae is impus. True or false: Sally is opaque. Let us think step by step.",
        "response_0": "",
        "noise_response_1": "Fae is",
        "noise_prompt_1": "Dumpus is discordant. Impus is dumpus. Fae is Grimpus. True or false: Fae is opaque. Let us think step by step.",
        "response_1": "Fae is",
        "noise_response_2": "Fae is impus.",
        "noise_prompt_2": "Dumpus is discordant. rompus is dumpus. Fae is impus. True or false: Fae is opaque. Let us think step by step.",
        "response_2": "Fae is impus.",
        "noise_response_3": "Fae is impus. Impus is",
        "noise_prompt_3": "Dumpus is discordant. Impus is impus. Fae is impus. True or false: Fae is opaque. Let us think step by step.",
        "response_3": "Fae is impus. Impus is",
        "noise_response_4": "Rex is impus. Impus is dumpus.",
        "noise_prompt_4": "Dumpus is discordant. Impus is dumpus. Fae is impus. True or false: Fae is opaque. Let us think step by step.",
        "response_4": "Fae is impus. Impus is dumpus.",
        "noise_response_5": "Fae is impus. Impus is Gorpus. Fae is",
        "noise_prompt_5": "Dumpus is discordant. Impus is dumpus. Fae is impus. True or false: Fae is opaque. Let us think step by step.",
        "response_5": "Fae is impus. Impus is dumpus. Fae is",
        "noise_response_6": "Fae is impus. Impus is dumpus. Fae is dumpus.",
        "noise_prompt_6": "Numpus is discordant. Impus is dumpus. Fae is impus. True or false: Fae is opaque. Let us think step by step.",
        "response_6": "Fae is impus. Impus is dumpus. Fae is dumpus.",
        "noise_response_7": "Fae is impus. Impus is dumpus. Fae is dumpus. Dumpus is",
        "noise_prompt_7": "Dumpus is amenable. Impus is dumpus. Fae is impus. True or false: Fae is opaque. Let us think step by step.",
        "response_7": "Fae is impus. Impus is dumpus. Fae is dumpus. Dumpus is",
        "noise_response_8": "Fae is impus. Impus is dumpus. Alex is dumpus. Dumpus is discordant.",
        "noise_prompt_8": "Dumpus is discordant. Impus is dumpus. Fae is impus. True or false: Fae is opaque. Let us think step by step.",
        "response_8": "Fae is impus. Impus is dumpus. Fae is dumpus. Dumpus is discordant.",
        "noise_response_9": "Fae is impus. Impus is dumpus. Fae is dumpus. Dumpus is melodic. Fae is",
        "noise_prompt_9": "Dumpus is discordant. Impus is dumpus. Fae is impus. True or false: Fae is opaque. Let us think step by step.",
        "response_9": "Fae is impus. Impus is dumpus. Fae is dumpus. Dumpus is discordant. Fae is",
        "noise_prompt_10": "Dumpus is discordant. Impus is dumpus. Fae is impus. True or false: Fae is opaque. Let us think step by step.",
        "response_10": "Fae is impus. Impus is dumpus. Fae is dumpus. Dumpus is discordant. Fae is discordant.",
        "noise_response_10": "Fae is impus. Impus is dumpus. Fae is dumpus. Dumpus is discordant. Fae is luminous.",
        "answer_token_id_0": 29943,
        "answer_token_pos_0": 380,
        "answer_token_0": "F",
        "end_token_pos_0": 379,
        "end_token_id_0": 13,
        "answer_token_id_1": 2411,
        "answer_token_pos_1": 383,
        "answer_token_1": "imp",
        "end_token_pos_1": 382,
        "end_token_id_1": 338,
        "answer_token_id_2": 14305,
        "answer_token_pos_2": 387,
        "answer_token_2": "Imp",
        "end_token_pos_2": 386,
        "end_token_id_2": 29889,
        "answer_token_id_3": 16766,
        "answer_token_pos_3": 391,
        "answer_token_3": "dump",
        "end_token_pos_3": 390,
        "end_token_id_3": 338,
        "answer_token_id_4": 383,
        "answer_token_pos_4": 395,
        "answer_token_4": "F",
        "end_token_pos_4": 394,
        "end_token_id_4": 29889,
        "answer_token_id_5": 16766,
        "answer_token_pos_5": 398,
        "answer_token_5": "dump",
        "end_token_pos_5": 397,
        "end_token_id_5": 338,
        "answer_token_id_6": 360,
        "answer_token_pos_6": 402,
        "answer_token_6": "D",
        "end_token_pos_6": 401,
        "end_token_id_6": 29889,
        "answer_token_id_7": 2313,
        "answer_token_pos_7": 406,
        "answer_token_7": "disc",
        "end_token_pos_7": 405,
        "end_token_id_7": 338,
        "answer_token_id_8": 383,
        "answer_token_pos_8": 410,
        "answer_token_8": "F",
        "end_token_pos_8": 409,
        "end_token_id_8": 29889,
        "answer_token_id_9": 2313,
        "answer_token_pos_9": 413,
        "answer_token_9": "disc",
        "end_token_pos_9": 412,
        "end_token_id_9": 338
    },
    {
        "question": "Brimpuses are transparent. Sterpus is brimpus. Stella is sterpus.",
        "query": "True or false: Stella is transparent.",
        "answer": "Stella is sterpus. Sterpus is brimpus. Stella is brimpus. Brimpuses are transparent. Stella is transparent. True",
        "label": "True",
        "prompt": "Brimpuses are transparent. Sterpus is brimpus. Stella is sterpus. True or false: Stella is transparent. Let us think step by step.",
        "generated": "Stella is sterpus. Sterpus is brimpus. Stella is brimpus. Brimpuses are transparent. Stella is transparent. True",
        "noise_response_0": "",
        "noise_prompt_0": "Brimpuses are transparent. Sterpus is brimpus. Stella is sterpus. True or false: Max is transparent. Let us think step by step.",
        "response_0": "",
        "noise_response_1": "Stella is",
        "noise_prompt_1": "Brimpuses are transparent. Sterpus is brimpus. Stella is zumpus. True or false: Stella is transparent. Let us think step by step.",
        "response_1": "Stella is",
        "noise_response_2": "Stella is sterpus.",
        "noise_prompt_2": "Brimpuses are transparent. Tumpus is brimpus. Stella is sterpus. True or false: Stella is transparent. Let us think step by step.",
        "response_2": "Stella is sterpus.",
        "noise_response_3": "Stella is sterpus. Sterpus is",
        "noise_prompt_3": "Brimpuses are transparent. Sterpus is floral. Stella is sterpus. True or false: Stella is transparent. Let us think step by step.",
        "response_3": "Stella is sterpus. Sterpus is",
        "noise_response_4": "Stella is sterpus. Wren is brimpus.",
        "noise_prompt_4": "Brimpuses are transparent. Sterpus is brimpus. Stella is sterpus. True or false: Stella is transparent. Let us think step by step.",
        "response_4": "Stella is sterpus. Sterpus is brimpus.",
        "noise_response_5": "Stella is sterpus. Sterpus is liquid. Stella is",
        "noise_prompt_5": "Brimpuses are transparent. Sterpus is brimpus. Stella is sterpus. True or false: Stella is transparent. Let us think step by step.",
        "response_5": "Stella is sterpus. Sterpus is brimpus. Stella is",
        "noise_response_6": "Stella is sterpus. Sterpus is brimpus. Stella is brimpus.",
        "noise_prompt_6": "Brimpus are transparent. Sterpus is brimpus. Stella is sterpus. True or false: Stella is transparent. Let us think step by step.",
        "response_6": "Stella is sterpus. Sterpus is brimpus. Stella is brimpus.",
        "noise_response_7": "Stella is sterpus. Sterpus is brimpus. Stella is brimpus. Brimpuses are",
        "noise_prompt_7": "Brimpuses are transparent. Sterpus is brimpus. Stella is sterpus. True or false: Stella is overcast. Let us think step by step.",
        "response_7": "Stella is sterpus. Sterpus is brimpus. Stella is brimpus. Brimpuses are",
        "noise_response_8": "Stella is sterpus. Sterpus is brimpus. Rex is brimpus. Brimpuses are transparent.",
        "noise_prompt_8": "Brimpuses are transparent. Sterpus is brimpus. Stella is sterpus. True or false: Stella is transparent. Let us think step by step.",
        "response_8": "Stella is sterpus. Sterpus is brimpus. Stella is brimpus. Brimpuses are transparent.",
        "noise_response_9": "Stella is sterpus. Sterpus is brimpus. Stella is brimpus. Brimpuses are snowy. Stella is",
        "noise_prompt_9": "Brimpuses are transparent. Sterpus is brimpus. Stella is sterpus. True or false: Stella is transparent. Let us think step by step.",
        "response_9": "Stella is sterpus. Sterpus is brimpus. Stella is brimpus. Brimpuses are transparent. Stella is",
        "noise_prompt_10": "Brimpuses are transparent. Sterpus is brimpus. Stella is sterpus. True or false: Stella is transparent. Let us think step by step.",
        "response_10": "Stella is sterpus. Sterpus is brimpus. Stella is brimpus. Brimpuses are transparent. Stella is transparent.",
        "noise_response_10": "Stella is sterpus. Sterpus is brimpus. Stella is brimpus. Brimpuses are transparent. Stella is dull.",
        "answer_token_id_0": 855,
        "answer_token_pos_0": 380,
        "answer_token_0": "St",
        "end_token_pos_0": 379,
        "end_token_id_0": 13,
        "answer_token_id_1": 16864,
        "answer_token_pos_1": 383,
        "answer_token_1": "ster",
        "end_token_pos_1": 382,
        "end_token_id_1": 338,
        "answer_token_id_2": 28588,
        "answer_token_pos_2": 387,
        "answer_token_2": "Ster",
        "end_token_pos_2": 386,
        "end_token_id_2": 29889,
        "answer_token_id_3": 1506,
        "answer_token_pos_3": 391,
        "answer_token_3": "br",
        "end_token_pos_3": 390,
        "end_token_id_3": 338,
        "answer_token_id_4": 624,
        "answer_token_pos_4": 395,
        "answer_token_4": "St",
        "end_token_pos_4": 394,
        "end_token_id_4": 29889,
        "answer_token_id_5": 1506,
        "answer_token_pos_5": 398,
        "answer_token_5": "br",
        "end_token_pos_5": 397,
        "end_token_id_5": 338,
        "answer_token_id_6": 1771,
        "answer_token_pos_6": 402,
        "answer_token_6": "Br",
        "end_token_pos_6": 401,
        "end_token_id_6": 29889,
        "answer_token_id_7": 17772,
        "answer_token_pos_7": 406,
        "answer_token_7": "transparent",
        "end_token_pos_7": 405,
        "end_token_id_7": 526,
        "answer_token_id_8": 624,
        "answer_token_pos_8": 410,
        "answer_token_8": "St",
        "end_token_pos_8": 409,
        "end_token_id_8": 29889,
        "answer_token_id_9": 17772,
        "answer_token_pos_9": 413,
        "answer_token_9": "transparent",
        "end_token_pos_9": 412,
        "end_token_id_9": 338
    },
    {
        "question": "Grimpus is luminous. Sterpuses are grimpuses. Fae is sterpus.",
        "query": "True or false: Fae is luminous.",
        "answer": "Fae is sterpus. Sterpuses are grimpuses. Fae is grimpus. Grimpus is luminous. Fae is luminous. True",
        "label": "True",
        "prompt": "Grimpus is luminous. Sterpuses are grimpuses. Fae is sterpus. True or false: Fae is luminous. Let us think step by step.",
        "generated": "Fae is sterpus. Sterpuses are grimpuses. Fae is grimpus. Grimpus is luminous. Fae is luminous. True",
        "noise_response_0": "",
        "noise_prompt_0": "Grimpus is luminous. Sterpuses are grimpuses. Fae is sterpus. True or false: Polly is luminous. Let us think step by step.",
        "response_0": "",
        "noise_response_1": "Fae is",
        "noise_prompt_1": "Grimpus is luminous. Sterpuses are grimpuses. Fae is Impus. True or false: Fae is luminous. Let us think step by step.",
        "response_1": "Fae is",
        "noise_response_2": "Fae is sterpus.",
        "noise_prompt_2": "Grimpus is luminous. impus are grimpuses. Fae is sterpus. True or false: Fae is luminous. Let us think step by step.",
        "response_2": "Fae is sterpus.",
        "noise_response_3": "Fae is sterpus. Sterpuses are",
        "noise_prompt_3": "Grimpus is luminous. Sterpuses are numpus. Fae is sterpus. True or false: Fae is luminous. Let us think step by step.",
        "response_3": "Fae is sterpus. Sterpuses are",
        "noise_response_4": "Alex is sterpus. Sterpuses are grimpuses.",
        "noise_prompt_4": "Grimpus is luminous. Sterpuses are grimpuses. Fae is sterpus. True or false: Fae is luminous. Let us think step by step.",
        "response_4": "Fae is sterpus. Sterpuses are grimpuses.",
        "noise_response_5": "Fae is sterpus. Sterpuses are dumpus. Fae is",
        "noise_prompt_5": "Grimpus is luminous. Sterpuses are grimpuses. Fae is sterpus. True or false: Fae is luminous. Let us think step by step.",
        "response_5": "Fae is sterpus. Sterpuses are grimpuses. Fae is",
        "noise_response_6": "Fae is sterpus. Sterpuses are grimpuses. Fae is grimpus.",
        "noise_prompt_6": "dumpus is luminous. Sterpuses are grimpuses. Fae is sterpus. True or false: Fae is luminous. Let us think step by step.",
        "response_6": "Fae is sterpus. Sterpuses are grimpuses. Fae is grimpus.",
        "noise_response_7": "Fae is sterpus. Sterpuses are grimpuses. Fae is grimpus. Grimpus is",
        "noise_prompt_7": "Grimpus is luminous. Sterpuses are grimpuses. Fae is sterpus. True or false: Fae is happy. Let us think step by step.",
        "response_7": "Fae is sterpus. Sterpuses are grimpuses. Fae is grimpus. Grimpus is",
        "noise_response_8": "Fae is sterpus. Sterpuses are grimpuses. Sally is grimpus. Grimpus is luminous.",
        "noise_prompt_8": "Grimpus is luminous. Sterpuses are grimpuses. Fae is sterpus. True or false: Fae is luminous. Let us think step by step.",
        "response_8": "Fae is sterpus. Sterpuses are grimpuses. Fae is grimpus. Grimpus is luminous.",
        "noise_response_9": "Fae is sterpus. Sterpuses are grimpuses. Fae is grimpus. Grimpus is aggressive. Fae is",
        "noise_prompt_9": "Grimpus is luminous. Sterpuses are grimpuses. Fae is sterpus. True or false: Fae is luminous. Let us think step by step.",
        "response_9": "Fae is sterpus. Sterpuses are grimpuses. Fae is grimpus. Grimpus is luminous. Fae is",
        "noise_prompt_10": "Grimpus is luminous. Sterpuses are grimpuses. Fae is sterpus. True or false: Fae is luminous. Let us think step by step.",
        "response_10": "Fae is sterpus. Sterpuses are grimpuses. Fae is grimpus. Grimpus is luminous. Fae is luminous.",
        "noise_response_10": "Fae is sterpus. Sterpuses are grimpuses. Fae is grimpus. Grimpus is luminous. Fae is shy.",
        "answer_token_id_0": 29943,
        "answer_token_pos_0": 380,
        "answer_token_0": "F",
        "end_token_pos_0": 379,
        "end_token_id_0": 13,
        "answer_token_id_1": 16864,
        "answer_token_pos_1": 383,
        "answer_token_1": "ster",
        "end_token_pos_1": 382,
        "end_token_id_1": 338,
        "answer_token_id_2": 28588,
        "answer_token_pos_2": 387,
        "answer_token_2": "Ster",
        "end_token_pos_2": 386,
        "end_token_id_2": 29889,
        "answer_token_id_3": 867,
        "answer_token_pos_3": 391,
        "answer_token_3": "gr",
        "end_token_pos_3": 390,
        "end_token_id_3": 526,
        "answer_token_id_4": 383,
        "answer_token_pos_4": 395,
        "answer_token_4": "F",
        "end_token_pos_4": 394,
        "end_token_id_4": 29889,
        "answer_token_id_5": 867,
        "answer_token_pos_5": 398,
        "answer_token_5": "gr",
        "end_token_pos_5": 397,
        "end_token_id_5": 338,
        "answer_token_id_6": 1632,
        "answer_token_pos_6": 402,
        "answer_token_6": "Gr",
        "end_token_pos_6": 401,
        "end_token_id_6": 29889,
        "answer_token_id_7": 301,
        "answer_token_pos_7": 406,
        "answer_token_7": "l",
        "end_token_pos_7": 405,
        "end_token_id_7": 338,
        "answer_token_id_8": 383,
        "answer_token_pos_8": 410,
        "answer_token_8": "F",
        "end_token_pos_8": 409,
        "end_token_id_8": 29889,
        "answer_token_id_9": 301,
        "answer_token_pos_9": 413,
        "answer_token_9": "l",
        "end_token_pos_9": 412,
        "end_token_id_9": 338
    },
    {
        "question": "Vumpus is small. Sterpuses are vumpuses. Rex is sterpus.",
        "query": "True or false: Rex is small.",
        "answer": "Rex is sterpus. Sterpuses are vumpuses. Rex is vumpus. Vumpus is small. Rex is small. True",
        "label": "True",
        "prompt": "Vumpus is small. Sterpuses are vumpuses. Rex is sterpus. True or false: Rex is small. Let us think step by step.",
        "generated": "Rex is sterpus. Sterpuses are vumpuses. Rex is vumpus. Vumpus is small. Rex is small. True",
        "noise_response_0": "",
        "noise_prompt_0": "Vumpus is small. Sterpuses are vumpuses. Rex is sterpus. True or false: Max is small. Let us think step by step.",
        "response_0": "",
        "noise_response_1": "Rex is",
        "noise_prompt_1": "Vumpus is small. Sterpuses are vumpuses. Rex is numpus. True or false: Rex is small. Let us think step by step.",
        "response_1": "Rex is",
        "noise_response_2": "Rex is sterpus.",
        "noise_prompt_2": "Vumpus is small. Brimpus are vumpuses. Rex is sterpus. True or false: Rex is small. Let us think step by step.",
        "response_2": "Rex is sterpus.",
        "noise_response_3": "Rex is sterpus. Sterpuses are",
        "noise_prompt_3": "Vumpus is small. Sterpuses are Jompus. Rex is sterpus. True or false: Rex is small. Let us think step by step.",
        "response_3": "Rex is sterpus. Sterpuses are",
        "noise_response_4": "Stella is sterpus. Sterpuses are vumpuses.",
        "noise_prompt_4": "Vumpus is small. Sterpuses are vumpuses. Rex is sterpus. True or false: Rex is small. Let us think step by step.",
        "response_4": "Rex is sterpus. Sterpuses are vumpuses.",
        "noise_response_5": "Rex is sterpus. Sterpuses are wumpus. Rex is",
        "noise_prompt_5": "Vumpus is small. Sterpuses are vumpuses. Rex is sterpus. True or false: Rex is small. Let us think step by step.",
        "response_5": "Rex is sterpus. Sterpuses are vumpuses. Rex is",
        "noise_response_6": "Rex is sterpus. Sterpuses are vumpuses. Rex is vumpus.",
        "noise_prompt_6": "Brimpus is small. Sterpuses are vumpuses. Rex is sterpus. True or false: Rex is small. Let us think step by step.",
        "response_6": "Rex is sterpus. Sterpuses are vumpuses. Rex is vumpus.",
        "noise_response_7": "Rex is sterpus. Sterpuses are vumpuses. Rex is vumpus. Vumpus is",
        "noise_prompt_7": "Vumpus is small. Sterpuses are vumpuses. Rex is sterpus. True or false: Rex is wooden. Let us think step by step.",
        "response_7": "Rex is sterpus. Sterpuses are vumpuses. Rex is vumpus. Vumpus is",
        "noise_response_8": "Rex is sterpus. Sterpuses are vumpuses. Fae is vumpus. Vumpus is small.",
        "noise_prompt_8": "Vumpus is small. Sterpuses are vumpuses. Rex is sterpus. True or false: Rex is small. Let us think step by step.",
        "response_8": "Rex is sterpus. Sterpuses are vumpuses. Rex is vumpus. Vumpus is small.",
        "noise_response_9": "Rex is sterpus. Sterpuses are vumpuses. Rex is vumpus. Vumpus is angry. Rex is",
        "noise_prompt_9": "Vumpus is small. Sterpuses are vumpuses. Rex is sterpus. True or false: Rex is small. Let us think step by step.",
        "response_9": "Rex is sterpus. Sterpuses are vumpuses. Rex is vumpus. Vumpus is small. Rex is",
        "noise_prompt_10": "Vumpus is small. Sterpuses are vumpuses. Rex is sterpus. True or false: Rex is small. Let us think step by step.",
        "response_10": "Rex is sterpus. Sterpuses are vumpuses. Rex is vumpus. Vumpus is small. Rex is small.",
        "noise_response_10": "Rex is sterpus. Sterpuses are vumpuses. Rex is vumpus. Vumpus is small. Rex is brown.",
        "answer_token_id_0": 29934,
        "answer_token_pos_0": 380,
        "answer_token_0": "R",
        "end_token_pos_0": 379,
        "end_token_id_0": 13,
        "answer_token_id_1": 16864,
        "answer_token_pos_1": 383,
        "answer_token_1": "ster",
        "end_token_pos_1": 382,
        "end_token_id_1": 338,
        "answer_token_id_2": 28588,
        "answer_token_pos_2": 387,
        "answer_token_2": "Ster",
        "end_token_pos_2": 386,
        "end_token_id_2": 29889,
        "answer_token_id_3": 325,
        "answer_token_pos_3": 391,
        "answer_token_3": "v",
        "end_token_pos_3": 390,
        "end_token_id_3": 526,
        "answer_token_id_4": 478,
        "answer_token_pos_4": 395,
        "answer_token_4": "V",
        "end_token_pos_4": 394,
        "end_token_id_4": 29889,
        "answer_token_id_5": 325,
        "answer_token_pos_5": 398,
        "answer_token_5": "v",
        "end_token_pos_5": 397,
        "end_token_id_5": 338,
        "answer_token_id_6": 478,
        "answer_token_pos_6": 402,
        "answer_token_6": "V",
        "end_token_pos_6": 401,
        "end_token_id_6": 29889,
        "answer_token_id_7": 2319,
        "answer_token_pos_7": 406,
        "answer_token_7": "small",
        "end_token_pos_7": 405,
        "end_token_id_7": 338,
        "answer_token_id_8": 390,
        "answer_token_pos_8": 410,
        "answer_token_8": "R",
        "end_token_pos_8": 409,
        "end_token_id_8": 29889,
        "answer_token_id_9": 2319,
        "answer_token_pos_9": 413,
        "answer_token_9": "small",
        "end_token_pos_9": 412,
        "end_token_id_9": 338
    },
    {
        "question": "Jompus is sour. Vumpus is jompus. Sam is vumpus.",
        "query": "True or false: Sam is sour.",
        "answer": "Sam is vumpus. Vumpus is jompus. Sam is jompus. Jompus is sour. Sam is sour. True",
        "label": "True",
        "prompt": "Jompus is sour. Vumpus is jompus. Sam is vumpus. True or false: Sam is sour. Let us think step by step.",
        "generated": "Sam is vumpus. Vumpus is jompus. Sam is jompus. Jompus is sour. Sam is sour. True",
        "noise_response_0": "",
        "noise_prompt_0": "Jompus is sour. Vumpus is jompus. Sam is vumpus. True or false: Rex is sour. Let us think step by step.",
        "response_0": "",
        "noise_response_1": "Sam is",
        "noise_prompt_1": "Jompus is sour. Vumpus is jompus. Sam is impus. True or false: Sam is sour. Let us think step by step.",
        "response_1": "Sam is",
        "noise_response_2": "Sam is vumpus.",
        "noise_prompt_2": "Jompus is sour. rompus is jompus. Sam is vumpus. True or false: Sam is sour. Let us think step by step.",
        "response_2": "Sam is vumpus.",
        "noise_response_3": "Sam is vumpus. Vumpus is",
        "noise_prompt_3": "Jompus is sour. Vumpus is rompus. Sam is vumpus. True or false: Sam is sour. Let us think step by step.",
        "response_3": "Sam is vumpus. Vumpus is",
        "noise_response_4": "Rex is vumpus. Vumpus is jompus.",
        "noise_prompt_4": "Jompus is sour. Vumpus is jompus. Sam is vumpus. True or false: Sam is sour. Let us think step by step.",
        "response_4": "Sam is vumpus. Vumpus is jompus.",
        "noise_response_5": "Sam is vumpus. Vumpus is Shumpus. Sam is",
        "noise_prompt_5": "Jompus is sour. Vumpus is jompus. Sam is vumpus. True or false: Sam is sour. Let us think step by step.",
        "response_5": "Sam is vumpus. Vumpus is jompus. Sam is",
        "noise_response_6": "Sam is vumpus. Vumpus is jompus. Sam is jompus.",
        "noise_prompt_6": "Shumpus is sour. Vumpus is jompus. Sam is vumpus. True or false: Sam is sour. Let us think step by step.",
        "response_6": "Sam is vumpus. Vumpus is jompus. Sam is jompus.",
        "noise_response_7": "Sam is vumpus. Vumpus is jompus. Sam is jompus. Jompus is",
        "noise_prompt_7": "Jompus is sour. Vumpus is jompus. Sam is vumpus. True or false: Sam is metallic. Let us think step by step.",
        "response_7": "Sam is vumpus. Vumpus is jompus. Sam is jompus. Jompus is",
        "noise_response_8": "Sam is vumpus. Vumpus is jompus. Max is jompus. Jompus is sour.",
        "noise_prompt_8": "Jompus is sour. Vumpus is jompus. Sam is vumpus. True or false: Sam is sour. Let us think step by step.",
        "response_8": "Sam is vumpus. Vumpus is jompus. Sam is jompus. Jompus is sour.",
        "noise_response_9": "Sam is vumpus. Vumpus is jompus. Sam is jompus. Jompus is small. Sam is",
        "noise_prompt_9": "Jompus is sour. Vumpus is jompus. Sam is vumpus. True or false: Sam is sour. Let us think step by step.",
        "response_9": "Sam is vumpus. Vumpus is jompus. Sam is jompus. Jompus is sour. Sam is",
        "noise_prompt_10": "Jompus is sour. Vumpus is jompus. Sam is vumpus. True or false: Sam is sour. Let us think step by step.",
        "response_10": "Sam is vumpus. Vumpus is jompus. Sam is jompus. Jompus is sour. Sam is sour.",
        "noise_response_10": "Sam is vumpus. Vumpus is jompus. Sam is jompus. Jompus is sour. Sam is blue.",
        "answer_token_id_0": 22966,
        "answer_token_pos_0": 380,
        "answer_token_0": "Sam",
        "end_token_pos_0": 379,
        "end_token_id_0": 13,
        "answer_token_id_1": 325,
        "answer_token_pos_1": 383,
        "answer_token_1": "v",
        "end_token_pos_1": 382,
        "end_token_id_1": 338,
        "answer_token_id_2": 478,
        "answer_token_pos_2": 387,
        "answer_token_2": "V",
        "end_token_pos_2": 386,
        "end_token_id_2": 29889,
        "answer_token_id_3": 432,
        "answer_token_pos_3": 391,
        "answer_token_3": "j",
        "end_token_pos_3": 390,
        "end_token_id_3": 338,
        "answer_token_id_4": 3685,
        "answer_token_pos_4": 395,
        "answer_token_4": "Sam",
        "end_token_pos_4": 394,
        "end_token_id_4": 29889,
        "answer_token_id_5": 432,
        "answer_token_pos_5": 398,
        "answer_token_5": "j",
        "end_token_pos_5": 397,
        "end_token_id_5": 338,
        "answer_token_id_6": 435,
        "answer_token_pos_6": 402,
        "answer_token_6": "J",
        "end_token_pos_6": 401,
        "end_token_id_6": 29889,
        "answer_token_id_7": 269,
        "answer_token_pos_7": 406,
        "answer_token_7": "s",
        "end_token_pos_7": 405,
        "end_token_id_7": 338,
        "answer_token_id_8": 3685,
        "answer_token_pos_8": 410,
        "answer_token_8": "Sam",
        "end_token_pos_8": 409,
        "end_token_id_8": 29889,
        "answer_token_id_9": 269,
        "answer_token_pos_9": 413,
        "answer_token_9": "s",
        "end_token_pos_9": 412,
        "end_token_id_9": 338
    },
    {
        "question": "Yumpuses are bright. Zumpus is yumpus. Rex is zumpus.",
        "query": "True or false: Rex is bright.",
        "answer": "Rex is zumpus. Zumpus is yumpus. Rex is yumpus. Yumpuses are bright. Rex is bright. True",
        "label": "True",
        "prompt": "Yumpuses are bright. Zumpus is yumpus. Rex is zumpus. True or false: Rex is bright. Let us think step by step.",
        "generated": "Rex is zumpus. Zumpus is yumpus. Rex is yumpus. Yumpuses are bright. Rex is bright. True",
        "noise_response_0": "",
        "noise_prompt_0": "Yumpuses are bright. Zumpus is yumpus. Rex is zumpus. True or false: Alex is bright. Let us think step by step.",
        "response_0": "",
        "noise_response_1": "Rex is",
        "noise_prompt_1": "Yumpuses are bright. Zumpus is yumpus. Rex is Lorpus. True or false: Rex is bright. Let us think step by step.",
        "response_1": "Rex is",
        "noise_response_2": "Rex is zumpus.",
        "noise_prompt_2": "Yumpuses are bright. rompus is yumpus. Rex is zumpus. True or false: Rex is bright. Let us think step by step.",
        "response_2": "Rex is zumpus.",
        "noise_response_3": "Rex is zumpus. Zumpus is",
        "noise_prompt_3": "Yumpuses are bright. Zumpus is numpus. Rex is zumpus. True or false: Rex is bright. Let us think step by step.",
        "response_3": "Rex is zumpus. Zumpus is",
        "noise_response_4": "Stella is zumpus. Zumpus is yumpus.",
        "noise_prompt_4": "Yumpuses are bright. Zumpus is yumpus. Rex is zumpus. True or false: Rex is bright. Let us think step by step.",
        "response_4": "Rex is zumpus. Zumpus is yumpus.",
        "noise_response_5": "Rex is zumpus. Zumpus is wumpus. Rex is",
        "noise_prompt_5": "Yumpuses are bright. Zumpus is yumpus. Rex is zumpus. True or false: Rex is bright. Let us think step by step.",
        "response_5": "Rex is zumpus. Zumpus is yumpus. Rex is",
        "noise_response_6": "Rex is zumpus. Zumpus is yumpus. Rex is yumpus.",
        "noise_prompt_6": "Sterpus are bright. Zumpus is yumpus. Rex is zumpus. True or false: Rex is bright. Let us think step by step.",
        "response_6": "Rex is zumpus. Zumpus is yumpus. Rex is yumpus.",
        "noise_response_7": "Rex is zumpus. Zumpus is yumpus. Rex is yumpus. Yumpuses are",
        "noise_prompt_7": "Yumpuses are bright. Zumpus is yumpus. Rex is zumpus. True or false: Rex is discordant. Let us think step by step.",
        "response_7": "Rex is zumpus. Zumpus is yumpus. Rex is yumpus. Yumpuses are",
        "noise_response_8": "Rex is zumpus. Zumpus is yumpus. Fae is yumpus. Yumpuses are bright.",
        "noise_prompt_8": "Yumpuses are bright. Zumpus is yumpus. Rex is zumpus. True or false: Rex is bright. Let us think step by step.",
        "response_8": "Rex is zumpus. Zumpus is yumpus. Rex is yumpus. Yumpuses are bright.",
        "noise_response_9": "Rex is zumpus. Zumpus is yumpus. Rex is yumpus. Yumpuses are happy. Rex is",
        "noise_prompt_9": "Yumpuses are bright. Zumpus is yumpus. Rex is zumpus. True or false: Rex is bright. Let us think step by step.",
        "response_9": "Rex is zumpus. Zumpus is yumpus. Rex is yumpus. Yumpuses are bright. Rex is",
        "noise_prompt_10": "Yumpuses are bright. Zumpus is yumpus. Rex is zumpus. True or false: Rex is bright. Let us think step by step.",
        "response_10": "Rex is zumpus. Zumpus is yumpus. Rex is yumpus. Yumpuses are bright. Rex is bright.",
        "noise_response_10": "Rex is zumpus. Zumpus is yumpus. Rex is yumpus. Yumpuses are bright. Rex is sour.",
        "answer_token_id_0": 29934,
        "answer_token_pos_0": 380,
        "answer_token_0": "R",
        "end_token_pos_0": 379,
        "end_token_id_0": 13,
        "answer_token_id_1": 3356,
        "answer_token_pos_1": 383,
        "answer_token_1": "zum",
        "end_token_pos_1": 382,
        "end_token_id_1": 338,
        "answer_token_id_2": 796,
        "answer_token_pos_2": 387,
        "answer_token_2": "Z",
        "end_token_pos_2": 386,
        "end_token_id_2": 29889,
        "answer_token_id_3": 343,
        "answer_token_pos_3": 391,
        "answer_token_3": "y",
        "end_token_pos_3": 390,
        "end_token_id_3": 338,
        "answer_token_id_4": 390,
        "answer_token_pos_4": 395,
        "answer_token_4": "R",
        "end_token_pos_4": 394,
        "end_token_id_4": 29889,
        "answer_token_id_5": 343,
        "answer_token_pos_5": 398,
        "answer_token_5": "y",
        "end_token_pos_5": 397,
        "end_token_id_5": 338,
        "answer_token_id_6": 612,
        "answer_token_pos_6": 402,
        "answer_token_6": "Y",
        "end_token_pos_6": 401,
        "end_token_id_6": 29889,
        "answer_token_id_7": 11785,
        "answer_token_pos_7": 406,
        "answer_token_7": "bright",
        "end_token_pos_7": 405,
        "end_token_id_7": 526,
        "answer_token_id_8": 390,
        "answer_token_pos_8": 410,
        "answer_token_8": "R",
        "end_token_pos_8": 409,
        "end_token_id_8": 29889,
        "answer_token_id_9": 11785,
        "answer_token_pos_9": 413,
        "answer_token_9": "bright",
        "end_token_pos_9": 412,
        "end_token_id_9": 338
    },
    {
        "question": "Lorpuses are temperate. Wumpus is lorpus. Sally is wumpus.",
        "query": "True or false: Sally is temperate.",
        "answer": "Sally is wumpus. Wumpus is lorpus. Sally is lorpus. Lorpuses are temperate. Sally is temperate. True",
        "label": "True",
        "prompt": "Lorpuses are temperate. Wumpus is lorpus. Sally is wumpus. True or false: Sally is temperate. Let us think step by step.",
        "generated": "Sally is wumpus. Wumpus is lorpus. Sally is lorpus. Lorpuses are temperate. Sally is temperate. True",
        "noise_response_0": "",
        "noise_prompt_0": "Lorpuses are temperate. Wumpus is lorpus. Sally is wumpus. True or false: Sam is temperate. Let us think step by step.",
        "response_0": "",
        "noise_response_1": "Sally is",
        "noise_prompt_1": "Lorpuses are temperate. Wumpus is lorpus. Sally is muffled. True or false: Sally is temperate. Let us think step by step.",
        "response_1": "Sally is",
        "noise_response_2": "Sally is wumpus.",
        "noise_prompt_2": "Lorpuses are temperate. Sam is lorpus. Sally is wumpus. True or false: Sally is temperate. Let us think step by step.",
        "response_2": "Sally is wumpus.",
        "noise_response_3": "Sally is wumpus. Wumpus is",
        "noise_prompt_3": "Lorpuses are temperate. Wumpus is melodic. Sally is wumpus. True or false: Sally is temperate. Let us think step by step.",
        "response_3": "Sally is wumpus. Wumpus is",
        "noise_response_4": "Sam is wumpus. Wumpus is lorpus.",
        "noise_prompt_4": "Lorpuses are temperate. Wumpus is lorpus. Sally is wumpus. True or false: Sally is temperate. Let us think step by step.",
        "response_4": "Sally is wumpus. Wumpus is lorpus.",
        "noise_response_5": "Sally is wumpus. Wumpus is shy. Sally is",
        "noise_prompt_5": "Lorpuses are temperate. Wumpus is lorpus. Sally is wumpus. True or false: Sally is temperate. Let us think step by step.",
        "response_5": "Sally is wumpus. Wumpus is lorpus. Sally is",
        "noise_response_6": "Sally is wumpus. Wumpus is lorpus. Sally is lorpus.",
        "noise_prompt_6": "lorpus are temperate. Wumpus is lorpus. Sally is wumpus. True or false: Sally is temperate. Let us think step by step.",
        "response_6": "Sally is wumpus. Wumpus is lorpus. Sally is lorpus.",
        "noise_response_7": "Sally is wumpus. Wumpus is lorpus. Sally is lorpus. Lorpuses are",
        "noise_prompt_7": "Lorpuses are temperate. Wumpus is lorpus. Sally is wumpus. True or false: Sally is brown. Let us think step by step.",
        "response_7": "Sally is wumpus. Wumpus is lorpus. Sally is lorpus. Lorpuses are",
        "noise_response_8": "Sally is wumpus. Wumpus is lorpus. Alex is lorpus. Lorpuses are temperate.",
        "noise_prompt_8": "Lorpuses are temperate. Wumpus is lorpus. Sally is wumpus. True or false: Sally is temperate. Let us think step by step.",
        "response_8": "Sally is wumpus. Wumpus is lorpus. Sally is lorpus. Lorpuses are temperate.",
        "noise_response_9": "Sally is wumpus. Wumpus is lorpus. Sally is lorpus. Lorpuses are liquid. Sally is",
        "noise_prompt_9": "Lorpuses are temperate. Wumpus is lorpus. Sally is wumpus. True or false: Sally is temperate. Let us think step by step.",
        "response_9": "Sally is wumpus. Wumpus is lorpus. Sally is lorpus. Lorpuses are temperate. Sally is",
        "noise_prompt_10": "Lorpuses are temperate. Wumpus is lorpus. Sally is wumpus. True or false: Sally is temperate. Let us think step by step.",
        "response_10": "Sally is wumpus. Wumpus is lorpus. Sally is lorpus. Lorpuses are temperate. Sally is temperate.",
        "noise_response_10": "Sally is wumpus. Wumpus is lorpus. Sally is lorpus. Lorpuses are temperate. Sally is moderate.",
        "answer_token_id_0": 29903,
        "answer_token_pos_0": 380,
        "answer_token_0": "S",
        "end_token_pos_0": 379,
        "end_token_id_0": 13,
        "answer_token_id_1": 281,
        "answer_token_pos_1": 383,
        "answer_token_1": "w",
        "end_token_pos_1": 382,
        "end_token_id_1": 338,
        "answer_token_id_2": 399,
        "answer_token_pos_2": 387,
        "answer_token_2": "W",
        "end_token_pos_2": 386,
        "end_token_id_2": 29889,
        "answer_token_id_3": 301,
        "answer_token_pos_3": 391,
        "answer_token_3": "l",
        "end_token_pos_3": 390,
        "end_token_id_3": 338,
        "answer_token_id_4": 317,
        "answer_token_pos_4": 395,
        "answer_token_4": "S",
        "end_token_pos_4": 394,
        "end_token_id_4": 29889,
        "answer_token_id_5": 301,
        "answer_token_pos_5": 398,
        "answer_token_5": "l",
        "end_token_pos_5": 397,
        "end_token_id_5": 338,
        "answer_token_id_6": 10980,
        "answer_token_pos_6": 402,
        "answer_token_6": "Lor",
        "end_token_pos_6": 401,
        "end_token_id_6": 29889,
        "answer_token_id_7": 6238,
        "answer_token_pos_7": 406,
        "answer_token_7": "temper",
        "end_token_pos_7": 405,
        "end_token_id_7": 526,
        "answer_token_id_8": 317,
        "answer_token_pos_8": 410,
        "answer_token_8": "S",
        "end_token_pos_8": 409,
        "end_token_id_8": 29889,
        "answer_token_id_9": 6238,
        "answer_token_pos_9": 413,
        "answer_token_9": "temper",
        "end_token_pos_9": 412,
        "end_token_id_9": 338
    },
    {
        "question": "Wumpus is dull. Vumpuses are wumpuses. Sally is vumpus.",
        "query": "True or false: Sally is fruity.",
        "answer": "Sally is vumpus. Vumpuses are wumpuses. Sally is wumpus. Wumpus is dull. Sally is dull. False",
        "label": "False",
        "prompt": "Wumpus is dull. Vumpuses are wumpuses. Sally is vumpus. True or false: Sally is fruity. Let us think step by step.",
        "generated": "Sally is vumpus. Vumpuses are wumpuses. Sally is wumpus. Wumpus is dull. Sally is dull. False",
        "noise_response_0": "",
        "noise_prompt_0": "Wumpus is dull. Vumpuses are wumpuses. Sally is vumpus. True or false: Max is fruity. Let us think step by step.",
        "response_0": "",
        "noise_response_1": "Sally is",
        "noise_prompt_1": "Wumpus is dull. Vumpuses are wumpuses. Sally is Impus. True or false: Sally is fruity. Let us think step by step.",
        "response_1": "Sally is",
        "noise_response_2": "Sally is vumpus.",
        "noise_prompt_2": "Wumpus is dull. Grimpus are wumpuses. Sally is vumpus. True or false: Sally is fruity. Let us think step by step.",
        "response_2": "Sally is vumpus.",
        "noise_response_3": "Sally is vumpus. Vumpuses are",
        "noise_prompt_3": "Wumpus is dull. Vumpuses are bright. Sally is vumpus. True or false: Sally is fruity. Let us think step by step.",
        "response_3": "Sally is vumpus. Vumpuses are",
        "noise_response_4": "Stella is vumpus. Vumpuses are wumpuses.",
        "noise_prompt_4": "Wumpus is dull. Vumpuses are wumpuses. Sally is vumpus. True or false: Sally is fruity. Let us think step by step.",
        "response_4": "Sally is vumpus. Vumpuses are wumpuses.",
        "noise_response_5": "Sally is vumpus. Vumpuses are rainy. Sally is",
        "noise_prompt_5": "Wumpus is dull. Vumpuses are wumpuses. Sally is vumpus. True or false: Sally is fruity. Let us think step by step.",
        "response_5": "Sally is vumpus. Vumpuses are wumpuses. Sally is",
        "noise_response_6": "Sally is vumpus. Vumpuses are wumpuses. Sally is wumpus.",
        "noise_prompt_6": "Polly is dull. Vumpuses are wumpuses. Sally is vumpus. True or false: Sally is fruity. Let us think step by step.",
        "response_6": "Sally is vumpus. Vumpuses are wumpuses. Sally is wumpus.",
        "noise_response_7": "Sally is vumpus. Vumpuses are wumpuses. Sally is wumpus. Wumpus is",
        "noise_prompt_7": "Wumpus is large. Vumpuses are wumpuses. Sally is vumpus. True or false: Sally is fruity. Let us think step by step.",
        "response_7": "Sally is vumpus. Vumpuses are wumpuses. Sally is wumpus. Wumpus is",
        "noise_response_8": "Sally is vumpus. Vumpuses are wumpuses. Rex is wumpus. Wumpus is dull.",
        "noise_prompt_8": "Wumpus is dull. Vumpuses are wumpuses. Sally is vumpus. True or false: Sally is fruity. Let us think step by step.",
        "response_8": "Sally is vumpus. Vumpuses are wumpuses. Sally is wumpus. Wumpus is dull.",
        "noise_response_9": "Sally is vumpus. Vumpuses are wumpuses. Sally is wumpus. Wumpus is metallic. Sally is",
        "noise_prompt_9": "Wumpus is dull. Vumpuses are wumpuses. Sally is vumpus. True or false: Sally is fruity. Let us think step by step.",
        "response_9": "Sally is vumpus. Vumpuses are wumpuses. Sally is wumpus. Wumpus is dull. Sally is",
        "noise_prompt_10": "Wumpus is dull. Vumpuses are wumpuses. Sally is vumpus. True or false: Sally is fruity. Let us think step by step.",
        "response_10": "Sally is vumpus. Vumpuses are wumpuses. Sally is wumpus. Wumpus is dull. Sally is dull.",
        "noise_response_10": "Sally is vumpus. Vumpuses are wumpuses. Sally is wumpus. Wumpus is dull. Sally is fast.",
        "answer_token_id_0": 29903,
        "answer_token_pos_0": 380,
        "answer_token_0": "S",
        "end_token_pos_0": 379,
        "end_token_id_0": 13,
        "answer_token_id_1": 325,
        "answer_token_pos_1": 383,
        "answer_token_1": "v",
        "end_token_pos_1": 382,
        "end_token_id_1": 338,
        "answer_token_id_2": 478,
        "answer_token_pos_2": 387,
        "answer_token_2": "V",
        "end_token_pos_2": 386,
        "end_token_id_2": 29889,
        "answer_token_id_3": 281,
        "answer_token_pos_3": 391,
        "answer_token_3": "w",
        "end_token_pos_3": 390,
        "end_token_id_3": 526,
        "answer_token_id_4": 317,
        "answer_token_pos_4": 395,
        "answer_token_4": "S",
        "end_token_pos_4": 394,
        "end_token_id_4": 29889,
        "answer_token_id_5": 281,
        "answer_token_pos_5": 398,
        "answer_token_5": "w",
        "end_token_pos_5": 397,
        "end_token_id_5": 338,
        "answer_token_id_6": 399,
        "answer_token_pos_6": 402,
        "answer_token_6": "W",
        "end_token_pos_6": 401,
        "end_token_id_6": 29889,
        "answer_token_id_7": 270,
        "answer_token_pos_7": 406,
        "answer_token_7": "d",
        "end_token_pos_7": 405,
        "end_token_id_7": 338,
        "answer_token_id_8": 317,
        "answer_token_pos_8": 410,
        "answer_token_8": "S",
        "end_token_pos_8": 409,
        "end_token_id_8": 29889,
        "answer_token_id_9": 270,
        "answer_token_pos_9": 413,
        "answer_token_9": "d",
        "end_token_pos_9": 412,
        "end_token_id_9": 338
    },
    {
        "question": "Yumpuses are large. Lempus is yumpus. Fae is lempus.",
        "query": "True or false: Fae is large.",
        "answer": "Fae is lempus. Lempus is yumpus. Fae is yumpus. Yumpuses are large. Fae is large. True",
        "label": "True",
        "prompt": "Yumpuses are large. Lempus is yumpus. Fae is lempus. True or false: Fae is large. Let us think step by step.",
        "generated": "Fae is lempus. Lempus is yumpus. Fae is yumpus. Yumpuses are large. Fae is large. True",
        "noise_response_0": "",
        "noise_prompt_0": "Yumpuses are large. Lempus is yumpus. Fae is lempus. True or false: Stella is large. Let us think step by step.",
        "response_0": "",
        "noise_response_1": "Fae is",
        "noise_prompt_1": "Yumpuses are large. Lempus is yumpus. Fae is Vumpus. True or false: Fae is large. Let us think step by step.",
        "response_1": "Fae is",
        "noise_response_2": "Fae is lempus.",
        "noise_prompt_2": "Yumpuses are large. impus is yumpus. Fae is lempus. True or false: Fae is large. Let us think step by step.",
        "response_2": "Fae is lempus.",
        "noise_response_3": "Fae is lempus. Lempus is",
        "noise_prompt_3": "Yumpuses are large. Lempus is Jompus. Fae is lempus. True or false: Fae is large. Let us think step by step.",
        "response_3": "Fae is lempus. Lempus is",
        "noise_response_4": "Sally is lempus. Lempus is yumpus.",
        "noise_prompt_4": "Yumpuses are large. Lempus is yumpus. Fae is lempus. True or false: Fae is large. Let us think step by step.",
        "response_4": "Fae is lempus. Lempus is yumpus.",
        "noise_response_5": "Fae is lempus. Lempus is dumpus. Fae is",
        "noise_prompt_5": "Yumpuses are large. Lempus is yumpus. Fae is lempus. True or false: Fae is large. Let us think step by step.",
        "response_5": "Fae is lempus. Lempus is yumpus. Fae is",
        "noise_response_6": "Fae is lempus. Lempus is yumpus. Fae is yumpus.",
        "noise_prompt_6": "gorpus are large. Lempus is yumpus. Fae is lempus. True or false: Fae is large. Let us think step by step.",
        "response_6": "Fae is lempus. Lempus is yumpus. Fae is yumpus.",
        "noise_response_7": "Fae is lempus. Lempus is yumpus. Fae is yumpus. Yumpuses are",
        "noise_prompt_7": "Yumpuses are large. Lempus is yumpus. Fae is lempus. True or false: Fae is melodic. Let us think step by step.",
        "response_7": "Fae is lempus. Lempus is yumpus. Fae is yumpus. Yumpuses are",
        "noise_response_8": "Fae is lempus. Lempus is yumpus. Sam is yumpus. Yumpuses are large.",
        "noise_prompt_8": "Yumpuses are large. Lempus is yumpus. Fae is lempus. True or false: Fae is large. Let us think step by step.",
        "response_8": "Fae is lempus. Lempus is yumpus. Fae is yumpus. Yumpuses are large.",
        "noise_response_9": "Fae is lempus. Lempus is yumpus. Fae is yumpus. Yumpuses are slow. Fae is",
        "noise_prompt_9": "Yumpuses are large. Lempus is yumpus. Fae is lempus. True or false: Fae is large. Let us think step by step.",
        "response_9": "Fae is lempus. Lempus is yumpus. Fae is yumpus. Yumpuses are large. Fae is",
        "noise_prompt_10": "Yumpuses are large. Lempus is yumpus. Fae is lempus. True or false: Fae is large. Let us think step by step.",
        "response_10": "Fae is lempus. Lempus is yumpus. Fae is yumpus. Yumpuses are large. Fae is large.",
        "noise_response_10": "Fae is lempus. Lempus is yumpus. Fae is yumpus. Yumpuses are large. Fae is metallic.",
        "answer_token_id_0": 29943,
        "answer_token_pos_0": 380,
        "answer_token_0": "F",
        "end_token_pos_0": 379,
        "end_token_id_0": 13,
        "answer_token_id_1": 454,
        "answer_token_pos_1": 383,
        "answer_token_1": "le",
        "end_token_pos_1": 382,
        "end_token_id_1": 338,
        "answer_token_id_2": 365,
        "answer_token_pos_2": 387,
        "answer_token_2": "L",
        "end_token_pos_2": 386,
        "end_token_id_2": 29889,
        "answer_token_id_3": 343,
        "answer_token_pos_3": 391,
        "answer_token_3": "y",
        "end_token_pos_3": 390,
        "end_token_id_3": 338,
        "answer_token_id_4": 383,
        "answer_token_pos_4": 395,
        "answer_token_4": "F",
        "end_token_pos_4": 394,
        "end_token_id_4": 29889,
        "answer_token_id_5": 343,
        "answer_token_pos_5": 398,
        "answer_token_5": "y",
        "end_token_pos_5": 397,
        "end_token_id_5": 338,
        "answer_token_id_6": 612,
        "answer_token_pos_6": 402,
        "answer_token_6": "Y",
        "end_token_pos_6": 401,
        "end_token_id_6": 29889,
        "answer_token_id_7": 2919,
        "answer_token_pos_7": 406,
        "answer_token_7": "large",
        "end_token_pos_7": 405,
        "end_token_id_7": 526,
        "answer_token_id_8": 383,
        "answer_token_pos_8": 410,
        "answer_token_8": "F",
        "end_token_pos_8": 409,
        "end_token_id_8": 29889,
        "answer_token_id_9": 2919,
        "answer_token_pos_9": 413,
        "answer_token_9": "large",
        "end_token_pos_9": 412,
        "end_token_id_9": 338
    },
    {
        "question": "Jompus is transparent. Dumpus is jompus. Fae is dumpus.",
        "query": "True or false: Fae is transparent.",
        "answer": "Fae is dumpus. Dumpus is jompus. Fae is jompus. Jompus is transparent. Fae is transparent. True",
        "label": "True",
        "prompt": "Jompus is transparent. Dumpus is jompus. Fae is dumpus. True or false: Fae is transparent. Let us think step by step.",
        "generated": "Fae is dumpus. Dumpus is jompus. Fae is jompus. Jompus is transparent. Fae is transparent. True",
        "noise_response_0": "",
        "noise_prompt_0": "Jompus is transparent. Dumpus is jompus. Fae is dumpus. True or false: Stella is transparent. Let us think step by step.",
        "response_0": "",
        "noise_response_1": "Fae is",
        "noise_prompt_1": "Jompus is transparent. Dumpus is jompus. Fae is tumpus. True or false: Fae is transparent. Let us think step by step.",
        "response_1": "Fae is",
        "noise_response_2": "Fae is dumpus.",
        "noise_prompt_2": "Jompus is transparent. Numpus is jompus. Fae is dumpus. True or false: Fae is transparent. Let us think step by step.",
        "response_2": "Fae is dumpus.",
        "noise_response_3": "Fae is dumpus. Dumpus is",
        "noise_prompt_3": "Jompus is transparent. Dumpus is zumpus. Fae is dumpus. True or false: Fae is transparent. Let us think step by step.",
        "response_3": "Fae is dumpus. Dumpus is",
        "noise_response_4": "Sally is dumpus. Dumpus is jompus.",
        "noise_prompt_4": "Jompus is transparent. Dumpus is jompus. Fae is dumpus. True or false: Fae is transparent. Let us think step by step.",
        "response_4": "Fae is dumpus. Dumpus is jompus.",
        "noise_response_5": "Fae is dumpus. Dumpus is zumpus. Fae is",
        "noise_prompt_5": "Jompus is transparent. Dumpus is jompus. Fae is dumpus. True or false: Fae is transparent. Let us think step by step.",
        "response_5": "Fae is dumpus. Dumpus is jompus. Fae is",
        "noise_response_6": "Fae is dumpus. Dumpus is jompus. Fae is jompus.",
        "noise_prompt_6": "Lempus is transparent. Dumpus is jompus. Fae is dumpus. True or false: Fae is transparent. Let us think step by step.",
        "response_6": "Fae is dumpus. Dumpus is jompus. Fae is jompus.",
        "noise_response_7": "Fae is dumpus. Dumpus is jompus. Fae is jompus. Jompus is",
        "noise_prompt_7": "Jompus is transparent. Dumpus is jompus. Fae is dumpus. True or false: Fae is wooden. Let us think step by step.",
        "response_7": "Fae is dumpus. Dumpus is jompus. Fae is jompus. Jompus is",
        "noise_response_8": "Fae is dumpus. Dumpus is jompus. Polly is jompus. Jompus is transparent.",
        "noise_prompt_8": "Jompus is transparent. Dumpus is jompus. Fae is dumpus. True or false: Fae is transparent. Let us think step by step.",
        "response_8": "Fae is dumpus. Dumpus is jompus. Fae is jompus. Jompus is transparent.",
        "noise_response_9": "Fae is dumpus. Dumpus is jompus. Fae is jompus. Jompus is sour. Fae is",
        "noise_prompt_9": "Jompus is transparent. Dumpus is jompus. Fae is dumpus. True or false: Fae is transparent. Let us think step by step.",
        "response_9": "Fae is dumpus. Dumpus is jompus. Fae is jompus. Jompus is transparent. Fae is",
        "noise_prompt_10": "Jompus is transparent. Dumpus is jompus. Fae is dumpus. True or false: Fae is transparent. Let us think step by step.",
        "response_10": "Fae is dumpus. Dumpus is jompus. Fae is jompus. Jompus is transparent. Fae is transparent.",
        "noise_response_10": "Fae is dumpus. Dumpus is jompus. Fae is jompus. Jompus is transparent. Fae is feisty.",
        "answer_token_id_0": 29943,
        "answer_token_pos_0": 380,
        "answer_token_0": "F",
        "end_token_pos_0": 379,
        "end_token_id_0": 13,
        "answer_token_id_1": 16766,
        "answer_token_pos_1": 383,
        "answer_token_1": "dump",
        "end_token_pos_1": 382,
        "end_token_id_1": 338,
        "answer_token_id_2": 360,
        "answer_token_pos_2": 387,
        "answer_token_2": "D",
        "end_token_pos_2": 386,
        "end_token_id_2": 29889,
        "answer_token_id_3": 432,
        "answer_token_pos_3": 391,
        "answer_token_3": "j",
        "end_token_pos_3": 390,
        "end_token_id_3": 338,
        "answer_token_id_4": 383,
        "answer_token_pos_4": 395,
        "answer_token_4": "F",
        "end_token_pos_4": 394,
        "end_token_id_4": 29889,
        "answer_token_id_5": 432,
        "answer_token_pos_5": 398,
        "answer_token_5": "j",
        "end_token_pos_5": 397,
        "end_token_id_5": 338,
        "answer_token_id_6": 435,
        "answer_token_pos_6": 402,
        "answer_token_6": "J",
        "end_token_pos_6": 401,
        "end_token_id_6": 29889,
        "answer_token_id_7": 17772,
        "answer_token_pos_7": 406,
        "answer_token_7": "transparent",
        "end_token_pos_7": 405,
        "end_token_id_7": 338,
        "answer_token_id_8": 383,
        "answer_token_pos_8": 410,
        "answer_token_8": "F",
        "end_token_pos_8": 409,
        "end_token_id_8": 29889,
        "answer_token_id_9": 17772,
        "answer_token_pos_9": 413,
        "answer_token_9": "transparent",
        "end_token_pos_9": 412,
        "end_token_id_9": 338
    },
    {
        "question": "Jompuses are orange. Lempus is jompus. Stella is lempus.",
        "query": "True or false: Stella is orange.",
        "answer": "Stella is lempus. Lempus is jompus. Stella is jompus. Jompuses are orange. Stella is orange. True",
        "label": "True",
        "prompt": "Jompuses are orange. Lempus is jompus. Stella is lempus. True or false: Stella is orange. Let us think step by step.",
        "generated": "Stella is lempus. Lempus is jompus. Stella is jompus. Jompuses are orange. Stella is orange. True",
        "noise_response_0": "",
        "noise_prompt_0": "Jompuses are orange. Lempus is jompus. Stella is lempus. True or false: Polly is orange. Let us think step by step.",
        "response_0": "",
        "noise_response_1": "Stella is",
        "noise_prompt_1": "Jompuses are orange. Lempus is jompus. Stella is Impus. True or false: Stella is orange. Let us think step by step.",
        "response_1": "Stella is",
        "noise_response_2": "Stella is lempus.",
        "noise_prompt_2": "Jompuses are orange. impus is jompus. Stella is lempus. True or false: Stella is orange. Let us think step by step.",
        "response_2": "Stella is lempus.",
        "noise_response_3": "Stella is lempus. Lempus is",
        "noise_prompt_3": "Jompuses are orange. Lempus is Gorpus. Stella is lempus. True or false: Stella is orange. Let us think step by step.",
        "response_3": "Stella is lempus. Lempus is",
        "noise_response_4": "Wren is lempus. Lempus is jompus.",
        "noise_prompt_4": "Jompuses are orange. Lempus is jompus. Stella is lempus. True or false: Stella is orange. Let us think step by step.",
        "response_4": "Stella is lempus. Lempus is jompus.",
        "noise_response_5": "Stella is lempus. Lempus is gorpus. Stella is",
        "noise_prompt_5": "Jompuses are orange. Lempus is jompus. Stella is lempus. True or false: Stella is orange. Let us think step by step.",
        "response_5": "Stella is lempus. Lempus is jompus. Stella is",
        "noise_response_6": "Stella is lempus. Lempus is jompus. Stella is jompus.",
        "noise_prompt_6": "dumpus are orange. Lempus is jompus. Stella is lempus. True or false: Stella is orange. Let us think step by step.",
        "response_6": "Stella is lempus. Lempus is jompus. Stella is jompus.",
        "noise_response_7": "Stella is lempus. Lempus is jompus. Stella is jompus. Jompuses are",
        "noise_prompt_7": "Jompuses are orange. Lempus is jompus. Stella is lempus. True or false: Stella is happy. Let us think step by step.",
        "response_7": "Stella is lempus. Lempus is jompus. Stella is jompus. Jompuses are",
        "noise_response_8": "Stella is lempus. Lempus is jompus. Rex is jompus. Jompuses are orange.",
        "noise_prompt_8": "Jompuses are orange. Lempus is jompus. Stella is lempus. True or false: Stella is orange. Let us think step by step.",
        "response_8": "Stella is lempus. Lempus is jompus. Stella is jompus. Jompuses are orange.",
        "noise_response_9": "Stella is lempus. Lempus is jompus. Stella is jompus. Jompuses are angry. Stella is",
        "noise_prompt_9": "Jompuses are orange. Lempus is jompus. Stella is lempus. True or false: Stella is orange. Let us think step by step.",
        "response_9": "Stella is lempus. Lempus is jompus. Stella is jompus. Jompuses are orange. Stella is",
        "noise_prompt_10": "Jompuses are orange. Lempus is jompus. Stella is lempus. True or false: Stella is orange. Let us think step by step.",
        "response_10": "Stella is lempus. Lempus is jompus. Stella is jompus. Jompuses are orange. Stella is orange.",
        "noise_response_10": "Stella is lempus. Lempus is jompus. Stella is jompus. Jompuses are orange. Stella is discordant.",
        "answer_token_id_0": 855,
        "answer_token_pos_0": 380,
        "answer_token_0": "St",
        "end_token_pos_0": 379,
        "end_token_id_0": 13,
        "answer_token_id_1": 454,
        "answer_token_pos_1": 383,
        "answer_token_1": "le",
        "end_token_pos_1": 382,
        "end_token_id_1": 338,
        "answer_token_id_2": 365,
        "answer_token_pos_2": 387,
        "answer_token_2": "L",
        "end_token_pos_2": 386,
        "end_token_id_2": 29889,
        "answer_token_id_3": 432,
        "answer_token_pos_3": 391,
        "answer_token_3": "j",
        "end_token_pos_3": 390,
        "end_token_id_3": 338,
        "answer_token_id_4": 624,
        "answer_token_pos_4": 395,
        "answer_token_4": "St",
        "end_token_pos_4": 394,
        "end_token_id_4": 29889,
        "answer_token_id_5": 432,
        "answer_token_pos_5": 398,
        "answer_token_5": "j",
        "end_token_pos_5": 397,
        "end_token_id_5": 338,
        "answer_token_id_6": 435,
        "answer_token_pos_6": 402,
        "answer_token_6": "J",
        "end_token_pos_6": 401,
        "end_token_id_6": 29889,
        "answer_token_id_7": 24841,
        "answer_token_pos_7": 406,
        "answer_token_7": "orange",
        "end_token_pos_7": 405,
        "end_token_id_7": 526,
        "answer_token_id_8": 624,
        "answer_token_pos_8": 410,
        "answer_token_8": "St",
        "end_token_pos_8": 409,
        "end_token_id_8": 29889,
        "answer_token_id_9": 24841,
        "answer_token_pos_9": 413,
        "answer_token_9": "orange",
        "end_token_pos_9": 412,
        "end_token_id_9": 338
    },
    {
        "question": "Sterpuses are fast. Brimpus is sterpus. Wren is brimpus.",
        "query": "True or false: Wren is fast.",
        "answer": "Wren is brimpus. Brimpus is sterpus. Wren is sterpus. Sterpuses are fast. Wren is fast. True",
        "label": "True",
        "prompt": "Sterpuses are fast. Brimpus is sterpus. Wren is brimpus. True or false: Wren is fast. Let us think step by step.",
        "generated": "Wren is brimpus. Brimpus is sterpus. Wren is sterpus. Sterpuses are fast. Wren is fast. True",
        "noise_response_0": "",
        "noise_prompt_0": "Sterpuses are fast. Brimpus is sterpus. Wren is brimpus. True or false: Max is fast. Let us think step by step.",
        "response_0": "",
        "noise_response_1": "Wren is",
        "noise_prompt_1": "Sterpuses are fast. Brimpus is sterpus. Wren is small. True or false: Wren is fast. Let us think step by step.",
        "response_1": "Wren is",
        "noise_response_2": "Wren is brimpus.",
        "noise_prompt_2": "Sterpuses are fast. vumpus is sterpus. Wren is brimpus. True or false: Wren is fast. Let us think step by step.",
        "response_2": "Wren is brimpus.",
        "noise_response_3": "Wren is brimpus. Brimpus is",
        "noise_prompt_3": "Sterpuses are fast. Brimpus is lorpus. Wren is brimpus. True or false: Wren is fast. Let us think step by step.",
        "response_3": "Wren is brimpus. Brimpus is",
        "noise_response_4": "Sally is brimpus. Brimpus is sterpus.",
        "noise_prompt_4": "Sterpuses are fast. Brimpus is sterpus. Wren is brimpus. True or false: Wren is fast. Let us think step by step.",
        "response_4": "Wren is brimpus. Brimpus is sterpus.",
        "noise_response_5": "Wren is brimpus. Brimpus is Rompus. Wren is",
        "noise_prompt_5": "Sterpuses are fast. Brimpus is sterpus. Wren is brimpus. True or false: Wren is fast. Let us think step by step.",
        "response_5": "Wren is brimpus. Brimpus is sterpus. Wren is",
        "noise_response_6": "Wren is brimpus. Brimpus is sterpus. Wren is sterpus.",
        "noise_prompt_6": "Sterpus are fast. Brimpus is sterpus. Wren is brimpus. True or false: Wren is fast. Let us think step by step.",
        "response_6": "Wren is brimpus. Brimpus is sterpus. Wren is sterpus.",
        "noise_response_7": "Wren is brimpus. Brimpus is sterpus. Wren is sterpus. Sterpuses are",
        "noise_prompt_7": "Sterpuses are fast. Brimpus is sterpus. Wren is brimpus. True or false: Wren is orange. Let us think step by step.",
        "response_7": "Wren is brimpus. Brimpus is sterpus. Wren is sterpus. Sterpuses are",
        "noise_response_8": "Wren is brimpus. Brimpus is sterpus. Sam is sterpus. Sterpuses are fast.",
        "noise_prompt_8": "Sterpuses are fast. Brimpus is sterpus. Wren is brimpus. True or false: Wren is fast. Let us think step by step.",
        "response_8": "Wren is brimpus. Brimpus is sterpus. Wren is sterpus. Sterpuses are fast.",
        "noise_response_9": "Wren is brimpus. Brimpus is sterpus. Wren is sterpus. Sterpuses are nervous. Wren is",
        "noise_prompt_9": "Sterpuses are fast. Brimpus is sterpus. Wren is brimpus. True or false: Wren is fast. Let us think step by step.",
        "response_9": "Wren is brimpus. Brimpus is sterpus. Wren is sterpus. Sterpuses are fast. Wren is",
        "noise_prompt_10": "Sterpuses are fast. Brimpus is sterpus. Wren is brimpus. True or false: Wren is fast. Let us think step by step.",
        "response_10": "Wren is brimpus. Brimpus is sterpus. Wren is sterpus. Sterpuses are fast. Wren is fast.",
        "noise_response_10": "Wren is brimpus. Brimpus is sterpus. Wren is sterpus. Sterpuses are fast. Wren is floral.",
        "answer_token_id_0": 29956,
        "answer_token_pos_0": 380,
        "answer_token_0": "W",
        "end_token_pos_0": 379,
        "end_token_id_0": 13,
        "answer_token_id_1": 1506,
        "answer_token_pos_1": 383,
        "answer_token_1": "br",
        "end_token_pos_1": 382,
        "end_token_id_1": 338,
        "answer_token_id_2": 1771,
        "answer_token_pos_2": 387,
        "answer_token_2": "Br",
        "end_token_pos_2": 386,
        "end_token_id_2": 29889,
        "answer_token_id_3": 16864,
        "answer_token_pos_3": 391,
        "answer_token_3": "ster",
        "end_token_pos_3": 390,
        "end_token_id_3": 338,
        "answer_token_id_4": 399,
        "answer_token_pos_4": 395,
        "answer_token_4": "W",
        "end_token_pos_4": 394,
        "end_token_id_4": 29889,
        "answer_token_id_5": 16864,
        "answer_token_pos_5": 398,
        "answer_token_5": "ster",
        "end_token_pos_5": 397,
        "end_token_id_5": 338,
        "answer_token_id_6": 28588,
        "answer_token_pos_6": 402,
        "answer_token_6": "Ster",
        "end_token_pos_6": 401,
        "end_token_id_6": 29889,
        "answer_token_id_7": 5172,
        "answer_token_pos_7": 406,
        "answer_token_7": "fast",
        "end_token_pos_7": 405,
        "end_token_id_7": 526,
        "answer_token_id_8": 399,
        "answer_token_pos_8": 410,
        "answer_token_8": "W",
        "end_token_pos_8": 409,
        "end_token_id_8": 29889,
        "answer_token_id_9": 5172,
        "answer_token_pos_9": 413,
        "answer_token_9": "fast",
        "end_token_pos_9": 412,
        "end_token_id_9": 338
    },
    {
        "question": "Tumpuses are blue. Lempuses are tumpuses. Sam is lempus.",
        "query": "True or false: Sam is blue.",
        "answer": "Sam is lempus. Lempuses are tumpuses. Sam is tumpus. Tumpuses are blue. Sam is blue. True",
        "label": "True",
        "prompt": "Tumpuses are blue. Lempuses are tumpuses. Sam is lempus. True or false: Sam is blue. Let us think step by step.",
        "generated": "Sam is lempus. Lempuses are tumpuses. Sam is tumpus. Tumpuses are blue. Sam is blue. True",
        "noise_response_0": "",
        "noise_prompt_0": "Tumpuses are blue. Lempuses are tumpuses. Sam is lempus. True or false: Stella is blue. Let us think step by step.",
        "response_0": "",
        "noise_response_1": "Sam is",
        "noise_prompt_1": "Tumpuses are blue. Lempuses are tumpuses. Sam is lempus. True or false: Sam is blue. Let us think step by step.",
        "response_1": "Sam is",
        "noise_response_2": "Sam is lempus.",
        "noise_prompt_2": "Tumpuses are blue. Lempus are tumpuses. Sam is lempus. True or false: Sam is blue. Let us think step by step.",
        "response_2": "Sam is lempus.",
        "noise_response_3": "Sam is lempus. Lempuses are",
        "noise_prompt_3": "Tumpuses are blue. Lempuses are dull. Sam is lempus. True or false: Sam is blue. Let us think step by step.",
        "response_3": "Sam is lempus. Lempuses are",
        "noise_response_4": "Sally is lempus. Lempuses are tumpuses.",
        "noise_prompt_4": "Tumpuses are blue. Lempuses are tumpuses. Sam is lempus. True or false: Sam is blue. Let us think step by step.",
        "response_4": "Sam is lempus. Lempuses are tumpuses.",
        "noise_response_5": "Sam is lempus. Lempuses are sweet. Sam is",
        "noise_prompt_5": "Tumpuses are blue. Lempuses are tumpuses. Sam is lempus. True or false: Sam is blue. Let us think step by step.",
        "response_5": "Sam is lempus. Lempuses are tumpuses. Sam is",
        "noise_response_6": "Sam is lempus. Lempuses are tumpuses. Sam is tumpus.",
        "noise_prompt_6": "Lempus are blue. Lempuses are tumpuses. Sam is lempus. True or false: Sam is blue. Let us think step by step.",
        "response_6": "Sam is lempus. Lempuses are tumpuses. Sam is tumpus.",
        "noise_response_7": "Sam is lempus. Lempuses are tumpuses. Sam is tumpus. Tumpuses are",
        "noise_prompt_7": "Tumpuses are blue. Lempuses are tumpuses. Sam is lempus. True or false: Sam is muffled. Let us think step by step.",
        "response_7": "Sam is lempus. Lempuses are tumpuses. Sam is tumpus. Tumpuses are",
        "noise_response_8": "Sam is lempus. Lempuses are tumpuses. Stella is tumpus. Tumpuses are blue.",
        "noise_prompt_8": "Tumpuses are blue. Lempuses are tumpuses. Sam is lempus. True or false: Sam is blue. Let us think step by step.",
        "response_8": "Sam is lempus. Lempuses are tumpuses. Sam is tumpus. Tumpuses are blue.",
        "noise_response_9": "Sam is lempus. Lempuses are tumpuses. Sam is tumpus. Tumpuses are liquid. Sam is",
        "noise_prompt_9": "Tumpuses are blue. Lempuses are tumpuses. Sam is lempus. True or false: Sam is blue. Let us think step by step.",
        "response_9": "Sam is lempus. Lempuses are tumpuses. Sam is tumpus. Tumpuses are blue. Sam is",
        "noise_prompt_10": "Tumpuses are blue. Lempuses are tumpuses. Sam is lempus. True or false: Sam is blue. Let us think step by step.",
        "response_10": "Sam is lempus. Lempuses are tumpuses. Sam is tumpus. Tumpuses are blue. Sam is blue.",
        "noise_response_10": "Sam is lempus. Lempuses are tumpuses. Sam is tumpus. Tumpuses are blue. Sam is mean.",
        "answer_token_id_0": 22966,
        "answer_token_pos_0": 380,
        "answer_token_0": "Sam",
        "end_token_pos_0": 379,
        "end_token_id_0": 13,
        "answer_token_id_1": 454,
        "answer_token_pos_1": 383,
        "answer_token_1": "le",
        "end_token_pos_1": 382,
        "end_token_id_1": 338,
        "answer_token_id_2": 365,
        "answer_token_pos_2": 387,
        "answer_token_2": "L",
        "end_token_pos_2": 386,
        "end_token_id_2": 29889,
        "answer_token_id_3": 260,
        "answer_token_pos_3": 391,
        "answer_token_3": "t",
        "end_token_pos_3": 390,
        "end_token_id_3": 526,
        "answer_token_id_4": 3685,
        "answer_token_pos_4": 395,
        "answer_token_4": "Sam",
        "end_token_pos_4": 394,
        "end_token_id_4": 29889,
        "answer_token_id_5": 260,
        "answer_token_pos_5": 398,
        "answer_token_5": "t",
        "end_token_pos_5": 397,
        "end_token_id_5": 338,
        "answer_token_id_6": 323,
        "answer_token_pos_6": 402,
        "answer_token_6": "T",
        "end_token_pos_6": 401,
        "end_token_id_6": 29889,
        "answer_token_id_7": 7254,
        "answer_token_pos_7": 406,
        "answer_token_7": "blue",
        "end_token_pos_7": 405,
        "end_token_id_7": 526,
        "answer_token_id_8": 3685,
        "answer_token_pos_8": 410,
        "answer_token_8": "Sam",
        "end_token_pos_8": 409,
        "end_token_id_8": 29889,
        "answer_token_id_9": 7254,
        "answer_token_pos_9": 413,
        "answer_token_9": "blue",
        "end_token_pos_9": 412,
        "end_token_id_9": 338
    },
    {
        "question": "Wumpuses are spicy. Rompus is wumpus. Stella is rompus.",
        "query": "True or false: Stella is spicy.",
        "answer": "Stella is rompus. Rompus is wumpus. Stella is wumpus. Wumpuses are spicy. Stella is spicy. True",
        "label": "True",
        "prompt": "Wumpuses are spicy. Rompus is wumpus. Stella is rompus. True or false: Stella is spicy. Let us think step by step.",
        "generated": "Stella is rompus. Rompus is wumpus. Stella is wumpus. Wumpuses are spicy. Stella is spicy. True",
        "noise_response_0": "",
        "noise_prompt_0": "Wumpuses are spicy. Rompus is wumpus. Stella is rompus. True or false: Fae is spicy. Let us think step by step.",
        "response_0": "",
        "noise_response_1": "Stella is",
        "noise_prompt_1": "Wumpuses are spicy. Rompus is wumpus. Stella is Zumpus. True or false: Stella is spicy. Let us think step by step.",
        "response_1": "Stella is",
        "noise_response_2": "Stella is rompus.",
        "noise_prompt_2": "Wumpuses are spicy. Zumpus is wumpus. Stella is rompus. True or false: Stella is spicy. Let us think step by step.",
        "response_2": "Stella is rompus.",
        "noise_response_3": "Stella is rompus. Rompus is",
        "noise_prompt_3": "Wumpuses are spicy. Rompus is cold. Stella is rompus. True or false: Stella is spicy. Let us think step by step.",
        "response_3": "Stella is rompus. Rompus is",
        "noise_response_4": "Fae is rompus. Rompus is wumpus.",
        "noise_prompt_4": "Wumpuses are spicy. Rompus is wumpus. Stella is rompus. True or false: Stella is spicy. Let us think step by step.",
        "response_4": "Stella is rompus. Rompus is wumpus.",
        "noise_response_5": "Stella is rompus. Rompus is blue. Stella is",
        "noise_prompt_5": "Wumpuses are spicy. Rompus is wumpus. Stella is rompus. True or false: Stella is spicy. Let us think step by step.",
        "response_5": "Stella is rompus. Rompus is wumpus. Stella is",
        "noise_response_6": "Stella is rompus. Rompus is wumpus. Stella is wumpus.",
        "noise_prompt_6": "Sam are spicy. Rompus is wumpus. Stella is rompus. True or false: Stella is spicy. Let us think step by step.",
        "response_6": "Stella is rompus. Rompus is wumpus. Stella is wumpus.",
        "noise_response_7": "Stella is rompus. Rompus is wumpus. Stella is wumpus. Wumpuses are",
        "noise_prompt_7": "Wumpuses are spicy. Rompus is wumpus. Stella is rompus. True or false: Stella is liquid. Let us think step by step.",
        "response_7": "Stella is rompus. Rompus is wumpus. Stella is wumpus. Wumpuses are",
        "noise_response_8": "Stella is rompus. Rompus is wumpus. Rex is wumpus. Wumpuses are spicy.",
        "noise_prompt_8": "Wumpuses are spicy. Rompus is wumpus. Stella is rompus. True or false: Stella is spicy. Let us think step by step.",
        "response_8": "Stella is rompus. Rompus is wumpus. Stella is wumpus. Wumpuses are spicy.",
        "noise_response_9": "Stella is rompus. Rompus is wumpus. Stella is wumpus. Wumpuses are rainy. Stella is",
        "noise_prompt_9": "Wumpuses are spicy. Rompus is wumpus. Stella is rompus. True or false: Stella is spicy. Let us think step by step.",
        "response_9": "Stella is rompus. Rompus is wumpus. Stella is wumpus. Wumpuses are spicy. Stella is",
        "noise_prompt_10": "Wumpuses are spicy. Rompus is wumpus. Stella is rompus. True or false: Stella is spicy. Let us think step by step.",
        "response_10": "Stella is rompus. Rompus is wumpus. Stella is wumpus. Wumpuses are spicy. Stella is spicy.",
        "noise_response_10": "Stella is rompus. Rompus is wumpus. Stella is wumpus. Wumpuses are spicy. Stella is transparent.",
        "answer_token_id_0": 855,
        "answer_token_pos_0": 380,
        "answer_token_0": "St",
        "end_token_pos_0": 379,
        "end_token_id_0": 13,
        "answer_token_id_1": 6017,
        "answer_token_pos_1": 383,
        "answer_token_1": "rom",
        "end_token_pos_1": 382,
        "end_token_id_1": 338,
        "answer_token_id_2": 6033,
        "answer_token_pos_2": 387,
        "answer_token_2": "Rom",
        "end_token_pos_2": 386,
        "end_token_id_2": 29889,
        "answer_token_id_3": 281,
        "answer_token_pos_3": 391,
        "answer_token_3": "w",
        "end_token_pos_3": 390,
        "end_token_id_3": 338,
        "answer_token_id_4": 624,
        "answer_token_pos_4": 395,
        "answer_token_4": "St",
        "end_token_pos_4": 394,
        "end_token_id_4": 29889,
        "answer_token_id_5": 281,
        "answer_token_pos_5": 398,
        "answer_token_5": "w",
        "end_token_pos_5": 397,
        "end_token_id_5": 338,
        "answer_token_id_6": 399,
        "answer_token_pos_6": 402,
        "answer_token_6": "W",
        "end_token_pos_6": 401,
        "end_token_id_6": 29889,
        "answer_token_id_7": 805,
        "answer_token_pos_7": 406,
        "answer_token_7": "sp",
        "end_token_pos_7": 405,
        "end_token_id_7": 526,
        "answer_token_id_8": 624,
        "answer_token_pos_8": 410,
        "answer_token_8": "St",
        "end_token_pos_8": 409,
        "end_token_id_8": 29889,
        "answer_token_id_9": 805,
        "answer_token_pos_9": 413,
        "answer_token_9": "sp",
        "end_token_pos_9": 412,
        "end_token_id_9": 338
    },
    {
        "question": "Zumpuses are bitter. Lorpus is zumpus. Sally is lorpus.",
        "query": "True or false: Sally is moderate.",
        "answer": "Sally is lorpus. Lorpus is zumpus. Sally is zumpus. Zumpuses are bitter. Sally is bitter. False",
        "label": "False",
        "prompt": "Zumpuses are bitter. Lorpus is zumpus. Sally is lorpus. True or false: Sally is moderate. Let us think step by step.",
        "generated": "Sally is lorpus. Lorpus is zumpus. Sally is zumpus. Zumpuses are bitter. Sally is bitter. False",
        "noise_response_0": "",
        "noise_prompt_0": "Zumpuses are bitter. Lorpus is zumpus. Sally is lorpus. True or false: Stella is moderate. Let us think step by step.",
        "response_0": "",
        "noise_response_1": "Sally is",
        "noise_prompt_1": "Zumpuses are bitter. Lorpus is zumpus. Sally is luminous. True or false: Sally is moderate. Let us think step by step.",
        "response_1": "Sally is",
        "noise_response_2": "Sally is lorpus.",
        "noise_prompt_2": "Zumpuses are bitter. Yumpus is zumpus. Sally is lorpus. True or false: Sally is moderate. Let us think step by step.",
        "response_2": "Sally is lorpus.",
        "noise_response_3": "Sally is lorpus. Lorpus is",
        "noise_prompt_3": "Zumpuses are bitter. Lorpus is grimpus. Sally is lorpus. True or false: Sally is moderate. Let us think step by step.",
        "response_3": "Sally is lorpus. Lorpus is",
        "noise_response_4": "Polly is lorpus. Lorpus is zumpus.",
        "noise_prompt_4": "Zumpuses are bitter. Lorpus is zumpus. Sally is lorpus. True or false: Sally is moderate. Let us think step by step.",
        "response_4": "Sally is lorpus. Lorpus is zumpus.",
        "noise_response_5": "Sally is lorpus. Lorpus is Dumpus. Sally is",
        "noise_prompt_5": "Zumpuses are bitter. Lorpus is zumpus. Sally is lorpus. True or false: Sally is moderate. Let us think step by step.",
        "response_5": "Sally is lorpus. Lorpus is zumpus. Sally is",
        "noise_response_6": "Sally is lorpus. Lorpus is zumpus. Sally is zumpus.",
        "noise_prompt_6": "vumpus are bitter. Lorpus is zumpus. Sally is lorpus. True or false: Sally is moderate. Let us think step by step.",
        "response_6": "Sally is lorpus. Lorpus is zumpus. Sally is zumpus.",
        "noise_response_7": "Sally is lorpus. Lorpus is zumpus. Sally is zumpus. Zumpuses are",
        "noise_prompt_7": "Zumpuses are metallic. Lorpus is zumpus. Sally is lorpus. True or false: Sally is moderate. Let us think step by step.",
        "response_7": "Sally is lorpus. Lorpus is zumpus. Sally is zumpus. Zumpuses are",
        "noise_response_8": "Sally is lorpus. Lorpus is zumpus. Stella is zumpus. Zumpuses are bitter.",
        "noise_prompt_8": "Zumpuses are bitter. Lorpus is zumpus. Sally is lorpus. True or false: Sally is moderate. Let us think step by step.",
        "response_8": "Sally is lorpus. Lorpus is zumpus. Sally is zumpus. Zumpuses are bitter.",
        "noise_response_9": "Sally is lorpus. Lorpus is zumpus. Sally is zumpus. Zumpuses are earthy. Sally is",
        "noise_prompt_9": "Zumpuses are bitter. Lorpus is zumpus. Sally is lorpus. True or false: Sally is moderate. Let us think step by step.",
        "response_9": "Sally is lorpus. Lorpus is zumpus. Sally is zumpus. Zumpuses are bitter. Sally is",
        "noise_prompt_10": "Zumpuses are bitter. Lorpus is zumpus. Sally is lorpus. True or false: Sally is moderate. Let us think step by step.",
        "response_10": "Sally is lorpus. Lorpus is zumpus. Sally is zumpus. Zumpuses are bitter. Sally is bitter.",
        "noise_response_10": "Sally is lorpus. Lorpus is zumpus. Sally is zumpus. Zumpuses are bitter. Sally is melodic.",
        "answer_token_id_0": 29903,
        "answer_token_pos_0": 380,
        "answer_token_0": "S",
        "end_token_pos_0": 379,
        "end_token_id_0": 13,
        "answer_token_id_1": 301,
        "answer_token_pos_1": 383,
        "answer_token_1": "l",
        "end_token_pos_1": 382,
        "end_token_id_1": 338,
        "answer_token_id_2": 10980,
        "answer_token_pos_2": 387,
        "answer_token_2": "Lor",
        "end_token_pos_2": 386,
        "end_token_id_2": 29889,
        "answer_token_id_3": 3356,
        "answer_token_pos_3": 391,
        "answer_token_3": "zum",
        "end_token_pos_3": 390,
        "end_token_id_3": 338,
        "answer_token_id_4": 317,
        "answer_token_pos_4": 395,
        "answer_token_4": "S",
        "end_token_pos_4": 394,
        "end_token_id_4": 29889,
        "answer_token_id_5": 3356,
        "answer_token_pos_5": 398,
        "answer_token_5": "zum",
        "end_token_pos_5": 397,
        "end_token_id_5": 338,
        "answer_token_id_6": 796,
        "answer_token_pos_6": 402,
        "answer_token_6": "Z",
        "end_token_pos_6": 401,
        "end_token_id_6": 29889,
        "answer_token_id_7": 22773,
        "answer_token_pos_7": 406,
        "answer_token_7": "bitter",
        "end_token_pos_7": 405,
        "end_token_id_7": 526,
        "answer_token_id_8": 317,
        "answer_token_pos_8": 410,
        "answer_token_8": "S",
        "end_token_pos_8": 409,
        "end_token_id_8": 29889,
        "answer_token_id_9": 22773,
        "answer_token_pos_9": 413,
        "answer_token_9": "bitter",
        "end_token_pos_9": 412,
        "end_token_id_9": 338
    },
    {
        "question": "Tumpuses are orange. Zumpus is tumpus. Sam is zumpus.",
        "query": "True or false: Sam is orange.",
        "answer": "Sam is zumpus. Zumpus is tumpus. Sam is tumpus. Tumpuses are orange. Sam is orange. True",
        "label": "True",
        "prompt": "Tumpuses are orange. Zumpus is tumpus. Sam is zumpus. True or false: Sam is orange. Let us think step by step.",
        "generated": "Sam is zumpus. Zumpus is tumpus. Sam is tumpus. Tumpuses are orange. Sam is orange. True",
        "noise_response_0": "",
        "noise_prompt_0": "Tumpuses are orange. Zumpus is tumpus. Sam is zumpus. True or false: Rex is orange. Let us think step by step.",
        "response_0": "",
        "noise_response_1": "Sam is",
        "noise_prompt_1": "Tumpuses are orange. Zumpus is tumpus. Sam is sterpus. True or false: Sam is orange. Let us think step by step.",
        "response_1": "Sam is",
        "noise_response_2": "Sam is zumpus.",
        "noise_prompt_2": "Tumpuses are orange. Shumpus is tumpus. Sam is zumpus. True or false: Sam is orange. Let us think step by step.",
        "response_2": "Sam is zumpus.",
        "noise_response_3": "Sam is zumpus. Zumpus is",
        "noise_prompt_3": "Tumpuses are orange. Zumpus is slow. Sam is zumpus. True or false: Sam is orange. Let us think step by step.",
        "response_3": "Sam is zumpus. Zumpus is",
        "noise_response_4": "Polly is zumpus. Zumpus is tumpus.",
        "noise_prompt_4": "Tumpuses are orange. Zumpus is tumpus. Sam is zumpus. True or false: Sam is orange. Let us think step by step.",
        "response_4": "Sam is zumpus. Zumpus is tumpus.",
        "noise_response_5": "Sam is zumpus. Zumpus is happy. Sam is",
        "noise_prompt_5": "Tumpuses are orange. Zumpus is tumpus. Sam is zumpus. True or false: Sam is orange. Let us think step by step.",
        "response_5": "Sam is zumpus. Zumpus is tumpus. Sam is",
        "noise_response_6": "Sam is zumpus. Zumpus is tumpus. Sam is tumpus.",
        "noise_prompt_6": "gorpus are orange. Zumpus is tumpus. Sam is zumpus. True or false: Sam is orange. Let us think step by step.",
        "response_6": "Sam is zumpus. Zumpus is tumpus. Sam is tumpus.",
        "noise_response_7": "Sam is zumpus. Zumpus is tumpus. Sam is tumpus. Tumpuses are",
        "noise_prompt_7": "Tumpuses are orange. Zumpus is tumpus. Sam is zumpus. True or false: Sam is angry. Let us think step by step.",
        "response_7": "Sam is zumpus. Zumpus is tumpus. Sam is tumpus. Tumpuses are",
        "noise_response_8": "Sam is zumpus. Zumpus is tumpus. Wren is tumpus. Tumpuses are orange.",
        "noise_prompt_8": "Tumpuses are orange. Zumpus is tumpus. Sam is zumpus. True or false: Sam is orange. Let us think step by step.",
        "response_8": "Sam is zumpus. Zumpus is tumpus. Sam is tumpus. Tumpuses are orange.",
        "noise_response_9": "Sam is zumpus. Zumpus is tumpus. Sam is tumpus. Tumpuses are muffled. Sam is",
        "noise_prompt_9": "Tumpuses are orange. Zumpus is tumpus. Sam is zumpus. True or false: Sam is orange. Let us think step by step.",
        "response_9": "Sam is zumpus. Zumpus is tumpus. Sam is tumpus. Tumpuses are orange. Sam is",
        "noise_prompt_10": "Tumpuses are orange. Zumpus is tumpus. Sam is zumpus. True or false: Sam is orange. Let us think step by step.",
        "response_10": "Sam is zumpus. Zumpus is tumpus. Sam is tumpus. Tumpuses are orange. Sam is orange.",
        "noise_response_10": "Sam is zumpus. Zumpus is tumpus. Sam is tumpus. Tumpuses are orange. Sam is sweet.",
        "answer_token_id_0": 22966,
        "answer_token_pos_0": 380,
        "answer_token_0": "Sam",
        "end_token_pos_0": 379,
        "end_token_id_0": 13,
        "answer_token_id_1": 3356,
        "answer_token_pos_1": 383,
        "answer_token_1": "zum",
        "end_token_pos_1": 382,
        "end_token_id_1": 338,
        "answer_token_id_2": 796,
        "answer_token_pos_2": 387,
        "answer_token_2": "Z",
        "end_token_pos_2": 386,
        "end_token_id_2": 29889,
        "answer_token_id_3": 260,
        "answer_token_pos_3": 391,
        "answer_token_3": "t",
        "end_token_pos_3": 390,
        "end_token_id_3": 338,
        "answer_token_id_4": 323,
        "answer_token_pos_4": 395,
        "answer_token_4": "T",
        "end_token_pos_4": 394,
        "end_token_id_4": 29889,
        "answer_token_id_5": 260,
        "answer_token_pos_5": 398,
        "answer_token_5": "t",
        "end_token_pos_5": 397,
        "end_token_id_5": 338,
        "answer_token_id_6": 323,
        "answer_token_pos_6": 402,
        "answer_token_6": "T",
        "end_token_pos_6": 401,
        "end_token_id_6": 29889,
        "answer_token_id_7": 24841,
        "answer_token_pos_7": 406,
        "answer_token_7": "orange",
        "end_token_pos_7": 405,
        "end_token_id_7": 526,
        "answer_token_id_8": 3685,
        "answer_token_pos_8": 410,
        "answer_token_8": "Sam",
        "end_token_pos_8": 409,
        "end_token_id_8": 29889,
        "answer_token_id_9": 24841,
        "answer_token_pos_9": 413,
        "answer_token_9": "orange",
        "end_token_pos_9": 412,
        "end_token_id_9": 338
    },
    {
        "question": "Shumpus is bright. Zumpus is shumpus. Wren is zumpus.",
        "query": "True or false: Wren is bright.",
        "answer": "Wren is zumpus. Zumpus is shumpus. Wren is shumpus. Shumpus is bright. Wren is bright. True",
        "label": "True",
        "prompt": "Shumpus is bright. Zumpus is shumpus. Wren is zumpus. True or false: Wren is bright. Let us think step by step.",
        "generated": "Wren is zumpus. Zumpus is shumpus. Wren is shumpus. Shumpus is bright. Wren is bright. True",
        "noise_response_0": "",
        "noise_prompt_0": "Shumpus is bright. Zumpus is shumpus. Wren is zumpus. True or false: Sally is bright. Let us think step by step.",
        "response_0": "",
        "noise_response_1": "Wren is",
        "noise_prompt_1": "Shumpus is bright. Zumpus is shumpus. Wren is yumpus. True or false: Wren is bright. Let us think step by step.",
        "response_1": "Wren is",
        "noise_response_2": "Wren is zumpus.",
        "noise_prompt_2": "Shumpus is bright. Gorpus is shumpus. Wren is zumpus. True or false: Wren is bright. Let us think step by step.",
        "response_2": "Wren is zumpus.",
        "noise_response_3": "Wren is zumpus. Zumpus is",
        "noise_prompt_3": "Shumpus is bright. Zumpus is bitter. Wren is zumpus. True or false: Wren is bright. Let us think step by step.",
        "response_3": "Wren is zumpus. Zumpus is",
        "noise_response_4": "Rex is zumpus. Zumpus is shumpus.",
        "noise_prompt_4": "Shumpus is bright. Zumpus is shumpus. Wren is zumpus. True or false: Wren is bright. Let us think step by step.",
        "response_4": "Wren is zumpus. Zumpus is shumpus.",
        "noise_response_5": "Wren is zumpus. Zumpus is bright. Wren is",
        "noise_prompt_5": "Shumpus is bright. Zumpus is shumpus. Wren is zumpus. True or false: Wren is bright. Let us think step by step.",
        "response_5": "Wren is zumpus. Zumpus is shumpus. Wren is",
        "noise_response_6": "Wren is zumpus. Zumpus is shumpus. Wren is shumpus.",
        "noise_prompt_6": "Dumpus is bright. Zumpus is shumpus. Wren is zumpus. True or false: Wren is bright. Let us think step by step.",
        "response_6": "Wren is zumpus. Zumpus is shumpus. Wren is shumpus.",
        "noise_response_7": "Wren is zumpus. Zumpus is shumpus. Wren is shumpus. Shumpus is",
        "noise_prompt_7": "Shumpus is bright. Zumpus is shumpus. Wren is zumpus. True or false: Wren is overcast. Let us think step by step.",
        "response_7": "Wren is zumpus. Zumpus is shumpus. Wren is shumpus. Shumpus is",
        "noise_response_8": "Wren is zumpus. Zumpus is shumpus. Sam is shumpus. Shumpus is bright.",
        "noise_prompt_8": "Shumpus is bright. Zumpus is shumpus. Wren is zumpus. True or false: Wren is bright. Let us think step by step.",
        "response_8": "Wren is zumpus. Zumpus is shumpus. Wren is shumpus. Shumpus is bright.",
        "noise_response_9": "Wren is zumpus. Zumpus is shumpus. Wren is shumpus. Shumpus is muffled. Wren is",
        "noise_prompt_9": "Shumpus is bright. Zumpus is shumpus. Wren is zumpus. True or false: Wren is bright. Let us think step by step.",
        "response_9": "Wren is zumpus. Zumpus is shumpus. Wren is shumpus. Shumpus is bright. Wren is",
        "noise_prompt_10": "Shumpus is bright. Zumpus is shumpus. Wren is zumpus. True or false: Wren is bright. Let us think step by step.",
        "response_10": "Wren is zumpus. Zumpus is shumpus. Wren is shumpus. Shumpus is bright. Wren is bright.",
        "noise_response_10": "Wren is zumpus. Zumpus is shumpus. Wren is shumpus. Shumpus is bright. Wren is melodic.",
        "answer_token_id_0": 29956,
        "answer_token_pos_0": 380,
        "answer_token_0": "W",
        "end_token_pos_0": 379,
        "end_token_id_0": 13,
        "answer_token_id_1": 3356,
        "answer_token_pos_1": 383,
        "answer_token_1": "zum",
        "end_token_pos_1": 382,
        "end_token_id_1": 338,
        "answer_token_id_2": 796,
        "answer_token_pos_2": 387,
        "answer_token_2": "Z",
        "end_token_pos_2": 386,
        "end_token_id_2": 29889,
        "answer_token_id_3": 528,
        "answer_token_pos_3": 391,
        "answer_token_3": "sh",
        "end_token_pos_3": 390,
        "end_token_id_3": 338,
        "answer_token_id_4": 399,
        "answer_token_pos_4": 395,
        "answer_token_4": "W",
        "end_token_pos_4": 394,
        "end_token_id_4": 29889,
        "answer_token_id_5": 528,
        "answer_token_pos_5": 398,
        "answer_token_5": "sh",
        "end_token_pos_5": 397,
        "end_token_id_5": 338,
        "answer_token_id_6": 1383,
        "answer_token_pos_6": 402,
        "answer_token_6": "Sh",
        "end_token_pos_6": 401,
        "end_token_id_6": 29889,
        "answer_token_id_7": 11785,
        "answer_token_pos_7": 406,
        "answer_token_7": "bright",
        "end_token_pos_7": 405,
        "end_token_id_7": 338,
        "answer_token_id_8": 399,
        "answer_token_pos_8": 410,
        "answer_token_8": "W",
        "end_token_pos_8": 409,
        "end_token_id_8": 29889,
        "answer_token_id_9": 11785,
        "answer_token_pos_9": 413,
        "answer_token_9": "bright",
        "end_token_pos_9": 412,
        "end_token_id_9": 338
    },
    {
        "question": "Grimpus is earthy. Yumpuses are grimpuses. Sally is yumpus.",
        "query": "True or false: Sally is earthy.",
        "answer": "Sally is yumpus. Yumpuses are grimpuses. Sally is grimpus. Grimpus is earthy. Sally is earthy. True",
        "label": "True",
        "prompt": "Grimpus is earthy. Yumpuses are grimpuses. Sally is yumpus. True or false: Sally is earthy. Let us think step by step.",
        "generated": "Sally is yumpus. Yumpuses are grimpuses. Sally is grimpus. Grimpus is earthy. Sally is earthy. True",
        "noise_response_0": "",
        "noise_prompt_0": "Grimpus is earthy. Yumpuses are grimpuses. Sally is yumpus. True or false: Alex is earthy. Let us think step by step.",
        "response_0": "",
        "noise_response_1": "Sally is",
        "noise_prompt_1": "Grimpus is earthy. Yumpuses are grimpuses. Sally is dumpus. True or false: Sally is earthy. Let us think step by step.",
        "response_1": "Sally is",
        "noise_response_2": "Sally is yumpus.",
        "noise_prompt_2": "Grimpus is earthy. yumpus are grimpuses. Sally is yumpus. True or false: Sally is earthy. Let us think step by step.",
        "response_2": "Sally is yumpus.",
        "noise_response_3": "Sally is yumpus. Yumpuses are",
        "noise_prompt_3": "Grimpus is earthy. Yumpuses are Numpus. Sally is yumpus. True or false: Sally is earthy. Let us think step by step.",
        "response_3": "Sally is yumpus. Yumpuses are",
        "noise_response_4": "Polly is yumpus. Yumpuses are grimpuses.",
        "noise_prompt_4": "Grimpus is earthy. Yumpuses are grimpuses. Sally is yumpus. True or false: Sally is earthy. Let us think step by step.",
        "response_4": "Sally is yumpus. Yumpuses are grimpuses.",
        "noise_response_5": "Sally is yumpus. Yumpuses are sterpus. Sally is",
        "noise_prompt_5": "Grimpus is earthy. Yumpuses are grimpuses. Sally is yumpus. True or false: Sally is earthy. Let us think step by step.",
        "response_5": "Sally is yumpus. Yumpuses are grimpuses. Sally is",
        "noise_response_6": "Sally is yumpus. Yumpuses are grimpuses. Sally is grimpus.",
        "noise_prompt_6": "Shumpus is earthy. Yumpuses are grimpuses. Sally is yumpus. True or false: Sally is earthy. Let us think step by step.",
        "response_6": "Sally is yumpus. Yumpuses are grimpuses. Sally is grimpus.",
        "noise_response_7": "Sally is yumpus. Yumpuses are grimpuses. Sally is grimpus. Grimpus is",
        "noise_prompt_7": "Grimpus is earthy. Yumpuses are grimpuses. Sally is yumpus. True or false: Sally is aggressive. Let us think step by step.",
        "response_7": "Sally is yumpus. Yumpuses are grimpuses. Sally is grimpus. Grimpus is",
        "noise_response_8": "Sally is yumpus. Yumpuses are grimpuses. Polly is grimpus. Grimpus is earthy.",
        "noise_prompt_8": "Grimpus is earthy. Yumpuses are grimpuses. Sally is yumpus. True or false: Sally is earthy. Let us think step by step.",
        "response_8": "Sally is yumpus. Yumpuses are grimpuses. Sally is grimpus. Grimpus is earthy.",
        "noise_response_9": "Sally is yumpus. Yumpuses are grimpuses. Sally is grimpus. Grimpus is transparent. Sally is",
        "noise_prompt_9": "Grimpus is earthy. Yumpuses are grimpuses. Sally is yumpus. True or false: Sally is earthy. Let us think step by step.",
        "response_9": "Sally is yumpus. Yumpuses are grimpuses. Sally is grimpus. Grimpus is earthy. Sally is",
        "noise_prompt_10": "Grimpus is earthy. Yumpuses are grimpuses. Sally is yumpus. True or false: Sally is earthy. Let us think step by step.",
        "response_10": "Sally is yumpus. Yumpuses are grimpuses. Sally is grimpus. Grimpus is earthy. Sally is earthy.",
        "noise_response_10": "Sally is yumpus. Yumpuses are grimpuses. Sally is grimpus. Grimpus is earthy. Sally is bright.",
        "answer_token_id_0": 29903,
        "answer_token_pos_0": 380,
        "answer_token_0": "S",
        "end_token_pos_0": 379,
        "end_token_id_0": 13,
        "answer_token_id_1": 343,
        "answer_token_pos_1": 383,
        "answer_token_1": "y",
        "end_token_pos_1": 382,
        "end_token_id_1": 338,
        "answer_token_id_2": 612,
        "answer_token_pos_2": 387,
        "answer_token_2": "Y",
        "end_token_pos_2": 386,
        "end_token_id_2": 29889,
        "answer_token_id_3": 867,
        "answer_token_pos_3": 391,
        "answer_token_3": "gr",
        "end_token_pos_3": 390,
        "end_token_id_3": 526,
        "answer_token_id_4": 317,
        "answer_token_pos_4": 395,
        "answer_token_4": "S",
        "end_token_pos_4": 394,
        "end_token_id_4": 29889,
        "answer_token_id_5": 867,
        "answer_token_pos_5": 398,
        "answer_token_5": "gr",
        "end_token_pos_5": 397,
        "end_token_id_5": 338,
        "answer_token_id_6": 1632,
        "answer_token_pos_6": 402,
        "answer_token_6": "Gr",
        "end_token_pos_6": 401,
        "end_token_id_6": 29889,
        "answer_token_id_7": 8437,
        "answer_token_pos_7": 406,
        "answer_token_7": "earth",
        "end_token_pos_7": 405,
        "end_token_id_7": 338,
        "answer_token_id_8": 317,
        "answer_token_pos_8": 410,
        "answer_token_8": "S",
        "end_token_pos_8": 409,
        "end_token_id_8": 29889,
        "answer_token_id_9": 8437,
        "answer_token_pos_9": 413,
        "answer_token_9": "earth",
        "end_token_pos_9": 412,
        "end_token_id_9": 338
    },
    {
        "question": "Dumpus is sweet. Wumpus is dumpus. Sally is wumpus.",
        "query": "True or false: Sally is sweet.",
        "answer": "Sally is wumpus. Wumpus is dumpus. Sally is dumpus. Dumpus is sweet. Sally is sweet. True",
        "label": "True",
        "prompt": "Dumpus is sweet. Wumpus is dumpus. Sally is wumpus. True or false: Sally is sweet. Let us think step by step.",
        "generated": "Sally is wumpus. Wumpus is dumpus. Sally is dumpus. Dumpus is sweet. Sally is sweet. True",
        "noise_response_0": "",
        "noise_prompt_0": "Dumpus is sweet. Wumpus is dumpus. Sally is wumpus. True or false: Max is sweet. Let us think step by step.",
        "response_0": "",
        "noise_response_1": "Sally is",
        "noise_prompt_1": "Dumpus is sweet. Wumpus is dumpus. Sally is small. True or false: Sally is sweet. Let us think step by step.",
        "response_1": "Sally is",
        "noise_response_2": "Sally is wumpus.",
        "noise_prompt_2": "Dumpus is sweet. Rex is dumpus. Sally is wumpus. True or false: Sally is sweet. Let us think step by step.",
        "response_2": "Sally is wumpus.",
        "noise_response_3": "Sally is wumpus. Wumpus is",
        "noise_prompt_3": "Dumpus is sweet. Wumpus is lempus. Sally is wumpus. True or false: Sally is sweet. Let us think step by step.",
        "response_3": "Sally is wumpus. Wumpus is",
        "noise_response_4": "Alex is wumpus. Wumpus is dumpus.",
        "noise_prompt_4": "Dumpus is sweet. Wumpus is dumpus. Sally is wumpus. True or false: Sally is sweet. Let us think step by step.",
        "response_4": "Sally is wumpus. Wumpus is dumpus.",
        "noise_response_5": "Sally is wumpus. Wumpus is Lempus. Sally is",
        "noise_prompt_5": "Dumpus is sweet. Wumpus is dumpus. Sally is wumpus. True or false: Sally is sweet. Let us think step by step.",
        "response_5": "Sally is wumpus. Wumpus is dumpus. Sally is",
        "noise_response_6": "Sally is wumpus. Wumpus is dumpus. Sally is dumpus.",
        "noise_prompt_6": "vumpus is sweet. Wumpus is dumpus. Sally is wumpus. True or false: Sally is sweet. Let us think step by step.",
        "response_6": "Sally is wumpus. Wumpus is dumpus. Sally is dumpus.",
        "noise_response_7": "Sally is wumpus. Wumpus is dumpus. Sally is dumpus. Dumpus is",
        "noise_prompt_7": "Dumpus is sweet. Wumpus is dumpus. Sally is wumpus. True or false: Sally is liquid. Let us think step by step.",
        "response_7": "Sally is wumpus. Wumpus is dumpus. Sally is dumpus. Dumpus is",
        "noise_response_8": "Sally is wumpus. Wumpus is dumpus. Stella is dumpus. Dumpus is sweet.",
        "noise_prompt_8": "Dumpus is sweet. Wumpus is dumpus. Sally is wumpus. True or false: Sally is sweet. Let us think step by step.",
        "response_8": "Sally is wumpus. Wumpus is dumpus. Sally is dumpus. Dumpus is sweet.",
        "noise_response_9": "Sally is wumpus. Wumpus is dumpus. Sally is dumpus. Dumpus is rainy. Sally is",
        "noise_prompt_9": "Dumpus is sweet. Wumpus is dumpus. Sally is wumpus. True or false: Sally is sweet. Let us think step by step.",
        "response_9": "Sally is wumpus. Wumpus is dumpus. Sally is dumpus. Dumpus is sweet. Sally is",
        "noise_prompt_10": "Dumpus is sweet. Wumpus is dumpus. Sally is wumpus. True or false: Sally is sweet. Let us think step by step.",
        "response_10": "Sally is wumpus. Wumpus is dumpus. Sally is dumpus. Dumpus is sweet. Sally is sweet.",
        "noise_response_10": "Sally is wumpus. Wumpus is dumpus. Sally is dumpus. Dumpus is sweet. Sally is sunny.",
        "answer_token_id_0": 29903,
        "answer_token_pos_0": 380,
        "answer_token_0": "S",
        "end_token_pos_0": 379,
        "end_token_id_0": 13,
        "answer_token_id_1": 281,
        "answer_token_pos_1": 383,
        "answer_token_1": "w",
        "end_token_pos_1": 382,
        "end_token_id_1": 338,
        "answer_token_id_2": 399,
        "answer_token_pos_2": 387,
        "answer_token_2": "W",
        "end_token_pos_2": 386,
        "end_token_id_2": 29889,
        "answer_token_id_3": 16766,
        "answer_token_pos_3": 391,
        "answer_token_3": "dump",
        "end_token_pos_3": 390,
        "end_token_id_3": 338,
        "answer_token_id_4": 317,
        "answer_token_pos_4": 395,
        "answer_token_4": "S",
        "end_token_pos_4": 394,
        "end_token_id_4": 29889,
        "answer_token_id_5": 16766,
        "answer_token_pos_5": 398,
        "answer_token_5": "dump",
        "end_token_pos_5": 397,
        "end_token_id_5": 338,
        "answer_token_id_6": 360,
        "answer_token_pos_6": 402,
        "answer_token_6": "D",
        "end_token_pos_6": 401,
        "end_token_id_6": 29889,
        "answer_token_id_7": 14225,
        "answer_token_pos_7": 406,
        "answer_token_7": "sweet",
        "end_token_pos_7": 405,
        "end_token_id_7": 338,
        "answer_token_id_8": 317,
        "answer_token_pos_8": 410,
        "answer_token_8": "S",
        "end_token_pos_8": 409,
        "end_token_id_8": 29889,
        "answer_token_id_9": 14225,
        "answer_token_pos_9": 413,
        "answer_token_9": "sweet",
        "end_token_pos_9": 412,
        "end_token_id_9": 338
    },
    {
        "question": "Tumpuses are liquid. Sterpuses are tumpuses. Stella is sterpus.",
        "query": "True or false: Stella is liquid.",
        "answer": "Stella is sterpus. Sterpuses are tumpuses. Stella is tumpus. Tumpuses are liquid. Stella is liquid. True",
        "label": "True",
        "prompt": "Tumpuses are liquid. Sterpuses are tumpuses. Stella is sterpus. True or false: Stella is liquid. Let us think step by step.",
        "generated": "Stella is sterpus. Sterpuses are tumpuses. Stella is tumpus. Tumpuses are liquid. Stella is liquid. True",
        "noise_response_0": "",
        "noise_prompt_0": "Tumpuses are liquid. Sterpuses are tumpuses. Stella is sterpus. True or false: Polly is liquid. Let us think step by step.",
        "response_0": "",
        "noise_response_1": "Stella is",
        "noise_prompt_1": "Tumpuses are liquid. Sterpuses are tumpuses. Stella is brimpus. True or false: Stella is liquid. Let us think step by step.",
        "response_1": "Stella is",
        "noise_response_2": "Stella is sterpus.",
        "noise_prompt_2": "Tumpuses are liquid. Tumpus are tumpuses. Stella is sterpus. True or false: Stella is liquid. Let us think step by step.",
        "response_2": "Stella is sterpus.",
        "noise_response_3": "Stella is sterpus. Sterpuses are",
        "noise_prompt_3": "Tumpuses are liquid. Sterpuses are muffled. Stella is sterpus. True or false: Stella is liquid. Let us think step by step.",
        "response_3": "Stella is sterpus. Sterpuses are",
        "noise_response_4": "Stella is sterpus. Rex are tumpuses.",
        "noise_prompt_4": "Tumpuses are liquid. Sterpuses are tumpuses. Stella is sterpus. True or false: Stella is liquid. Let us think step by step.",
        "response_4": "Stella is sterpus. Sterpuses are tumpuses.",
        "noise_response_5": "Stella is sterpus. Sterpuses are angry. Stella is",
        "noise_prompt_5": "Tumpuses are liquid. Sterpuses are tumpuses. Stella is sterpus. True or false: Stella is liquid. Let us think step by step.",
        "response_5": "Stella is sterpus. Sterpuses are tumpuses. Stella is",
        "noise_response_6": "Stella is sterpus. Sterpuses are tumpuses. Stella is tumpus.",
        "noise_prompt_6": "Gorpus are liquid. Sterpuses are tumpuses. Stella is sterpus. True or false: Stella is liquid. Let us think step by step.",
        "response_6": "Stella is sterpus. Sterpuses are tumpuses. Stella is tumpus.",
        "noise_response_7": "Stella is sterpus. Sterpuses are tumpuses. Stella is tumpus. Tumpuses are",
        "noise_prompt_7": "Tumpuses are liquid. Sterpuses are tumpuses. Stella is sterpus. True or false: Stella is sweet. Let us think step by step.",
        "response_7": "Stella is sterpus. Sterpuses are tumpuses. Stella is tumpus. Tumpuses are",
        "noise_response_8": "Stella is sterpus. Sterpuses are tumpuses. Fae is tumpus. Tumpuses are liquid.",
        "noise_prompt_8": "Tumpuses are liquid. Sterpuses are tumpuses. Stella is sterpus. True or false: Stella is liquid. Let us think step by step.",
        "response_8": "Stella is sterpus. Sterpuses are tumpuses. Stella is tumpus. Tumpuses are liquid.",
        "noise_response_9": "Stella is sterpus. Sterpuses are tumpuses. Stella is tumpus. Tumpuses are wooden. Stella is",
        "noise_prompt_9": "Tumpuses are liquid. Sterpuses are tumpuses. Stella is sterpus. True or false: Stella is liquid. Let us think step by step.",
        "response_9": "Stella is sterpus. Sterpuses are tumpuses. Stella is tumpus. Tumpuses are liquid. Stella is",
        "noise_prompt_10": "Tumpuses are liquid. Sterpuses are tumpuses. Stella is sterpus. True or false: Stella is liquid. Let us think step by step.",
        "response_10": "Stella is sterpus. Sterpuses are tumpuses. Stella is tumpus. Tumpuses are liquid. Stella is liquid.",
        "noise_response_10": "Stella is sterpus. Sterpuses are tumpuses. Stella is tumpus. Tumpuses are liquid. Stella is rainy.",
        "answer_token_id_0": 855,
        "answer_token_pos_0": 380,
        "answer_token_0": "St",
        "end_token_pos_0": 379,
        "end_token_id_0": 13,
        "answer_token_id_1": 16864,
        "answer_token_pos_1": 383,
        "answer_token_1": "ster",
        "end_token_pos_1": 382,
        "end_token_id_1": 338,
        "answer_token_id_2": 28588,
        "answer_token_pos_2": 387,
        "answer_token_2": "Ster",
        "end_token_pos_2": 386,
        "end_token_id_2": 29889,
        "answer_token_id_3": 260,
        "answer_token_pos_3": 391,
        "answer_token_3": "t",
        "end_token_pos_3": 390,
        "end_token_id_3": 526,
        "answer_token_id_4": 624,
        "answer_token_pos_4": 395,
        "answer_token_4": "St",
        "end_token_pos_4": 394,
        "end_token_id_4": 29889,
        "answer_token_id_5": 260,
        "answer_token_pos_5": 398,
        "answer_token_5": "t",
        "end_token_pos_5": 397,
        "end_token_id_5": 338,
        "answer_token_id_6": 323,
        "answer_token_pos_6": 402,
        "answer_token_6": "T",
        "end_token_pos_6": 401,
        "end_token_id_6": 29889,
        "answer_token_id_7": 23904,
        "answer_token_pos_7": 406,
        "answer_token_7": "liquid",
        "end_token_pos_7": 405,
        "end_token_id_7": 526,
        "answer_token_id_8": 624,
        "answer_token_pos_8": 410,
        "answer_token_8": "St",
        "end_token_pos_8": 409,
        "end_token_id_8": 29889,
        "answer_token_id_9": 23904,
        "answer_token_pos_9": 413,
        "answer_token_9": "liquid",
        "end_token_pos_9": 412,
        "end_token_id_9": 338
    },
    {
        "question": "Lempuses are brown. Tumpuses are lempuses. Sally is tumpus.",
        "query": "True or false: Sally is brown.",
        "answer": "Sally is tumpus. Tumpuses are lempuses. Sally is lempus. Lempuses are brown. Sally is brown. True",
        "label": "True",
        "prompt": "Lempuses are brown. Tumpuses are lempuses. Sally is tumpus. True or false: Sally is brown. Let us think step by step.",
        "generated": "Sally is tumpus. Tumpuses are lempuses. Sally is lempus. Lempuses are brown. Sally is brown. True",
        "noise_response_0": "",
        "noise_prompt_0": "Lempuses are brown. Tumpuses are lempuses. Sally is tumpus. True or false: Polly is brown. Let us think step by step.",
        "response_0": "",
        "noise_response_1": "Sally is",
        "noise_prompt_1": "Lempuses are brown. Tumpuses are lempuses. Sally is slow. True or false: Sally is brown. Let us think step by step.",
        "response_1": "Sally is",
        "noise_response_2": "Sally is tumpus.",
        "noise_prompt_2": "Lempuses are brown. vumpus are lempuses. Sally is tumpus. True or false: Sally is brown. Let us think step by step.",
        "response_2": "Sally is tumpus.",
        "noise_response_3": "Sally is tumpus. Tumpuses are",
        "noise_prompt_3": "Lempuses are brown. Tumpuses are Sterpus. Sally is tumpus. True or false: Sally is brown. Let us think step by step.",
        "response_3": "Sally is tumpus. Tumpuses are",
        "noise_response_4": "Fae is tumpus. Tumpuses are lempuses.",
        "noise_prompt_4": "Lempuses are brown. Tumpuses are lempuses. Sally is tumpus. True or false: Sally is brown. Let us think step by step.",
        "response_4": "Sally is tumpus. Tumpuses are lempuses.",
        "noise_response_5": "Sally is tumpus. Tumpuses are wumpus. Sally is",
        "noise_prompt_5": "Lempuses are brown. Tumpuses are lempuses. Sally is tumpus. True or false: Sally is brown. Let us think step by step.",
        "response_5": "Sally is tumpus. Tumpuses are lempuses. Sally is",
        "noise_response_6": "Sally is tumpus. Tumpuses are lempuses. Sally is lempus.",
        "noise_prompt_6": "Rompus are brown. Tumpuses are lempuses. Sally is tumpus. True or false: Sally is brown. Let us think step by step.",
        "response_6": "Sally is tumpus. Tumpuses are lempuses. Sally is lempus.",
        "noise_response_7": "Sally is tumpus. Tumpuses are lempuses. Sally is lempus. Lempuses are",
        "noise_prompt_7": "Lempuses are brown. Tumpuses are lempuses. Sally is tumpus. True or false: Sally is temperate. Let us think step by step.",
        "response_7": "Sally is tumpus. Tumpuses are lempuses. Sally is lempus. Lempuses are",
        "noise_response_8": "Sally is tumpus. Tumpuses are lempuses. Polly is lempus. Lempuses are brown.",
        "noise_prompt_8": "Lempuses are brown. Tumpuses are lempuses. Sally is tumpus. True or false: Sally is brown. Let us think step by step.",
        "response_8": "Sally is tumpus. Tumpuses are lempuses. Sally is lempus. Lempuses are brown.",
        "noise_response_9": "Sally is tumpus. Tumpuses are lempuses. Sally is lempus. Lempuses are angry. Sally is",
        "noise_prompt_9": "Lempuses are brown. Tumpuses are lempuses. Sally is tumpus. True or false: Sally is brown. Let us think step by step.",
        "response_9": "Sally is tumpus. Tumpuses are lempuses. Sally is lempus. Lempuses are brown. Sally is",
        "noise_prompt_10": "Lempuses are brown. Tumpuses are lempuses. Sally is tumpus. True or false: Sally is brown. Let us think step by step.",
        "response_10": "Sally is tumpus. Tumpuses are lempuses. Sally is lempus. Lempuses are brown. Sally is brown.",
        "noise_response_10": "Sally is tumpus. Tumpuses are lempuses. Sally is lempus. Lempuses are brown. Sally is metallic.",
        "answer_token_id_0": 29903,
        "answer_token_pos_0": 380,
        "answer_token_0": "S",
        "end_token_pos_0": 379,
        "end_token_id_0": 13,
        "answer_token_id_1": 260,
        "answer_token_pos_1": 383,
        "answer_token_1": "t",
        "end_token_pos_1": 382,
        "end_token_id_1": 338,
        "answer_token_id_2": 323,
        "answer_token_pos_2": 387,
        "answer_token_2": "T",
        "end_token_pos_2": 386,
        "end_token_id_2": 29889,
        "answer_token_id_3": 454,
        "answer_token_pos_3": 391,
        "answer_token_3": "le",
        "end_token_pos_3": 390,
        "end_token_id_3": 526,
        "answer_token_id_4": 317,
        "answer_token_pos_4": 395,
        "answer_token_4": "S",
        "end_token_pos_4": 394,
        "end_token_id_4": 29889,
        "answer_token_id_5": 454,
        "answer_token_pos_5": 398,
        "answer_token_5": "le",
        "end_token_pos_5": 397,
        "end_token_id_5": 338,
        "answer_token_id_6": 365,
        "answer_token_pos_6": 402,
        "answer_token_6": "L",
        "end_token_pos_6": 401,
        "end_token_id_6": 29889,
        "answer_token_id_7": 17354,
        "answer_token_pos_7": 406,
        "answer_token_7": "brown",
        "end_token_pos_7": 405,
        "end_token_id_7": 526,
        "answer_token_id_8": 317,
        "answer_token_pos_8": 410,
        "answer_token_8": "S",
        "end_token_pos_8": 409,
        "end_token_id_8": 29889,
        "answer_token_id_9": 17354,
        "answer_token_pos_9": 413,
        "answer_token_9": "brown",
        "end_token_pos_9": 412,
        "end_token_id_9": 338
    },
    {
        "question": "Shumpus is floral. Grimpuses are shumpuses. Polly is grimpus.",
        "query": "True or false: Polly is floral.",
        "answer": "Polly is grimpus. Grimpuses are shumpuses. Polly is shumpus. Shumpus is floral. Polly is floral. True",
        "label": "True",
        "prompt": "Shumpus is floral. Grimpuses are shumpuses. Polly is grimpus. True or false: Polly is floral. Let us think step by step.",
        "generated": "Polly is grimpus. Grimpuses are shumpuses. Polly is shumpus. Shumpus is floral. Polly is floral. True",
        "noise_response_0": "",
        "noise_prompt_0": "Shumpus is floral. Grimpuses are shumpuses. Polly is grimpus. True or false: Wren is floral. Let us think step by step.",
        "response_0": "",
        "noise_response_1": "Polly is",
        "noise_prompt_1": "Shumpus is floral. Grimpuses are shumpuses. Polly is Dumpus. True or false: Polly is floral. Let us think step by step.",
        "response_1": "Polly is",
        "noise_response_2": "Polly is grimpus.",
        "noise_prompt_2": "Shumpus is floral. Numpus are shumpuses. Polly is grimpus. True or false: Polly is floral. Let us think step by step.",
        "response_2": "Polly is grimpus.",
        "noise_response_3": "Polly is grimpus. Grimpuses are",
        "noise_prompt_3": "Shumpus is floral. Grimpuses are aggressive. Polly is grimpus. True or false: Polly is floral. Let us think step by step.",
        "response_3": "Polly is grimpus. Grimpuses are",
        "noise_response_4": "Sam is grimpus. Grimpuses are shumpuses.",
        "noise_prompt_4": "Shumpus is floral. Grimpuses are shumpuses. Polly is grimpus. True or false: Polly is floral. Let us think step by step.",
        "response_4": "Polly is grimpus. Grimpuses are shumpuses.",
        "noise_response_5": "Polly is grimpus. Grimpuses are hot. Polly is",
        "noise_prompt_5": "Shumpus is floral. Grimpuses are shumpuses. Polly is grimpus. True or false: Polly is floral. Let us think step by step.",
        "response_5": "Polly is grimpus. Grimpuses are shumpuses. Polly is",
        "noise_response_6": "Polly is grimpus. Grimpuses are shumpuses. Polly is shumpus.",
        "noise_prompt_6": "Grimpus is floral. Grimpuses are shumpuses. Polly is grimpus. True or false: Polly is floral. Let us think step by step.",
        "response_6": "Polly is grimpus. Grimpuses are shumpuses. Polly is shumpus.",
        "noise_response_7": "Polly is grimpus. Grimpuses are shumpuses. Polly is shumpus. Shumpus is",
        "noise_prompt_7": "Shumpus is floral. Grimpuses are shumpuses. Polly is grimpus. True or false: Polly is fast. Let us think step by step.",
        "response_7": "Polly is grimpus. Grimpuses are shumpuses. Polly is shumpus. Shumpus is",
        "noise_response_8": "Polly is grimpus. Grimpuses are shumpuses. Fae is shumpus. Shumpus is floral.",
        "noise_prompt_8": "Shumpus is floral. Grimpuses are shumpuses. Polly is grimpus. True or false: Polly is floral. Let us think step by step.",
        "response_8": "Polly is grimpus. Grimpuses are shumpuses. Polly is shumpus. Shumpus is floral.",
        "noise_response_9": "Polly is grimpus. Grimpuses are shumpuses. Polly is shumpus. Shumpus is orange. Polly is",
        "noise_prompt_9": "Shumpus is floral. Grimpuses are shumpuses. Polly is grimpus. True or false: Polly is floral. Let us think step by step.",
        "response_9": "Polly is grimpus. Grimpuses are shumpuses. Polly is shumpus. Shumpus is floral. Polly is",
        "noise_prompt_10": "Shumpus is floral. Grimpuses are shumpuses. Polly is grimpus. True or false: Polly is floral. Let us think step by step.",
        "response_10": "Polly is grimpus. Grimpuses are shumpuses. Polly is shumpus. Shumpus is floral. Polly is floral.",
        "noise_response_10": "Polly is grimpus. Grimpuses are shumpuses. Polly is shumpus. Shumpus is floral. Polly is small.",
        "answer_token_id_0": 7713,
        "answer_token_pos_0": 380,
        "answer_token_0": "Pol",
        "end_token_pos_0": 379,
        "end_token_id_0": 13,
        "answer_token_id_1": 867,
        "answer_token_pos_1": 383,
        "answer_token_1": "gr",
        "end_token_pos_1": 382,
        "end_token_id_1": 338,
        "answer_token_id_2": 1632,
        "answer_token_pos_2": 387,
        "answer_token_2": "Gr",
        "end_token_pos_2": 386,
        "end_token_id_2": 29889,
        "answer_token_id_3": 528,
        "answer_token_pos_3": 391,
        "answer_token_3": "sh",
        "end_token_pos_3": 390,
        "end_token_id_3": 526,
        "answer_token_id_4": 2043,
        "answer_token_pos_4": 395,
        "answer_token_4": "Pol",
        "end_token_pos_4": 394,
        "end_token_id_4": 29889,
        "answer_token_id_5": 528,
        "answer_token_pos_5": 398,
        "answer_token_5": "sh",
        "end_token_pos_5": 397,
        "end_token_id_5": 338,
        "answer_token_id_6": 1383,
        "answer_token_pos_6": 402,
        "answer_token_6": "Sh",
        "end_token_pos_6": 401,
        "end_token_id_6": 29889,
        "answer_token_id_7": 1652,
        "answer_token_pos_7": 406,
        "answer_token_7": "fl",
        "end_token_pos_7": 405,
        "end_token_id_7": 338,
        "answer_token_id_8": 2043,
        "answer_token_pos_8": 410,
        "answer_token_8": "Pol",
        "end_token_pos_8": 409,
        "end_token_id_8": 29889,
        "answer_token_id_9": 1652,
        "answer_token_pos_9": 413,
        "answer_token_9": "fl",
        "end_token_pos_9": 412,
        "end_token_id_9": 338
    },
    {
        "question": "Impuses are loud. Vumpus is impus. Fae is vumpus.",
        "query": "True or false: Fae is loud.",
        "answer": "Fae is vumpus. Vumpus is impus. Fae is impus. Impuses are loud. Fae is loud. True",
        "label": "True",
        "prompt": "Impuses are loud. Vumpus is impus. Fae is vumpus. True or false: Fae is loud. Let us think step by step.",
        "generated": "Fae is vumpus. Vumpus is impus. Fae is impus. Impuses are loud. Fae is loud. True",
        "noise_response_0": "",
        "noise_prompt_0": "Impuses are loud. Vumpus is impus. Fae is vumpus. True or false: Rex is loud. Let us think step by step.",
        "response_0": "",
        "noise_response_1": "Fae is",
        "noise_prompt_1": "Impuses are loud. Vumpus is impus. Fae is Rompus. True or false: Fae is loud. Let us think step by step.",
        "response_1": "Fae is",
        "noise_response_2": "Fae is vumpus.",
        "noise_prompt_2": "Impuses are loud. lorpus is impus. Fae is vumpus. True or false: Fae is loud. Let us think step by step.",
        "response_2": "Fae is vumpus.",
        "noise_response_3": "Fae is vumpus. Vumpus is",
        "noise_prompt_3": "Impuses are loud. Vumpus is vumpus. Fae is vumpus. True or false: Fae is loud. Let us think step by step.",
        "response_3": "Fae is vumpus. Vumpus is",
        "noise_response_4": "Rex is vumpus. Vumpus is impus.",
        "noise_prompt_4": "Impuses are loud. Vumpus is impus. Fae is vumpus. True or false: Fae is loud. Let us think step by step.",
        "response_4": "Fae is vumpus. Vumpus is impus.",
        "noise_response_5": "Fae is vumpus. Vumpus is Grimpus. Fae is",
        "noise_prompt_5": "Impuses are loud. Vumpus is impus. Fae is vumpus. True or false: Fae is loud. Let us think step by step.",
        "response_5": "Fae is vumpus. Vumpus is impus. Fae is",
        "noise_response_6": "Fae is vumpus. Vumpus is impus. Fae is impus.",
        "noise_prompt_6": "Wumpus are loud. Vumpus is impus. Fae is vumpus. True or false: Fae is loud. Let us think step by step.",
        "response_6": "Fae is vumpus. Vumpus is impus. Fae is impus.",
        "noise_response_7": "Fae is vumpus. Vumpus is impus. Fae is impus. Impuses are",
        "noise_prompt_7": "Impuses are loud. Vumpus is impus. Fae is vumpus. True or false: Fae is luminous. Let us think step by step.",
        "response_7": "Fae is vumpus. Vumpus is impus. Fae is impus. Impuses are",
        "noise_response_8": "Fae is vumpus. Vumpus is impus. Sam is impus. Impuses are loud.",
        "noise_prompt_8": "Impuses are loud. Vumpus is impus. Fae is vumpus. True or false: Fae is loud. Let us think step by step.",
        "response_8": "Fae is vumpus. Vumpus is impus. Fae is impus. Impuses are loud.",
        "noise_response_9": "Fae is vumpus. Vumpus is impus. Fae is impus. Impuses are sweet. Fae is",
        "noise_prompt_9": "Impuses are loud. Vumpus is impus. Fae is vumpus. True or false: Fae is loud. Let us think step by step.",
        "response_9": "Fae is vumpus. Vumpus is impus. Fae is impus. Impuses are loud. Fae is",
        "noise_prompt_10": "Impuses are loud. Vumpus is impus. Fae is vumpus. True or false: Fae is loud. Let us think step by step.",
        "response_10": "Fae is vumpus. Vumpus is impus. Fae is impus. Impuses are loud. Fae is loud.",
        "noise_response_10": "Fae is vumpus. Vumpus is impus. Fae is impus. Impuses are loud. Fae is hot.",
        "answer_token_id_0": 29943,
        "answer_token_pos_0": 380,
        "answer_token_0": "F",
        "end_token_pos_0": 379,
        "end_token_id_0": 13,
        "answer_token_id_1": 325,
        "answer_token_pos_1": 383,
        "answer_token_1": "v",
        "end_token_pos_1": 382,
        "end_token_id_1": 338,
        "answer_token_id_2": 478,
        "answer_token_pos_2": 387,
        "answer_token_2": "V",
        "end_token_pos_2": 386,
        "end_token_id_2": 29889,
        "answer_token_id_3": 2411,
        "answer_token_pos_3": 391,
        "answer_token_3": "imp",
        "end_token_pos_3": 390,
        "end_token_id_3": 338,
        "answer_token_id_4": 383,
        "answer_token_pos_4": 395,
        "answer_token_4": "F",
        "end_token_pos_4": 394,
        "end_token_id_4": 29889,
        "answer_token_id_5": 2411,
        "answer_token_pos_5": 398,
        "answer_token_5": "imp",
        "end_token_pos_5": 397,
        "end_token_id_5": 338,
        "answer_token_id_6": 14305,
        "answer_token_pos_6": 402,
        "answer_token_6": "Imp",
        "end_token_pos_6": 401,
        "end_token_id_6": 29889,
        "answer_token_id_7": 22526,
        "answer_token_pos_7": 406,
        "answer_token_7": "loud",
        "end_token_pos_7": 405,
        "end_token_id_7": 526,
        "answer_token_id_8": 383,
        "answer_token_pos_8": 410,
        "answer_token_8": "F",
        "end_token_pos_8": 409,
        "end_token_id_8": 29889,
        "answer_token_id_9": 22526,
        "answer_token_pos_9": 413,
        "answer_token_9": "loud",
        "end_token_pos_9": 412,
        "end_token_id_9": 338
    },
    {
        "question": "Wumpus is moderate. Dumpus is wumpus. Polly is dumpus.",
        "query": "True or false: Polly is moderate.",
        "answer": "Polly is dumpus. Dumpus is wumpus. Polly is wumpus. Wumpus is moderate. Polly is moderate. True",
        "label": "True",
        "prompt": "Wumpus is moderate. Dumpus is wumpus. Polly is dumpus. True or false: Polly is moderate. Let us think step by step.",
        "generated": "Polly is dumpus. Dumpus is wumpus. Polly is wumpus. Wumpus is moderate. Polly is moderate. True",
        "noise_response_0": "",
        "noise_prompt_0": "Wumpus is moderate. Dumpus is wumpus. Polly is dumpus. True or false: Sam is moderate. Let us think step by step.",
        "response_0": "",
        "noise_response_1": "Polly is",
        "noise_prompt_1": "Wumpus is moderate. Dumpus is wumpus. Polly is Shumpus. True or false: Polly is moderate. Let us think step by step.",
        "response_1": "Polly is",
        "noise_response_2": "Polly is dumpus.",
        "noise_prompt_2": "Wumpus is moderate. Grimpus is wumpus. Polly is dumpus. True or false: Polly is moderate. Let us think step by step.",
        "response_2": "Polly is dumpus.",
        "noise_response_3": "Polly is dumpus. Dumpus is",
        "noise_prompt_3": "Wumpus is moderate. Dumpus is overcast. Polly is dumpus. True or false: Polly is moderate. Let us think step by step.",
        "response_3": "Polly is dumpus. Dumpus is",
        "noise_response_4": "Fae is dumpus. Dumpus is wumpus.",
        "noise_prompt_4": "Wumpus is moderate. Dumpus is wumpus. Polly is dumpus. True or false: Polly is moderate. Let us think step by step.",
        "response_4": "Polly is dumpus. Dumpus is wumpus.",
        "noise_response_5": "Polly is dumpus. Dumpus is melodic. Polly is",
        "noise_prompt_5": "Wumpus is moderate. Dumpus is wumpus. Polly is dumpus. True or false: Polly is moderate. Let us think step by step.",
        "response_5": "Polly is dumpus. Dumpus is wumpus. Polly is",
        "noise_response_6": "Polly is dumpus. Dumpus is wumpus. Polly is wumpus.",
        "noise_prompt_6": "Rex is moderate. Dumpus is wumpus. Polly is dumpus. True or false: Polly is moderate. Let us think step by step.",
        "response_6": "Polly is dumpus. Dumpus is wumpus. Polly is wumpus.",
        "noise_response_7": "Polly is dumpus. Dumpus is wumpus. Polly is wumpus. Wumpus is",
        "noise_prompt_7": "Wumpus is moderate. Dumpus is wumpus. Polly is dumpus. True or false: Polly is discordant. Let us think step by step.",
        "response_7": "Polly is dumpus. Dumpus is wumpus. Polly is wumpus. Wumpus is",
        "noise_response_8": "Polly is dumpus. Dumpus is wumpus. Rex is wumpus. Wumpus is moderate.",
        "noise_prompt_8": "Wumpus is moderate. Dumpus is wumpus. Polly is dumpus. True or false: Polly is moderate. Let us think step by step.",
        "response_8": "Polly is dumpus. Dumpus is wumpus. Polly is wumpus. Wumpus is moderate.",
        "noise_response_9": "Polly is dumpus. Dumpus is wumpus. Polly is wumpus. Wumpus is bitter. Polly is",
        "noise_prompt_9": "Wumpus is moderate. Dumpus is wumpus. Polly is dumpus. True or false: Polly is moderate. Let us think step by step.",
        "response_9": "Polly is dumpus. Dumpus is wumpus. Polly is wumpus. Wumpus is moderate. Polly is",
        "noise_prompt_10": "Wumpus is moderate. Dumpus is wumpus. Polly is dumpus. True or false: Polly is moderate. Let us think step by step.",
        "response_10": "Polly is dumpus. Dumpus is wumpus. Polly is wumpus. Wumpus is moderate. Polly is moderate.",
        "noise_response_10": "Polly is dumpus. Dumpus is wumpus. Polly is wumpus. Wumpus is moderate. Polly is dull.",
        "answer_token_id_0": 7713,
        "answer_token_pos_0": 380,
        "answer_token_0": "Pol",
        "end_token_pos_0": 379,
        "end_token_id_0": 13,
        "answer_token_id_1": 16766,
        "answer_token_pos_1": 383,
        "answer_token_1": "dump",
        "end_token_pos_1": 382,
        "end_token_id_1": 338,
        "answer_token_id_2": 360,
        "answer_token_pos_2": 387,
        "answer_token_2": "D",
        "end_token_pos_2": 386,
        "end_token_id_2": 29889,
        "answer_token_id_3": 281,
        "answer_token_pos_3": 391,
        "answer_token_3": "w",
        "end_token_pos_3": 390,
        "end_token_id_3": 338,
        "answer_token_id_4": 2043,
        "answer_token_pos_4": 395,
        "answer_token_4": "Pol",
        "end_token_pos_4": 394,
        "end_token_id_4": 29889,
        "answer_token_id_5": 281,
        "answer_token_pos_5": 398,
        "answer_token_5": "w",
        "end_token_pos_5": 397,
        "end_token_id_5": 338,
        "answer_token_id_6": 399,
        "answer_token_pos_6": 402,
        "answer_token_6": "W",
        "end_token_pos_6": 401,
        "end_token_id_6": 29889,
        "answer_token_id_7": 17768,
        "answer_token_pos_7": 406,
        "answer_token_7": "moder",
        "end_token_pos_7": 405,
        "end_token_id_7": 338,
        "answer_token_id_8": 2043,
        "answer_token_pos_8": 410,
        "answer_token_8": "Pol",
        "end_token_pos_8": 409,
        "end_token_id_8": 29889,
        "answer_token_id_9": 17768,
        "answer_token_pos_9": 413,
        "answer_token_9": "moder",
        "end_token_pos_9": 412,
        "end_token_id_9": 338
    },
    {
        "question": "Gorpus is overcast. Grimpus is gorpus. Sally is grimpus.",
        "query": "True or false: Sally is moderate.",
        "answer": "Sally is grimpus. Grimpus is gorpus. Sally is gorpus. Gorpus is overcast. Sally is overcast. False",
        "label": "False",
        "prompt": "Gorpus is overcast. Grimpus is gorpus. Sally is grimpus. True or false: Sally is moderate. Let us think step by step.",
        "generated": "Sally is grimpus. Grimpus is gorpus. Sally is gorpus. Gorpus is overcast. Sally is overcast. False",
        "noise_response_0": "",
        "noise_prompt_0": "Gorpus is overcast. Grimpus is gorpus. Sally is grimpus. True or false: Alex is moderate. Let us think step by step.",
        "response_0": "",
        "noise_response_1": "Sally is",
        "noise_prompt_1": "Gorpus is overcast. Grimpus is gorpus. Sally is brimpus. True or false: Sally is moderate. Let us think step by step.",
        "response_1": "Sally is",
        "noise_response_2": "Sally is grimpus.",
        "noise_prompt_2": "Gorpus is overcast. Yumpus is gorpus. Sally is grimpus. True or false: Sally is moderate. Let us think step by step.",
        "response_2": "Sally is grimpus.",
        "noise_response_3": "Sally is lempus. Grimpus is",
        "noise_prompt_3": "Gorpus is overcast. Grimpus is gorpus. Sally is grimpus. True or false: Sally is moderate. Let us think step by step.",
        "response_3": "Sally is grimpus. Grimpus is",
        "noise_response_4": "Sam is grimpus. Grimpus is gorpus.",
        "noise_prompt_4": "Gorpus is overcast. Grimpus is gorpus. Sally is grimpus. True or false: Sally is moderate. Let us think step by step.",
        "response_4": "Sally is grimpus. Grimpus is gorpus.",
        "noise_response_5": "Sally is grimpus. Grimpus is lorpus. Sally is",
        "noise_prompt_5": "Gorpus is overcast. Grimpus is gorpus. Sally is grimpus. True or false: Sally is moderate. Let us think step by step.",
        "response_5": "Sally is grimpus. Grimpus is gorpus. Sally is",
        "noise_response_6": "Sally is grimpus. Grimpus is gorpus. Sally is gorpus.",
        "noise_prompt_6": "shumpus is overcast. Grimpus is gorpus. Sally is grimpus. True or false: Sally is moderate. Let us think step by step.",
        "response_6": "Sally is grimpus. Grimpus is gorpus. Sally is gorpus.",
        "noise_response_7": "Sally is grimpus. Grimpus is gorpus. Sally is gorpus. Gorpus is",
        "noise_prompt_7": "Gorpus is kind. Grimpus is gorpus. Sally is grimpus. True or false: Sally is moderate. Let us think step by step.",
        "response_7": "Sally is grimpus. Grimpus is gorpus. Sally is gorpus. Gorpus is",
        "noise_response_8": "Sally is grimpus. Grimpus is gorpus. Wren is gorpus. Gorpus is overcast.",
        "noise_prompt_8": "Gorpus is overcast. Grimpus is gorpus. Sally is grimpus. True or false: Sally is moderate. Let us think step by step.",
        "response_8": "Sally is grimpus. Grimpus is gorpus. Sally is gorpus. Gorpus is overcast.",
        "noise_response_9": "Sally is grimpus. Grimpus is gorpus. Sally is gorpus. Gorpus is aggressive. Sally is",
        "noise_prompt_9": "Gorpus is overcast. Grimpus is gorpus. Sally is grimpus. True or false: Sally is moderate. Let us think step by step.",
        "response_9": "Sally is grimpus. Grimpus is gorpus. Sally is gorpus. Gorpus is overcast. Sally is",
        "noise_prompt_10": "Gorpus is overcast. Grimpus is gorpus. Sally is grimpus. True or false: Sally is moderate. Let us think step by step.",
        "response_10": "Sally is grimpus. Grimpus is gorpus. Sally is gorpus. Gorpus is overcast. Sally is overcast.",
        "noise_response_10": "Sally is grimpus. Grimpus is gorpus. Sally is gorpus. Gorpus is overcast. Sally is fast.",
        "answer_token_id_0": 29903,
        "answer_token_pos_0": 380,
        "answer_token_0": "S",
        "end_token_pos_0": 379,
        "end_token_id_0": 13,
        "answer_token_id_1": 867,
        "answer_token_pos_1": 383,
        "answer_token_1": "gr",
        "end_token_pos_1": 382,
        "end_token_id_1": 338,
        "answer_token_id_2": 1632,
        "answer_token_pos_2": 387,
        "answer_token_2": "Gr",
        "end_token_pos_2": 386,
        "end_token_id_2": 29889,
        "answer_token_id_3": 330,
        "answer_token_pos_3": 391,
        "answer_token_3": "g",
        "end_token_pos_3": 390,
        "end_token_id_3": 338,
        "answer_token_id_4": 317,
        "answer_token_pos_4": 395,
        "answer_token_4": "S",
        "end_token_pos_4": 394,
        "end_token_id_4": 29889,
        "answer_token_id_5": 330,
        "answer_token_pos_5": 398,
        "answer_token_5": "g",
        "end_token_pos_5": 397,
        "end_token_id_5": 338,
        "answer_token_id_6": 18686,
        "answer_token_pos_6": 402,
        "answer_token_6": "Gor",
        "end_token_pos_6": 401,
        "end_token_id_6": 29889,
        "answer_token_id_7": 975,
        "answer_token_pos_7": 406,
        "answer_token_7": "over",
        "end_token_pos_7": 405,
        "end_token_id_7": 338,
        "answer_token_id_8": 317,
        "answer_token_pos_8": 410,
        "answer_token_8": "S",
        "end_token_pos_8": 409,
        "end_token_id_8": 29889,
        "answer_token_id_9": 975,
        "answer_token_pos_9": 413,
        "answer_token_9": "over",
        "end_token_pos_9": 412,
        "end_token_id_9": 338
    }
]