[
  {
    "index": 0,
    "uncertainty_score": 4.3164271801288123e-07,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 1,
    "uncertainty_score": 0.0031827010679990053,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 2,
    "uncertainty_score": 1.4820241176494164e-06,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 3,
    "uncertainty_score": 5.409021142099846e-08,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 4,
    "uncertainty_score": 0.21925031251486268,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 5,
    "uncertainty_score": 2.249309766222396e-11,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 6,
    "uncertainty_score": 0.5000076881651694,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 7,
    "uncertainty_score": 1.6767905952619344e-09,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 8,
    "uncertainty_score": 0.4000000059604645,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 9,
    "uncertainty_score": 3.360102418525912e-09,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 10,
    "uncertainty_score": 0.00032970556640066206,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 11,
    "uncertainty_score": 8.365626626982703e-07,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 12,
    "uncertainty_score": 0.00017050451424438506,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 13,
    "uncertainty_score": 6.123630935661595e-09,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 14,
    "uncertainty_score": 2.603827908842504e-07,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 15,
    "uncertainty_score": 2.6958966259371664e-07,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 16,
    "uncertainty_score": 0.20003094173616226,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 17,
    "uncertainty_score": 2.120275894412771e-05,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 18,
    "uncertainty_score": 3.323607344896118e-08,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 19,
    "uncertainty_score": 0.2000010758638382,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 20,
    "uncertainty_score": 8.768540027404015e-08,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 21,
    "uncertainty_score": 0.09090951085090637,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 22,
    "uncertainty_score": 0.0034234714694321156,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 23,
    "uncertainty_score": 0.4000004003135288,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 24,
    "uncertainty_score": 0.0001249396154889837,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 25,
    "uncertainty_score": 2.070201389869908e-06,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 26,
    "uncertainty_score": 2.6257653189531993e-06,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 27,
    "uncertainty_score": 0.0003912372631020844,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 28,
    "uncertainty_score": 0.002220922615379095,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 29,
    "uncertainty_score": 1.6584424944454668e-09,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 30,
    "uncertainty_score": 4.414206705405377e-05,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 31,
    "uncertainty_score": 2.1362834559113253e-06,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 32,
    "uncertainty_score": 4.6168415757108505e-09,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 33,
    "uncertainty_score": 3.605552478802565e-07,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 34,
    "uncertainty_score": 8.299991011324892e-13,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 35,
    "uncertainty_score": 0.2000027447938919,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 36,
    "uncertainty_score": 9.443930082397856e-09,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 37,
    "uncertainty_score": 3.953497014208551e-07,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 38,
    "uncertainty_score": 0.0008849736186675727,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 39,
    "uncertainty_score": 4.825869109481573e-05,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 40,
    "uncertainty_score": 0.16717682778835297,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 41,
    "uncertainty_score": 7.737047114098061e-10,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 42,
    "uncertainty_score": 0.16666807568250283,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 43,
    "uncertainty_score": 1.3112870647091768e-06,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 44,
    "uncertainty_score": 1.1494923057853157e-07,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 45,
    "uncertainty_score": 0.20000597834587097,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 46,
    "uncertainty_score": 0.7247803509235382,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 47,
    "uncertainty_score": 2.0349229998828378e-06,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 48,
    "uncertainty_score": 0.00266313087195158,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 49,
    "uncertainty_score": 0.3994455635547638,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 50,
    "uncertainty_score": 1.660445718698611e-06,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 51,
    "uncertainty_score": 0.5000000013861878,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 52,
    "uncertainty_score": 0.19952145218849182,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 53,
    "uncertainty_score": 0.2519257664680481,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 54,
    "uncertainty_score": 4.374239495064103e-07,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 55,
    "uncertainty_score": 1.867760834883825e-09,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 56,
    "uncertainty_score": 0.1670728474855423,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 57,
    "uncertainty_score": 3.0867477107676677e-06,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 58,
    "uncertainty_score": 0.7326154708862305,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 59,
    "uncertainty_score": 1.0893744217810308e-07,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 60,
    "uncertainty_score": 2.6116088065464282e-06,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 61,
    "uncertainty_score": 0.3333335220813751,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 62,
    "uncertainty_score": 8.079432611916908e-23,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 63,
    "uncertainty_score": 5.93935624237929e-07,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 64,
    "uncertainty_score": 0.16690172255039215,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 65,
    "uncertainty_score": 0.0002471897460054606,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 66,
    "uncertainty_score": 6.914092409715522e-09,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 67,
    "uncertainty_score": 5.65141045072437e-09,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 68,
    "uncertainty_score": 0.20003299415111542,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 69,
    "uncertainty_score": 1.6064442831531522e-10,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 70,
    "uncertainty_score": 6.898802666910342e-07,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 71,
    "uncertainty_score": 7.398961315630004e-05,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 72,
    "uncertainty_score": 6.114630650699837e-07,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 73,
    "uncertainty_score": 1.7560436162966653e-06,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 74,
    "uncertainty_score": 0.3848283886909485,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 75,
    "uncertainty_score": 1.9970673292846186e-07,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 76,
    "uncertainty_score": 6.376968286758711e-08,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 77,
    "uncertainty_score": 2.5909820955405394e-09,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 78,
    "uncertainty_score": 0.0006593443104065955,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 79,
    "uncertainty_score": 0.6053518600250711,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 80,
    "uncertainty_score": 0.5,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 81,
    "uncertainty_score": 5.123269364304406e-09,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 82,
    "uncertainty_score": 0.20000004768371582,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 83,
    "uncertainty_score": 0.19997426867485046,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 84,
    "uncertainty_score": 3.4678680549404817e-06,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 85,
    "uncertainty_score": 1.2948327965389694e-09,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 86,
    "uncertainty_score": 2.593035342002281e-09,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 87,
    "uncertainty_score": 0.20000568212284256,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 88,
    "uncertainty_score": 0.25,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 89,
    "uncertainty_score": 0.7269997596740723,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 90,
    "uncertainty_score": 0.03636302798986435,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 91,
    "uncertainty_score": 1.6772286337563003e-10,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 92,
    "uncertainty_score": 0.0057443431578576565,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 93,
    "uncertainty_score": 4.316514090607626e-10,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 94,
    "uncertainty_score": 3.1554925339349893e-09,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 95,
    "uncertainty_score": 3.718408081443414e-10,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 96,
    "uncertainty_score": 5.385454187489813e-06,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 97,
    "uncertainty_score": 6.328988092718646e-05,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 98,
    "uncertainty_score": 0.25,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 99,
    "uncertainty_score": 3.017576318598003e-06,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 100,
    "uncertainty_score": 0.5000000000000018,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 101,
    "uncertainty_score": 2.399598297841976e-10,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 102,
    "uncertainty_score": 2.409021590210614e-06,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 103,
    "uncertainty_score": 2.4405049162123937e-11,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 104,
    "uncertainty_score": 3.629413569683493e-08,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 105,
    "uncertainty_score": 4.1729570511961356e-05,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 106,
    "uncertainty_score": 3.4379720545985037e-06,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 107,
    "uncertainty_score": 1.11240888145403e-06,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 108,
    "uncertainty_score": 1.8418586478219368e-07,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 109,
    "uncertainty_score": 0.5000044703483582,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 110,
    "uncertainty_score": 2.2004171569278697e-06,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 111,
    "uncertainty_score": 0.1999996304512024,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 112,
    "uncertainty_score": 9.784977272886408e-09,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 113,
    "uncertainty_score": 8.989419256977271e-06,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 114,
    "uncertainty_score": 0.001606970326974988,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 115,
    "uncertainty_score": 3.6968998529118835e-08,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 116,
    "uncertainty_score": 0.4000004827976227,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 117,
    "uncertainty_score": 3.018782793184904e-11,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 118,
    "uncertainty_score": 0.25000518560409546,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 119,
    "uncertainty_score": 4.794532326712897e-09,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 120,
    "uncertainty_score": 0.0003195347380824387,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 121,
    "uncertainty_score": 0.0231791865080595,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 122,
    "uncertainty_score": 0.2500057518482208,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 123,
    "uncertainty_score": 1.1638683794501503e-08,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 124,
    "uncertainty_score": 0.600000000000001,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 125,
    "uncertainty_score": 2.4287441391379616e-08,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 126,
    "uncertainty_score": 0.20090806484222412,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 127,
    "uncertainty_score": 0.2509966492652893,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 128,
    "uncertainty_score": 0.3114919066429138,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 129,
    "uncertainty_score": 2.68999850172591e-10,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 130,
    "uncertainty_score": 6.593427581691458e-09,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 131,
    "uncertainty_score": 5.124372364662122e-06,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 132,
    "uncertainty_score": 0.00032969689345918596,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 133,
    "uncertainty_score": 1.1788652187760817e-07,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 134,
    "uncertainty_score": 0.0001564755802974105,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 135,
    "uncertainty_score": 1.7555232267874032e-10,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 136,
    "uncertainty_score": 3.434198561080848e-07,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 137,
    "uncertainty_score": 2.0992020621779517e-11,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 138,
    "uncertainty_score": 0.00011729817924788222,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 139,
    "uncertainty_score": 6.723585829604417e-05,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 140,
    "uncertainty_score": 0.20001054217366665,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 141,
    "uncertainty_score": 6.313699996846056e-12,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 142,
    "uncertainty_score": 1.7605125690600687e-11,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 143,
    "uncertainty_score": 0.0009810968767851591,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 144,
    "uncertainty_score": 5.310535566849239e-09,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 145,
    "uncertainty_score": 2.500788411907706e-07,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 146,
    "uncertainty_score": 0.2000000000632179,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 147,
    "uncertainty_score": 2.4523214570137952e-09,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 148,
    "uncertainty_score": 2.9542861490483574e-09,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 149,
    "uncertainty_score": 0.20000000082867658,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 150,
    "uncertainty_score": 0.19993191957473755,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 151,
    "uncertainty_score": 2.039860280689254e-09,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 152,
    "uncertainty_score": 3.4905696111309226e-07,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 153,
    "uncertainty_score": 0.25002118945121765,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 154,
    "uncertainty_score": 1.020054529732306e-08,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 155,
    "uncertainty_score": 7.372108484560158e-06,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 156,
    "uncertainty_score": 0.40004808619639576,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 157,
    "uncertainty_score": 0.00011134239321108907,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 158,
    "uncertainty_score": 1.3572748684964608e-06,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 159,
    "uncertainty_score": 1.7901193860581088e-09,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 160,
    "uncertainty_score": 0.00010985415428876877,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 161,
    "uncertainty_score": 3.054334592889063e-05,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 162,
    "uncertainty_score": 0.22428162395954132,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 163,
    "uncertainty_score": 2.1167743113892357e-09,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 164,
    "uncertainty_score": 0.24992601573467255,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 165,
    "uncertainty_score": 2.6735220703955065e-09,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 166,
    "uncertainty_score": 0.6000000238418579,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 167,
    "uncertainty_score": 8.395336976718681e-07,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 168,
    "uncertainty_score": 8.147061691943236e-09,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 169,
    "uncertainty_score": 3.648351898366542e-10,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 170,
    "uncertainty_score": 2.211870935298066e-07,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 171,
    "uncertainty_score": 1.2871829824234737e-07,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 172,
    "uncertainty_score": 0.004597897175699472,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 173,
    "uncertainty_score": 0.18332581222057343,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 174,
    "uncertainty_score": 0.16666690061668635,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 175,
    "uncertainty_score": 4.3912754335906357e-05,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 176,
    "uncertainty_score": 0.33356383442878723,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 177,
    "uncertainty_score": 0.6666666865348816,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 178,
    "uncertainty_score": 4.2108339037838505e-09,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 179,
    "uncertainty_score": 1.242289326963686e-10,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 180,
    "uncertainty_score": 6.821566057624295e-05,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 181,
    "uncertainty_score": 7.474588947786742e-09,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 182,
    "uncertainty_score": 2.1277504856698215e-05,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 183,
    "uncertainty_score": 0.33334699273109436,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 184,
    "uncertainty_score": 0.0018624587683007121,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 185,
    "uncertainty_score": 0.1666666716337204,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 186,
    "uncertainty_score": 1.0362591496004825e-07,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 187,
    "uncertainty_score": 0.15363098680973053,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 188,
    "uncertainty_score": 0.49457430839538574,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 189,
    "uncertainty_score": 6.360242110758918e-08,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 190,
    "uncertainty_score": 5.121890353620984e-06,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 191,
    "uncertainty_score": 0.8,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 192,
    "uncertainty_score": 1.1097537683723777e-13,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 193,
    "uncertainty_score": 2.9320770522645034e-07,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 194,
    "uncertainty_score": 1.1889806916798307e-09,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 195,
    "uncertainty_score": 3.643970236666405e-09,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 196,
    "uncertainty_score": 0.20375263690948486,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 197,
    "uncertainty_score": 1.1616138095860151e-07,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 198,
    "uncertainty_score": 5.521330237456823e-08,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 199,
    "uncertainty_score": 0.00014921186084393412,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 200,
    "uncertainty_score": 9.317078024650982e-07,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 201,
    "uncertainty_score": 4.702401929534972e-05,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 202,
    "uncertainty_score": 3.562438399828949e-10,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 203,
    "uncertainty_score": 0.32142873199503325,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 204,
    "uncertainty_score": 3.5100793382980555e-08,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 205,
    "uncertainty_score": 0.002498111454769969,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 206,
    "uncertainty_score": 0.003107912838459015,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 207,
    "uncertainty_score": 5.521289328513923e-11,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 208,
    "uncertainty_score": 1.7123799600504697e-10,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 209,
    "uncertainty_score": 1.8985449656838682e-08,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 210,
    "uncertainty_score": 0.4007570147514343,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 211,
    "uncertainty_score": 4.0731205075417165e-08,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 212,
    "uncertainty_score": 8.589784265822242e-12,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 213,
    "uncertainty_score": 0.2000000774860382,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 214,
    "uncertainty_score": 4.1838382758285775e-10,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 215,
    "uncertainty_score": 1.4598618314209943e-08,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 216,
    "uncertainty_score": 0.00037141182110644877,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 217,
    "uncertainty_score": 1.5824107649220487e-11,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 218,
    "uncertainty_score": 7.290064107934313e-09,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 219,
    "uncertainty_score": 0.13621777296066284,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 220,
    "uncertainty_score": 0.02642790600657463,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 221,
    "uncertainty_score": 0.2500000596046448,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 222,
    "uncertainty_score": 4.7530861024824844e-08,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 223,
    "uncertainty_score": 0.33333733677864075,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 224,
    "uncertainty_score": 1.3349351846159152e-08,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 225,
    "uncertainty_score": 4.019301195512526e-05,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 226,
    "uncertainty_score": 1.3736439763434305e-09,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 227,
    "uncertainty_score": 2.4442828316928455e-10,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 228,
    "uncertainty_score": 3.58012471224356e-07,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 229,
    "uncertainty_score": 0.20000000284900715,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 230,
    "uncertainty_score": 0.20000000298023224,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 231,
    "uncertainty_score": 1.7881957319332287e-06,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 232,
    "uncertainty_score": 6.77031039231224e-07,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 233,
    "uncertainty_score": 8.163695414120653e-11,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 234,
    "uncertainty_score": 9.424128144530641e-09,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 235,
    "uncertainty_score": 0.4999178647994995,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 236,
    "uncertainty_score": 0.00042756422772072256,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 237,
    "uncertainty_score": 1.0321831167559026e-09,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 238,
    "uncertainty_score": 0.1668676882982254,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 239,
    "uncertainty_score": 3.863471695342291e-11,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 240,
    "uncertainty_score": 8.824582037325612e-11,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 241,
    "uncertainty_score": 6.205090699040738e-07,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 242,
    "uncertainty_score": 3.82816324417945e-07,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 243,
    "uncertainty_score": 4.740944348213816e-07,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 244,
    "uncertainty_score": 2.2602678062533244e-10,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 245,
    "uncertainty_score": 3.937008705157119e-11,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 246,
    "uncertainty_score": 0.5003525896472507,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 247,
    "uncertainty_score": 0.20000047981739044,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 248,
    "uncertainty_score": 3.1269926648036517e-09,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 249,
    "uncertainty_score": 7.938986357203248e-08,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 250,
    "uncertainty_score": 1.4018876337562602e-10,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 251,
    "uncertainty_score": 0.33542653918266296,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 252,
    "uncertainty_score": 6.598154748266305e-12,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 253,
    "uncertainty_score": 3.206779980446939e-11,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 254,
    "uncertainty_score": 5.532997393586925e-10,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 255,
    "uncertainty_score": 4.236813566649289e-08,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 256,
    "uncertainty_score": 7.783512955938932e-06,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 257,
    "uncertainty_score": 8.588279456489545e-07,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 258,
    "uncertainty_score": 1.0,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 259,
    "uncertainty_score": 0.00020113067876081914,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 260,
    "uncertainty_score": 1.003477677841147e-06,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 261,
    "uncertainty_score": 0.20000861885210325,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 262,
    "uncertainty_score": 2.526400521674077e-06,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 263,
    "uncertainty_score": 3.123974465779611e-07,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 264,
    "uncertainty_score": 1.5394239483157435e-07,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 265,
    "uncertainty_score": 0.0036685015074908733,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 266,
    "uncertainty_score": 5.04959540847949e-09,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 267,
    "uncertainty_score": 0.7499765157699585,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 268,
    "uncertainty_score": 0.03328925743699074,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 269,
    "uncertainty_score": 8.680676546646282e-05,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 270,
    "uncertainty_score": 0.5603357489744667,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 271,
    "uncertainty_score": 2.0340557966846973e-05,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 272,
    "uncertainty_score": 1.1577015041064342e-10,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 273,
    "uncertainty_score": 9.726502412377158e-07,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 274,
    "uncertainty_score": 0.25000670552253723,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 275,
    "uncertainty_score": 2.0890714949928224e-05,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 276,
    "uncertainty_score": 1.7869218936539255e-05,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 277,
    "uncertainty_score": 7.799543482178706e-07,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 278,
    "uncertainty_score": 3.779110193136148e-05,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 279,
    "uncertainty_score": 0.22025826573371887,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 280,
    "uncertainty_score": 0.03319079428911209,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 281,
    "uncertainty_score": 0.010021352209150791,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 282,
    "uncertainty_score": 1.1327017546136631e-07,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 283,
    "uncertainty_score": 2.3340100597124547e-05,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 284,
    "uncertainty_score": 0.20000000298023224,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 285,
    "uncertainty_score": 1.610225808690302e-05,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 286,
    "uncertainty_score": 1.1492552465242056e-09,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 287,
    "uncertainty_score": 5.9408903325675055e-05,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 288,
    "uncertainty_score": 1.7211861631949432e-05,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 289,
    "uncertainty_score": 0.25003698468208313,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 290,
    "uncertainty_score": 5.535662239708472e-07,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 291,
    "uncertainty_score": 3.338403985253535e-05,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 292,
    "uncertainty_score": 4.4855347880456975e-08,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 293,
    "uncertainty_score": 0.3994404375553131,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 294,
    "uncertainty_score": 9.49890277546217e-10,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 295,
    "uncertainty_score": 3.2666173410689225e-07,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 296,
    "uncertainty_score": 6.389631601599888e-10,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 297,
    "uncertainty_score": 3.5436663381460676e-08,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 298,
    "uncertainty_score": 2.3973431240165155e-08,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 299,
    "uncertainty_score": 6.700933226966299e-06,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 300,
    "uncertainty_score": 5.6849433605066224e-08,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 301,
    "uncertainty_score": 0.00015260104555636644,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 302,
    "uncertainty_score": 7.076736778799386e-07,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 303,
    "uncertainty_score": 3.7806309194365895e-09,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 304,
    "uncertainty_score": 7.685475589269686e-10,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 305,
    "uncertainty_score": 1.505015889691208e-09,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 306,
    "uncertainty_score": 0.25,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 307,
    "uncertainty_score": 8.185977640096098e-05,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 308,
    "uncertainty_score": 0.2000054121017456,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 309,
    "uncertainty_score": 0.2480524480342865,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 310,
    "uncertainty_score": 9.363394504191547e-10,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 311,
    "uncertainty_score": 3.530688843511598e-07,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 312,
    "uncertainty_score": 0.5000000006685725,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 313,
    "uncertainty_score": 0.1657719910144806,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 314,
    "uncertainty_score": 8.218083991096137e-08,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 315,
    "uncertainty_score": 0.002529338002204895,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 316,
    "uncertainty_score": 5.1389040891081095e-05,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 317,
    "uncertainty_score": 0.0004236731037963182,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 318,
    "uncertainty_score": 0.024303603917360306,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 319,
    "uncertainty_score": 1.7584472766785098e-09,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 320,
    "uncertainty_score": 0.2000000000000952,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 321,
    "uncertainty_score": 4.023634971872525e-07,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 322,
    "uncertainty_score": 1.3254004910828778e-18,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 323,
    "uncertainty_score": 0.33337788853239797,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 324,
    "uncertainty_score": 2.55677665705889e-08,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 325,
    "uncertainty_score": 0.25,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 326,
    "uncertainty_score": 7.915118516166331e-08,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 327,
    "uncertainty_score": 1.724620668497323e-09,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 328,
    "uncertainty_score": 0.2000005692243576,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 329,
    "uncertainty_score": 3.520372274579131e-06,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 330,
    "uncertainty_score": 0.33332931995391846,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 331,
    "uncertainty_score": 0.25009027123451233,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 332,
    "uncertainty_score": 1.1124400771223009e-05,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 333,
    "uncertainty_score": 1.8152658043391057e-08,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 334,
    "uncertainty_score": 0.1514679342508316,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 335,
    "uncertainty_score": 5.306310946195936e-11,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 336,
    "uncertainty_score": 9.261554190231891e-09,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 337,
    "uncertainty_score": 0.19999898970127106,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 338,
    "uncertainty_score": 3.437746499912464e-06,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 339,
    "uncertainty_score": 2.892044603797217e-09,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 340,
    "uncertainty_score": 1.2113341654185206e-05,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 341,
    "uncertainty_score": 5.7328820730617736e-06,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 342,
    "uncertainty_score": 1.1052446735604349e-09,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 343,
    "uncertainty_score": 0.005625627469271421,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 344,
    "uncertainty_score": 1.4035936146683525e-05,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 345,
    "uncertainty_score": 5.895054346183315e-05,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 346,
    "uncertainty_score": 3.713384799652886e-08,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 347,
    "uncertainty_score": 3.4594322073644435e-08,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 348,
    "uncertainty_score": 3.6005670667194067e-10,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 349,
    "uncertainty_score": 0.21430382523486072,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 350,
    "uncertainty_score": 0.19999131560325623,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 351,
    "uncertainty_score": 1.7443607021050411e-06,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 352,
    "uncertainty_score": 0.49999547004699707,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 353,
    "uncertainty_score": 4.075471588294022e-05,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 354,
    "uncertainty_score": 4.820411163564131e-07,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 355,
    "uncertainty_score": 0.2000000000052568,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 356,
    "uncertainty_score": 0.7946724385867128,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 357,
    "uncertainty_score": 0.20002318408177358,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 358,
    "uncertainty_score": 1.2948315998073667e-05,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 359,
    "uncertainty_score": 0.25000014901161194,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 360,
    "uncertainty_score": 0.2307991236448288,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 361,
    "uncertainty_score": 0.0001245384628418833,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 362,
    "uncertainty_score": 1.413755956747309e-08,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 363,
    "uncertainty_score": 3.3485090256135663e-08,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 364,
    "uncertainty_score": 1.4224227925296873e-05,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 365,
    "uncertainty_score": 3.318877672686682e-10,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 366,
    "uncertainty_score": 1.360685002171902e-12,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 367,
    "uncertainty_score": 0.002902788808569312,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 368,
    "uncertainty_score": 9.566103472025134e-06,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 369,
    "uncertainty_score": 1.3437679058370122e-07,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 370,
    "uncertainty_score": 1.5463701856788248e-06,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 371,
    "uncertainty_score": 4.1057318656001485e-10,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 372,
    "uncertainty_score": 1.572235008850953e-09,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 373,
    "uncertainty_score": 0.200317603436471,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 374,
    "uncertainty_score": 0.04521939158439636,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 375,
    "uncertainty_score": 1.4501046197157308e-10,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 376,
    "uncertainty_score": 3.085210698028362e-10,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 377,
    "uncertainty_score": 2.4806320886305855e-10,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 378,
    "uncertainty_score": 1.5309562645393626e-11,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 379,
    "uncertainty_score": 9.976186447602231e-06,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 380,
    "uncertainty_score": 0.2000035047531128,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 381,
    "uncertainty_score": 0.17974284291267395,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 382,
    "uncertainty_score": 2.288781431047937e-08,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 383,
    "uncertainty_score": 9.78730962941654e-09,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 384,
    "uncertainty_score": 3.3347411498851898e-09,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 385,
    "uncertainty_score": 0.3103095293045044,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 386,
    "uncertainty_score": 0.6000001107087201,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 387,
    "uncertainty_score": 6.079338845665916e-07,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 388,
    "uncertainty_score": 0.4000003640064687,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 389,
    "uncertainty_score": 2.3706733998096752e-07,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 390,
    "uncertainty_score": 2.2595376958367552e-10,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 391,
    "uncertainty_score": 1.4110067070305377e-07,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 392,
    "uncertainty_score": 2.1480705669069122e-12,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 393,
    "uncertainty_score": 2.613312790344935e-05,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 394,
    "uncertainty_score": 0.20002159822459492,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 395,
    "uncertainty_score": 8.18383978185011e-06,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 396,
    "uncertainty_score": 0.4000005750305736,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 397,
    "uncertainty_score": 1.941758455359377e-05,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 398,
    "uncertainty_score": 0.10000000894069672,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 399,
    "uncertainty_score": 2.3902055890090423e-09,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 400,
    "uncertainty_score": 0.00025552697479724884,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 401,
    "uncertainty_score": 0.25000005206796344,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 402,
    "uncertainty_score": 1.5297220670618117e-05,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 403,
    "uncertainty_score": 1.8944352859762148e-06,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 404,
    "uncertainty_score": 9.740526365931146e-06,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 405,
    "uncertainty_score": 0.0001384223869536072,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 406,
    "uncertainty_score": 0.40015108175242686,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 407,
    "uncertainty_score": 0.5021666251122952,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 408,
    "uncertainty_score": 0.03176837041974068,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 409,
    "uncertainty_score": 2.6895643046032092e-08,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 410,
    "uncertainty_score": 0.20000667870044708,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 411,
    "uncertainty_score": 5.8628618717193604e-05,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 412,
    "uncertainty_score": 0.00010652465425664559,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 413,
    "uncertainty_score": 0.00022690992045681924,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 414,
    "uncertainty_score": 0.20000037550926208,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 415,
    "uncertainty_score": 8.33209851407446e-05,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 416,
    "uncertainty_score": 5.57452040084172e-06,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 417,
    "uncertainty_score": 1.0060148027124516e-11,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 418,
    "uncertainty_score": 5.82023451656255e-09,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 419,
    "uncertainty_score": 0.21517163664410838,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 420,
    "uncertainty_score": 3.326373132495064e-08,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 421,
    "uncertainty_score": 0.011935403570532799,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 422,
    "uncertainty_score": 0.6557485262552897,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 423,
    "uncertainty_score": 1.2132257865005158e-08,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 424,
    "uncertainty_score": 1.1815992628783079e-08,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 425,
    "uncertainty_score": 4.667297215377175e-09,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 426,
    "uncertainty_score": 2.1461386001675464e-09,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 427,
    "uncertainty_score": 1.2387304515470987e-08,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 428,
    "uncertainty_score": 0.0005336845642887056,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 429,
    "uncertainty_score": 0.49999985098838806,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 430,
    "uncertainty_score": 0.0022423742770535803,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 431,
    "uncertainty_score": 0.000873513393720762,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 432,
    "uncertainty_score": 3.68581393162304e-11,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 433,
    "uncertainty_score": 0.25007398936908454,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 434,
    "uncertainty_score": 0.4666745718664122,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 435,
    "uncertainty_score": 5.3338033141564535e-05,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 436,
    "uncertainty_score": 2.4709177605161703e-07,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 437,
    "uncertainty_score": 0.20000000117366007,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 438,
    "uncertainty_score": 0.2000000252519619,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 439,
    "uncertainty_score": 8.708505787093132e-08,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 440,
    "uncertainty_score": 1.782174622691016e-08,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 441,
    "uncertainty_score": 0.2502207612281231,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 442,
    "uncertainty_score": 1.375084816414308e-07,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 443,
    "uncertainty_score": 0.0010332648506438651,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 444,
    "uncertainty_score": 0.25154768985128834,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 445,
    "uncertainty_score": 3.203949723623699e-08,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 446,
    "uncertainty_score": 0.20005069181217944,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 447,
    "uncertainty_score": 3.700458438209491e-11,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 448,
    "uncertainty_score": 3.5719708065942634e-09,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 449,
    "uncertainty_score": 2.7818612176503385e-05,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 450,
    "uncertainty_score": 7.528724615159429e-10,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 451,
    "uncertainty_score": 0.0008649781041064405,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 452,
    "uncertainty_score": 8.77629782739131e-09,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 453,
    "uncertainty_score": 1.0189734762030442e-06,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 454,
    "uncertainty_score": 1.8864482902944476e-10,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 455,
    "uncertainty_score": 0.4004018350286712,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 456,
    "uncertainty_score": 0.2521691088021354,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 457,
    "uncertainty_score": 4.932849469075889e-11,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 458,
    "uncertainty_score": 0.40002001327540143,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 459,
    "uncertainty_score": 3.7065172098146055e-05,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 460,
    "uncertainty_score": 6.976891113472662e-11,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 461,
    "uncertainty_score": 0.200000202778912,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 462,
    "uncertainty_score": 8.522014231745185e-05,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 463,
    "uncertainty_score": 1.9384964814100364e-07,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 464,
    "uncertainty_score": 4.735703519686765e-10,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 465,
    "uncertainty_score": 1.1432903320073051e-07,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 466,
    "uncertainty_score": 2.1942835546661936e-11,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 467,
    "uncertainty_score": 0.500059082987306,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 468,
    "uncertainty_score": 2.8140502114984925e-08,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 469,
    "uncertainty_score": 0.2500000002016692,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 470,
    "uncertainty_score": 0.20000277065996058,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 471,
    "uncertainty_score": 7.000292592527121e-06,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 472,
    "uncertainty_score": 0.20000032382776714,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 473,
    "uncertainty_score": 0.1821216947520267,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 474,
    "uncertainty_score": 1.2434432780821349e-05,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 475,
    "uncertainty_score": 1.8278274234787772e-10,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 476,
    "uncertainty_score": 0.3819909297883086,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 477,
    "uncertainty_score": 0.0002783900103834004,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 478,
    "uncertainty_score": 0.08635167298307334,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 479,
    "uncertainty_score": 0.0010497055828638205,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 480,
    "uncertainty_score": 0.20002442347123872,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 481,
    "uncertainty_score": 5.156094801066886e-09,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 482,
    "uncertainty_score": 0.20000014066060406,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 483,
    "uncertainty_score": 1.2409836413457217e-08,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 484,
    "uncertainty_score": 0.20000288636279598,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 485,
    "uncertainty_score": 1.4004564279606963e-06,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 486,
    "uncertainty_score": 0.07703049347333576,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 487,
    "uncertainty_score": 0.5004124492435833,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 488,
    "uncertainty_score": 2.518780655522633e-12,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 489,
    "uncertainty_score": 1.2605409323593856e-05,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 490,
    "uncertainty_score": 3.568645510718463e-12,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 491,
    "uncertainty_score": 4.366223292727274e-05,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 492,
    "uncertainty_score": 5.069449073576966e-06,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 493,
    "uncertainty_score": 1.1535115993113325e-05,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 494,
    "uncertainty_score": 0.00035114301080092,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 495,
    "uncertainty_score": 3.6410386910882e-07,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 496,
    "uncertainty_score": 0.24999999979372978,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 497,
    "uncertainty_score": 1.4725724499754339e-05,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 498,
    "uncertainty_score": 7.831717831357895e-05,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 499,
    "uncertainty_score": 5.053638553292045e-06,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 500,
    "uncertainty_score": 0.99999999975,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 501,
    "uncertainty_score": 0.038008147397564446,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 502,
    "uncertainty_score": 1.1000230359800496e-07,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 503,
    "uncertainty_score": 2.342081837790988e-10,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 504,
    "uncertainty_score": 0.40015098297952967,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 505,
    "uncertainty_score": 0.39998724176079814,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 506,
    "uncertainty_score": 0.0003838661022301881,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 507,
    "uncertainty_score": 7.350858918476504e-07,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 508,
    "uncertainty_score": 6.052088677529275e-07,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 509,
    "uncertainty_score": 0.33333333333333487,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 510,
    "uncertainty_score": 2.5272234592987182e-06,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 511,
    "uncertainty_score": 0.20000320729293702,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 512,
    "uncertainty_score": 0.3368990156180307,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 513,
    "uncertainty_score": 1.2241869488956178e-10,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 514,
    "uncertainty_score": 0.20000002648786847,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 515,
    "uncertainty_score": 1.4295727223005632e-10,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 516,
    "uncertainty_score": 7.411510171183044e-09,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 517,
    "uncertainty_score": 0.0011055780401840946,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 518,
    "uncertainty_score": 1.0678760285447231e-10,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 519,
    "uncertainty_score": 0.20000068029214782,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 520,
    "uncertainty_score": 0.2538190282099174,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 521,
    "uncertainty_score": 0.2677245989212622,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 522,
    "uncertainty_score": 3.706469455055106e-07,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 523,
    "uncertainty_score": 0.5127153885849971,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 524,
    "uncertainty_score": 1.091814746470526e-08,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 525,
    "uncertainty_score": 0.6000022786956083,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 526,
    "uncertainty_score": 4.758902614165913e-05,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 527,
    "uncertainty_score": 3.8176405464399284e-07,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 528,
    "uncertainty_score": 2.5560612571149646e-09,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 529,
    "uncertainty_score": 0.33333333318070285,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 530,
    "uncertainty_score": 7.75446005849897e-05,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 531,
    "uncertainty_score": 1.3782587445517245e-08,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 532,
    "uncertainty_score": 0.3635768580629442,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 533,
    "uncertainty_score": 2.1480174575996936e-08,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 534,
    "uncertainty_score": 0.00016096317006926056,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 535,
    "uncertainty_score": 2.042477324671078e-09,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 536,
    "uncertainty_score": 2.246900488564946e-06,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 537,
    "uncertainty_score": 1.701343595594833e-08,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 538,
    "uncertainty_score": 0.20202349347442983,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 539,
    "uncertainty_score": 0.19999646372468657,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 540,
    "uncertainty_score": 0.40007234424004673,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 541,
    "uncertainty_score": 0.19999991704480985,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 542,
    "uncertainty_score": 0.20075700640567434,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 543,
    "uncertainty_score": 2.0232672141345613e-09,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 544,
    "uncertainty_score": 0.3999999884049781,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 545,
    "uncertainty_score": 1.353029589895999e-08,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 546,
    "uncertainty_score": 4.072785540277654e-12,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 547,
    "uncertainty_score": 0.008034600937224566,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 548,
    "uncertainty_score": 1.7360357996583732e-09,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 549,
    "uncertainty_score": 0.2226334268384708,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 550,
    "uncertainty_score": 0.16666763809282625,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 551,
    "uncertainty_score": 5.434253697320507e-10,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 552,
    "uncertainty_score": 2.611572251979261e-05,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 553,
    "uncertainty_score": 9.118778969514541e-10,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 554,
    "uncertainty_score": 1.2275462657893136e-07,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 555,
    "uncertainty_score": 8.094253815245133e-10,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 556,
    "uncertainty_score": 0.0001427713476015703,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 557,
    "uncertainty_score": 6.222547800074203e-08,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 558,
    "uncertainty_score": 0.06001888226969361,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 559,
    "uncertainty_score": 0.664231315809649,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 560,
    "uncertainty_score": 0.30796094615928254,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 561,
    "uncertainty_score": 0.16666217187013863,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 562,
    "uncertainty_score": 0.19999992854138166,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 563,
    "uncertainty_score": 1.390277144942165e-07,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 564,
    "uncertainty_score": 0.00019603395158474882,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 565,
    "uncertainty_score": 2.4967590455569836e-07,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 566,
    "uncertainty_score": 1.619121729061082e-06,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 567,
    "uncertainty_score": 0.45149524279854425,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 568,
    "uncertainty_score": 0.20007289621241936,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 569,
    "uncertainty_score": 1.8007351012767016e-08,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 570,
    "uncertainty_score": 3.425673270034015e-08,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 571,
    "uncertainty_score": 8.479012477149658e-05,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 572,
    "uncertainty_score": 2.236625321456205e-07,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 573,
    "uncertainty_score": 0.212582071083542,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 574,
    "uncertainty_score": 1.009110961162822e-09,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 575,
    "uncertainty_score": 0.0005883286415521228,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 576,
    "uncertainty_score": 0.006228784690334629,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 577,
    "uncertainty_score": 3.1114104644890605e-09,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 578,
    "uncertainty_score": 0.10000180656046131,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 579,
    "uncertainty_score": 0.2523451855047333,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 580,
    "uncertainty_score": 6.020779906837278e-10,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 581,
    "uncertainty_score": 0.20000004021522183,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 582,
    "uncertainty_score": 1.815505546483655e-10,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 583,
    "uncertainty_score": 7.952704617494218e-05,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 584,
    "uncertainty_score": 0.20000003380782339,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 585,
    "uncertainty_score": 1.8637547204563557e-05,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 586,
    "uncertainty_score": 0.26087244194318326,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 587,
    "uncertainty_score": 1.009087866122339e-05,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 588,
    "uncertainty_score": 0.013784803559059504,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 589,
    "uncertainty_score": 0.24999999955114002,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 590,
    "uncertainty_score": 5.393667067933187e-06,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 591,
    "uncertainty_score": 1.4223028002942017e-05,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 592,
    "uncertainty_score": 4.9257267201887386e-05,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 593,
    "uncertainty_score": 0.20000003113639542,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 594,
    "uncertainty_score": 1.1309307150584031e-06,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 595,
    "uncertainty_score": 0.001920371312828486,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 596,
    "uncertainty_score": 0.9999999996666666,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 597,
    "uncertainty_score": 5.757702024994053e-07,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 598,
    "uncertainty_score": 2.7449254027069275e-08,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 599,
    "uncertainty_score": 0.1669017903858956,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 600,
    "uncertainty_score": 0.3608860373497009,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 601,
    "uncertainty_score": 8.259229411500257e-11,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 602,
    "uncertainty_score": 5.9101580518472474e-08,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 603,
    "uncertainty_score": 3.22215285564198e-08,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 604,
    "uncertainty_score": 5.267316396384558e-07,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 605,
    "uncertainty_score": 0.001887895748950541,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 606,
    "uncertainty_score": 1.4386809198185802e-05,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 607,
    "uncertainty_score": 1.3601222925707646e-10,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 608,
    "uncertainty_score": 1.7303004862245785e-10,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 609,
    "uncertainty_score": 8.711882669258653e-13,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 610,
    "uncertainty_score": 0.0006416263058781624,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 611,
    "uncertainty_score": 1.278432693041509e-09,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 612,
    "uncertainty_score": 0.25000908970832825,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 613,
    "uncertainty_score": 0.2000018060207367,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 614,
    "uncertainty_score": 0.5156218504423578,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 615,
    "uncertainty_score": 0.3333365023136139,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 616,
    "uncertainty_score": 3.651132374216104e-07,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 617,
    "uncertainty_score": 0.060093820095062256,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 618,
    "uncertainty_score": 0.3382686756287214,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 619,
    "uncertainty_score": 4.978881662509593e-08,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 620,
    "uncertainty_score": 2.1911915837335982e-08,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 621,
    "uncertainty_score": 4.6045112611636796e-08,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 622,
    "uncertainty_score": 0.20005920429833476,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 623,
    "uncertainty_score": 0.20000000298023224,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 624,
    "uncertainty_score": 0.00018606963567435741,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 625,
    "uncertainty_score": 0.200000000315604,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 626,
    "uncertainty_score": 0.5000666720152368,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 627,
    "uncertainty_score": 8.977331162896007e-05,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 628,
    "uncertainty_score": 0.19999632239341736,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 629,
    "uncertainty_score": 0.600112795829773,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 630,
    "uncertainty_score": 1.7620355663439113e-07,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 631,
    "uncertainty_score": 0.19825401902198792,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 632,
    "uncertainty_score": 0.005187890026718378,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 633,
    "uncertainty_score": 6.4511923483223654e-06,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 634,
    "uncertainty_score": 0.0001965470873983577,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 635,
    "uncertainty_score": 4.653754785977071e-06,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 636,
    "uncertainty_score": 0.29859605295994524,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 637,
    "uncertainty_score": 0.40029463171958923,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 638,
    "uncertainty_score": 5.08024525225359e-11,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 639,
    "uncertainty_score": 0.20000000001111404,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 640,
    "uncertainty_score": 0.00465782918035984,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 641,
    "uncertainty_score": 9.873517410596833e-05,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 642,
    "uncertainty_score": 2.5145618565147743e-06,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 643,
    "uncertainty_score": 0.003542137099429965,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 644,
    "uncertainty_score": 0.00010587546421447769,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 645,
    "uncertainty_score": 1.9104831605609718e-10,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 646,
    "uncertainty_score": 0.0008043070556595922,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 647,
    "uncertainty_score": 0.2500000298023224,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 648,
    "uncertainty_score": 0.1999247521162033,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 649,
    "uncertainty_score": 5.350201490728068e-07,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 650,
    "uncertainty_score": 4.556328092597539e-10,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 651,
    "uncertainty_score": 0.0003853520902339369,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 652,
    "uncertainty_score": 1.0438591147021725e-07,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 653,
    "uncertainty_score": 0.25195807666752756,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 654,
    "uncertainty_score": 6.052028425074241e-07,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 655,
    "uncertainty_score": 2.9214161756385693e-08,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 656,
    "uncertainty_score": 0.0002828483993653208,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 657,
    "uncertainty_score": 3.2233260505165617e-09,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 658,
    "uncertainty_score": 1.984096525120549e-05,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 659,
    "uncertainty_score": 0.06778077781200409,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 660,
    "uncertainty_score": 0.0014369463315233588,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 661,
    "uncertainty_score": 3.957038188673323e-06,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 662,
    "uncertainty_score": 0.25028637051582336,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 663,
    "uncertainty_score": 0.0006823731819167733,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 664,
    "uncertainty_score": 4.286656292151747e-07,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 665,
    "uncertainty_score": 1.8457463966115029e-06,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 666,
    "uncertainty_score": 1.3081660654279403e-05,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 667,
    "uncertainty_score": 0.2000323777711288,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 668,
    "uncertainty_score": 2.201546855928882e-08,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 669,
    "uncertainty_score": 0.24962858855724335,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 670,
    "uncertainty_score": 0.19999995827674866,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 671,
    "uncertainty_score": 0.20011885464191437,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 672,
    "uncertainty_score": 0.20010583102703094,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 673,
    "uncertainty_score": 4.1727020288817585e-05,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 674,
    "uncertainty_score": 4.966033140263448e-10,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 675,
    "uncertainty_score": 0.24999986588954926,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 676,
    "uncertainty_score": 0.20153005623097023,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 677,
    "uncertainty_score": 3.233206007280387e-05,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 678,
    "uncertainty_score": 2.8152530262559594e-07,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 679,
    "uncertainty_score": 1.8850567773398552e-09,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 680,
    "uncertainty_score": 0.75,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 681,
    "uncertainty_score": 0.00015769523452036083,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 682,
    "uncertainty_score": 1.3118360584485345e-05,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 683,
    "uncertainty_score": 1.637115047969928e-07,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 684,
    "uncertainty_score": 4.408502718433738e-08,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 685,
    "uncertainty_score": 5.375596856538323e-07,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 686,
    "uncertainty_score": 2.645595409411783e-10,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 687,
    "uncertainty_score": 0.42214545607566833,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 688,
    "uncertainty_score": 6.078692237065919e-13,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 689,
    "uncertainty_score": 0.46972902510854964,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 690,
    "uncertainty_score": 0.4000018239021301,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 691,
    "uncertainty_score": 4.3566910790104885e-07,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 692,
    "uncertainty_score": 1.916689695846685e-09,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 693,
    "uncertainty_score": 0.0006031202501617372,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 694,
    "uncertainty_score": 5.773002301895369e-12,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 695,
    "uncertainty_score": 9.213240264216438e-05,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 696,
    "uncertainty_score": 2.266169370213067e-11,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 697,
    "uncertainty_score": 4.1992672777269036e-05,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 698,
    "uncertainty_score": 2.3911432435852475e-05,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 699,
    "uncertainty_score": 6.585759715349582e-10,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 700,
    "uncertainty_score": 4.74417172213748e-11,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 701,
    "uncertainty_score": 0.1666666716337204,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 702,
    "uncertainty_score": 0.2000030279159546,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 703,
    "uncertainty_score": 2.22860362555366e-05,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 704,
    "uncertainty_score": 3.099889442359505e-11,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 705,
    "uncertainty_score": 1.5690395230194554e-05,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 706,
    "uncertainty_score": 0.25000008940696716,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 707,
    "uncertainty_score": 6.668396054010373e-06,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 708,
    "uncertainty_score": 0.0007570263696834445,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 709,
    "uncertainty_score": 0.24999947845935822,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 710,
    "uncertainty_score": 6.59392640045553e-07,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 711,
    "uncertainty_score": 0.1024627760052681,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 712,
    "uncertainty_score": 0.5849084688845323,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 713,
    "uncertainty_score": 0.40000000001329106,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 714,
    "uncertainty_score": 0.25000011920928955,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 715,
    "uncertainty_score": 1.0373989445255916e-09,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 716,
    "uncertainty_score": 0.00015955719572957605,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 717,
    "uncertainty_score": 0.20000000298023224,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 718,
    "uncertainty_score": 1.3950527844031058e-08,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 719,
    "uncertainty_score": 0.20045046508312225,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 720,
    "uncertainty_score": 0.20000028610229492,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 721,
    "uncertainty_score": 0.500000002018475,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 722,
    "uncertainty_score": 3.145566307427572e-10,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 723,
    "uncertainty_score": 2.745496052725116e-10,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 724,
    "uncertainty_score": 1.0788633062475128e-06,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 725,
    "uncertainty_score": 0.25,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 726,
    "uncertainty_score": 1.0584647824884996e-08,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 727,
    "uncertainty_score": 0.004029365256428719,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 728,
    "uncertainty_score": 0.030023762956261635,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 729,
    "uncertainty_score": 0.20017679035663605,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 730,
    "uncertainty_score": 5.4954099937276624e-08,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 731,
    "uncertainty_score": 0.24999213218688965,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 732,
    "uncertainty_score": 0.40000023838241605,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 733,
    "uncertainty_score": 0.8501663208007812,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 734,
    "uncertainty_score": 0.25,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 735,
    "uncertainty_score": 0.20001069076059946,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 736,
    "uncertainty_score": 0.3333333432674408,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 737,
    "uncertainty_score": 8.86502693475677e-09,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 738,
    "uncertainty_score": 0.40000000170321953,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 739,
    "uncertainty_score": 2.5179729894182865e-16,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 740,
    "uncertainty_score": 1.9316460111440392e-06,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 741,
    "uncertainty_score": 0.0002402509853709489,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 742,
    "uncertainty_score": 1.8577497939986642e-07,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 743,
    "uncertainty_score": 1.1117278209127335e-09,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 744,
    "uncertainty_score": 1.1507843566960219e-09,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 745,
    "uncertainty_score": 0.3889579155617692,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 746,
    "uncertainty_score": 8.143206997601737e-08,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 747,
    "uncertainty_score": 3.365564715807068e-09,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 748,
    "uncertainty_score": 4.94526530836481e-10,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 749,
    "uncertainty_score": 0.20000021159648895,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 750,
    "uncertainty_score": 0.00019153532048221678,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 751,
    "uncertainty_score": 0.3160781240664732,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 752,
    "uncertainty_score": 0.25242453813552856,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 753,
    "uncertainty_score": 0.2000158280134201,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 754,
    "uncertainty_score": 5.052001039729248e-10,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 755,
    "uncertainty_score": 0.20000021159648895,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 756,
    "uncertainty_score": 4.0253325672701123e-10,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 757,
    "uncertainty_score": 0.20000010523276054,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 758,
    "uncertainty_score": 0.004621665924787521,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 759,
    "uncertainty_score": 5.142413647263311e-05,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 760,
    "uncertainty_score": 0.20127107603360234,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 761,
    "uncertainty_score": 0.5100093039699569,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 762,
    "uncertainty_score": 5.313148321306471e-08,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 763,
    "uncertainty_score": 2.8845970057034265e-09,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 764,
    "uncertainty_score": 3.104238288642591e-08,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 765,
    "uncertainty_score": 5.266344998977601e-11,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 766,
    "uncertainty_score": 3.3127198900695376e-11,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 767,
    "uncertainty_score": 0.0001384514180244878,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 768,
    "uncertainty_score": 3.4123706882382976e-07,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 769,
    "uncertainty_score": 0.40007299935558366,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 770,
    "uncertainty_score": 6.692277287889681e-11,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 771,
    "uncertainty_score": 0.2000035436653675,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 772,
    "uncertainty_score": 2.450979081913829e-07,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 773,
    "uncertainty_score": 6.342171400319785e-05,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 774,
    "uncertainty_score": 8.022593873946438e-12,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 775,
    "uncertainty_score": 0.799498188495636,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 776,
    "uncertainty_score": 9.067310458021893e-09,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 777,
    "uncertainty_score": 0.33319219946861267,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 778,
    "uncertainty_score": 0.20622873306274414,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 779,
    "uncertainty_score": 4.5068614440424426e-07,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 780,
    "uncertainty_score": 0.4,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 781,
    "uncertainty_score": 1.6514530216227286e-05,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 782,
    "uncertainty_score": 1.7290894902544096e-05,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 783,
    "uncertainty_score": 0.20000055398676403,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 784,
    "uncertainty_score": 8.18314674688736e-06,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 785,
    "uncertainty_score": 0.20000000298023224,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 786,
    "uncertainty_score": 1.4090511513131787e-06,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 787,
    "uncertainty_score": 1.9903571057966474e-07,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 788,
    "uncertainty_score": 0.2000039517879486,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 789,
    "uncertainty_score": 0.24989892542362213,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 790,
    "uncertainty_score": 2.4896491979120583e-08,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 791,
    "uncertainty_score": 7.89579104321092e-08,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 792,
    "uncertainty_score": 0.00013372115790843964,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 793,
    "uncertainty_score": 0.25000762939453125,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 794,
    "uncertainty_score": 6.248099371219951e-09,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 795,
    "uncertainty_score": 0.5000000059589214,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 796,
    "uncertainty_score": 9.418897661817027e-08,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 797,
    "uncertainty_score": 5.494777724379674e-06,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 798,
    "uncertainty_score": 5.462337071548973e-07,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 799,
    "uncertainty_score": 3.0081462682574056e-05,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 800,
    "uncertainty_score": 0.25252944231033325,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 801,
    "uncertainty_score": 0.33333173394203186,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 802,
    "uncertainty_score": 2.1004347150466174e-09,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 803,
    "uncertainty_score": 1.0921382909145905e-06,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 804,
    "uncertainty_score": 0.2000691948205382,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 805,
    "uncertainty_score": 1.496966162140012e-10,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 806,
    "uncertainty_score": 2.3372382202069275e-05,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 807,
    "uncertainty_score": 1.5686582628404722e-06,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 808,
    "uncertainty_score": 7.449613622156903e-05,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 809,
    "uncertainty_score": 2.7390973426769628e-18,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 810,
    "uncertainty_score": 0.25000018284827064,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 811,
    "uncertainty_score": 0.0004753063549287617,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 812,
    "uncertainty_score": 0.00019894063007086515,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 813,
    "uncertainty_score": 0.3333510160446167,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 814,
    "uncertainty_score": 0.004017889034003019,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 815,
    "uncertainty_score": 0.0003769787435885519,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 816,
    "uncertainty_score": 0.14321637153625488,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 817,
    "uncertainty_score": 1.2941139271305246e-09,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 818,
    "uncertainty_score": 4.0333407014259137e-07,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 819,
    "uncertainty_score": 1.1419360568254433e-08,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 820,
    "uncertainty_score": 1.3422517440631054e-05,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 821,
    "uncertainty_score": 2.9982943211548374e-11,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 822,
    "uncertainty_score": 0.014469994232058525,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 823,
    "uncertainty_score": 6.887275389999559e-07,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 824,
    "uncertainty_score": 1.607140198700563e-08,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 825,
    "uncertainty_score": 1.9184035693342594e-07,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 826,
    "uncertainty_score": 0.999988317489624,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 827,
    "uncertainty_score": 0.00023124281142372638,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 828,
    "uncertainty_score": 0.31470367312431335,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 829,
    "uncertainty_score": 0.20000001166766013,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 830,
    "uncertainty_score": 0.19991478323936462,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 831,
    "uncertainty_score": 8.371454214284313e-07,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 832,
    "uncertainty_score": 8.21094581624493e-05,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 833,
    "uncertainty_score": 8.820987273949754e-10,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 834,
    "uncertainty_score": 4.396328949951567e-05,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 835,
    "uncertainty_score": 0.2500000298023224,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 836,
    "uncertainty_score": 0.24999988079071045,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 837,
    "uncertainty_score": 0.8000198305453523,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 838,
    "uncertainty_score": 0.21087472140789032,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 839,
    "uncertainty_score": 1.1870375793421317e-08,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 840,
    "uncertainty_score": 0.16686777770519257,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 841,
    "uncertainty_score": 9.255080613002065e-08,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 842,
    "uncertainty_score": 0.6644686460494995,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 843,
    "uncertainty_score": 7.744717089863684e-10,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 844,
    "uncertainty_score": 2.0394854693961406e-09,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 845,
    "uncertainty_score": 1.23366305615491e-07,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 846,
    "uncertainty_score": 0.2501126527786255,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 847,
    "uncertainty_score": 2.7395421042797352e-08,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 848,
    "uncertainty_score": 0.1999998241662979,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 849,
    "uncertainty_score": 0.27946358919143677,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 850,
    "uncertainty_score": 4.011580789775593e-10,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 851,
    "uncertainty_score": 1.8840753909898922e-05,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 852,
    "uncertainty_score": 0.4999333322048187,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 853,
    "uncertainty_score": 7.717531058659688e-10,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 854,
    "uncertainty_score": 6.715668993129142e-11,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 855,
    "uncertainty_score": 0.33333333370108537,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 856,
    "uncertainty_score": 0.006524630822241306,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 857,
    "uncertainty_score": 2.2103077701451923e-10,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 858,
    "uncertainty_score": 9.96279195533134e-05,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 859,
    "uncertainty_score": 4.446692614124004e-08,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 860,
    "uncertainty_score": 0.25000004375767765,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 861,
    "uncertainty_score": 0.33311793208122253,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 862,
    "uncertainty_score": 0.25,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 863,
    "uncertainty_score": 4.5700699047301896e-07,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 864,
    "uncertainty_score": 0.24999859929084778,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 865,
    "uncertainty_score": 1.139291860852154e-08,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 866,
    "uncertainty_score": 1.6194707086469862e-07,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 867,
    "uncertainty_score": 2.1442368961288594e-05,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 868,
    "uncertainty_score": 0.16360034048557281,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 869,
    "uncertainty_score": 1.6190329632514988e-10,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 870,
    "uncertainty_score": 3.95277356801671e-06,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 871,
    "uncertainty_score": 3.259346340200864e-05,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 872,
    "uncertainty_score": 2.0229260826454265e-06,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 873,
    "uncertainty_score": 0.19999995827674866,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 874,
    "uncertainty_score": 3.398831177037209e-05,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 875,
    "uncertainty_score": 0.1987936943769455,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 876,
    "uncertainty_score": 3.168733383063227e-05,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 877,
    "uncertainty_score": 0.19999182224273682,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 878,
    "uncertainty_score": 4.860413355345372e-06,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 879,
    "uncertainty_score": 0.8000000000004265,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 880,
    "uncertainty_score": 0.00018425965390633792,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 881,
    "uncertainty_score": 1.7171436184071354e-06,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 882,
    "uncertainty_score": 5.562810201809043e-06,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 883,
    "uncertainty_score": 5.2029021091470895e-09,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 884,
    "uncertainty_score": 1.0063007493954501e-06,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 885,
    "uncertainty_score": 0.0014333382714539766,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 886,
    "uncertainty_score": 0.20000486075878143,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 887,
    "uncertainty_score": 0.25,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 888,
    "uncertainty_score": 5.811190106896902e-08,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 889,
    "uncertainty_score": 3.009210922755301e-05,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 890,
    "uncertainty_score": 1.6577190535826958e-06,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 891,
    "uncertainty_score": 0.20000001586073904,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 892,
    "uncertainty_score": 0.6000161170959473,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 893,
    "uncertainty_score": 0.2000000923871994,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 894,
    "uncertainty_score": 0.003738557221367955,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 895,
    "uncertainty_score": 0.20000021159648895,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 896,
    "uncertainty_score": 1.1834437430024991e-07,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 897,
    "uncertainty_score": 8.484771912842248e-11,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 898,
    "uncertainty_score": 8.275708590632647e-11,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 899,
    "uncertainty_score": 0.013774094171822071,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 900,
    "uncertainty_score": 0.20000004768371582,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 901,
    "uncertainty_score": 0.00012271727609913796,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 902,
    "uncertainty_score": 0.7999984622001648,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 903,
    "uncertainty_score": 5.678681080922843e-09,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 904,
    "uncertainty_score": 0.2000000923871994,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 905,
    "uncertainty_score": 7.605074209271478e-11,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 906,
    "uncertainty_score": 1.3631996864660323e-07,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 907,
    "uncertainty_score": 7.774582968522736e-07,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 908,
    "uncertainty_score": 0.00024135080457199365,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 909,
    "uncertainty_score": 0.2004503756761551,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 910,
    "uncertainty_score": 0.009060489945113659,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 911,
    "uncertainty_score": 0.250010651012758,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 912,
    "uncertainty_score": 2.91789439832435e-11,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 913,
    "uncertainty_score": 5.048946718488878e-07,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 914,
    "uncertainty_score": 4.664605590676274e-09,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 915,
    "uncertainty_score": 0.20000071823596954,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 916,
    "uncertainty_score": 5.625420726573793e-06,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 917,
    "uncertainty_score": 0.20000001788139343,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 918,
    "uncertainty_score": 0.1666688770055771,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 919,
    "uncertainty_score": 3.850868512955685e-10,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 920,
    "uncertainty_score": 7.379081239378138e-07,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 921,
    "uncertainty_score": 3.0970661590856707e-09,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 922,
    "uncertainty_score": 4.375134722067742e-06,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 923,
    "uncertainty_score": 5.014194357499946e-06,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 924,
    "uncertainty_score": 0.40000000000026653,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 925,
    "uncertainty_score": 0.19998472929000854,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 926,
    "uncertainty_score": 8.279268399746798e-07,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 927,
    "uncertainty_score": 4.5444515706094535e-08,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 928,
    "uncertainty_score": 1.162698097800785e-07,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 929,
    "uncertainty_score": 0.2000334906038582,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 930,
    "uncertainty_score": 1.4454247320827562e-05,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 931,
    "uncertainty_score": 0.24999912083148956,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 932,
    "uncertainty_score": 5.510268907826799e-10,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 933,
    "uncertainty_score": 3.66791027772706e-05,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 934,
    "uncertainty_score": 1.3992092817716184e-07,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 935,
    "uncertainty_score": 0.0009835168020799756,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 936,
    "uncertainty_score": 0.25052523612976074,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 937,
    "uncertainty_score": 0.2000003159046173,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 938,
    "uncertainty_score": 0.24999983608722687,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 939,
    "uncertainty_score": 1.1680555189741426e-07,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 940,
    "uncertainty_score": 1.0892202908507898e-06,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 941,
    "uncertainty_score": 1.0559871033155588e-10,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 942,
    "uncertainty_score": 0.00017667017527855933,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 943,
    "uncertainty_score": 1.8430920079026691e-07,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 944,
    "uncertainty_score": 1.6682995263028744e-10,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 945,
    "uncertainty_score": 0.03865945711731911,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 946,
    "uncertainty_score": 5.972697181277908e-06,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 947,
    "uncertainty_score": 1.4548252238455461e-06,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 948,
    "uncertainty_score": 0.2057614028453827,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 949,
    "uncertainty_score": 0.19999995827674866,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 950,
    "uncertainty_score": 0.20000119105936648,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 951,
    "uncertainty_score": 0.2500002533836883,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 952,
    "uncertainty_score": 0.24276474303931908,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 953,
    "uncertainty_score": 0.20000000298023224,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 954,
    "uncertainty_score": 0.33333336036986,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 955,
    "uncertainty_score": 5.727571306124446e-08,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 956,
    "uncertainty_score": 2.6577194489618705e-07,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 957,
    "uncertainty_score": 1.858051490444268e-09,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 958,
    "uncertainty_score": 1.478933864262899e-08,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 959,
    "uncertainty_score": 0.00017491279868409038,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 960,
    "uncertainty_score": 0.4000000000000636,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 961,
    "uncertainty_score": 7.971770514814125e-07,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 962,
    "uncertainty_score": 5.049074047747126e-09,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 963,
    "uncertainty_score": 3.2756025802882505e-07,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 964,
    "uncertainty_score": 0.19859036803245544,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 965,
    "uncertainty_score": 0.014477227814495564,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 966,
    "uncertainty_score": 4.39353868841863e-08,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 967,
    "uncertainty_score": 7.528298738179728e-05,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 968,
    "uncertainty_score": 0.1446959227323532,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 969,
    "uncertainty_score": 6.305947863438632e-06,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 970,
    "uncertainty_score": 0.00036583488690666854,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 971,
    "uncertainty_score": 4.22694768076326e-10,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 972,
    "uncertainty_score": 0.001409689662978053,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 973,
    "uncertainty_score": 0.6000188243328012,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 974,
    "uncertainty_score": 1.5927714258623382e-08,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 975,
    "uncertainty_score": 1.7005057084684694e-10,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 976,
    "uncertainty_score": 6.1839418776799e-05,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 977,
    "uncertainty_score": 0.3962474465370178,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 978,
    "uncertainty_score": 7.27159431335167e-07,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 979,
    "uncertainty_score": 6.621983517085539e-10,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 980,
    "uncertainty_score": 1.2062870147211413e-10,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 981,
    "uncertainty_score": 1.8308815796785893e-08,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 982,
    "uncertainty_score": 2.6507542827403086e-08,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 983,
    "uncertainty_score": 7.65780896472279e-08,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 984,
    "uncertainty_score": 1.0717261744730422e-07,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 985,
    "uncertainty_score": 0.4870053231716156,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 986,
    "uncertainty_score": 3.121452607501851e-07,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 987,
    "uncertainty_score": 1.1130359780509025e-05,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 988,
    "uncertainty_score": 0.00020645097538363189,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 989,
    "uncertainty_score": 8.06783639895059e-10,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 990,
    "uncertainty_score": 2.009900072152959e-06,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 991,
    "uncertainty_score": 8.191184974748467e-07,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 992,
    "uncertainty_score": 0.20841754542619725,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 993,
    "uncertainty_score": 0.3052041530609131,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 994,
    "uncertainty_score": 0.20516535639762878,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 995,
    "uncertainty_score": 0.400013247213362,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 996,
    "uncertainty_score": 3.3628522942308336e-05,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 997,
    "uncertainty_score": 3.759068056830017e-10,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 998,
    "uncertainty_score": 8.914243565527613e-09,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 999,
    "uncertainty_score": 0.2508098163525574,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 1000,
    "uncertainty_score": 1.7986313549656074e-09,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 1001,
    "uncertainty_score": 0.0005073951906524599,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 1002,
    "uncertainty_score": 1.7962298315410408e-11,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 1003,
    "uncertainty_score": 1.360790520266164e-07,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 1004,
    "uncertainty_score": 1.6962252630037256e-05,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 1005,
    "uncertainty_score": 0.40108823627233503,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 1006,
    "uncertainty_score": 0.25,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 1007,
    "uncertainty_score": 1.97980654093044e-08,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 1008,
    "uncertainty_score": 0.3858276903629303,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 1009,
    "uncertainty_score": 0.4000731331749193,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 1010,
    "uncertainty_score": 3.8336761543078524e-10,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 1011,
    "uncertainty_score": 0.25,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 1012,
    "uncertainty_score": 1.0892465525103034e-06,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 1013,
    "uncertainty_score": 0.0004573393671307713,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 1014,
    "uncertainty_score": 0.00018606972298584878,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 1015,
    "uncertainty_score": 3.9696189146905435e-17,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 1016,
    "uncertainty_score": 0.18428246676921844,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 1017,
    "uncertainty_score": 0.25000006544759623,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 1018,
    "uncertainty_score": 0.20000307261943817,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 1019,
    "uncertainty_score": 0.7499999403953552,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 1020,
    "uncertainty_score": 0.011330485343933105,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 1021,
    "uncertainty_score": 0.4014935218896426,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 1022,
    "uncertainty_score": 1.2594675302679548e-10,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 1023,
    "uncertainty_score": 0.0001227306347573176,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 1024,
    "uncertainty_score": 1.7597757973053518e-10,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 1025,
    "uncertainty_score": 0.0018555531278252602,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 1026,
    "uncertainty_score": 0.016976991668343544,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 1027,
    "uncertainty_score": 5.95502172018314e-07,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 1028,
    "uncertainty_score": 2.6119625906595445e-10,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 1029,
    "uncertainty_score": 2.787484132404927e-10,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 1030,
    "uncertainty_score": 0.40017420053482056,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 1031,
    "uncertainty_score": 9.69589336818899e-07,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 1032,
    "uncertainty_score": 0.20000003634952312,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 1033,
    "uncertainty_score": 0.0009070960222743452,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 1034,
    "uncertainty_score": 2.3525045023120583e-08,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 1035,
    "uncertainty_score": 0.2522775355054958,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 1036,
    "uncertainty_score": 2.75181310030459e-12,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 1037,
    "uncertainty_score": 0.20000000298023224,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 1038,
    "uncertainty_score": 2.244742391965815e-09,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 1039,
    "uncertainty_score": 0.6000000238418579,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 1040,
    "uncertainty_score": 0.0009462505113333464,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 1041,
    "uncertainty_score": 6.435624477774127e-09,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 1042,
    "uncertainty_score": 0.0025293531361967325,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 1043,
    "uncertainty_score": 7.492182703572325e-06,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 1044,
    "uncertainty_score": 0.2500000596046448,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 1045,
    "uncertainty_score": 0.4020577073097229,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 1046,
    "uncertainty_score": 2.5730818379088305e-05,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 1047,
    "uncertainty_score": 1.1431681157247908e-09,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 1048,
    "uncertainty_score": 7.116427447328988e-10,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 1049,
    "uncertainty_score": 0.20000000298023224,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 1050,
    "uncertainty_score": 0.25,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 1051,
    "uncertainty_score": 0.00011795383034041151,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 1052,
    "uncertainty_score": 0.1666666716337204,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 1053,
    "uncertainty_score": 1.2222029965869297e-07,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 1054,
    "uncertainty_score": 0.009634974412620068,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 1055,
    "uncertainty_score": 5.935891222996759e-10,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 1056,
    "uncertainty_score": 3.463327971076069e-07,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 1057,
    "uncertainty_score": 1.384493474726467e-11,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 1058,
    "uncertainty_score": 0.0005176120903342962,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 1059,
    "uncertainty_score": 0.12800614535808563,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 1060,
    "uncertainty_score": 4.400824593631114e-08,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 1061,
    "uncertainty_score": 3.0285123298057215e-09,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 1062,
    "uncertainty_score": 3.267737636036827e-09,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 1063,
    "uncertainty_score": 2.3115018166208756e-07,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 1064,
    "uncertainty_score": 0.25000159552965084,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 1065,
    "uncertainty_score": 2.496542208518804e-07,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 1066,
    "uncertainty_score": 8.796119459475449e-07,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 1067,
    "uncertainty_score": 0.2000000029239985,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 1068,
    "uncertainty_score": 0.0019539722707122564,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 1069,
    "uncertainty_score": 0.19998566806316376,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 1070,
    "uncertainty_score": 0.3333331048488617,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 1071,
    "uncertainty_score": 1.366143180803192e-07,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 1072,
    "uncertainty_score": 8.807085727369213e-09,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 1073,
    "uncertainty_score": 2.2665777588137814e-10,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 1074,
    "uncertainty_score": 1.4965145965106785e-05,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 1075,
    "uncertainty_score": 1.0228654034882823e-10,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 1076,
    "uncertainty_score": 7.016890776867513e-06,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 1077,
    "uncertainty_score": 1.0661162832548143e-06,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 1078,
    "uncertainty_score": 5.161480203241808e-07,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 1079,
    "uncertainty_score": 0.25200700759887695,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 1080,
    "uncertainty_score": 1.5674104361096397e-06,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 1081,
    "uncertainty_score": 1.9544454943343226e-08,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 1082,
    "uncertainty_score": 0.40000362905452674,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 1083,
    "uncertainty_score": 5.4752599680796266e-06,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 1084,
    "uncertainty_score": 2.3326271048063063e-07,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 1085,
    "uncertainty_score": 2.229534584330395e-05,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 1086,
    "uncertainty_score": 0.2003861743427288,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 1087,
    "uncertainty_score": 1.0319216698917444e-06,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 1088,
    "uncertainty_score": 6.64226590396666e-11,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 1089,
    "uncertainty_score": 0.20000000298023224,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 1090,
    "uncertainty_score": 6.399818175850669e-06,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 1091,
    "uncertainty_score": 7.95539190079353e-09,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 1092,
    "uncertainty_score": 0.2500002980232239,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 1093,
    "uncertainty_score": 0.00023347341630142182,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 1094,
    "uncertainty_score": 1.6864863283672094e-08,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 1095,
    "uncertainty_score": 0.2500000992275711,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 1096,
    "uncertainty_score": 0.0001976944477064535,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 1097,
    "uncertainty_score": 0.3401767611503601,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 1098,
    "uncertainty_score": 3.555892817530548e-06,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 1099,
    "uncertainty_score": 4.823990096269881e-09,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 1100,
    "uncertainty_score": 2.638659291065437e-09,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 1101,
    "uncertainty_score": 2.348009431329956e-08,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 1102,
    "uncertainty_score": 0.2000006139278412,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 1103,
    "uncertainty_score": 0.06298553943634033,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 1104,
    "uncertainty_score": 8.841271181836419e-08,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 1105,
    "uncertainty_score": 0.20001106844865718,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 1106,
    "uncertainty_score": 0.36916007480844465,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 1107,
    "uncertainty_score": 0.3079445497384129,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 1108,
    "uncertainty_score": 3.354930752706658e-08,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 1109,
    "uncertainty_score": 0.00047439190032134363,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 1110,
    "uncertainty_score": 5.655762833485629e-06,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 1111,
    "uncertainty_score": 0.19967030464677998,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 1112,
    "uncertainty_score": 0.5999999550386776,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 1113,
    "uncertainty_score": 0.2037947916396381,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 1114,
    "uncertainty_score": 0.4018147392466103,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 1115,
    "uncertainty_score": 0.34810019645470913,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 1116,
    "uncertainty_score": 0.16667094202028976,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 1117,
    "uncertainty_score": 2.6681749440249013e-05,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 1118,
    "uncertainty_score": 0.20000001076905258,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 1119,
    "uncertainty_score": 0.08422903791604493,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 1120,
    "uncertainty_score": 2.3746134570939792e-07,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 1121,
    "uncertainty_score": 0.4131209595729084,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 1122,
    "uncertainty_score": 0.20000007732476982,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 1123,
    "uncertainty_score": 3.3085548164866954e-07,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 1124,
    "uncertainty_score": 1.7165540853809685e-07,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 1125,
    "uncertainty_score": 1.976565246494473e-07,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 1126,
    "uncertainty_score": 0.004595491170660858,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 1127,
    "uncertainty_score": 7.625705508651395e-09,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 1128,
    "uncertainty_score": 1.9830895311720644e-05,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 1129,
    "uncertainty_score": 9.079579356369249e-06,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 1130,
    "uncertainty_score": 7.280558347591351e-10,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 1131,
    "uncertainty_score": 0.39999999981021306,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 1132,
    "uncertainty_score": 5.905228304369312e-10,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 1133,
    "uncertainty_score": 0.25000833148125867,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 1134,
    "uncertainty_score": 0.00013819476063194525,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 1135,
    "uncertainty_score": 5.480262126708581e-10,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 1136,
    "uncertainty_score": 0.1956597695445669,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 1137,
    "uncertainty_score": 0.40002987421087044,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 1138,
    "uncertainty_score": 7.304374661836579e-07,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 1139,
    "uncertainty_score": 0.0001927007003028937,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 1140,
    "uncertainty_score": 1.3942081023816433e-06,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 1141,
    "uncertainty_score": 0.022965336789623272,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 1142,
    "uncertainty_score": 2.3767451206544383e-11,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 1143,
    "uncertainty_score": 6.585460053866845e-10,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 1144,
    "uncertainty_score": 0.004145778496629691,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 1145,
    "uncertainty_score": 0.7491900158003362,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 1146,
    "uncertainty_score": 7.02390379301778e-05,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 1147,
    "uncertainty_score": 0.041037837385323725,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 1148,
    "uncertainty_score": 5.464282461517446e-07,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 1149,
    "uncertainty_score": 8.072530921551171e-10,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 1150,
    "uncertainty_score": 2.549178726396551e-07,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 1151,
    "uncertainty_score": 4.884800913940726e-10,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 1152,
    "uncertainty_score": 1.3601631051900653e-06,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 1153,
    "uncertainty_score": 7.289298193280667e-08,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 1154,
    "uncertainty_score": 1.425284678663591e-07,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 1155,
    "uncertainty_score": 4.969070688266443e-10,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 1156,
    "uncertainty_score": 8.720462343984525e-09,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 1157,
    "uncertainty_score": 0.5000000013767592,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 1158,
    "uncertainty_score": 0.20019890425742334,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 1159,
    "uncertainty_score": 3.329516139887908e-10,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 1160,
    "uncertainty_score": 0.0008404388648208689,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 1161,
    "uncertainty_score": 0.0009468683149695124,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 1162,
    "uncertainty_score": 0.13245295153745681,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 1163,
    "uncertainty_score": 0.19998835363267156,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 1164,
    "uncertainty_score": 1.9305891377014108e-07,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 1165,
    "uncertainty_score": 0.25,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 1166,
    "uncertainty_score": 1.4468970447498235e-08,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 1167,
    "uncertainty_score": 7.218041979074729e-10,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 1168,
    "uncertainty_score": 2.0125820546727982e-09,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 1169,
    "uncertainty_score": 0.1242195319528649,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 1170,
    "uncertainty_score": 1.4160981708362231e-06,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 1171,
    "uncertainty_score": 5.667563317901607e-10,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 1172,
    "uncertainty_score": 0.20000000238684876,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 1173,
    "uncertainty_score": 0.2500000018353749,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 1174,
    "uncertainty_score": 0.00010138737098282502,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 1175,
    "uncertainty_score": 0.25056296335771444,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 1176,
    "uncertainty_score": 0.24181145183996514,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 1177,
    "uncertainty_score": 0.0,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 1178,
    "uncertainty_score": 7.188075308123815e-10,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 1179,
    "uncertainty_score": 2.5084614834750317e-10,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 1180,
    "uncertainty_score": 6.446745729145506e-05,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 1181,
    "uncertainty_score": 6.167049654189658e-08,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 1182,
    "uncertainty_score": 0.00011860888392470725,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 1183,
    "uncertainty_score": 1.6558114396830377e-09,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 1184,
    "uncertainty_score": 2.6407983946106846e-10,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 1185,
    "uncertainty_score": 0.25004878181757384,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 1186,
    "uncertainty_score": 0.2500303211997333,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 1187,
    "uncertainty_score": 4.865231221785934e-07,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 1188,
    "uncertainty_score": 0.25000079691922,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 1189,
    "uncertainty_score": 0.25002555674863286,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 1190,
    "uncertainty_score": 0.018214239703347117,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 1191,
    "uncertainty_score": 0.25013041671127034,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 1192,
    "uncertainty_score": 0.21380302157473646,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 1193,
    "uncertainty_score": 3.4129510888461274e-08,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 1194,
    "uncertainty_score": 3.7090665267301065e-05,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 1195,
    "uncertainty_score": 0.20003528559504785,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 1196,
    "uncertainty_score": 0.4000109780288478,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 1197,
    "uncertainty_score": 0.20050038360928463,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 1198,
    "uncertainty_score": 8.032064923873881e-06,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 1199,
    "uncertainty_score": 0.2540175584966465,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 1200,
    "uncertainty_score": 0.041080690475880276,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 1201,
    "uncertainty_score": 4.6679061892179555e-07,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 1202,
    "uncertainty_score": 1.3414034503652164e-05,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 1203,
    "uncertainty_score": 0.5999982444958475,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 1204,
    "uncertainty_score": 2.2699328121124692e-10,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 1205,
    "uncertainty_score": 2.895052122788757e-06,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 1206,
    "uncertainty_score": 0.16667895836502358,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 1207,
    "uncertainty_score": 0.1666912286395413,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 1208,
    "uncertainty_score": 0.10000044275839366,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 1209,
    "uncertainty_score": 0.2500000003621892,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 1210,
    "uncertainty_score": 1.2382795621768175e-06,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 1211,
    "uncertainty_score": 3.8017247129771777e-06,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 1212,
    "uncertainty_score": 7.146396336264908e-10,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 1213,
    "uncertainty_score": 1.1869524417652154e-11,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 1214,
    "uncertainty_score": 2.179057880294271e-05,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 1215,
    "uncertainty_score": 1.9993614887266723e-10,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 1216,
    "uncertainty_score": 1.907101298320635e-09,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 1217,
    "uncertainty_score": 0.4001960992029959,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 1218,
    "uncertainty_score": 0.2000000002841719,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 1219,
    "uncertainty_score": 0.20688902250096883,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 1220,
    "uncertainty_score": 5.433447043049008e-10,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 1221,
    "uncertainty_score": 1.016306571235946e-05,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 1222,
    "uncertainty_score": 5.378516012783196e-09,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 1223,
    "uncertainty_score": 5.958897671631806e-09,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 1224,
    "uncertainty_score": 0.003742266100639695,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 1225,
    "uncertainty_score": 0.002230951845664585,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 1226,
    "uncertainty_score": 3.3764464658741027e-06,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 1227,
    "uncertainty_score": 5.246223136807153e-09,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 1228,
    "uncertainty_score": 0.24999392726405997,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 1229,
    "uncertainty_score": 1.561988066408228e-05,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 1230,
    "uncertainty_score": 0.3999999998304905,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 1231,
    "uncertainty_score": 0.2003297016889566,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 1232,
    "uncertainty_score": 3.559014910030642e-07,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 1233,
    "uncertainty_score": 5.774826073180264e-09,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 1234,
    "uncertainty_score": 0.2746540474708915,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 1235,
    "uncertainty_score": 1.9954250105507134e-10,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 1236,
    "uncertainty_score": 0.0039363483571586075,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 1237,
    "uncertainty_score": 7.508053815796977e-08,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 1238,
    "uncertainty_score": 1.415924651103915e-09,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 1239,
    "uncertainty_score": 0.0019103170498894625,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 1240,
    "uncertainty_score": 0.0013296901452436655,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 1241,
    "uncertainty_score": 1.2669456916421397e-09,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 1242,
    "uncertainty_score": 0.16666666659589438,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 1243,
    "uncertainty_score": 0.2500000092455957,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 1244,
    "uncertainty_score": 8.984948441072094e-11,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 1245,
    "uncertainty_score": 0.16666666685069162,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 1246,
    "uncertainty_score": 2.774758854723483e-07,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 1247,
    "uncertainty_score": 0.6000024693981096,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 1248,
    "uncertainty_score": 2.7225127543351384e-10,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 1249,
    "uncertainty_score": 4.265801585362986e-07,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 1250,
    "uncertainty_score": 0.3962406474047699,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 1251,
    "uncertainty_score": 1.021055044724057e-06,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 1252,
    "uncertainty_score": 0.10872016994400936,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 1253,
    "uncertainty_score": 3.4509386085291287e-08,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 1254,
    "uncertainty_score": 0.016794952345649337,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 1255,
    "uncertainty_score": 0.25000000091907204,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 1256,
    "uncertainty_score": 0.403747417219605,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 1257,
    "uncertainty_score": 0.09703879121055572,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 1258,
    "uncertainty_score": 0.20012852960415112,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 1259,
    "uncertainty_score": 1.4287732072089318e-07,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 1260,
    "uncertainty_score": 2.5554059228211655e-07,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 1261,
    "uncertainty_score": 0.2500000142666601,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 1262,
    "uncertainty_score": 0.0036194404040891734,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 1263,
    "uncertainty_score": 2.469588190109228e-06,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 1264,
    "uncertainty_score": 3.3222789987474485e-08,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 1265,
    "uncertainty_score": 5.176231019820896e-07,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 1266,
    "uncertainty_score": 0.006575330488350466,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 1267,
    "uncertainty_score": 1.7544573442870222e-09,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 1268,
    "uncertainty_score": 0.19999999985704417,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 1269,
    "uncertainty_score": 0.20012770096077678,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 1270,
    "uncertainty_score": 0.002317101856222343,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 1271,
    "uncertainty_score": 8.18214145825317e-06,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 1272,
    "uncertainty_score": 0.19377123361876505,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 1273,
    "uncertainty_score": 3.902553279521381e-05,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 1274,
    "uncertainty_score": 0.0025318407911483136,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 1275,
    "uncertainty_score": 2.8637755971791686e-09,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 1276,
    "uncertainty_score": 0.1999791094198479,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 1277,
    "uncertainty_score": 5.272865101049437e-07,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 1278,
    "uncertainty_score": 0.25000009425996866,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 1279,
    "uncertainty_score": 0.24999997588039508,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 1280,
    "uncertainty_score": 0.5133516319394894,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 1281,
    "uncertainty_score": 1.7670582091051092e-05,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 1282,
    "uncertainty_score": 2.4912029984326702e-08,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 1283,
    "uncertainty_score": 4.043144273570691e-08,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 1284,
    "uncertainty_score": 8.963098014401251e-08,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 1285,
    "uncertainty_score": 1.5521113170125905e-11,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 1286,
    "uncertainty_score": 8.089936174437079e-05,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 1287,
    "uncertainty_score": 0.40052633481668043,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 1288,
    "uncertainty_score": 4.330819029764093e-06,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 1289,
    "uncertainty_score": 3.37526286789581e-06,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 1290,
    "uncertainty_score": 0.00024132918163653712,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 1291,
    "uncertainty_score": 0.1026002647631572,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 1292,
    "uncertainty_score": 0.20049968922509556,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 1293,
    "uncertainty_score": 0.2000000381445764,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 1294,
    "uncertainty_score": 3.290338672917012e-07,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 1295,
    "uncertainty_score": 2.9574201709267654e-06,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 1296,
    "uncertainty_score": 5.618875834403123e-05,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 1297,
    "uncertainty_score": 1.3369987584973632e-07,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 1298,
    "uncertainty_score": 1.0582209213132247e-08,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 1299,
    "uncertainty_score": 6.910047089035016e-08,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 1300,
    "uncertainty_score": 1.0683716838383279e-09,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 1301,
    "uncertainty_score": 2.385854441023424e-10,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 1302,
    "uncertainty_score": 6.878211747614166e-06,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 1303,
    "uncertainty_score": 0.25000017357481114,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 1304,
    "uncertainty_score": 5.1927907631640716e-05,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 1305,
    "uncertainty_score": 0.20000259305982,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 1306,
    "uncertainty_score": 0.5000082924581247,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 1307,
    "uncertainty_score": 6.635970437527177e-09,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 1308,
    "uncertainty_score": 3.034738562510867e-07,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 1309,
    "uncertainty_score": 0.25948325545650675,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 1310,
    "uncertainty_score": 6.8670641819822984e-06,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 1311,
    "uncertainty_score": 6.698774301349126e-10,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 1312,
    "uncertainty_score": 1.3422274834142491e-08,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 1313,
    "uncertainty_score": 0.1997328434258332,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 1314,
    "uncertainty_score": 0.20000300742793162,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 1315,
    "uncertainty_score": 0.399999763381892,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 1316,
    "uncertainty_score": 0.0005415567121865212,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 1317,
    "uncertainty_score": 2.725099340302239e-09,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 1318,
    "uncertainty_score": 0.49999999975000003,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 1319,
    "uncertainty_score": 2.188223263419243e-07,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 1320,
    "uncertainty_score": 3.788509179145702e-07,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 1321,
    "uncertainty_score": 0.33338557673141195,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 1322,
    "uncertainty_score": 0.5000000363343143,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 1323,
    "uncertainty_score": 0.199473665206141,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 1324,
    "uncertainty_score": 0.07703189111274239,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 1325,
    "uncertainty_score": 1.1743941616565375e-07,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 1326,
    "uncertainty_score": 6.696412736486487e-09,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 1327,
    "uncertainty_score": 0.050189246198589485,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 1328,
    "uncertainty_score": 8.782574729301611e-10,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 1329,
    "uncertainty_score": 1.1515773145897511e-06,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 1330,
    "uncertainty_score": 5.852138211403784e-08,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 1331,
    "uncertainty_score": 0.031778086787588936,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 1332,
    "uncertainty_score": 1.8572681104960353e-07,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 1333,
    "uncertainty_score": 0.2500002066875336,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 1334,
    "uncertainty_score": 3.677533825278247e-10,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 1335,
    "uncertainty_score": 5.580009808875258e-11,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 1336,
    "uncertainty_score": 1.1714206127527394e-10,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 1337,
    "uncertainty_score": 0.74999999975,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 1338,
    "uncertainty_score": 0.6000000020015501,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 1339,
    "uncertainty_score": 3.159022887615813e-07,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 1340,
    "uncertainty_score": 5.5638648672253583e-11,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 1341,
    "uncertainty_score": 0.19775686520775831,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 1342,
    "uncertainty_score": 0.2000001042194422,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 1343,
    "uncertainty_score": 5.110174760155993e-08,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 1344,
    "uncertainty_score": 8.286246223884451e-10,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 1345,
    "uncertainty_score": 3.9288977969197017e-10,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 1346,
    "uncertainty_score": 3.8095687650856706e-09,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 1347,
    "uncertainty_score": 1.1718453584645254e-09,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 1348,
    "uncertainty_score": 0.20000000004689475,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 1349,
    "uncertainty_score": 0.19584970236960736,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 1350,
    "uncertainty_score": 0.20000000077134464,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 1351,
    "uncertainty_score": 0.002486330333641939,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 1352,
    "uncertainty_score": 0.20000102008006815,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 1353,
    "uncertainty_score": 2.672980835874848e-10,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 1354,
    "uncertainty_score": 0.33335074922811353,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 1355,
    "uncertainty_score": 3.056670250959534e-11,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 1356,
    "uncertainty_score": 0.006572852586184873,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 1357,
    "uncertainty_score": 0.2000220075964454,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 1358,
    "uncertainty_score": 0.20000010328645107,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 1359,
    "uncertainty_score": 0.4000000000017052,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 1360,
    "uncertainty_score": 0.6666666666666666,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 1361,
    "uncertainty_score": 0.250000405277612,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 1362,
    "uncertainty_score": 3.0259473174189694e-08,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 1363,
    "uncertainty_score": 1.8599393542721976e-05,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 1364,
    "uncertainty_score": 0.4440853841718863,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 1365,
    "uncertainty_score": 1.4132445602380887e-09,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 1366,
    "uncertainty_score": 9.191142169475295e-12,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 1367,
    "uncertainty_score": 3.7226956579488473e-06,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 1368,
    "uncertainty_score": 0.6000389783157983,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 1369,
    "uncertainty_score": 0.5909091249860275,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 1370,
    "uncertainty_score": 1.8949516138320874e-07,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 1371,
    "uncertainty_score": 0.20001786883743838,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 1372,
    "uncertainty_score": 1.2961336237099466e-09,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 1373,
    "uncertainty_score": 0.0008091347574526238,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 1374,
    "uncertainty_score": 0.24999999981081122,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 1375,
    "uncertainty_score": 1.4609991615887346e-09,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 1376,
    "uncertainty_score": 4.566353479681603e-08,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 1377,
    "uncertainty_score": 0.20000104854413325,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 1378,
    "uncertainty_score": 7.249402126311098e-06,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 1379,
    "uncertainty_score": 0.16667040664829402,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 1380,
    "uncertainty_score": 3.1925405511898637e-09,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 1381,
    "uncertainty_score": 9.75934951788436e-09,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 1382,
    "uncertainty_score": 5.196967490520283e-06,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 1383,
    "uncertainty_score": 0.18750326815825982,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 1384,
    "uncertainty_score": 2.0510979899323845e-07,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 1385,
    "uncertainty_score": 4.935243455566585e-09,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 1386,
    "uncertainty_score": 0.2499999997603654,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 1387,
    "uncertainty_score": 6.216149052213126e-06,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 1388,
    "uncertainty_score": 0.0011275588455397089,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 1389,
    "uncertainty_score": 0.40853806958601363,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 1390,
    "uncertainty_score": 2.305187255642573e-07,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 1391,
    "uncertainty_score": 2.982047232250891e-06,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 1392,
    "uncertainty_score": 0.43196962830144925,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 1393,
    "uncertainty_score": 0.24999999974999998,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 1394,
    "uncertainty_score": 0.20000005483339406,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 1395,
    "uncertainty_score": 0.11375875065337492,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 1396,
    "uncertainty_score": 0.00011058476019511477,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 1397,
    "uncertainty_score": 6.7501675978001e-10,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 1398,
    "uncertainty_score": 9.963469266819937e-05,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 1399,
    "uncertainty_score": 7.964899595932546e-08,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 1400,
    "uncertainty_score": 0.16729224384164484,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 1401,
    "uncertainty_score": 1.8395929894494585e-11,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 1402,
    "uncertainty_score": 0.35896216404598824,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 1403,
    "uncertainty_score": 1.2387049566324599e-06,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 1404,
    "uncertainty_score": 0.25000020874840034,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 1405,
    "uncertainty_score": 3.7877418877522017e-07,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 1406,
    "uncertainty_score": 0.20000000023176084,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 1407,
    "uncertainty_score": 0.14511458925242451,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 1408,
    "uncertainty_score": 0.40968642419543355,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 1409,
    "uncertainty_score": 0.0006481641126533313,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 1410,
    "uncertainty_score": 2.637237062812316e-10,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 1411,
    "uncertainty_score": 0.20502928351798025,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 1412,
    "uncertainty_score": 0.2310354554064263,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 1413,
    "uncertainty_score": 0.010522025042198967,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 1414,
    "uncertainty_score": 2.957370269229129e-09,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 1415,
    "uncertainty_score": 0.4015631774703962,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 1416,
    "uncertainty_score": 6.667553297962054e-07,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 1417,
    "uncertainty_score": 6.109156799716022e-11,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 1418,
    "uncertainty_score": 0.3386576856801146,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 1419,
    "uncertainty_score": 1.038953750796204e-09,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 1420,
    "uncertainty_score": 0.006889022391576097,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 1421,
    "uncertainty_score": 0.20021908896383436,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 1422,
    "uncertainty_score": 2.2621047100967335e-11,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 1423,
    "uncertainty_score": 0.2008582932049597,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 1424,
    "uncertainty_score": 6.0274956924590334e-05,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 1425,
    "uncertainty_score": 1.5206143776228386e-10,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 1426,
    "uncertainty_score": 9.599050962308648e-05,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 1427,
    "uncertainty_score": 4.613542069578395e-06,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 1428,
    "uncertainty_score": 4.17211469259407e-05,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 1429,
    "uncertainty_score": 0.0001866749507915333,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 1430,
    "uncertainty_score": 0.0015086930084369406,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 1431,
    "uncertainty_score": 0.3332904538441203,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 1432,
    "uncertainty_score": 4.962632054389904e-06,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 1433,
    "uncertainty_score": 2.5992678427745907e-06,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 1434,
    "uncertainty_score": 3.529791356710363e-07,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 1435,
    "uncertainty_score": 3.241853850009424e-07,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 1436,
    "uncertainty_score": 4.682287769357805e-06,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 1437,
    "uncertainty_score": 3.862212891668501e-06,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 1438,
    "uncertainty_score": 0.0006883537985332381,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 1439,
    "uncertainty_score": 6.107478483627537e-08,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 1440,
    "uncertainty_score": 1.2798238239601432e-08,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 1441,
    "uncertainty_score": 6.350688545553646e-05,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 1442,
    "uncertainty_score": 0.0002971284599518012,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 1443,
    "uncertainty_score": 7.327307922510627e-10,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 1444,
    "uncertainty_score": 0.3333333343721094,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 1445,
    "uncertainty_score": 1.9387872068861577e-07,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 1446,
    "uncertainty_score": 0.19999183689087335,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 1447,
    "uncertainty_score": 0.25048168368735624,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 1448,
    "uncertainty_score": 0.2500000664973709,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 1449,
    "uncertainty_score": 0.28440646326081753,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 1450,
    "uncertainty_score": 0.24999999981254326,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 1451,
    "uncertainty_score": 5.3534407137706436e-11,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 1452,
    "uncertainty_score": 0.2500600788639915,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 1453,
    "uncertainty_score": 0.00016774939259756375,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 1454,
    "uncertainty_score": 4.886798993906853e-08,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 1455,
    "uncertainty_score": 0.20005333762853,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 1456,
    "uncertainty_score": 4.73425818561055e-10,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 1457,
    "uncertainty_score": 0.19995437700915586,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 1458,
    "uncertainty_score": 1.0252898890063577e-10,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 1459,
    "uncertainty_score": 0.20000000677392796,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 1460,
    "uncertainty_score": 0.1961760961723929,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 1461,
    "uncertainty_score": 0.0012920220068634823,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 1462,
    "uncertainty_score": 0.25010121531528373,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 1463,
    "uncertainty_score": 1.442155706749509e-08,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 1464,
    "uncertainty_score": 0.00027942449635072475,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 1465,
    "uncertainty_score": 0.2013385785267478,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 1466,
    "uncertainty_score": 0.24999999976331735,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 1467,
    "uncertainty_score": 1.1316232117690035e-05,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 1468,
    "uncertainty_score": 0.00045796512152224605,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 1469,
    "uncertainty_score": 0.10668259744568868,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 1470,
    "uncertainty_score": 3.1270019997341614e-11,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 1471,
    "uncertainty_score": 0.25000004787759117,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 1472,
    "uncertainty_score": 1.142188487618182e-06,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 1473,
    "uncertainty_score": 0.08134658993514558,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 1474,
    "uncertainty_score": 2.6879786085380916e-08,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 1475,
    "uncertainty_score": 5.100745575739642e-06,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 1476,
    "uncertainty_score": 0.2000000736666859,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 1477,
    "uncertainty_score": 6.01321360469203e-10,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 1478,
    "uncertainty_score": 2.1797664645677005e-05,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 1479,
    "uncertainty_score": 8.120614356033445e-11,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 1480,
    "uncertainty_score": 0.2000000005651637,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 1481,
    "uncertainty_score": 6.904376581717613e-07,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 1482,
    "uncertainty_score": 0.5980790146048602,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 1483,
    "uncertainty_score": 0.24999991040198252,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 1484,
    "uncertainty_score": 4.9452641932650794e-11,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 1485,
    "uncertainty_score": 7.023519098186943e-05,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 1486,
    "uncertainty_score": 1.1402589655407396e-05,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 1487,
    "uncertainty_score": 0.3999965972708762,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 1488,
    "uncertainty_score": 0.25000006889307835,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 1489,
    "uncertainty_score": 7.120236970085373e-07,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 1490,
    "uncertainty_score": 0.2500003452439856,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 1491,
    "uncertainty_score": 5.45799865087026e-08,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 1492,
    "uncertainty_score": 1.8755165772108985e-10,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 1493,
    "uncertainty_score": 0.25000000124905297,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 1494,
    "uncertainty_score": 1.2059426589680264e-10,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 1495,
    "uncertainty_score": 0.2500247883762052,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 1496,
    "uncertainty_score": 3.484260875021334e-06,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 1497,
    "uncertainty_score": 4.0953231445179904e-08,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 1498,
    "uncertainty_score": 0.3999191482134598,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 1499,
    "uncertainty_score": 0.0077859634741195,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 1500,
    "uncertainty_score": 3.0851902337002435e-07,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 1501,
    "uncertainty_score": 0.38801486440374877,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 1502,
    "uncertainty_score": 0.37500009111066585,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 1503,
    "uncertainty_score": 0.29491311671622794,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 1504,
    "uncertainty_score": 8.579686551147137e-10,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 1505,
    "uncertainty_score": 0.666666662874915,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 1506,
    "uncertainty_score": 0.399614652679649,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 1507,
    "uncertainty_score": 0.20000687302518272,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 1508,
    "uncertainty_score": 1.8294144098282062e-06,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 1509,
    "uncertainty_score": 6.91985764940911e-05,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 1510,
    "uncertainty_score": 3.6641144807339574e-07,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 1511,
    "uncertainty_score": 0.2500513896678267,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 1512,
    "uncertainty_score": 1.1951827444889502e-08,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 1513,
    "uncertainty_score": 0.2001803192068628,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 1514,
    "uncertainty_score": 0.2500000062478914,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 1515,
    "uncertainty_score": 2.4448575141621745e-06,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 1516,
    "uncertainty_score": 0.3997935763384489,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 1517,
    "uncertainty_score": 0.002605296382742765,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 1518,
    "uncertainty_score": 0.005647031036093087,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 1519,
    "uncertainty_score": 0.00012272818848607729,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 1520,
    "uncertainty_score": 0.20000003466992738,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 1521,
    "uncertainty_score": 6.820647051087121e-10,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 1522,
    "uncertainty_score": 0.3333339542806019,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 1523,
    "uncertainty_score": 2.7622575306328056e-05,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 1524,
    "uncertainty_score": 7.039631884394165e-14,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 1525,
    "uncertainty_score": 7.293161022158272e-05,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 1526,
    "uncertainty_score": 6.511042539338257e-09,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 1527,
    "uncertainty_score": 1.0679689332523424e-07,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 1528,
    "uncertainty_score": 0.0369092711416271,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 1529,
    "uncertainty_score": 1.9283839292914564e-09,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 1530,
    "uncertainty_score": 4.0799395987014006e-08,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 1531,
    "uncertainty_score": 0.3994738134604791,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 1532,
    "uncertainty_score": 0.0008397597849104349,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 1533,
    "uncertainty_score": 6.329641646932423e-08,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 1534,
    "uncertainty_score": 2.3964779938864404e-08,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 1535,
    "uncertainty_score": 7.560846831724681e-06,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 1536,
    "uncertainty_score": 1.6110435381002477e-05,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 1537,
    "uncertainty_score": 3.704518458981075e-05,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 1538,
    "uncertainty_score": 9.281436922133442e-10,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 1539,
    "uncertainty_score": 3.3837245220131167e-08,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 1540,
    "uncertainty_score": 5.206365227274193e-07,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 1541,
    "uncertainty_score": 1.5719659161084287e-05,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 1542,
    "uncertainty_score": 4.374267977867731e-05,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 1543,
    "uncertainty_score": 0.09014088399262837,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 1544,
    "uncertainty_score": 0.2024792414146853,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 1545,
    "uncertainty_score": 0.34259717134912493,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 1546,
    "uncertainty_score": 0.026608144087891056,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 1547,
    "uncertainty_score": 0.20003444855357788,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 1548,
    "uncertainty_score": 8.355894415768345e-05,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 1549,
    "uncertainty_score": 0.0008329837356292391,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 1550,
    "uncertainty_score": 3.892968787398059e-06,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 1551,
    "uncertainty_score": 2.046893980015879e-08,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 1552,
    "uncertainty_score": 4.752287309762694e-09,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 1553,
    "uncertainty_score": 0.49221388517406445,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 1554,
    "uncertainty_score": 1.7869411045678527e-05,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 1555,
    "uncertainty_score": 0.2000168216975935,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 1556,
    "uncertainty_score": 0.41325557415987146,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 1557,
    "uncertainty_score": 0.09014121858934253,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 1558,
    "uncertainty_score": 3.0432827039621504e-06,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 1559,
    "uncertainty_score": 1.344101586482504e-06,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 1560,
    "uncertainty_score": 0.6000000000163337,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 1561,
    "uncertainty_score": 2.114635708042958e-07,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 1562,
    "uncertainty_score": 0.40070505819186863,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 1563,
    "uncertainty_score": 0.20000901776804936,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 1564,
    "uncertainty_score": 4.3374522863780235e-05,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 1565,
    "uncertainty_score": 0.250000240526616,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 1566,
    "uncertainty_score": 1.4135817743745864e-06,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 1567,
    "uncertainty_score": 1.339569476551595e-06,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 1568,
    "uncertainty_score": 2.9613123516418867e-08,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 1569,
    "uncertainty_score": 7.925785235868014e-10,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 1570,
    "uncertainty_score": 0.003624718187907193,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 1571,
    "uncertainty_score": 0.1999999992990457,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 1572,
    "uncertainty_score": 0.37827374792268653,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 1573,
    "uncertainty_score": 1.8298091320945691e-09,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 1574,
    "uncertainty_score": 5.0102802709381914e-11,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 1575,
    "uncertainty_score": 5.804639599706811e-06,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 1576,
    "uncertainty_score": 1.130647617034136e-06,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 1577,
    "uncertainty_score": 3.410654781398638e-08,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 1578,
    "uncertainty_score": 4.838330229692964e-09,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 1579,
    "uncertainty_score": 9.925900289951555e-08,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 1580,
    "uncertainty_score": 7.2155461157840555e-06,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 1581,
    "uncertainty_score": 2.6182887672798244e-05,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 1582,
    "uncertainty_score": 1.6612395941612412e-07,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 1583,
    "uncertainty_score": 3.843132202638152e-06,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 1584,
    "uncertainty_score": 0.28702999709187593,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 1585,
    "uncertainty_score": 4.5632365051476196e-09,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 1586,
    "uncertainty_score": 1.940708519866768e-07,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 1587,
    "uncertainty_score": 0.07900374404621074,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 1588,
    "uncertainty_score": 4.7872592940116426e-08,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 1589,
    "uncertainty_score": 7.708080939966497e-08,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 1590,
    "uncertainty_score": 4.496285988599801e-07,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 1591,
    "uncertainty_score": 0.25027439948919616,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 1592,
    "uncertainty_score": 0.00460006034187335,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 1593,
    "uncertainty_score": 8.210939942973666e-05,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 1594,
    "uncertainty_score": 2.4458307020938734e-05,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 1595,
    "uncertainty_score": 2.9443196594619047e-09,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 1596,
    "uncertainty_score": 0.20394282440475542,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 1597,
    "uncertainty_score": 0.20000002010335166,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 1598,
    "uncertainty_score": 1.960728781096738e-08,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 1599,
    "uncertainty_score": 0.14409940551381586,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 1600,
    "uncertainty_score": 3.384635915242731e-06,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 1601,
    "uncertainty_score": 0.4999724867950287,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 1602,
    "uncertainty_score": 0.2000835961608975,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 1603,
    "uncertainty_score": 0.2500000209776298,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 1604,
    "uncertainty_score": 0.025301191260045788,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 1605,
    "uncertainty_score": 2.9623061287124136e-07,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 1606,
    "uncertainty_score": 6.667042998246223e-09,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 1607,
    "uncertainty_score": 4.93896195180689e-07,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 1608,
    "uncertainty_score": 6.169827730996128e-08,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 1609,
    "uncertainty_score": 1.6101539624043648e-05,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 1610,
    "uncertainty_score": 0.4203172914057999,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 1611,
    "uncertainty_score": 6.758407175728212e-10,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 1612,
    "uncertainty_score": 7.771778871157171e-07,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 1613,
    "uncertainty_score": 1.2910177482266662e-06,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 1614,
    "uncertainty_score": 9.086948392103304e-09,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 1615,
    "uncertainty_score": 2.124110273194862e-09,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 1616,
    "uncertainty_score": 0.3999977990300099,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 1617,
    "uncertainty_score": 5.239781632764848e-06,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 1618,
    "uncertainty_score": 0.015175899623772275,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 1619,
    "uncertainty_score": 0.0004341178300001411,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 1620,
    "uncertainty_score": 7.887987612096948e-07,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 1621,
    "uncertainty_score": 1.2027835357060867e-07,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 1622,
    "uncertainty_score": 5.614754671187523e-10,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 1623,
    "uncertainty_score": 0.19999999940775823,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 1624,
    "uncertainty_score": 0.23803028184691466,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 1625,
    "uncertainty_score": 0.19999999980800656,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 1626,
    "uncertainty_score": 1.0054698424716715e-10,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 1627,
    "uncertainty_score": 1.7530833863345676e-09,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 1628,
    "uncertainty_score": 1.1952808705686825e-09,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 1629,
    "uncertainty_score": 0.1999999998000031,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 1630,
    "uncertainty_score": 6.0756639094685e-06,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 1631,
    "uncertainty_score": 9.085244863619712e-06,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 1632,
    "uncertainty_score": 0.0013729689855230566,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 1633,
    "uncertainty_score": 0.00017019766328433186,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 1634,
    "uncertainty_score": 0.2500000560177692,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 1635,
    "uncertainty_score": 6.5440402137768215e-09,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 1636,
    "uncertainty_score": 5.696397790586361e-11,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 1637,
    "uncertainty_score": 0.008332442152899529,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 1638,
    "uncertainty_score": 9.585170967849016e-09,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 1639,
    "uncertainty_score": 0.2000000036784963,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 1640,
    "uncertainty_score": 1.6364351348700945e-05,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 1641,
    "uncertainty_score": 6.3842753218845e-05,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 1642,
    "uncertainty_score": 0.6666884559614625,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 1643,
    "uncertainty_score": 0.0004988551833865956,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 1644,
    "uncertainty_score": 0.00034929864144390705,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 1645,
    "uncertainty_score": 0.0015635084740144294,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 1646,
    "uncertainty_score": 7.515037242288259e-10,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 1647,
    "uncertainty_score": 7.79530976332471e-05,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 1648,
    "uncertainty_score": 0.20001423590586512,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 1649,
    "uncertainty_score": 0.20000111189738257,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 1650,
    "uncertainty_score": 1.0726632667076681e-10,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 1651,
    "uncertainty_score": 1.9125233583331687e-05,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 1652,
    "uncertainty_score": 0.4001252228487074,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 1653,
    "uncertainty_score": 9.043817621957637e-11,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 1654,
    "uncertainty_score": 4.8493294242454024e-12,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 1655,
    "uncertainty_score": 3.655806089384067e-05,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 1656,
    "uncertainty_score": 0.20000004029857216,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 1657,
    "uncertainty_score": 0.5000069859572382,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 1658,
    "uncertainty_score": 0.0007506158397417416,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 1659,
    "uncertainty_score": 0.2500000348893472,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 1660,
    "uncertainty_score": 1.888482022597572e-12,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 1661,
    "uncertainty_score": 0.4002366086580148,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 1662,
    "uncertainty_score": 0.2500000126023357,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 1663,
    "uncertainty_score": 0.6666666439674768,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 1664,
    "uncertainty_score": 1.5561515690321005e-09,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 1665,
    "uncertainty_score": 2.729813599523922e-10,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 1666,
    "uncertainty_score": 7.894556006554802e-09,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 1667,
    "uncertainty_score": 1.5593366799215707e-05,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 1668,
    "uncertainty_score": 4.138465014616231e-09,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 1669,
    "uncertainty_score": 2.0467587258978658e-09,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 1670,
    "uncertainty_score": 1.2442846539467345e-05,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 1671,
    "uncertainty_score": 0.25000000687551094,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 1672,
    "uncertainty_score": 9.457319214317831e-05,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 1673,
    "uncertainty_score": 2.0900790391540655e-05,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 1674,
    "uncertainty_score": 2.522314385858302e-09,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 1675,
    "uncertainty_score": 5.884636246321558e-08,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 1676,
    "uncertainty_score": 0.20048554397377227,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 1677,
    "uncertainty_score": 0.4999996494853289,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 1678,
    "uncertainty_score": 0.3333332155086312,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 1679,
    "uncertainty_score": 0.3789286562264758,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 1680,
    "uncertainty_score": 2.053905846679845e-09,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 1681,
    "uncertainty_score": 0.0006531658513391657,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 1682,
    "uncertainty_score": 2.0760192548982958e-05,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 1683,
    "uncertainty_score": 8.114570718194554e-10,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 1684,
    "uncertainty_score": 0.3333333513075751,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 1685,
    "uncertainty_score": 0.00012454510204940223,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 1686,
    "uncertainty_score": 0.5001355448387877,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 1687,
    "uncertainty_score": 3.171901564570524e-09,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 1688,
    "uncertainty_score": 7.443472168055517e-10,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 1689,
    "uncertainty_score": 1.3113993947134691e-09,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 1690,
    "uncertainty_score": 0.4017333001746392,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 1691,
    "uncertainty_score": 5.761553697685332e-12,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 1692,
    "uncertainty_score": 4.5087080295399157e-07,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 1693,
    "uncertainty_score": 7.22550541458196e-05,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 1694,
    "uncertainty_score": 1.4726299939856615e-05,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 1695,
    "uncertainty_score": 0.3333410221002297,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 1696,
    "uncertainty_score": 0.20000106560105602,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 1697,
    "uncertainty_score": 1.085359470329982e-06,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 1698,
    "uncertainty_score": 0.20000417462880246,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 1699,
    "uncertainty_score": 0.22215241080364384,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 1700,
    "uncertainty_score": 4.529198283690419e-10,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 1701,
    "uncertainty_score": 3.902212229731095e-11,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 1702,
    "uncertainty_score": 0.4762417496671822,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 1703,
    "uncertainty_score": 1.7668554379861024e-06,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 1704,
    "uncertainty_score": 0.003164000308416111,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 1705,
    "uncertainty_score": 1.5961287842898564e-09,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 1706,
    "uncertainty_score": 1.0942141090976486e-06,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 1707,
    "uncertainty_score": 1.6342633897787262e-05,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 1708,
    "uncertainty_score": 5.639845504000873e-11,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 1709,
    "uncertainty_score": 1.514618514026016e-06,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 1710,
    "uncertainty_score": 1.2412655742137557e-05,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 1711,
    "uncertainty_score": 3.737895658685866e-08,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 1712,
    "uncertainty_score": 1.32312139704439e-06,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 1713,
    "uncertainty_score": 2.0514781715740977e-10,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 1714,
    "uncertainty_score": 0.031643797039129326,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 1715,
    "uncertainty_score": 7.76819921591838e-06,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 1716,
    "uncertainty_score": 0.0020575841497759923,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 1717,
    "uncertainty_score": 1.2616271707203638e-06,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 1718,
    "uncertainty_score": 0.00012704045348949094,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 1719,
    "uncertainty_score": 0.00010652660667194749,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 1720,
    "uncertainty_score": 0.00436733473995485,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 1721,
    "uncertainty_score": 0.249999999753472,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 1722,
    "uncertainty_score": 6.51938635473859e-08,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 1723,
    "uncertainty_score": 0.00015338373433745474,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 1724,
    "uncertainty_score": 2.608826273979886e-05,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 1725,
    "uncertainty_score": 0.256122828752733,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 1726,
    "uncertainty_score": 0.006294519633369191,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 1727,
    "uncertainty_score": 1.1041983076823436e-07,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 1728,
    "uncertainty_score": 0.7499787939970167,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 1729,
    "uncertainty_score": 5.615113119094364e-08,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 1730,
    "uncertainty_score": 1.6570369562214678e-05,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 1731,
    "uncertainty_score": 4.7041180944844395e-07,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 1732,
    "uncertainty_score": 9.48227974376849e-05,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 1733,
    "uncertainty_score": 0.2741303124496327,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 1734,
    "uncertainty_score": 0.2001860466888447,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 1735,
    "uncertainty_score": 4.405425132896177e-09,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 1736,
    "uncertainty_score": 0.200667812018383,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 1737,
    "uncertainty_score": 2.5028535095477063e-07,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 1738,
    "uncertainty_score": 4.21248280052032e-10,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 1739,
    "uncertainty_score": 3.056993508292083e-11,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 1740,
    "uncertainty_score": 2.1209255692629843e-08,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 1741,
    "uncertainty_score": 1.3528610019082578e-07,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 1742,
    "uncertainty_score": 2.6417041750565192e-05,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 1743,
    "uncertainty_score": 0.007049432026360427,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 1744,
    "uncertainty_score": 3.601260378396833e-10,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 1745,
    "uncertainty_score": 0.11350198197043908,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 1746,
    "uncertainty_score": 3.087107373589875e-05,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 1747,
    "uncertainty_score": 0.19995525989147717,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 1748,
    "uncertainty_score": 1.7134302423083845e-05,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 1749,
    "uncertainty_score": 0.25003385564683495,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 1750,
    "uncertainty_score": 6.530472312127404e-07,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 1751,
    "uncertainty_score": 9.99111478798881e-07,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 1752,
    "uncertainty_score": 0.00012389336441599695,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 1753,
    "uncertainty_score": 1.787362194202828e-05,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 1754,
    "uncertainty_score": 0.5128283840164504,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 1755,
    "uncertainty_score": 6.453706390611274e-08,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 1756,
    "uncertainty_score": 0.35179981287240264,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 1757,
    "uncertainty_score": 2.0683497336276472e-05,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 1758,
    "uncertainty_score": 0.25000000000085126,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 1759,
    "uncertainty_score": 8.279852630244528e-06,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 1760,
    "uncertainty_score": 0.10881564674975723,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 1761,
    "uncertainty_score": 0.23732829086227164,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 1762,
    "uncertainty_score": 6.994109752737549e-11,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 1763,
    "uncertainty_score": 0.005930688736336663,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 1764,
    "uncertainty_score": 1.101222366744707e-10,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 1765,
    "uncertainty_score": 0.8000808960984885,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 1766,
    "uncertainty_score": 0.446402678670633,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 1767,
    "uncertainty_score": 0.001014319613724051,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 1768,
    "uncertainty_score": 0.0003266595239448756,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 1769,
    "uncertainty_score": 2.06536380070729e-09,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 1770,
    "uncertainty_score": 0.1662012353723818,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 1771,
    "uncertainty_score": 0.00023642771709283492,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 1772,
    "uncertainty_score": 2.9059104239286204e-08,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 1773,
    "uncertainty_score": 0.4045219709353648,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 1774,
    "uncertainty_score": 6.492033977358383e-07,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 1775,
    "uncertainty_score": 0.00014638370018750548,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 1776,
    "uncertainty_score": 0.027127343766715623,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 1777,
    "uncertainty_score": 0.25003262579550267,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 1778,
    "uncertainty_score": 0.20055055887605727,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 1779,
    "uncertainty_score": 0.16062999057907187,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 1780,
    "uncertainty_score": 7.139969013414315e-07,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 1781,
    "uncertainty_score": 7.330444754158916e-07,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 1782,
    "uncertainty_score": 0.2026191383620906,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 1783,
    "uncertainty_score": 0.28800821753074396,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 1784,
    "uncertainty_score": 0.00010991436139338025,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 1785,
    "uncertainty_score": 3.3051269495013476e-05,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 1786,
    "uncertainty_score": 0.49998430811386146,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 1787,
    "uncertainty_score": 2.9577745810432707e-05,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 1788,
    "uncertainty_score": 0.0008862140480287851,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 1789,
    "uncertainty_score": 0.35709406709872665,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 1790,
    "uncertainty_score": 0.01028282943400958,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 1791,
    "uncertainty_score": 6.645708408374619e-09,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 1792,
    "uncertainty_score": 7.085755235230666e-10,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 1793,
    "uncertainty_score": 0.0053764924528122105,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 1794,
    "uncertainty_score": 0.25002691254476106,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 1795,
    "uncertainty_score": 0.20020879107431946,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 1796,
    "uncertainty_score": 6.147503692526125e-05,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 1797,
    "uncertainty_score": 0.33333333326905307,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 1798,
    "uncertainty_score": 0.3960565155074889,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 1799,
    "uncertainty_score": 0.003382985090267973,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 1800,
    "uncertainty_score": 1.1532824530363982e-08,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 1801,
    "uncertainty_score": 0.40004564907743834,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 1802,
    "uncertainty_score": 0.0003132416090032871,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 1803,
    "uncertainty_score": 0.2500049780218677,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 1804,
    "uncertainty_score": 0.23212910044133017,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 1805,
    "uncertainty_score": 6.123643589227161e-09,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 1806,
    "uncertainty_score": 0.2999838674969818,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 1807,
    "uncertainty_score": 0.05436277827099788,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 1808,
    "uncertainty_score": 0.22216680600677985,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 1809,
    "uncertainty_score": 1.004340622453767e-06,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 1810,
    "uncertainty_score": 0.2902881372981182,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 1811,
    "uncertainty_score": 1.3464629180954548e-05,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 1812,
    "uncertainty_score": 0.4000033307996591,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 1813,
    "uncertainty_score": 0.5630298290018605,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 1814,
    "uncertainty_score": 0.20001528629625498,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 1815,
    "uncertainty_score": 0.20035070712888517,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 1816,
    "uncertainty_score": 4.5656193158067836e-08,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 1817,
    "uncertainty_score": 0.3999275433171954,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 1818,
    "uncertainty_score": 2.5474573586535792e-05,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 1819,
    "uncertainty_score": 0.00015686534510567126,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 1820,
    "uncertainty_score": 0.2500003120838539,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 1821,
    "uncertainty_score": 0.20675733212733896,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 1822,
    "uncertainty_score": 3.578596577028204e-10,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 1823,
    "uncertainty_score": 0.06390029325280426,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 1824,
    "uncertainty_score": 1.0747823061292453e-07,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 1825,
    "uncertainty_score": 0.20000004483160666,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 1826,
    "uncertainty_score": 0.006044251393641003,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 1827,
    "uncertainty_score": 2.202987511448378e-06,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 1828,
    "uncertainty_score": 0.00034787758061534954,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 1829,
    "uncertainty_score": 0.5002449734861341,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 1830,
    "uncertainty_score": 0.24998552151099723,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 1831,
    "uncertainty_score": 1.0560081025903031e-14,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 1832,
    "uncertainty_score": 1.0577159367726932e-07,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 1833,
    "uncertainty_score": 0.4000456533346317,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 1834,
    "uncertainty_score": 8.680106364517856e-06,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 1835,
    "uncertainty_score": 0.1024654022574153,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 1836,
    "uncertainty_score": 0.16664536184639855,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 1837,
    "uncertainty_score": 6.290262236408051e-05,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 1838,
    "uncertainty_score": 0.9987383372483684,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 1839,
    "uncertainty_score": 1.6077378792246727e-06,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 1840,
    "uncertainty_score": 0.00027184371287153347,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 1841,
    "uncertainty_score": 4.1654485418874284e-14,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 1842,
    "uncertainty_score": 6.239938604118565e-05,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 1843,
    "uncertainty_score": 3.029752932526436e-05,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 1844,
    "uncertainty_score": 0.3333333505048878,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 1845,
    "uncertainty_score": 0.00023685931770781846,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 1846,
    "uncertainty_score": 2.128162926181598e-05,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 1847,
    "uncertainty_score": 7.465099471812705e-10,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 1848,
    "uncertainty_score": 4.419777788767324e-09,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 1849,
    "uncertainty_score": 0.20088445515052228,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 1850,
    "uncertainty_score": 0.5000000499593633,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 1851,
    "uncertainty_score": 0.0003472938534460351,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 1852,
    "uncertainty_score": 1.0118785327920248e-05,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 1853,
    "uncertainty_score": 0.2500126896532715,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 1854,
    "uncertainty_score": 0.33200450616160754,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 1855,
    "uncertainty_score": 2.1584046784160464e-09,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 1856,
    "uncertainty_score": 0.0006998220820658036,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 1857,
    "uncertainty_score": 0.19999578814552946,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 1858,
    "uncertainty_score": 6.798897921912187e-08,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 1859,
    "uncertainty_score": 0.0002975433669985605,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 1860,
    "uncertainty_score": 0.01675333229368323,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 1861,
    "uncertainty_score": 7.918882707064024e-11,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 1862,
    "uncertainty_score": 1.0356624385684338e-08,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 1863,
    "uncertainty_score": 0.00031812536618114465,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 1864,
    "uncertainty_score": 1.5345371530330883e-10,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 1865,
    "uncertainty_score": 0.20303208166000025,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 1866,
    "uncertainty_score": 1.234846241156469e-10,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 1867,
    "uncertainty_score": 5.8623780897144654e-05,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 1868,
    "uncertainty_score": 2.7410219675254565e-08,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 1869,
    "uncertainty_score": 0.7499999992499514,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 1870,
    "uncertainty_score": 0.6000000334640234,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 1871,
    "uncertainty_score": 1.2236048089158316e-05,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 1872,
    "uncertainty_score": 0.20000234607873849,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 1873,
    "uncertainty_score": 4.758832821354645e-05,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 1874,
    "uncertainty_score": 7.107965584257739e-06,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 1875,
    "uncertainty_score": 0.25000001346136724,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 1876,
    "uncertainty_score": 9.909571930254825e-08,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 1877,
    "uncertainty_score": 0.035234042954254856,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 1878,
    "uncertainty_score": 9.83525712042755e-07,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 1879,
    "uncertainty_score": 7.144585113838649e-10,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 1880,
    "uncertainty_score": 3.25663764767917e-06,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 1881,
    "uncertainty_score": 0.39950041955942744,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 1882,
    "uncertainty_score": 5.053184614661771e-09,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 1883,
    "uncertainty_score": 1.2892022178571083e-07,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 1884,
    "uncertainty_score": 0.0010399296866929735,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 1885,
    "uncertainty_score": 2.889897552296006e-07,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 1886,
    "uncertainty_score": 5.992354427119586e-07,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 1887,
    "uncertainty_score": 0.4000023545421155,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 1888,
    "uncertainty_score": 9.81230097505755e-09,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 1889,
    "uncertainty_score": 3.2875277493404275e-07,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 1890,
    "uncertainty_score": 0.20029443210584935,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 1891,
    "uncertainty_score": 5.091271337800093e-10,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 1892,
    "uncertainty_score": 2.2831370162908472e-07,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 1893,
    "uncertainty_score": 3.53061154381621e-05,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 1894,
    "uncertainty_score": 2.1175426412950278e-05,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 1895,
    "uncertainty_score": 5.425756639563344e-10,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 1896,
    "uncertainty_score": 1.8344626255340914e-06,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 1897,
    "uncertainty_score": 0.25002998321222775,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 1898,
    "uncertainty_score": 0.16666667738582652,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 1899,
    "uncertainty_score": 9.833172190714079e-06,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 1900,
    "uncertainty_score": 8.948836446818628e-08,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 1901,
    "uncertainty_score": 2.1764069363016617e-08,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 1902,
    "uncertainty_score": 3.5169937342735624e-05,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 1903,
    "uncertainty_score": 5.132710778324758e-07,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 1904,
    "uncertainty_score": 3.108194579501392e-09,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 1905,
    "uncertainty_score": 1.3767032127028598e-08,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 1906,
    "uncertainty_score": 1.9390299928939236e-08,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 1907,
    "uncertainty_score": 0.39996831337112526,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 1908,
    "uncertainty_score": 4.3037134714410735e-08,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 1909,
    "uncertainty_score": 1.3160156766010763e-06,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 1910,
    "uncertainty_score": 2.931975375502362e-05,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 1911,
    "uncertainty_score": 0.2500000846223677,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 1912,
    "uncertainty_score": 0.9998905205461736,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 1913,
    "uncertainty_score": 0.0007002356182692832,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 1914,
    "uncertainty_score": 0.2502245547974925,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 1915,
    "uncertainty_score": 8.18302587401873e-09,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 1916,
    "uncertainty_score": 0.0005930665847167059,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 1917,
    "uncertainty_score": 0.24183338865178738,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 1918,
    "uncertainty_score": 3.4417558645505766e-08,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 1919,
    "uncertainty_score": 0.00024133956173621817,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 1920,
    "uncertainty_score": 2.2360169469085304e-07,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 1921,
    "uncertainty_score": 7.972303366845916e-08,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 1922,
    "uncertainty_score": 4.0519643769095127e-08,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 1923,
    "uncertainty_score": 8.403600735362068e-07,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 1924,
    "uncertainty_score": 0.0005038577780475366,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 1925,
    "uncertainty_score": 0.013724614116137582,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 1926,
    "uncertainty_score": 0.2000037479898645,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 1927,
    "uncertainty_score": 0.04636916082772489,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 1928,
    "uncertainty_score": 0.2500007205458335,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 1929,
    "uncertainty_score": 2.128385354295937e-10,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 1930,
    "uncertainty_score": 2.125293473402894e-06,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 1931,
    "uncertainty_score": 6.10796812302342e-06,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 1932,
    "uncertainty_score": 1.4509232417219066e-05,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 1933,
    "uncertainty_score": 5.253149066625767e-09,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 1934,
    "uncertainty_score": 3.569126512996434e-05,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 1935,
    "uncertainty_score": 0.19988242885987162,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 1936,
    "uncertainty_score": 0.0020450933588355116,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 1937,
    "uncertainty_score": 0.5000000012883727,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 1938,
    "uncertainty_score": 0.3748275080383557,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 1939,
    "uncertainty_score": 5.12690456076152e-05,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 1940,
    "uncertainty_score": 1.9841465857893425e-05,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 1941,
    "uncertainty_score": 0.2500000027282033,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 1942,
    "uncertainty_score": 0.20130732890109865,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 1943,
    "uncertainty_score": 1.2857594027015517e-09,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 1944,
    "uncertainty_score": 1.7786288022874612e-07,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 1945,
    "uncertainty_score": 2.258054580310742e-05,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 1946,
    "uncertainty_score": 8.587025612924881e-06,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 1947,
    "uncertainty_score": 2.8273461567085423e-07,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 1948,
    "uncertainty_score": 3.8998219961787767e-10,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 1949,
    "uncertainty_score": 0.14242693647076457,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 1950,
    "uncertainty_score": 1.2092958803442103e-09,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 1951,
    "uncertainty_score": 3.078395404148036e-07,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 1952,
    "uncertainty_score": 6.011214907080276e-06,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 1953,
    "uncertainty_score": 0.3324540719044612,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 1954,
    "uncertainty_score": 9.627101376224305e-10,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 1955,
    "uncertainty_score": 0.00669771155456445,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 1956,
    "uncertainty_score": 1.574671278828244e-06,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 1957,
    "uncertainty_score": 0.3495502502189268,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 1958,
    "uncertainty_score": 2.3687773392085667e-09,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 1959,
    "uncertainty_score": 0.2006176198660215,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 1960,
    "uncertainty_score": 0.16666669389412425,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 1961,
    "uncertainty_score": 6.689646625970505e-10,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 1962,
    "uncertainty_score": 0.20001882413166946,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 1963,
    "uncertainty_score": 4.4463491383023875e-05,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 1964,
    "uncertainty_score": 0.011276638409222833,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 1965,
    "uncertainty_score": 0.25000274136259226,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 1966,
    "uncertainty_score": 0.4304127541979007,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 1967,
    "uncertainty_score": 1.2052140444811257e-08,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 1968,
    "uncertainty_score": 0.2500001513107385,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 1969,
    "uncertainty_score": 0.23649983886126918,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 1970,
    "uncertainty_score": 8.90983074739188e-05,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 1971,
    "uncertainty_score": 0.4999959945604229,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 1972,
    "uncertainty_score": 0.0005101691945825174,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 1973,
    "uncertainty_score": 0.5000029431568322,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 1974,
    "uncertainty_score": 1.7844875475320705e-07,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 1975,
    "uncertainty_score": 3.613907901413463e-06,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 1976,
    "uncertainty_score": 8.303602073560053e-06,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 1977,
    "uncertainty_score": 4.626300154502323e-06,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 1978,
    "uncertainty_score": 3.50131357947251e-08,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 1979,
    "uncertainty_score": 5.223920855235968e-05,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 1980,
    "uncertainty_score": 0.49794100228934135,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 1981,
    "uncertainty_score": 3.4157139563406873e-10,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 1982,
    "uncertainty_score": 0.40000000666682445,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 1983,
    "uncertainty_score": 0.012655891861280999,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 1984,
    "uncertainty_score": 1.3237799149779593e-08,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 1985,
    "uncertainty_score": 0.20006440355160157,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 1986,
    "uncertainty_score": 4.803306093194095e-09,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 1987,
    "uncertainty_score": 2.6628205729443987e-08,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 1988,
    "uncertainty_score": 0.2500000347708523,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 1989,
    "uncertainty_score": 1.0693833005938998e-05,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 1990,
    "uncertainty_score": 0.2486003037082452,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 1991,
    "uncertainty_score": 0.3999343432447042,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 1992,
    "uncertainty_score": 2.6052512420502102e-06,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 1993,
    "uncertainty_score": 0.250081105514719,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 1994,
    "uncertainty_score": 4.732111526804976e-09,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 1995,
    "uncertainty_score": 1.0423194267403424e-12,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 1996,
    "uncertainty_score": 0.20003488320052054,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 1997,
    "uncertainty_score": 0.24999578290038704,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 1998,
    "uncertainty_score": 1.305723587152484e-08,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 1999,
    "uncertainty_score": 0.4988355990550842,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 2000,
    "uncertainty_score": 0.0003519057045039315,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2001,
    "uncertainty_score": 4.7630987594282526e-07,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 2002,
    "uncertainty_score": 0.2037809106773782,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 2003,
    "uncertainty_score": 3.2893000295146985e-08,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2004,
    "uncertainty_score": 0.2159185546246921,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2005,
    "uncertainty_score": 0.2037485483317223,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2006,
    "uncertainty_score": 6.869742891408586e-08,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 2007,
    "uncertainty_score": 3.168847414142046e-05,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 2008,
    "uncertainty_score": 0.9999628850240351,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2009,
    "uncertainty_score": 6.310429300060762e-06,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 2010,
    "uncertainty_score": 0.036640025050537976,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 2011,
    "uncertainty_score": 0.20000001128210046,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 2012,
    "uncertainty_score": 0.19146180370767363,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 2013,
    "uncertainty_score": 0.2499999793759098,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2014,
    "uncertainty_score": 3.465012089842396e-07,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 2015,
    "uncertainty_score": 0.49999938530980415,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 2016,
    "uncertainty_score": 0.01191615433898363,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 2017,
    "uncertainty_score": 9.386933908770069e-10,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2018,
    "uncertainty_score": 9.34912144519706e-09,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 2019,
    "uncertainty_score": 0.00042381092342149286,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 2020,
    "uncertainty_score": 3.8968329869176745e-07,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 2021,
    "uncertainty_score": 7.569011676501036e-09,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2022,
    "uncertainty_score": 0.3684978739517853,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 2023,
    "uncertainty_score": 0.1668094215327442,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2024,
    "uncertainty_score": 1.3898346771568475e-06,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 2025,
    "uncertainty_score": 2.524221408650068e-10,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 2026,
    "uncertainty_score": 3.5991421170565163e-07,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 2027,
    "uncertainty_score": 1.3609385247018421e-09,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 2028,
    "uncertainty_score": 8.37252561688022e-08,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 2029,
    "uncertainty_score": 0.22648569546364214,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 2030,
    "uncertainty_score": 0.33333333300001244,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 2031,
    "uncertainty_score": 0.24943714808411965,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 2032,
    "uncertainty_score": 1.6200088264517877e-07,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2033,
    "uncertainty_score": 1.6423028927770696e-05,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2034,
    "uncertainty_score": 0.0014326461958873561,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 2035,
    "uncertainty_score": 0.20002938053326366,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 2036,
    "uncertainty_score": 0.25000027193363533,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 2037,
    "uncertainty_score": 0.36382475396612,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 2038,
    "uncertainty_score": 1.1977390196357333e-10,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 2039,
    "uncertainty_score": 5.259537996296005e-06,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 2040,
    "uncertainty_score": 2.2624848739967716e-10,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 2041,
    "uncertainty_score": 0.24531569635820455,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 2042,
    "uncertainty_score": 0.20000000510434418,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 2043,
    "uncertainty_score": 4.265458083010081e-07,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 2044,
    "uncertainty_score": 1.2109723583549476e-07,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 2045,
    "uncertainty_score": 0.000680303342289897,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 2046,
    "uncertainty_score": 0.40000051409322246,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2047,
    "uncertainty_score": 0.6000002240501594,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 2048,
    "uncertainty_score": 0.19974765822402002,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 2049,
    "uncertainty_score": 9.742913157895278e-05,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2050,
    "uncertainty_score": 0.4000000192529658,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 2051,
    "uncertainty_score": 0.0007153348065704179,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 2052,
    "uncertainty_score": 0.2500050424402347,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2053,
    "uncertainty_score": 3.218498377711122e-07,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 2054,
    "uncertainty_score": 0.0007574131389877914,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 2055,
    "uncertainty_score": 0.16684445306522924,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 2056,
    "uncertainty_score": 5.943404339232623e-10,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 2057,
    "uncertainty_score": 0.333335121681459,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 2058,
    "uncertainty_score": 0.20000292517500684,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2059,
    "uncertainty_score": 5.9904726604894686e-09,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 2060,
    "uncertainty_score": 0.16666673546287683,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2061,
    "uncertainty_score": 8.052514968474527e-07,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 2062,
    "uncertainty_score": 1.086769175089747e-06,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 2063,
    "uncertainty_score": 0.20000527854391853,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 2064,
    "uncertainty_score": 2.418608969977326e-10,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 2065,
    "uncertainty_score": 0.0013604282924653197,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 2066,
    "uncertainty_score": 0.005351876269625533,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2067,
    "uncertainty_score": 0.042804329896500244,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 2068,
    "uncertainty_score": 3.0901850207937997e-07,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 2069,
    "uncertainty_score": 0.6026175250378296,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2070,
    "uncertainty_score": 0.4033842702624007,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2071,
    "uncertainty_score": 0.0033848875354578747,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 2072,
    "uncertainty_score": 0.2605219452697226,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2073,
    "uncertainty_score": 6.280728785440927e-07,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 2074,
    "uncertainty_score": 1.3268774795217289e-05,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 2075,
    "uncertainty_score": 0.9999999998,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2076,
    "uncertainty_score": 0.25000025858954805,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 2077,
    "uncertainty_score": 0.0005073813690812711,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2078,
    "uncertainty_score": 3.240829245116587e-20,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 2079,
    "uncertainty_score": 0.2542325295940763,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 2080,
    "uncertainty_score": 0.5000023319790136,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2081,
    "uncertainty_score": 0.19999999988928255,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2082,
    "uncertainty_score": 0.7500000000422977,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2083,
    "uncertainty_score": 0.1674630117660972,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2084,
    "uncertainty_score": 0.0065508862842407435,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2085,
    "uncertainty_score": 1.1331828284829815e-05,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 2086,
    "uncertainty_score": 0.25019893977311036,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 2087,
    "uncertainty_score": 0.40001467316151385,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 2088,
    "uncertainty_score": 0.00048168369941307927,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2089,
    "uncertainty_score": 3.605642824148426e-06,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 2090,
    "uncertainty_score": 0.39957243571396434,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2091,
    "uncertainty_score": 0.3333333401032139,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2092,
    "uncertainty_score": 0.3892135668947378,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2093,
    "uncertainty_score": 0.5000000229462651,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 2094,
    "uncertainty_score": 0.8000687925024316,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2095,
    "uncertainty_score": 0.7999999998,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2096,
    "uncertainty_score": 0.27768195056021344,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2097,
    "uncertainty_score": 0.4001049476829211,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2098,
    "uncertainty_score": 0.4435519898893713,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2099,
    "uncertainty_score": 4.004969788058588e-06,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2100,
    "uncertainty_score": 0.2730412330113893,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 2101,
    "uncertainty_score": 0.4,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2102,
    "uncertainty_score": 3.1031095811350436e-08,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2103,
    "uncertainty_score": 0.6000002277887222,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 2104,
    "uncertainty_score": 0.40000664283875587,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2105,
    "uncertainty_score": 0.00018885220006263192,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2106,
    "uncertainty_score": 0.20083993239157208,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 2107,
    "uncertainty_score": 1.0099546148843004e-05,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2108,
    "uncertainty_score": 0.16666695103060025,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2109,
    "uncertainty_score": 0.5,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2110,
    "uncertainty_score": 0.2500000224193731,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2111,
    "uncertainty_score": 0.40000022019244585,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2112,
    "uncertainty_score": 0.7500000000401632,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2113,
    "uncertainty_score": 0.3999999891147108,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2114,
    "uncertainty_score": 0.004164331437245932,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2115,
    "uncertainty_score": 0.5000000008158401,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2116,
    "uncertainty_score": 0.7999999992,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2117,
    "uncertainty_score": 0.6009315207055346,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2118,
    "uncertainty_score": 1.214922753484304e-10,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 2119,
    "uncertainty_score": 0.5424607812025858,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2120,
    "uncertainty_score": 0.5000053333942223,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2121,
    "uncertainty_score": 0.7499999997261493,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2122,
    "uncertainty_score": 0.20000001423240438,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 2123,
    "uncertainty_score": 2.3107981084372326e-19,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 2124,
    "uncertainty_score": 0.20035857783384148,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2125,
    "uncertainty_score": 0.9999999998,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2126,
    "uncertainty_score": 0.333335952572048,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2127,
    "uncertainty_score": 0.16666703640970792,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2128,
    "uncertainty_score": 0.0026223596376600145,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2129,
    "uncertainty_score": 0.6,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 2130,
    "uncertainty_score": 0.24999999974999992,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2131,
    "uncertainty_score": 0.5000036492280578,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2132,
    "uncertainty_score": 0.000583952898589725,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2133,
    "uncertainty_score": 0.250271841264059,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2134,
    "uncertainty_score": 1.4719612125119281e-07,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 2135,
    "uncertainty_score": 0.19998303794587766,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 2136,
    "uncertainty_score": 0.2000007075033769,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 2137,
    "uncertainty_score": 0.2605820540359117,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 2138,
    "uncertainty_score": 2.7035725977492644e-06,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2139,
    "uncertainty_score": 0.4000000029832094,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2140,
    "uncertainty_score": 0.25048178761384804,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2141,
    "uncertainty_score": 0.20000002960396346,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2142,
    "uncertainty_score": 0.3333333331169858,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2143,
    "uncertainty_score": 0.600000307480699,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2144,
    "uncertainty_score": 0.4809356884399375,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2145,
    "uncertainty_score": 0.74999999975,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2146,
    "uncertainty_score": 0.4000000079358242,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2147,
    "uncertainty_score": 0.5433220518935813,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2148,
    "uncertainty_score": 0.4396873774857545,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2149,
    "uncertainty_score": 0.6,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2150,
    "uncertainty_score": 0.16667648868236798,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 2151,
    "uncertainty_score": 0.35018323111206673,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 2152,
    "uncertainty_score": 0.8039438253208067,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2153,
    "uncertainty_score": 0.34841377651111005,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2154,
    "uncertainty_score": 0.5871612830859213,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2155,
    "uncertainty_score": 0.20103326942597008,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 2156,
    "uncertainty_score": 5.138903636122143e-05,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2157,
    "uncertainty_score": 0.668352889560495,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2158,
    "uncertainty_score": 1.411291047881238e-12,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2159,
    "uncertainty_score": 0.800000354084737,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 2160,
    "uncertainty_score": 0.04825016227218854,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2161,
    "uncertainty_score": 0.5394116400099218,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2162,
    "uncertainty_score": 0.0006929974047555996,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 2163,
    "uncertainty_score": 1.2410147053065374e-05,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 2164,
    "uncertainty_score": 4.963528130972057e-10,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 2165,
    "uncertainty_score": 2.5471838486806138e-05,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2166,
    "uncertainty_score": 4.689431937362288e-06,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 2167,
    "uncertainty_score": 0.3333348743373949,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2168,
    "uncertainty_score": 1.0,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 2169,
    "uncertainty_score": 0.75,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 2170,
    "uncertainty_score": 0.5999995575200308,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 2171,
    "uncertainty_score": 0.25,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 2172,
    "uncertainty_score": 6.142894706887014e-07,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 2173,
    "uncertainty_score": 0.6000000000820624,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 2174,
    "uncertainty_score": 0.5233253329993557,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 2175,
    "uncertainty_score": 0.636363646701282,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2176,
    "uncertainty_score": 1.0287836682630371e-10,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 2177,
    "uncertainty_score": 0.19671670113966452,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 2178,
    "uncertainty_score": 7.625072494313042e-10,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 2179,
    "uncertainty_score": 1.6808595494006394e-06,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 2180,
    "uncertainty_score": 0.5875033456294383,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 2181,
    "uncertainty_score": 0.4999999998333333,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2182,
    "uncertainty_score": 0.6568357964919016,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 2183,
    "uncertainty_score": 0.39925074831994356,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 2184,
    "uncertainty_score": 0.0,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 2185,
    "uncertainty_score": 0.0463615236023918,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2186,
    "uncertainty_score": 0.2000302789097163,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 2187,
    "uncertainty_score": 0.2500000000001879,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 2188,
    "uncertainty_score": 0.25195837127546544,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2189,
    "uncertainty_score": 1.05316247923132e-05,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2190,
    "uncertainty_score": 0.6000000157945304,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 2191,
    "uncertainty_score": 0.19993764516870347,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 2192,
    "uncertainty_score": 0.40004806218034494,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2193,
    "uncertainty_score": 0.2500040059535981,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2194,
    "uncertainty_score": 1.0,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 2195,
    "uncertainty_score": 0.20000114843994857,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 2196,
    "uncertainty_score": 5.58624663473791e-05,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2197,
    "uncertainty_score": 6.177950398847241e-05,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2198,
    "uncertainty_score": 5.13234529711523e-08,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2199,
    "uncertainty_score": 7.13840011880276e-06,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 2200,
    "uncertainty_score": 1.3177231223313001e-06,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 2201,
    "uncertainty_score": 0.0004434476034470876,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 2202,
    "uncertainty_score": 0.2500005552310428,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 2203,
    "uncertainty_score": 0.24991740668552015,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 2204,
    "uncertainty_score": 1.6434946812773042e-09,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2205,
    "uncertainty_score": 0.2500126149060972,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2206,
    "uncertainty_score": 5.503071576149738e-07,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 2207,
    "uncertainty_score": 0.24988180292012385,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 2208,
    "uncertainty_score": 0.21715942941234487,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 2209,
    "uncertainty_score": 7.933393933603318e-11,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 2210,
    "uncertainty_score": 2.485468387049647e-10,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 2211,
    "uncertainty_score": 3.232745253970702e-06,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 2212,
    "uncertainty_score": 0.14286404227376312,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 2213,
    "uncertainty_score": 1.0609911476041963e-07,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 2214,
    "uncertainty_score": 0.17030646993700946,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 2215,
    "uncertainty_score": 1.3869910837059509e-10,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 2216,
    "uncertainty_score": 0.0004328330693462468,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2217,
    "uncertainty_score": 8.207681406003714e-09,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 2218,
    "uncertainty_score": 0.021011055407252316,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 2219,
    "uncertainty_score": 0.004029334659250581,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 2220,
    "uncertainty_score": 2.6985600031837142e-08,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 2221,
    "uncertainty_score": 0.25000024173014707,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 2222,
    "uncertainty_score": 7.272809737199931e-05,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 2223,
    "uncertainty_score": 9.60948395843395e-12,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 2224,
    "uncertainty_score": 0.0006930966174964393,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 2225,
    "uncertainty_score": 0.199900375095924,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 2226,
    "uncertainty_score": 0.20304905978331061,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 2227,
    "uncertainty_score": 4.1667419491855806e-07,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 2228,
    "uncertainty_score": 0.0003307539932519391,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2229,
    "uncertainty_score": 0.2097715612797723,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 2230,
    "uncertainty_score": 4.228261030930833e-05,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 2231,
    "uncertainty_score": 0.1739220239560267,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 2232,
    "uncertainty_score": 0.4000000015182712,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 2233,
    "uncertainty_score": 0.19999999980219993,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 2234,
    "uncertainty_score": 6.185227549847282e-09,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2235,
    "uncertainty_score": 0.03801539421060441,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 2236,
    "uncertainty_score": 0.35244098030707366,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 2237,
    "uncertainty_score": 0.20000043966817643,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2238,
    "uncertainty_score": 0.042053967747502606,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 2239,
    "uncertainty_score": 2.946489172344057e-09,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 2240,
    "uncertainty_score": 5.374250252431711e-06,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 2241,
    "uncertainty_score": 0.07573505195607556,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 2242,
    "uncertainty_score": 3.4805403704605467e-09,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 2243,
    "uncertainty_score": 0.200022042223504,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 2244,
    "uncertainty_score": 9.20069299078312e-08,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2245,
    "uncertainty_score": 9.094385396266172e-09,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 2246,
    "uncertainty_score": 0.2499999997500002,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2247,
    "uncertainty_score": 0.0011055739867929743,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2248,
    "uncertainty_score": 3.326054946822132e-08,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 2249,
    "uncertainty_score": 7.058965580626504e-07,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 2250,
    "uncertainty_score": 5.5132993155622196e-08,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 2251,
    "uncertainty_score": 3.4150971778409335e-08,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 2252,
    "uncertainty_score": 0.6477774563691964,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 2253,
    "uncertainty_score": 0.20290071590458805,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2254,
    "uncertainty_score": 1.5901522269464151e-09,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 2255,
    "uncertainty_score": 9.435335891943513e-05,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 2256,
    "uncertainty_score": 3.738518658227413e-08,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 2257,
    "uncertainty_score": 8.693150256654695e-10,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 2258,
    "uncertainty_score": 1.2332322161881939e-10,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 2259,
    "uncertainty_score": 3.806568124507187e-09,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 2260,
    "uncertainty_score": 0.001196699842148044,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 2261,
    "uncertainty_score": 0.25041211895576043,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 2262,
    "uncertainty_score": 3.7747674737322884e-11,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 2263,
    "uncertainty_score": 0.0003861519102147,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 2264,
    "uncertainty_score": 0.2500089106364019,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2265,
    "uncertainty_score": 5.713749519706716e-07,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2266,
    "uncertainty_score": 2.070058429670285e-10,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 2267,
    "uncertainty_score": 1.2114312952167214e-09,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 2268,
    "uncertainty_score": 0.3333333345239919,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 2269,
    "uncertainty_score": 0.33333631289072335,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2270,
    "uncertainty_score": 2.263269421579963e-06,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 2271,
    "uncertainty_score": 0.2500417261942193,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2272,
    "uncertainty_score": 0.0025319548786915816,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 2273,
    "uncertainty_score": 0.021010289672844785,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 2274,
    "uncertainty_score": 0.2500000001012321,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 2275,
    "uncertainty_score": 0.3331424790726997,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 2276,
    "uncertainty_score": 0.20000231334266189,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 2277,
    "uncertainty_score": 1.9042618915565187e-07,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2278,
    "uncertainty_score": 8.881615742229353e-09,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 2279,
    "uncertainty_score": 1.0342883880120247e-06,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 2280,
    "uncertainty_score": 0.2000244050299713,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 2281,
    "uncertainty_score": 0.2000000003249907,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 2282,
    "uncertainty_score": 0.2499998237810146,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2283,
    "uncertainty_score": 0.4021666215771741,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2284,
    "uncertainty_score": 3.128391852951803e-06,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2285,
    "uncertainty_score": 0.595632740655933,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 2286,
    "uncertainty_score": 0.0008098372875472898,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 2287,
    "uncertainty_score": 0.4999367837421123,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2288,
    "uncertainty_score": 0.002996678540073394,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 2289,
    "uncertainty_score": 1.6274014125035025e-05,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 2290,
    "uncertainty_score": 2.396176527022827e-10,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 2291,
    "uncertainty_score": 0.2776818280732995,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 2292,
    "uncertainty_score": 0.0008423329576223132,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 2293,
    "uncertainty_score": 0.000691804980458497,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 2294,
    "uncertainty_score": 0.20002045207727295,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2295,
    "uncertainty_score": 8.978259987181656e-05,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 2296,
    "uncertainty_score": 2.5582894330199387e-10,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 2297,
    "uncertainty_score": 0.16684796687673656,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 2298,
    "uncertainty_score": 0.20003601658894715,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2299,
    "uncertainty_score": 0.0020461141687727284,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 2300,
    "uncertainty_score": 0.12171042547679559,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 2301,
    "uncertainty_score": 0.1746770731616251,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 2302,
    "uncertainty_score": 0.5992918910130173,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 2303,
    "uncertainty_score": 0.013174943696285482,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 2304,
    "uncertainty_score": 4.831522526577414e-06,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 2305,
    "uncertainty_score": 3.7953204961868203e-13,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2306,
    "uncertainty_score": 0.00013822416203138063,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 2307,
    "uncertainty_score": 0.3999999998,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 2308,
    "uncertainty_score": 2.3221217500506037e-07,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 2309,
    "uncertainty_score": 0.3333333502241394,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2310,
    "uncertainty_score": 0.2500000000148388,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 2311,
    "uncertainty_score": 0.2500039636285405,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 2312,
    "uncertainty_score": 4.863855749749351e-09,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 2313,
    "uncertainty_score": 1.024982200633977e-05,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 2314,
    "uncertainty_score": 0.20000605112739467,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 2315,
    "uncertainty_score": 0.24999799420970995,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 2316,
    "uncertainty_score": 1.2016211069363428e-10,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 2317,
    "uncertainty_score": 0.20000681229368106,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 2318,
    "uncertainty_score": 2.372891976485579e-06,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 2319,
    "uncertainty_score": 7.102436207864299e-06,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 2320,
    "uncertainty_score": 0.2557258432715468,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 2321,
    "uncertainty_score": 0.0005843942172685233,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 2322,
    "uncertainty_score": 0.0003484788186002009,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 2323,
    "uncertainty_score": 4.892769068673992e-06,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 2324,
    "uncertainty_score": 0.007378341631012626,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 2325,
    "uncertainty_score": 0.4037474163581666,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2326,
    "uncertainty_score": 0.006350855665951251,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2327,
    "uncertainty_score": 0.6666666705829676,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 2328,
    "uncertainty_score": 0.2500000035451301,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 2329,
    "uncertainty_score": 0.005514363352496501,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 2330,
    "uncertainty_score": 0.1666725172821071,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 2331,
    "uncertainty_score": 6.3059666435627235e-06,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2332,
    "uncertainty_score": 0.0008864332375746456,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 2333,
    "uncertainty_score": 1.4761302501056317e-05,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 2334,
    "uncertainty_score": 0.005142067132722385,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 2335,
    "uncertainty_score": 0.3333333397934621,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2336,
    "uncertainty_score": 0.5129491318109425,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2337,
    "uncertainty_score": 1.5040373797400587e-06,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 2338,
    "uncertainty_score": 8.303587245446335e-06,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 2339,
    "uncertainty_score": 7.575512271113289e-10,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2340,
    "uncertainty_score": 0.14288612196914158,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 2341,
    "uncertainty_score": 2.812008508865927e-07,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 2342,
    "uncertainty_score": 0.399999817213868,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 2343,
    "uncertainty_score": 5.746385758044191e-08,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 2344,
    "uncertainty_score": 3.076753431588256e-08,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 2345,
    "uncertainty_score": 0.0007191025491175963,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 2346,
    "uncertainty_score": 0.16700363297105703,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 2347,
    "uncertainty_score": 0.20059931632836842,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2348,
    "uncertainty_score": 2.233817978420044e-05,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2349,
    "uncertainty_score": 2.6589027070666125e-08,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 2350,
    "uncertainty_score": 7.483457752450302e-06,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 2351,
    "uncertainty_score": 0.00012044996901240909,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 2352,
    "uncertainty_score": 0.20169937591502807,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 2353,
    "uncertainty_score": 3.2303122200973684e-05,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 2354,
    "uncertainty_score": 4.383523705931595e-07,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2355,
    "uncertainty_score": 2.1747327997515783e-10,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 2356,
    "uncertainty_score": 3.676245226356108e-05,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 2357,
    "uncertainty_score": 0.02768617237917326,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 2358,
    "uncertainty_score": 6.968645308208547e-08,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 2359,
    "uncertainty_score": 6.334234230796111e-05,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 2360,
    "uncertainty_score": 0.6615776400953183,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 2361,
    "uncertainty_score": 0.16354406604349211,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2362,
    "uncertainty_score": 0.19999615200782533,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 2363,
    "uncertainty_score": 0.25000014636117796,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 2364,
    "uncertainty_score": 0.5029520515748233,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2365,
    "uncertainty_score": 0.20000235211755038,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 2366,
    "uncertainty_score": 0.03177438694080996,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 2367,
    "uncertainty_score": 0.24508423946735505,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2368,
    "uncertainty_score": 4.7596277064384263e-07,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 2369,
    "uncertainty_score": 4.567531231357099e-06,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 2370,
    "uncertainty_score": 1.6258097689707807e-09,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 2371,
    "uncertainty_score": 0.5001311855958948,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 2372,
    "uncertainty_score": 0.0015889154038271325,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 2373,
    "uncertainty_score": 1.2408378580689306e-06,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 2374,
    "uncertainty_score": 1.676251761388819e-06,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 2375,
    "uncertainty_score": 9.832281353059183e-07,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 2376,
    "uncertainty_score": 0.3333575147279339,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 2377,
    "uncertainty_score": 4.932595438068188e-06,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 2378,
    "uncertainty_score": 0.0016651179777907093,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 2379,
    "uncertainty_score": 9.609311082029314e-05,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 2380,
    "uncertainty_score": 0.16666667027450977,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 2381,
    "uncertainty_score": 0.0159242767047432,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 2382,
    "uncertainty_score": 7.369060323719192e-10,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 2383,
    "uncertainty_score": 0.2652541735424089,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2384,
    "uncertainty_score": 0.24639032519816506,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2385,
    "uncertainty_score": 0.33333335755182714,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 2386,
    "uncertainty_score": 0.19999891009969478,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 2387,
    "uncertainty_score": 3.493679361590657e-07,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2388,
    "uncertainty_score": 1.5751714988971497e-06,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 2389,
    "uncertainty_score": 7.483357918036699e-07,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 2390,
    "uncertainty_score": 0.004372210933499257,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 2391,
    "uncertainty_score": 0.25000276593545656,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 2392,
    "uncertainty_score": 0.05345379511772355,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 2393,
    "uncertainty_score": 1.488896256622647e-09,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 2394,
    "uncertainty_score": 2.2857597622252158e-07,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 2395,
    "uncertainty_score": 1.2061837966658184e-05,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 2396,
    "uncertainty_score": 0.3333353180464762,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 2397,
    "uncertainty_score": 9.143308275251311e-07,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 2398,
    "uncertainty_score": 0.26283398271045205,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 2399,
    "uncertainty_score": 9.318190347360042e-08,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 2400,
    "uncertainty_score": 0.3895394579181337,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 2401,
    "uncertainty_score": 0.1993849311336552,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 2402,
    "uncertainty_score": 0.00248633203007298,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 2403,
    "uncertainty_score": 7.952817915882273e-09,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 2404,
    "uncertainty_score": 1.0197887616492448e-06,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 2405,
    "uncertainty_score": 0.2500000689320344,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 2406,
    "uncertainty_score": 0.5999977771666655,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 2407,
    "uncertainty_score": 0.3333333127881589,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2408,
    "uncertainty_score": 0.30796205019740874,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 2409,
    "uncertainty_score": 0.00028407737934348196,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2410,
    "uncertainty_score": 0.49999994390695657,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 2411,
    "uncertainty_score": 0.200008587872736,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2412,
    "uncertainty_score": 0.19988951242342495,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 2413,
    "uncertainty_score": 5.179122482170112e-07,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 2414,
    "uncertainty_score": 0.20000000005686033,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 2415,
    "uncertainty_score": 0.24870854939818582,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 2416,
    "uncertainty_score": 1.67941095176033e-05,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2417,
    "uncertainty_score": 0.1666707639843985,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2418,
    "uncertainty_score": 0.13264055595014762,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2419,
    "uncertainty_score": 0.008058667908606596,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 2420,
    "uncertainty_score": 0.0037131375252846114,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2421,
    "uncertainty_score": 2.529482255460203e-05,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 2422,
    "uncertainty_score": 1.999819154906309e-05,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 2423,
    "uncertainty_score": 2.024058134937107e-07,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 2424,
    "uncertainty_score": 9.378930246548348e-07,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 2425,
    "uncertainty_score": 0.2000000295606213,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2426,
    "uncertainty_score": 0.0005201852272630665,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 2427,
    "uncertainty_score": 0.6000000009790265,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2428,
    "uncertainty_score": 4.53618983367326e-09,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 2429,
    "uncertainty_score": 0.004017560072969532,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2430,
    "uncertainty_score": 0.0006930056048865254,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 2431,
    "uncertainty_score": 0.00020667901298198368,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 2432,
    "uncertainty_score": 0.19999989235264537,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 2433,
    "uncertainty_score": 9.878800265219644e-07,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 2434,
    "uncertainty_score": 9.19065909231284e-07,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 2435,
    "uncertainty_score": 0.3333334159682087,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 2436,
    "uncertainty_score": 5.0415954238324455e-06,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 2437,
    "uncertainty_score": 0.25110834616103545,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 2438,
    "uncertainty_score": 0.6586079380920573,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2439,
    "uncertainty_score": 0.9566436882244416,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2440,
    "uncertainty_score": 1.196301265383171e-10,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 2441,
    "uncertainty_score": 0.24968226690086398,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 2442,
    "uncertainty_score": 3.873324721437556e-09,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2443,
    "uncertainty_score": 1.276428933657181e-07,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 2444,
    "uncertainty_score": 0.0002718404454679603,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 2445,
    "uncertainty_score": 0.4009261189939033,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 2446,
    "uncertainty_score": 0.20000499522525397,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 2447,
    "uncertainty_score": 6.2775342728362254e-09,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2448,
    "uncertainty_score": 0.2500030950779589,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 2449,
    "uncertainty_score": 0.2500015689522795,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 2450,
    "uncertainty_score": 0.1540582553241356,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2451,
    "uncertainty_score": 0.07128429901877108,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 2452,
    "uncertainty_score": 0.2004743545783735,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 2453,
    "uncertainty_score": 1.1205519260846185e-05,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 2454,
    "uncertainty_score": 0.0010751426850160524,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 2455,
    "uncertainty_score": 3.7318843864177865e-08,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 2456,
    "uncertainty_score": 9.498354176232099e-07,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 2457,
    "uncertainty_score": 1.346046986545563e-07,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 2458,
    "uncertainty_score": 0.5028039179318786,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2459,
    "uncertainty_score": 0.33335628905236164,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2460,
    "uncertainty_score": 4.523588442643117e-07,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 2461,
    "uncertainty_score": 0.16698714130210657,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 2462,
    "uncertainty_score": 0.06272839160944553,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 2463,
    "uncertainty_score": 0.2500002083643616,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 2464,
    "uncertainty_score": 0.000443842430883254,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2465,
    "uncertainty_score": 0.333333335953528,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2466,
    "uncertainty_score": 2.657384360218861e-05,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 2467,
    "uncertainty_score": 0.00033968816890466395,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 2468,
    "uncertainty_score": 0.3342510615799587,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 2469,
    "uncertainty_score": 0.1907277734282926,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2470,
    "uncertainty_score": 0.3333334349780614,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 2471,
    "uncertainty_score": 3.388204494421919e-08,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 2472,
    "uncertainty_score": 4.3259443110927525e-06,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 2473,
    "uncertainty_score": 2.8932402992957642e-05,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 2474,
    "uncertainty_score": 1.0811683625406027e-07,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2475,
    "uncertainty_score": 6.328934148399411e-05,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 2476,
    "uncertainty_score": 2.3482099416127016e-07,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2477,
    "uncertainty_score": 1.957979184979707e-10,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 2478,
    "uncertainty_score": 2.186636379164898e-09,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 2479,
    "uncertainty_score": 0.0052081519600971566,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 2480,
    "uncertainty_score": 0.5000000000228951,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 2481,
    "uncertainty_score": 0.20026777622694292,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 2482,
    "uncertainty_score": 0.2505667663160885,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 2483,
    "uncertainty_score": 1.174091941853221e-06,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 2484,
    "uncertainty_score": 1.6711337837052108e-07,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 2485,
    "uncertainty_score": 1.4511414964953396e-05,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 2486,
    "uncertainty_score": 2.9436921304740032e-05,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2487,
    "uncertainty_score": 0.2066629053558428,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2488,
    "uncertainty_score": 0.49618851779017564,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 2489,
    "uncertainty_score": 0.7999858042532313,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 2490,
    "uncertainty_score": 5.613508286509252e-07,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2491,
    "uncertainty_score": 0.4062287659275922,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 2492,
    "uncertainty_score": 0.20007144859233256,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 2493,
    "uncertainty_score": 0.04404985443503747,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 2494,
    "uncertainty_score": 0.4999999739733628,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 2495,
    "uncertainty_score": 8.370174507587145e-09,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 2496,
    "uncertainty_score": 9.509135255114919e-08,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 2497,
    "uncertainty_score": 5.295301992696968e-06,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2498,
    "uncertainty_score": 1.1193677262453573e-08,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 2499,
    "uncertainty_score": 0.012108624685713573,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2500,
    "uncertainty_score": 0.00021769251915526808,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2501,
    "uncertainty_score": 0.0053528238769490555,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 2502,
    "uncertainty_score": 0.24957230338485967,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 2503,
    "uncertainty_score": 0.20002442412644067,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 2504,
    "uncertainty_score": 0.00021872960814411937,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 2505,
    "uncertainty_score": 2.1536271822919396e-10,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 2506,
    "uncertainty_score": 0.4026588491205718,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 2507,
    "uncertainty_score": 9.508755924194746e-05,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 2508,
    "uncertainty_score": 0.6000256806465474,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2509,
    "uncertainty_score": 1.5133723123617566e-05,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2510,
    "uncertainty_score": 1.2133231484226516e-05,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 2511,
    "uncertainty_score": 0.3230251416651289,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 2512,
    "uncertainty_score": 6.225370887427061e-07,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2513,
    "uncertainty_score": 0.0006471779060227561,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 2514,
    "uncertainty_score": 0.000112224120428591,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 2515,
    "uncertainty_score": 0.46423315447633157,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 2516,
    "uncertainty_score": 0.40028204735359124,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 2517,
    "uncertainty_score": 0.16786628053774397,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2518,
    "uncertainty_score": 0.5768076217575685,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2519,
    "uncertainty_score": 0.13276879205069006,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2520,
    "uncertainty_score": 0.2000000045286189,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 2521,
    "uncertainty_score": 0.2000000537740302,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2522,
    "uncertainty_score": 1.4976614580561043e-09,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 2523,
    "uncertainty_score": 1.3460212724886573e-06,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 2524,
    "uncertainty_score": 0.3333522713262185,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2525,
    "uncertainty_score": 0.25000005097037836,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 2526,
    "uncertainty_score": 1.2202225674609158e-12,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2527,
    "uncertainty_score": 0.2027799834070058,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 2528,
    "uncertainty_score": 0.01831317152439248,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2529,
    "uncertainty_score": 0.00041212090962323945,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 2530,
    "uncertainty_score": 5.070997762020388e-06,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 2531,
    "uncertainty_score": 3.9226454567163494e-07,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 2532,
    "uncertainty_score": 3.0723946300541028e-06,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 2533,
    "uncertainty_score": 0.0013317071655667625,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2534,
    "uncertainty_score": 6.0136109001497885e-09,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 2535,
    "uncertainty_score": 0.005666990545567267,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 2536,
    "uncertainty_score": 0.40001241250506414,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2537,
    "uncertainty_score": 1.2355134966618808e-08,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 2538,
    "uncertainty_score": 0.2000039864053497,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2539,
    "uncertainty_score": 1.011160240221445e-11,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2540,
    "uncertainty_score": 0.040493505595042605,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2541,
    "uncertainty_score": 0.25000114732159456,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 2542,
    "uncertainty_score": 4.768414619988031e-07,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 2543,
    "uncertainty_score": 0.000474399909601397,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2544,
    "uncertainty_score": 2.6989206136830904e-07,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2545,
    "uncertainty_score": 0.20015108764241618,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2546,
    "uncertainty_score": 0.20001679665041827,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2547,
    "uncertainty_score": 1.629437133376014e-07,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 2548,
    "uncertainty_score": 8.418230595375027e-10,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 2549,
    "uncertainty_score": 5.458227775702887e-08,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2550,
    "uncertainty_score": 0.25000000324599725,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 2551,
    "uncertainty_score": 9.926206427495316e-06,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2552,
    "uncertainty_score": 0.20000000043212202,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2553,
    "uncertainty_score": 3.423397007702245e-07,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 2554,
    "uncertainty_score": 0.19995367568117775,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 2555,
    "uncertainty_score": 0.001439264969726687,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2556,
    "uncertainty_score": 0.2500247215133141,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 2557,
    "uncertainty_score": 0.5999999997980711,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2558,
    "uncertainty_score": 0.24999999688397145,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2559,
    "uncertainty_score": 0.2019254603263206,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 2560,
    "uncertainty_score": 0.20683124296264674,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2561,
    "uncertainty_score": 0.4159772730648049,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2562,
    "uncertainty_score": 0.3517461552825598,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 2563,
    "uncertainty_score": 0.167672257337784,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 2564,
    "uncertainty_score": 4.706520442595288e-06,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2565,
    "uncertainty_score": 8.334617657964103e-09,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 2566,
    "uncertainty_score": 0.3336127562307392,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2567,
    "uncertainty_score": 0.402139242588352,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2568,
    "uncertainty_score": 1.1312830932509245e-06,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 2569,
    "uncertainty_score": 0.25003125193574866,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2570,
    "uncertainty_score": 4.724485049856015e-08,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 2571,
    "uncertainty_score": 0.42300607424383985,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 2572,
    "uncertainty_score": 0.0024845588637563546,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 2573,
    "uncertainty_score": 0.000692997368785636,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 2574,
    "uncertainty_score": 3.014825879024903e-07,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 2575,
    "uncertainty_score": 0.5001676518917958,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2576,
    "uncertainty_score": 0.7499996146632089,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 2577,
    "uncertainty_score": 0.2505876687687943,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 2578,
    "uncertainty_score": 7.66753739812237e-15,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 2579,
    "uncertainty_score": 3.229947316458643e-07,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 2580,
    "uncertainty_score": 0.15064547726980643,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 2581,
    "uncertainty_score": 0.49996709030708114,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 2582,
    "uncertainty_score": 0.19999999980047273,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2583,
    "uncertainty_score": 0.0001962709396825656,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 2584,
    "uncertainty_score": 0.2500185289400335,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 2585,
    "uncertainty_score": 2.2640673141496535e-13,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2586,
    "uncertainty_score": 0.2002214182227248,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 2587,
    "uncertainty_score": 0.33430658057574797,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2588,
    "uncertainty_score": 0.00031424727596274677,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 2589,
    "uncertainty_score": 0.5051652882437829,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 2590,
    "uncertainty_score": 6.326968974184046e-06,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 2591,
    "uncertainty_score": 0.3999999720882505,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2592,
    "uncertainty_score": 4.4681339523462526e-07,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2593,
    "uncertainty_score": 0.40032967887207976,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 2594,
    "uncertainty_score": 0.33333333466570275,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 2595,
    "uncertainty_score": 0.40038537229394067,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 2596,
    "uncertainty_score": 0.24997388727777667,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2597,
    "uncertainty_score": 7.318315678071159e-08,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 2598,
    "uncertainty_score": 0.19562263519708542,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2599,
    "uncertainty_score": 0.25000004955670063,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 2600,
    "uncertainty_score": 0.16666778487641762,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 2601,
    "uncertainty_score": 9.119967124223482e-05,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 2602,
    "uncertainty_score": 1.9950107161041253e-08,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 2603,
    "uncertainty_score": 0.2000000013651765,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 2604,
    "uncertainty_score": 5.315786930662012e-08,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 2605,
    "uncertainty_score": 0.0004187281092776688,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 2606,
    "uncertainty_score": 1.5224691929134166e-08,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 2607,
    "uncertainty_score": 0.49996904821871335,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2608,
    "uncertainty_score": 0.0,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 2609,
    "uncertainty_score": 0.0005495771191312886,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 2610,
    "uncertainty_score": 0.33333333414324345,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 2611,
    "uncertainty_score": 5.181081016676248e-06,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 2612,
    "uncertainty_score": 0.0012263523039958465,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 2613,
    "uncertainty_score": 0.6000028863801379,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2614,
    "uncertainty_score": 2.4935049832645507e-06,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 2615,
    "uncertainty_score": 1.9433254635247666e-07,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 2616,
    "uncertainty_score": 3.41094225901027e-12,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2617,
    "uncertainty_score": 4.8249371917396284e-11,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 2618,
    "uncertainty_score": 1.262985302929966e-10,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 2619,
    "uncertainty_score": 7.8163887986823e-10,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 2620,
    "uncertainty_score": 1.617573352869462e-08,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 2621,
    "uncertainty_score": 0.24999999977037116,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2622,
    "uncertainty_score": 0.2500068776034027,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2623,
    "uncertainty_score": 0.1669430008285886,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 2624,
    "uncertainty_score": 6.344511012161392e-07,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 2625,
    "uncertainty_score": 0.015223814613685499,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 2626,
    "uncertainty_score": 0.40000392561785514,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 2627,
    "uncertainty_score": 0.25000020547835083,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 2628,
    "uncertainty_score": 2.5374487131554957e-10,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 2629,
    "uncertainty_score": 0.3938893759691346,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 2630,
    "uncertainty_score": 4.6752830315570545e-06,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 2631,
    "uncertainty_score": 1.207868616850681e-08,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 2632,
    "uncertainty_score": 2.461518887702247e-11,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 2633,
    "uncertainty_score": 0.001228719028564067,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2634,
    "uncertainty_score": 0.25000000001857403,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 2635,
    "uncertainty_score": 0.0001593438552246933,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2636,
    "uncertainty_score": 7.083020406653388e-10,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 2637,
    "uncertainty_score": 0.00717907012440861,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2638,
    "uncertainty_score": 9.023766347550899e-07,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 2639,
    "uncertainty_score": 0.20000274680767943,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 2640,
    "uncertainty_score": 0.49997388636805595,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 2641,
    "uncertainty_score": 0.007044173753794764,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 2642,
    "uncertainty_score": 1.17267771368343e-05,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 2643,
    "uncertainty_score": 1.280107374716372e-11,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 2644,
    "uncertainty_score": 4.4713126749415844e-05,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 2645,
    "uncertainty_score": 0.17272847708858255,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2646,
    "uncertainty_score": 4.395795506094608e-05,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 2647,
    "uncertainty_score": 0.1835204951904147,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 2648,
    "uncertainty_score": 0.333344404397206,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 2649,
    "uncertainty_score": 5.9865398771735e-08,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 2650,
    "uncertainty_score": 6.053900823506477e-06,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 2651,
    "uncertainty_score": 0.2000001031133011,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 2652,
    "uncertainty_score": 0.24425731400476725,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2653,
    "uncertainty_score": 0.0004858021245791575,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 2654,
    "uncertainty_score": 0.0007124017470757143,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 2655,
    "uncertainty_score": 4.856462222044654e-09,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 2656,
    "uncertainty_score": 2.9678143673705994e-08,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2657,
    "uncertainty_score": 0.2548134417622821,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 2658,
    "uncertainty_score": 0.013407999074116208,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 2659,
    "uncertainty_score": 6.804761366571993e-06,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2660,
    "uncertainty_score": 0.33333333320003095,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2661,
    "uncertainty_score": 0.530351993660628,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 2662,
    "uncertainty_score": 1.1388610283349111e-05,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 2663,
    "uncertainty_score": 0.2500038101049271,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 2664,
    "uncertainty_score": 0.008919761461259489,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 2665,
    "uncertainty_score": 1.1479829970433335e-06,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 2666,
    "uncertainty_score": 0.004604092847858623,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 2667,
    "uncertainty_score": 0.1998727002317176,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2668,
    "uncertainty_score": 4.6330081076123947e-07,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 2669,
    "uncertainty_score": 0.4001164954687666,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2670,
    "uncertainty_score": 0.21669824204513968,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 2671,
    "uncertainty_score": 0.1999999999068146,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 2672,
    "uncertainty_score": 0.2000000327527835,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2673,
    "uncertainty_score": 0.19999997385277044,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 2674,
    "uncertainty_score": 0.16668322925576798,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 2675,
    "uncertainty_score": 0.003071328490369249,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 2676,
    "uncertainty_score": 2.897544971298807e-10,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 2677,
    "uncertainty_score": 0.0005629675397151864,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 2678,
    "uncertainty_score": 0.5000029951905339,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2679,
    "uncertainty_score": 0.2500063996215205,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 2680,
    "uncertainty_score": 0.40008120357615395,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2681,
    "uncertainty_score": 0.4002951254573743,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 2682,
    "uncertainty_score": 0.20000756641385423,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2683,
    "uncertainty_score": 0.6000284491946035,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2684,
    "uncertainty_score": 2.4788187855285303e-05,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 2685,
    "uncertainty_score": 0.002550366542344141,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2686,
    "uncertainty_score": 1.018716491910444e-06,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2687,
    "uncertainty_score": 0.19999995264802078,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 2688,
    "uncertainty_score": 1.9948669555242822e-15,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2689,
    "uncertainty_score": 0.8000000418890153,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2690,
    "uncertainty_score": 0.5000218241143263,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2691,
    "uncertainty_score": 4.2558220104909996e-06,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2692,
    "uncertainty_score": 0.2365229470465582,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 2693,
    "uncertainty_score": 4.910991396383421e-06,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 2694,
    "uncertainty_score": 8.15015193754735e-05,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 2695,
    "uncertainty_score": 0.25000710219126165,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2696,
    "uncertainty_score": 6.209312948258799e-08,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2697,
    "uncertainty_score": 9.670768091367838e-07,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 2698,
    "uncertainty_score": 0.2001051987230483,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2699,
    "uncertainty_score": 2.4807208001337774e-11,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 2700,
    "uncertainty_score": 0.19999999957362,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 2701,
    "uncertainty_score": 1.9495671762560994e-06,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 2702,
    "uncertainty_score": 4.985106209951181e-08,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 2703,
    "uncertainty_score": 0.19709957578812037,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2704,
    "uncertainty_score": 0.49999999974999815,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2705,
    "uncertainty_score": 0.20164606708053548,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 2706,
    "uncertainty_score": 0.39999999590861773,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 2707,
    "uncertainty_score": 5.530706043820389e-11,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 2708,
    "uncertainty_score": 2.0187141327696364e-09,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 2709,
    "uncertainty_score": 2.2034004182306228e-08,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 2710,
    "uncertainty_score": 0.25000000008876994,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 2711,
    "uncertainty_score": 0.1666666667511761,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 2712,
    "uncertainty_score": 3.339157926387444e-05,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 2713,
    "uncertainty_score": 2.6402400328958607e-06,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2714,
    "uncertainty_score": 0.25000000010833384,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2715,
    "uncertainty_score": 0.20000000635110676,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 2716,
    "uncertainty_score": 3.637071637345053e-09,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 2717,
    "uncertainty_score": 0.34932051843407386,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 2718,
    "uncertainty_score": 9.682775399568748e-06,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2719,
    "uncertainty_score": 3.130399577434793e-09,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 2720,
    "uncertainty_score": 0.2500000000004104,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2721,
    "uncertainty_score": 0.20003723747433216,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 2722,
    "uncertainty_score": 3.849212727316941e-07,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2723,
    "uncertainty_score": 0.1295499770886918,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2724,
    "uncertainty_score": 0.004684429509207338,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2725,
    "uncertainty_score": 0.20000063383489658,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 2726,
    "uncertainty_score": 2.6002139096366652e-08,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 2727,
    "uncertainty_score": 0.19963417171863312,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 2728,
    "uncertainty_score": 0.2500000084246994,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 2729,
    "uncertainty_score": 8.18142558017658e-06,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 2730,
    "uncertainty_score": 0.1673671214596331,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 2731,
    "uncertainty_score": 1.4586003539911931e-08,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 2732,
    "uncertainty_score": 0.0009693535411627954,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 2733,
    "uncertainty_score": 0.25050738496934793,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 2734,
    "uncertainty_score": 0.6000000034226011,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2735,
    "uncertainty_score": 0.400001972196714,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2736,
    "uncertainty_score": 1.2863359712173551e-05,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2737,
    "uncertainty_score": 5.119887448360818e-06,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 2738,
    "uncertainty_score": 0.0005495522087659421,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 2739,
    "uncertainty_score": 1.7405729129829664e-06,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2740,
    "uncertainty_score": 0.25000250626498405,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2741,
    "uncertainty_score": 1.793654921009665e-08,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 2742,
    "uncertainty_score": 0.06062914801114548,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 2743,
    "uncertainty_score": 2.2036241988791305e-10,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 2744,
    "uncertainty_score": 0.24999974228104752,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2745,
    "uncertainty_score": 0.14269343868040524,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 2746,
    "uncertainty_score": 0.2500000088017806,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 2747,
    "uncertainty_score": 1.133909857823111e-09,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 2748,
    "uncertainty_score": 5.307319245935448e-06,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 2749,
    "uncertainty_score": 0.3352610197648544,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 2750,
    "uncertainty_score": 2.093216995655516e-09,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 2751,
    "uncertainty_score": 0.1999999888309657,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2752,
    "uncertainty_score": 0.005160795630264716,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 2753,
    "uncertainty_score": 0.2048351613172517,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 2754,
    "uncertainty_score": 0.16715986902800736,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2755,
    "uncertainty_score": 0.41517201681394783,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 2756,
    "uncertainty_score": 1.740600229780665e-06,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 2757,
    "uncertainty_score": 0.3333333373622551,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 2758,
    "uncertainty_score": 0.00037016736499078724,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2759,
    "uncertainty_score": 0.440703812877428,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 2760,
    "uncertainty_score": 2.121228427643033e-05,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 2761,
    "uncertainty_score": 1.6593613753290285e-05,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2762,
    "uncertainty_score": 0.20000009000664684,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 2763,
    "uncertainty_score": 0.003542228240144009,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 2764,
    "uncertainty_score": 0.0012073583456455532,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 2765,
    "uncertainty_score": 0.2500040050218897,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 2766,
    "uncertainty_score": 6.327544308929596e-12,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 2767,
    "uncertainty_score": 0.0014844347010721129,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 2768,
    "uncertainty_score": 4.945077303867692e-11,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2769,
    "uncertainty_score": 3.7950249703774945e-05,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 2770,
    "uncertainty_score": 0.2353683547804195,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 2771,
    "uncertainty_score": 0.0005819507363992894,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2772,
    "uncertainty_score": 0.20000000000329288,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2773,
    "uncertainty_score": 1.0763899781272275e-10,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 2774,
    "uncertainty_score": 5.99915410564463e-06,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 2775,
    "uncertainty_score": 0.19491286341674768,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 2776,
    "uncertainty_score": 0.25000002971678603,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 2777,
    "uncertainty_score": 0.400000003005494,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2778,
    "uncertainty_score": 2.1698167989759935e-10,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 2779,
    "uncertainty_score": 8.967964416639892e-10,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 2780,
    "uncertainty_score": 4.172687075029078e-05,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 2781,
    "uncertainty_score": 0.1999999998,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 2782,
    "uncertainty_score": 0.016102658208603453,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 2783,
    "uncertainty_score": 0.2500117008445065,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 2784,
    "uncertainty_score": 2.6942761691920685e-05,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 2785,
    "uncertainty_score": 0.010299529400562493,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2786,
    "uncertainty_score": 2.2795478914413506e-09,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 2787,
    "uncertainty_score": 7.969938520961361e-07,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2788,
    "uncertainty_score": 0.25000349954851225,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 2789,
    "uncertainty_score": 1.1011848890720481e-07,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 2790,
    "uncertainty_score": 0.0007247244196642128,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 2791,
    "uncertainty_score": 0.40164628080522097,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 2792,
    "uncertainty_score": 0.5200500314094129,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 2793,
    "uncertainty_score": 2.175093149877576e-07,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 2794,
    "uncertainty_score": 0.26161931363372726,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 2795,
    "uncertainty_score": 0.20133862803408253,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2796,
    "uncertainty_score": 0.19990542966502792,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2797,
    "uncertainty_score": 2.916309502606706e-14,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 2798,
    "uncertainty_score": 0.0038295649330323278,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2799,
    "uncertainty_score": 0.20000000256968925,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2800,
    "uncertainty_score": 0.6000035528110667,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 2801,
    "uncertainty_score": 0.20001529783088903,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 2802,
    "uncertainty_score": 0.00044635243015955615,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 2803,
    "uncertainty_score": 0.20003159427654044,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2804,
    "uncertainty_score": 0.2408864152080032,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2805,
    "uncertainty_score": 0.7999834155213377,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2806,
    "uncertainty_score": 9.311582561920063e-10,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 2807,
    "uncertainty_score": 0.25000000125044775,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 2808,
    "uncertainty_score": 0.0017021004621797866,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 2809,
    "uncertainty_score": 0.0002823285986199227,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 2810,
    "uncertainty_score": 0.20003007907259365,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 2811,
    "uncertainty_score": 1.7257353356201603e-05,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 2812,
    "uncertainty_score": 0.19998344253748937,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2813,
    "uncertainty_score": 9.962488213955058e-05,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 2814,
    "uncertainty_score": 0.48778555456826206,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 2815,
    "uncertainty_score": 0.2259369439772721,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 2816,
    "uncertainty_score": 0.2000622336513322,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2817,
    "uncertainty_score": 0.3333333332126723,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 2818,
    "uncertainty_score": 0.3303026354480146,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 2819,
    "uncertainty_score": 0.33333333302855805,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2820,
    "uncertainty_score": 2.0238223579571313e-08,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 2821,
    "uncertainty_score": 4.0697402755388643e-07,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 2822,
    "uncertainty_score": 0.24999998675371565,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 2823,
    "uncertainty_score": 0.006701625950509447,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 2824,
    "uncertainty_score": 0.25000000078164325,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2825,
    "uncertainty_score": 2.1123148143377706e-12,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 2826,
    "uncertainty_score": 0.015208232897820969,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 2827,
    "uncertainty_score": 0.2500000537457136,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 2828,
    "uncertainty_score": 0.6035606106683986,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 2829,
    "uncertainty_score": 1.3332461375460005e-09,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 2830,
    "uncertainty_score": 0.44276288473112924,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2831,
    "uncertainty_score": 0.75,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 2832,
    "uncertainty_score": 0.019250688453901075,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 2833,
    "uncertainty_score": 0.2500002561562397,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2834,
    "uncertainty_score": 0.000482034290717007,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 2835,
    "uncertainty_score": 0.03319060050119002,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2836,
    "uncertainty_score": 0.40120695366563686,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 2837,
    "uncertainty_score": 0.2499925177114113,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 2838,
    "uncertainty_score": 0.002093478087120049,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 2839,
    "uncertainty_score": 0.20000107189915975,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 2840,
    "uncertainty_score": 0.00015194295212779608,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 2841,
    "uncertainty_score": 6.007803743153641e-05,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 2842,
    "uncertainty_score": 4.9562477746670125e-11,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 2843,
    "uncertainty_score": 8.320507106051654e-09,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2844,
    "uncertainty_score": 1.6815618076678086e-05,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 2845,
    "uncertainty_score": 0.000769644659648205,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2846,
    "uncertainty_score": 5.1781698676250204e-08,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2847,
    "uncertainty_score": 0.2002413177560825,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 2848,
    "uncertainty_score": 7.669103219600658e-11,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 2849,
    "uncertainty_score": 0.2500072801504784,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 2850,
    "uncertainty_score": 4.78241332865742e-07,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 2851,
    "uncertainty_score": 0.000282108507084795,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2852,
    "uncertainty_score": 0.20000304117937567,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2853,
    "uncertainty_score": 2.1445273202171067e-08,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 2854,
    "uncertainty_score": 1.331083330806445e-05,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 2855,
    "uncertainty_score": 2.3861821054478156e-06,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 2856,
    "uncertainty_score": 0.500007510266661,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2857,
    "uncertainty_score": 0.4999999997500035,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 2858,
    "uncertainty_score": 6.287491511190451e-09,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 2859,
    "uncertainty_score": 0.2500666792477697,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 2860,
    "uncertainty_score": 1.2547072948005228e-06,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 2861,
    "uncertainty_score": 2.0890664641553005e-05,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 2862,
    "uncertainty_score": 1.2456871629643434e-11,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 2863,
    "uncertainty_score": 0.20000000040532706,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 2864,
    "uncertainty_score": 1.1651286405308323e-12,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 2865,
    "uncertainty_score": 3.735549016743232e-09,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 2866,
    "uncertainty_score": 1.7179148858971678e-06,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 2867,
    "uncertainty_score": 0.3337722155648601,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2868,
    "uncertainty_score": 0.20019598055459467,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2869,
    "uncertainty_score": 0.20482723612053405,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 2870,
    "uncertainty_score": 0.08451792465408905,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2871,
    "uncertainty_score": 5.364273821734234e-06,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 2872,
    "uncertainty_score": 0.15953522765590414,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2873,
    "uncertainty_score": 1.2715719350950143e-07,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2874,
    "uncertainty_score": 0.00079092734589554,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2875,
    "uncertainty_score": 0.004408445903186994,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2876,
    "uncertainty_score": 0.00041313967983792486,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 2877,
    "uncertainty_score": 1.7799641730671299e-10,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2878,
    "uncertainty_score": 0.20000002176998993,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 2879,
    "uncertainty_score": 0.0019692070747365656,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 2880,
    "uncertainty_score": 0.0,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2881,
    "uncertainty_score": 0.000321928383832395,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 2882,
    "uncertainty_score": 0.3333333319309025,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 2883,
    "uncertainty_score": 1.456710289450822e-11,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 2884,
    "uncertainty_score": 0.00932578654186556,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 2885,
    "uncertainty_score": 2.8955523677324843e-10,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 2886,
    "uncertainty_score": 1.0663473236833189e-05,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 2887,
    "uncertainty_score": 4.306739303660426e-06,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2888,
    "uncertainty_score": 0.0013229273764106997,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 2889,
    "uncertainty_score": 0.19999887011712264,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 2890,
    "uncertainty_score": 0.4009397016442886,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 2891,
    "uncertainty_score": 4.5173596898657775e-05,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 2892,
    "uncertainty_score": 1.4145741224312914e-07,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 2893,
    "uncertainty_score": 0.20000001121531716,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 2894,
    "uncertainty_score": 2.0937575270329813e-09,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 2895,
    "uncertainty_score": 0.0004619984132330231,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2896,
    "uncertainty_score": 0.4999999995002314,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 2897,
    "uncertainty_score": 1.4880656025526213e-09,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 2898,
    "uncertainty_score": 0.24999999985549098,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 2899,
    "uncertainty_score": 1.87412178557562e-08,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 2900,
    "uncertainty_score": 7.066050384138371e-07,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 2901,
    "uncertainty_score": 3.95058158392499e-07,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 2902,
    "uncertainty_score": 0.1444571650160233,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 2903,
    "uncertainty_score": 0.3711229309258492,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2904,
    "uncertainty_score": 0.04397702462581542,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 2905,
    "uncertainty_score": 0.2000001644256447,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 2906,
    "uncertainty_score": 0.2845777137426013,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 2907,
    "uncertainty_score": 1.3050813502585283e-08,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 2908,
    "uncertainty_score": 0.015171667527382868,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2909,
    "uncertainty_score": 4.379600044018916e-07,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2910,
    "uncertainty_score": 1.0076377411659758e-05,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 2911,
    "uncertainty_score": 9.671983476755537e-08,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2912,
    "uncertainty_score": 0.19983910542013258,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 2913,
    "uncertainty_score": 0.00035201352039335106,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 2914,
    "uncertainty_score": 0.06738274546463732,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 2915,
    "uncertainty_score": 5.53457212632781e-07,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 2916,
    "uncertainty_score": 0.2000119853905405,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 2917,
    "uncertainty_score": 5.854412133981143e-05,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 2918,
    "uncertainty_score": 1.094104678738651e-08,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2919,
    "uncertainty_score": 1.9644381382522242e-06,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 2920,
    "uncertainty_score": 0.19999222828785013,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2921,
    "uncertainty_score": 0.1666776425016274,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 2922,
    "uncertainty_score": 0.17031410878810727,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 2923,
    "uncertainty_score": 0.49999721155315047,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 2924,
    "uncertainty_score": 0.0,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 2925,
    "uncertainty_score": 0.031771535056293515,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 2926,
    "uncertainty_score": 0.8119002373449646,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2927,
    "uncertainty_score": 2.4526288266564477e-05,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 2928,
    "uncertainty_score": 0.5999994853507393,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2929,
    "uncertainty_score": 2.938418959745229e-07,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2930,
    "uncertainty_score": 0.3999844014961917,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 2931,
    "uncertainty_score": 0.17240455725047635,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2932,
    "uncertainty_score": 0.1307947388365582,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2933,
    "uncertainty_score": 0.5000000000020625,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 2934,
    "uncertainty_score": 0.40040590816774363,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2935,
    "uncertainty_score": 0.16666667613014327,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2936,
    "uncertainty_score": 0.0003312678436553341,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2937,
    "uncertainty_score": 0.0006848375003174535,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 2938,
    "uncertainty_score": 0.19999999942269295,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2939,
    "uncertainty_score": 1.0351919167386641e-09,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 2940,
    "uncertainty_score": 0.19999999980000033,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2941,
    "uncertainty_score": 1.8562494375343231e-09,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 2942,
    "uncertainty_score": 0.0046488380037821575,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2943,
    "uncertainty_score": 3.073633841355368e-07,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2944,
    "uncertainty_score": 0.20000004667432184,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2945,
    "uncertainty_score": 5.176190514519337e-07,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2946,
    "uncertainty_score": 5.033041915776359e-06,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2947,
    "uncertainty_score": 0.20017668861085397,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2948,
    "uncertainty_score": 0.4000008147688258,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 2949,
    "uncertainty_score": 0.40079730819821585,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 2950,
    "uncertainty_score": 0.2000010732089294,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2951,
    "uncertainty_score": 0.00013618931534493977,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2952,
    "uncertainty_score": 0.24422830799500644,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2953,
    "uncertainty_score": 0.003894048263695304,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 2954,
    "uncertainty_score": 0.00042756434830854543,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2955,
    "uncertainty_score": 0.6000051198903382,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 2956,
    "uncertainty_score": 0.6000005172230899,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2957,
    "uncertainty_score": 0.14286208505997847,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 2958,
    "uncertainty_score": 1.9905466756149453e-10,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2959,
    "uncertainty_score": 1.6107729439608373e-05,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 2960,
    "uncertainty_score": 0.5725436522731585,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2961,
    "uncertainty_score": 0.4020314014192786,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2962,
    "uncertainty_score": 3.518979004528586e-05,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 2963,
    "uncertainty_score": 0.20000288682616868,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 2964,
    "uncertainty_score": 0.2858600804696953,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 2965,
    "uncertainty_score": 9.039227784331337e-09,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2966,
    "uncertainty_score": 0.214010638486774,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2967,
    "uncertainty_score": 0.20002421027286585,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2968,
    "uncertainty_score": 0.6000053936025171,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2969,
    "uncertainty_score": 0.20000139245651263,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 2970,
    "uncertainty_score": 0.6,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 2971,
    "uncertainty_score": 0.37354136734438875,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2972,
    "uncertainty_score": 5.923828681430325e-06,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2973,
    "uncertainty_score": 0.25344440658110495,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 2974,
    "uncertainty_score": 0.2500002283145697,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2975,
    "uncertainty_score": 0.0002174721009487643,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2976,
    "uncertainty_score": 0.2,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2977,
    "uncertainty_score": 0.20001308506509125,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 2978,
    "uncertainty_score": 0.5998950511327932,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2979,
    "uncertainty_score": 0.39955254488180136,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2980,
    "uncertainty_score": 0.20800743591639334,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2981,
    "uncertainty_score": 1.138177247236463e-09,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2982,
    "uncertainty_score": 2.005329387936748e-06,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2983,
    "uncertainty_score": 1.6728414536314966e-11,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2984,
    "uncertainty_score": 0.41249674202096864,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2985,
    "uncertainty_score": 9.230312309715642e-06,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 2986,
    "uncertainty_score": 0.4048351510054239,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2987,
    "uncertainty_score": 3.052922465006402e-05,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 2988,
    "uncertainty_score": 0.25000000001298234,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2989,
    "uncertainty_score": 3.168724303941233e-05,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2990,
    "uncertainty_score": 0.4000000004587119,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2991,
    "uncertainty_score": 0.799999999087888,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2992,
    "uncertainty_score": 0.2000095650009536,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2993,
    "uncertainty_score": 0.00028941136652984494,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2994,
    "uncertainty_score": 1.0342191072416561e-05,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 2995,
    "uncertainty_score": 0.4004996903684045,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2996,
    "uncertainty_score": 0.2655656544472949,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2997,
    "uncertainty_score": 1.15555262562865e-08,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2998,
    "uncertainty_score": 0.40005919207816437,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 2999,
    "uncertainty_score": 6.082557612198705e-08,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 3000,
    "uncertainty_score": 0.20676292086958617,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3001,
    "uncertainty_score": 0.20006236862198418,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3002,
    "uncertainty_score": 0.799999999207049,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3003,
    "uncertainty_score": 0.49999999986991966,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3004,
    "uncertainty_score": 0.49999999975,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3005,
    "uncertainty_score": 0.2000000022921545,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 3006,
    "uncertainty_score": 0.39999999980575895,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3007,
    "uncertainty_score": 4.042819162699405e-14,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3008,
    "uncertainty_score": 0.40086572418634586,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 3009,
    "uncertainty_score": 0.19999953338508153,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3010,
    "uncertainty_score": 0.99999999975,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3011,
    "uncertainty_score": 0.1660364548642533,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3012,
    "uncertainty_score": 0.00047440070184498066,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 3013,
    "uncertainty_score": 6.503665618747357e-10,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 3014,
    "uncertainty_score": 0.0199290234457892,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 3015,
    "uncertainty_score": 0.4999999998247443,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 3016,
    "uncertainty_score": 0.8,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3017,
    "uncertainty_score": 0.25001049632676814,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 3018,
    "uncertainty_score": 0.40002421786405246,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3019,
    "uncertainty_score": 0.2500020001795225,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3020,
    "uncertainty_score": 9.851485691635823e-23,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3021,
    "uncertainty_score": 3.6087935340942673e-06,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3022,
    "uncertainty_score": 0.7142857146080751,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3023,
    "uncertainty_score": 0.0,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 3024,
    "uncertainty_score": 0.507796637487678,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3025,
    "uncertainty_score": 7.2312638510043926e-09,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3026,
    "uncertainty_score": 0.2000264509651374,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3027,
    "uncertainty_score": 5.611646707007662e-07,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 3028,
    "uncertainty_score": 0.20000000030177958,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3029,
    "uncertainty_score": 0.2499999997499296,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3030,
    "uncertainty_score": 1.3293976162827866e-06,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3031,
    "uncertainty_score": 0.33358830573000303,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3032,
    "uncertainty_score": 0.5999999993999999,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3033,
    "uncertainty_score": 0.40000005472832,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 3034,
    "uncertainty_score": 0.5104226108800524,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 3035,
    "uncertainty_score": 0.2000198218696902,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 3036,
    "uncertainty_score": 0.20114605067476723,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3037,
    "uncertainty_score": 0.33333759970899973,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3038,
    "uncertainty_score": 0.6000000001782989,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3039,
    "uncertainty_score": 0.5000000000000001,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3040,
    "uncertainty_score": 0.14285714288680634,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 3041,
    "uncertainty_score": 0.20397237819903918,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3042,
    "uncertainty_score": 0.20002625215853237,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3043,
    "uncertainty_score": 0.16671629921834705,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3044,
    "uncertainty_score": 0.200000032888931,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3045,
    "uncertainty_score": 5.277558605182039e-07,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 3046,
    "uncertainty_score": 0.5999999998,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3047,
    "uncertainty_score": 0.0005613154314826601,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3048,
    "uncertainty_score": 0.4420383776760951,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3049,
    "uncertainty_score": 1.3562649041561276e-07,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3050,
    "uncertainty_score": 1.5794531458499427e-08,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3051,
    "uncertainty_score": 0.8000000709271766,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 3052,
    "uncertainty_score": 5.540738921895134e-18,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3053,
    "uncertainty_score": 1.4890860371115038e-05,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3054,
    "uncertainty_score": 0.3964727940855399,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3055,
    "uncertainty_score": 3.3752573436524793e-06,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3056,
    "uncertainty_score": 0.20009962452176108,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3057,
    "uncertainty_score": 0.20042756402289105,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 3058,
    "uncertainty_score": 0.4000188257060378,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3059,
    "uncertainty_score": 0.4054084839904485,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 3060,
    "uncertainty_score": 0.41028093326505266,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3061,
    "uncertainty_score": 0.20202357745481353,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3062,
    "uncertainty_score": 0.20020644575376742,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3063,
    "uncertainty_score": 0.20120695437512787,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3064,
    "uncertainty_score": 6.920509320102112e-05,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3065,
    "uncertainty_score": 2.41588578911652e-12,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3066,
    "uncertainty_score": 0.40003516505309467,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3067,
    "uncertainty_score": 0.4000000310332375,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3068,
    "uncertainty_score": 0.2500000029395805,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3069,
    "uncertainty_score": 0.25000000097917924,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3070,
    "uncertainty_score": 0.1999976557223613,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3071,
    "uncertainty_score": 0.5000321605309049,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3072,
    "uncertainty_score": 0.25000001591124094,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3073,
    "uncertainty_score": 0.6018555800837306,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3074,
    "uncertainty_score": 0.3333456198012444,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 3075,
    "uncertainty_score": 5.31000471490377e-16,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3076,
    "uncertainty_score": 0.3333609337767504,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3077,
    "uncertainty_score": 3.652239061312398e-07,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3078,
    "uncertainty_score": 0.6000000000223074,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3079,
    "uncertainty_score": 0.4006150814156163,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 3080,
    "uncertainty_score": 0.20178588999983896,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 3081,
    "uncertainty_score": 7.786052969689082e-11,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3082,
    "uncertainty_score": 0.400050635165422,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3083,
    "uncertainty_score": 0.0028669110999654814,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 3084,
    "uncertainty_score": 0.2000012711413711,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 3085,
    "uncertainty_score": 0.04103808585860835,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 3086,
    "uncertainty_score": 0.20000664283819755,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3087,
    "uncertainty_score": 1.0,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3088,
    "uncertainty_score": 0.39999999959499083,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 3089,
    "uncertainty_score": 0.42857142828571415,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 3090,
    "uncertainty_score": 0.001918185369875926,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 3091,
    "uncertainty_score": 0.2495878988201259,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3092,
    "uncertainty_score": 0.2,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 3093,
    "uncertainty_score": 0.2510652114746653,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 3094,
    "uncertainty_score": 0.000206446210324958,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3095,
    "uncertainty_score": 0.20000000077707342,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 3096,
    "uncertainty_score": 0.25023730063868876,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 3097,
    "uncertainty_score": 0.4079523757384512,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3098,
    "uncertainty_score": 0.5999999989452991,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 3099,
    "uncertainty_score": 0.49999999949999996,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3100,
    "uncertainty_score": 0.3999999998,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 3101,
    "uncertainty_score": 0.5999999996015288,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 3102,
    "uncertainty_score": 0.4000000894870352,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 3103,
    "uncertainty_score": 0.3999999996036038,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3104,
    "uncertainty_score": 0.19999999979995434,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 3105,
    "uncertainty_score": 0.20394382509081468,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3106,
    "uncertainty_score": 0.39999968381518913,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3107,
    "uncertainty_score": 0.3824872303065165,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3108,
    "uncertainty_score": 0.39999990119302514,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 3109,
    "uncertainty_score": 0.375718541518016,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 3110,
    "uncertainty_score": 0.00022691515361875355,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 3111,
    "uncertainty_score": 0.39998992211108764,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 3112,
    "uncertainty_score": 1.5289041893097036e-05,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 3113,
    "uncertainty_score": 0.39993094070174273,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3114,
    "uncertainty_score": 0.3999999998,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 3115,
    "uncertainty_score": 0.400104875933447,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 3116,
    "uncertainty_score": 5.891437144159336e-15,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 3117,
    "uncertainty_score": 5.563526273206883e-05,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 3118,
    "uncertainty_score": 0.3333333333333333,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 3119,
    "uncertainty_score": 0.4999999943609082,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 3120,
    "uncertainty_score": 1.1089502576919224e-09,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 3121,
    "uncertainty_score": 0.5018692644896342,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3122,
    "uncertainty_score": 0.3333077353653051,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 3123,
    "uncertainty_score": 0.2500000038883917,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 3124,
    "uncertainty_score": 0.1671308327884193,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 3125,
    "uncertainty_score": 0.0919824172784434,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 3126,
    "uncertainty_score": 0.749741940710114,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 3127,
    "uncertainty_score": 0.33333079454520204,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 3128,
    "uncertainty_score": 0.5997709039955585,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 3129,
    "uncertainty_score": 3.882018241808953e-11,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 3130,
    "uncertainty_score": 0.00020749390481471352,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 3131,
    "uncertainty_score": 0.7046617455534893,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 3132,
    "uncertainty_score": 4.869077920452938e-07,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 3133,
    "uncertainty_score": 0.19996661887153128,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3134,
    "uncertainty_score": 0.39999999959999977,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 3135,
    "uncertainty_score": 0.2535146763362199,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 3136,
    "uncertainty_score": 0.16666667566853435,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 3137,
    "uncertainty_score": 0.8056668698949851,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 3138,
    "uncertainty_score": 0.002617505501177003,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3139,
    "uncertainty_score": 0.5011502803920901,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 3140,
    "uncertainty_score": 0.33326396601575964,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 3141,
    "uncertainty_score": 0.5999993617935002,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3142,
    "uncertainty_score": 2.251629552977394e-08,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 3143,
    "uncertainty_score": 0.49999999801451106,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 3144,
    "uncertainty_score": 0.6666666666666666,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3145,
    "uncertainty_score": 1.2173310561133766e-08,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3146,
    "uncertainty_score": 0.004356437210201571,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3147,
    "uncertainty_score": 7.341923782548357e-16,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 3148,
    "uncertainty_score": 0.0008962330248971967,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3149,
    "uncertainty_score": 0.4000000010680999,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3150,
    "uncertainty_score": 0.4999955431348854,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 3151,
    "uncertainty_score": 0.6678645338461472,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3152,
    "uncertainty_score": 2.968852336171222e-10,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 3153,
    "uncertainty_score": 0.20000038812563808,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3154,
    "uncertainty_score": 0.0013385714469394748,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 3155,
    "uncertainty_score": 0.01826958436483317,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 3156,
    "uncertainty_score": 6.667507147724144e-05,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 3157,
    "uncertainty_score": 9.510540328599636e-09,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 3158,
    "uncertainty_score": 0.11111600040984985,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 3159,
    "uncertainty_score": 1.7275589080274946e-09,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 3160,
    "uncertainty_score": 0.00064722616567398,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3161,
    "uncertainty_score": 3.4958765174930842e-06,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 3162,
    "uncertainty_score": 0.002916112718732814,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3163,
    "uncertainty_score": 3.801784728629579e-06,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 3164,
    "uncertainty_score": 0.2000605837471145,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 3165,
    "uncertainty_score": 0.014029256860753821,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 3166,
    "uncertainty_score": 0.20265908584317538,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 3167,
    "uncertainty_score": 9.019475482118574e-10,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 3168,
    "uncertainty_score": 0.00035394946565174,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 3169,
    "uncertainty_score": 0.42114505646429895,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 3170,
    "uncertainty_score": 0.005087180120740328,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 3171,
    "uncertainty_score": 0.0002481852113668153,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 3172,
    "uncertainty_score": 2.797432024610326e-06,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 3173,
    "uncertainty_score": 0.00012970293146967015,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 3174,
    "uncertainty_score": 0.06273607677190823,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3175,
    "uncertainty_score": 0.00020020087179649677,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3176,
    "uncertainty_score": 0.22029574204060545,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3177,
    "uncertainty_score": 0.009535443484457085,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3178,
    "uncertainty_score": 0.20005253452347382,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 3179,
    "uncertainty_score": 1.2766695868275858e-11,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3180,
    "uncertainty_score": 1.126878579704021e-08,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 3181,
    "uncertainty_score": 0.012214479685547628,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3182,
    "uncertainty_score": 0.4000001204108221,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 3183,
    "uncertainty_score": 0.40000287679350865,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3184,
    "uncertainty_score": 0.20000001389808472,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3185,
    "uncertainty_score": 0.3333333796960873,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 3186,
    "uncertainty_score": 7.181232560645832e-07,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 3187,
    "uncertainty_score": 0.2000000096863337,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 3188,
    "uncertainty_score": 0.00020606734958809745,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 3189,
    "uncertainty_score": 0.6666666803366907,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 3190,
    "uncertainty_score": 0.17964859824123275,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 3191,
    "uncertainty_score": 0.20009963124319094,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 3192,
    "uncertainty_score": 0.20182477423560066,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3193,
    "uncertainty_score": 0.003253431309503226,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 3194,
    "uncertainty_score": 1.101485897007555e-07,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 3195,
    "uncertainty_score": 0.3333333330156158,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 3196,
    "uncertainty_score": 0.20068357762290567,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 3197,
    "uncertainty_score": 8.3109129281619e-06,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 3198,
    "uncertainty_score": 2.7132307201859633e-06,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 3199,
    "uncertainty_score": 8.809137450114667e-08,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 3200,
    "uncertainty_score": 0.00014088657766154997,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3201,
    "uncertainty_score": 2.770628848013815e-07,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3202,
    "uncertainty_score": 0.00013482716324197863,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 3203,
    "uncertainty_score": 0.3999956237214614,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3204,
    "uncertainty_score": 8.228651651268609e-05,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3205,
    "uncertainty_score": 2.777718408642866e-10,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 3206,
    "uncertainty_score": 0.0014847232228177704,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 3207,
    "uncertainty_score": 3.6132387342134914e-05,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 3208,
    "uncertainty_score": 0.2500305290425207,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 3209,
    "uncertainty_score": 0.1669356090703268,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 3210,
    "uncertainty_score": 3.2039514148347843e-06,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 3211,
    "uncertainty_score": 0.26845408716097224,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3212,
    "uncertainty_score": 0.2002441336172212,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3213,
    "uncertainty_score": 3.086064297132997e-09,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3214,
    "uncertainty_score": 0.00015335696672485807,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 3215,
    "uncertainty_score": 0.02434858472735976,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 3216,
    "uncertainty_score": 3.497013301427929e-08,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 3217,
    "uncertainty_score": 1.5358676664873421e-09,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 3218,
    "uncertainty_score": 1.947054356264935e-09,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3219,
    "uncertainty_score": 2.919980535293511e-06,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 3220,
    "uncertainty_score": 5.239616053865151e-08,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 3221,
    "uncertainty_score": 3.3631792001199683e-10,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3222,
    "uncertainty_score": 5.595230386865264e-12,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3223,
    "uncertainty_score": 5.260775880507166e-09,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 3224,
    "uncertainty_score": 0.1664940918022749,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3225,
    "uncertainty_score": 9.565261805282922e-06,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 3226,
    "uncertainty_score": 0.0008353740408350965,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3227,
    "uncertainty_score": 0.250996643813714,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 3228,
    "uncertainty_score": 0.00014963213779961695,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3229,
    "uncertainty_score": 0.3950125020774837,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3230,
    "uncertainty_score": 0.20000497416030308,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 3231,
    "uncertainty_score": 0.19998303835171896,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 3232,
    "uncertainty_score": 1.7365624859421303e-05,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 3233,
    "uncertainty_score": 4.0776240029494406e-05,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 3234,
    "uncertainty_score": 0.20000000008577912,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 3235,
    "uncertainty_score": 0.01962264943596035,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 3236,
    "uncertainty_score": 0.03977176460579968,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 3237,
    "uncertainty_score": 0.0005703522405355213,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3238,
    "uncertainty_score": 6.946240451721349e-11,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 3239,
    "uncertainty_score": 0.5004375242003504,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3240,
    "uncertainty_score": 7.102444666059723e-06,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3241,
    "uncertainty_score": 8.107790408971983e-05,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3242,
    "uncertainty_score": 0.19998471554016864,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 3243,
    "uncertainty_score": 0.018072510171904275,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3244,
    "uncertainty_score": 0.2433101789653816,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3245,
    "uncertainty_score": 0.0022431388208768734,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 3246,
    "uncertainty_score": 0.20002442327236536,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3247,
    "uncertainty_score": 0.00030296241576915515,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 3248,
    "uncertainty_score": 0.029782454274919268,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 3249,
    "uncertainty_score": 0.20024131811845813,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3250,
    "uncertainty_score": 0.500000038034605,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 3251,
    "uncertainty_score": 0.2029240205705801,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 3252,
    "uncertainty_score": 2.135161517639181e-10,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 3253,
    "uncertainty_score": 0.00027184552759697587,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 3254,
    "uncertainty_score": 0.5002449732388947,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3255,
    "uncertainty_score": 0.1999999998198361,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 3256,
    "uncertainty_score": 6.235369216002205e-06,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3257,
    "uncertainty_score": 0.009647707073188962,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3258,
    "uncertainty_score": 6.796038718491424e-09,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 3259,
    "uncertainty_score": 0.41266867086121817,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3260,
    "uncertainty_score": 0.4000000014476196,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3261,
    "uncertainty_score": 5.547672891308313e-07,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3262,
    "uncertainty_score": 0.4005786559843445,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3263,
    "uncertainty_score": 2.759138403984458e-09,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 3264,
    "uncertainty_score": 0.046369031697327465,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 3265,
    "uncertainty_score": 0.00011058537240260893,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 3266,
    "uncertainty_score": 5.1839375415724746e-08,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 3267,
    "uncertainty_score": 0.16669753772713156,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 3268,
    "uncertainty_score": 0.2107865277183581,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 3269,
    "uncertainty_score": 2.0105797649748352e-08,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 3270,
    "uncertainty_score": 0.0012595322182040525,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3271,
    "uncertainty_score": 0.0001400356160598016,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3272,
    "uncertainty_score": 0.003382982859061015,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 3273,
    "uncertainty_score": 0.539184508172412,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 3274,
    "uncertainty_score": 0.4000000451727674,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3275,
    "uncertainty_score": 6.4035364001323376e-06,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 3276,
    "uncertainty_score": 5.764173854671112e-13,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 3277,
    "uncertainty_score": 1.0688351172143575e-08,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 3278,
    "uncertainty_score": 0.2394780677497074,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3279,
    "uncertainty_score": 0.14344434641221016,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 3280,
    "uncertainty_score": 0.251432541802446,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3281,
    "uncertainty_score": 0.6666051113755992,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3282,
    "uncertainty_score": 2.436116880977552e-09,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 3283,
    "uncertainty_score": 0.2014094801747969,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3284,
    "uncertainty_score": 0.5555555672557977,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3285,
    "uncertainty_score": 0.0,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 3286,
    "uncertainty_score": 8.276477684975038e-08,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 3287,
    "uncertainty_score": 0.33459500368329526,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3288,
    "uncertainty_score": 1.7285044049454868e-09,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 3289,
    "uncertainty_score": 0.40000000003049185,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3290,
    "uncertainty_score": 0.23348849389566287,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3291,
    "uncertainty_score": 5.8616487678357925e-05,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 3292,
    "uncertainty_score": 1.508133388648868e-07,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 3293,
    "uncertainty_score": 0.0005945635350455673,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3294,
    "uncertainty_score": 0.08450789369015181,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 3295,
    "uncertainty_score": 0.1669142751424747,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3296,
    "uncertainty_score": 0.21991722665180785,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3297,
    "uncertainty_score": 8.367407604118205e-08,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 3298,
    "uncertainty_score": 0.200001075080687,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 3299,
    "uncertainty_score": 0.5899732393249262,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3300,
    "uncertainty_score": 9.810100187518702e-08,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 3301,
    "uncertainty_score": 3.2234416655497224e-06,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 3302,
    "uncertainty_score": 0.3333333349470693,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3303,
    "uncertainty_score": 0.0005167199015942782,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 3304,
    "uncertainty_score": 0.20073113366088324,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 3305,
    "uncertainty_score": 3.204713215429372e-06,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3306,
    "uncertainty_score": 0.6666649680982425,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 3307,
    "uncertainty_score": 0.3333333671549419,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3308,
    "uncertainty_score": 0.4,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 3309,
    "uncertainty_score": 0.6000002925529155,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 3310,
    "uncertainty_score": 7.08662381005385e-10,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 3311,
    "uncertainty_score": 0.04490701849832273,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3312,
    "uncertainty_score": 1.7345895102114906e-07,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 3313,
    "uncertainty_score": 2.9788531611234427e-05,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 3314,
    "uncertainty_score": 0.5868790337743659,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3315,
    "uncertainty_score": 0.20000190315980046,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3316,
    "uncertainty_score": 0.0008610508166402977,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3317,
    "uncertainty_score": 0.26989890700888514,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 3318,
    "uncertainty_score": 9.925427664909611e-08,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3319,
    "uncertainty_score": 9.062613056633178e-11,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 3320,
    "uncertainty_score": 5.216262141613782e-05,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3321,
    "uncertainty_score": 8.36515390368021e-08,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3322,
    "uncertainty_score": 0.2500000177739018,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3323,
    "uncertainty_score": 0.6000000195016097,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3324,
    "uncertainty_score": 0.25345994518161813,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 3325,
    "uncertainty_score": 0.1666665968135456,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 3326,
    "uncertainty_score": 0.04663000745816768,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3327,
    "uncertainty_score": 6.007823095205825e-05,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 3328,
    "uncertainty_score": 0.00037531344517158525,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3329,
    "uncertainty_score": 0.39999995199708777,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3330,
    "uncertainty_score": 0.3229616964906466,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3331,
    "uncertainty_score": 0.0021115271889718163,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 3332,
    "uncertainty_score": 0.012496652885807518,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3333,
    "uncertainty_score": 2.7252757901934064e-10,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 3334,
    "uncertainty_score": 2.5450830273968052e-06,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 3335,
    "uncertainty_score": 0.010516812569201674,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 3336,
    "uncertainty_score": 8.915567768780382e-10,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 3337,
    "uncertainty_score": 0.5999767228624864,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3338,
    "uncertainty_score": 0.49999999981090437,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3339,
    "uncertainty_score": 6.445578040312549e-08,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3340,
    "uncertainty_score": 2.4051983866748587e-07,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 3341,
    "uncertainty_score": 0.43760808368912735,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3342,
    "uncertainty_score": 0.0015543229741540466,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 3343,
    "uncertainty_score": 4.932626732585582e-06,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 3344,
    "uncertainty_score": 2.3053672717192136e-07,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3345,
    "uncertainty_score": 0.20000000058248307,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 3346,
    "uncertainty_score": 0.40884769004089777,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 3347,
    "uncertainty_score": 5.230006489380352e-11,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 3348,
    "uncertainty_score": 0.00047602528930388205,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 3349,
    "uncertainty_score": 0.20003519641734,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3350,
    "uncertainty_score": 0.0006931179384281881,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 3351,
    "uncertainty_score": 0.25281140150362297,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3352,
    "uncertainty_score": 0.4000000546368484,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 3353,
    "uncertainty_score": 0.20013528741547687,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3354,
    "uncertainty_score": 0.0009462478957010765,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 3355,
    "uncertainty_score": 0.20000018244084133,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 3356,
    "uncertainty_score": 0.00018296161326753288,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3357,
    "uncertainty_score": 2.0943502386037387e-06,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 3358,
    "uncertainty_score": 0.4559997802215633,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 3359,
    "uncertainty_score": 1.4718341573810897e-11,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3360,
    "uncertainty_score": 4.319394255948599e-06,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3361,
    "uncertainty_score": 0.19902483396669454,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3362,
    "uncertainty_score": 2.6201810973903627e-05,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 3363,
    "uncertainty_score": 3.802030450534838e-06,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 3364,
    "uncertainty_score": 1.4445456080250569e-06,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3365,
    "uncertainty_score": 3.710711057526492e-06,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3366,
    "uncertainty_score": 0.40513524431869863,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 3367,
    "uncertainty_score": 4.966361867230446e-06,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 3368,
    "uncertainty_score": 9.6305482523767e-08,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 3369,
    "uncertainty_score": 0.6666666168192109,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3370,
    "uncertainty_score": 0.002552595223921524,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 3371,
    "uncertainty_score": 0.05218916217605918,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 3372,
    "uncertainty_score": 0.2931844459419712,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 3373,
    "uncertainty_score": 4.459654447089321e-06,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3374,
    "uncertainty_score": 0.046906471206493605,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 3375,
    "uncertainty_score": 0.37782857952956306,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 3376,
    "uncertainty_score": 0.11052555832814971,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 3377,
    "uncertainty_score": 0.33288704152394044,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3378,
    "uncertainty_score": 5.7875488683231e-10,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 3379,
    "uncertainty_score": 5.422849761410896e-07,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 3380,
    "uncertainty_score": 0.3333333332184521,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3381,
    "uncertainty_score": 0.4000000510026306,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 3382,
    "uncertainty_score": 0.2501517543891479,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3383,
    "uncertainty_score": 1.0393793336278475e-05,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3384,
    "uncertainty_score": 6.535362754928222e-08,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 3385,
    "uncertainty_score": 0.6666666711468262,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3386,
    "uncertainty_score": 0.6475375232137593,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3387,
    "uncertainty_score": 0.0004976434449677604,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 3388,
    "uncertainty_score": 8.366325047952283e-07,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 3389,
    "uncertainty_score": 1.4543657166562975e-05,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 3390,
    "uncertainty_score": 0.15210945504920978,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3391,
    "uncertainty_score": 0.25004706921005465,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 3392,
    "uncertainty_score": 1.9830714088792056e-05,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 3393,
    "uncertainty_score": 0.4999933737357094,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3394,
    "uncertainty_score": 4.860439438881873e-06,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 3395,
    "uncertainty_score": 0.009298687421029477,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3396,
    "uncertainty_score": 0.037744396796043765,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 3397,
    "uncertainty_score": 0.5000275094025364,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 3398,
    "uncertainty_score": 0.0021678340921145556,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 3399,
    "uncertainty_score": 6.568558436827061e-10,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 3400,
    "uncertainty_score": 0.2500000000226404,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 3401,
    "uncertainty_score": 0.2500000002485583,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 3402,
    "uncertainty_score": 0.05230997571704847,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3403,
    "uncertainty_score": 0.5778545851172057,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3404,
    "uncertainty_score": 0.6004743916773727,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 3405,
    "uncertainty_score": 0.25000001586949805,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 3406,
    "uncertainty_score": 0.2056299453982021,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3407,
    "uncertainty_score": 0.16666886830687203,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 3408,
    "uncertainty_score": 0.6666666666836885,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3409,
    "uncertainty_score": 0.00045450234038861917,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3410,
    "uncertainty_score": 0.25028635528248766,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 3411,
    "uncertainty_score": 2.960130847788622e-12,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3412,
    "uncertainty_score": 0.12830428118176285,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 3413,
    "uncertainty_score": 0.5000001954888665,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 3414,
    "uncertainty_score": 0.6000028868126359,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 3415,
    "uncertainty_score": 0.0003820545707850023,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 3416,
    "uncertainty_score": 4.1909782549806224e-07,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 3417,
    "uncertainty_score": 1.1216746089496423e-10,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 3418,
    "uncertainty_score": 0.4001589242796976,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3419,
    "uncertainty_score": 5.433243410739116e-11,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 3420,
    "uncertainty_score": 0.25000000037176895,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 3421,
    "uncertainty_score": 0.24598328105644396,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3422,
    "uncertainty_score": 0.6666668060395754,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3423,
    "uncertainty_score": 0.5000000015557038,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 3424,
    "uncertainty_score": 0.6667020892407735,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3425,
    "uncertainty_score": 0.20024055004694402,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3426,
    "uncertainty_score": 0.0,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 3427,
    "uncertainty_score": 0.20047422346120936,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 3428,
    "uncertainty_score": 1.1918110413952619e-06,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3429,
    "uncertainty_score": 8.121746473616293e-11,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3430,
    "uncertainty_score": 0.20000139653002957,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3431,
    "uncertainty_score": 7.289674870489494e-05,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 3432,
    "uncertainty_score": 8.10008443124672e-06,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 3433,
    "uncertainty_score": 0.4000257638057846,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3434,
    "uncertainty_score": 0.3333364052160089,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 3435,
    "uncertainty_score": 1.7411696098220977e-09,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 3436,
    "uncertainty_score": 0.20002717965512132,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3437,
    "uncertainty_score": 3.630234072476436e-11,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 3438,
    "uncertainty_score": 0.2500071025412346,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 3439,
    "uncertainty_score": 0.40000072606360104,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3440,
    "uncertainty_score": 0.0005239040465932214,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 3441,
    "uncertainty_score": 0.250000338686347,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3442,
    "uncertainty_score": 0.40000000000024016,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3443,
    "uncertainty_score": 0.2000000000060668,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3444,
    "uncertainty_score": 0.2770124093385123,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3445,
    "uncertainty_score": 0.7343931608266181,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 3446,
    "uncertainty_score": 3.1515473652504215e-06,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 3447,
    "uncertainty_score": 0.5999815836366638,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 3448,
    "uncertainty_score": 0.20000000236504598,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3449,
    "uncertainty_score": 0.2622144507197325,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3450,
    "uncertainty_score": 0.25000000032806796,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 3451,
    "uncertainty_score": 0.20772566309534302,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3452,
    "uncertainty_score": 1.283586960620568e-09,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 3453,
    "uncertainty_score": 1.1575366846551736e-11,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 3454,
    "uncertainty_score": 0.2499999643578013,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 3455,
    "uncertainty_score": 0.1981207386541193,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3456,
    "uncertainty_score": 2.246707237995419e-06,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 3457,
    "uncertainty_score": 9.988886549785329e-08,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 3458,
    "uncertainty_score": 3.990302534858221e-06,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3459,
    "uncertainty_score": 0.7500321610312101,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 3460,
    "uncertainty_score": 0.01841865558410318,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3461,
    "uncertainty_score": 0.25000000459285654,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3462,
    "uncertainty_score": 0.2160918045892115,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3463,
    "uncertainty_score": 0.6000257287286292,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 3464,
    "uncertainty_score": 0.00025420649890503516,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3465,
    "uncertainty_score": 0.21529366789053608,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 3466,
    "uncertainty_score": 0.21028301030354346,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 3467,
    "uncertainty_score": 0.1666666666666672,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 3468,
    "uncertainty_score": 6.243416241557784e-06,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 3469,
    "uncertainty_score": 0.00015237780723692692,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 3470,
    "uncertainty_score": 3.789066093624262e-05,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3471,
    "uncertainty_score": 0.2021271146521833,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3472,
    "uncertainty_score": 3.444262432806711e-05,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 3473,
    "uncertainty_score": 2.8092546891607023e-06,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 3474,
    "uncertainty_score": 4.8600715570965545e-06,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3475,
    "uncertainty_score": 0.250371628313645,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3476,
    "uncertainty_score": 0.0092987488554826,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 3477,
    "uncertainty_score": 0.24999999813082846,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3478,
    "uncertainty_score": 0.014876121132035762,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 3479,
    "uncertainty_score": 0.20002457137504442,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3480,
    "uncertainty_score": 0.1999999998,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 3481,
    "uncertainty_score": 0.3333333336319253,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 3482,
    "uncertainty_score": 1.4750947516859033e-06,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3483,
    "uncertainty_score": 9.844549247302882e-11,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 3484,
    "uncertainty_score": 0.0016460706444738188,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3485,
    "uncertainty_score": 0.22987940259650405,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 3486,
    "uncertainty_score": 0.0490348359990518,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 3487,
    "uncertainty_score": 0.20000004459160156,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 3488,
    "uncertainty_score": 0.8000000000004487,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3489,
    "uncertainty_score": 0.006051568303744103,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 3490,
    "uncertainty_score": 1.0031412621399389e-08,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 3491,
    "uncertainty_score": 0.0023617386326043118,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 3492,
    "uncertainty_score": 0.2500019877774498,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3493,
    "uncertainty_score": 0.0008342925896526453,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 3494,
    "uncertainty_score": 0.75,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 3495,
    "uncertainty_score": 0.7500021437056303,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 3496,
    "uncertainty_score": 0.25000014287511246,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3497,
    "uncertainty_score": 1.6168525120462922e-10,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 3498,
    "uncertainty_score": 0.07301525628319566,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3499,
    "uncertainty_score": 1.7728704218341315e-08,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 3500,
    "uncertainty_score": 0.20001451803042541,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3501,
    "uncertainty_score": 0.16668014156677588,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 3502,
    "uncertainty_score": 0.8,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3503,
    "uncertainty_score": 9.89619753475733e-07,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 3504,
    "uncertainty_score": 0.6000090795753936,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 3505,
    "uncertainty_score": 0.3333333330124533,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3506,
    "uncertainty_score": 0.5000700832757717,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3507,
    "uncertainty_score": 3.853248235117964e-08,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3508,
    "uncertainty_score": 0.2500000081448635,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3509,
    "uncertainty_score": 0.00025959749754759945,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 3510,
    "uncertainty_score": 0.3382678468470332,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 3511,
    "uncertainty_score": 0.20005895939548085,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 3512,
    "uncertainty_score": 9.679342774336781e-08,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 3513,
    "uncertainty_score": 1.484324297561184e-07,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 3514,
    "uncertainty_score": 0.24673367793658044,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3515,
    "uncertainty_score": 0.21364016341401215,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 3516,
    "uncertainty_score": 6.024096596706012e-11,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 3517,
    "uncertainty_score": 0.5014245347092295,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3518,
    "uncertainty_score": 0.40006198941292814,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3519,
    "uncertainty_score": 0.20401147710537448,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 3520,
    "uncertainty_score": 0.2000150116783644,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3521,
    "uncertainty_score": 0.5011644007648559,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 3522,
    "uncertainty_score": 0.20108820087230939,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3523,
    "uncertainty_score": 3.989489183180594e-07,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 3524,
    "uncertainty_score": 0.2001105902256617,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3525,
    "uncertainty_score": 0.29622479440679245,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3526,
    "uncertainty_score": 0.5000375988395616,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 3527,
    "uncertainty_score": 9.42405712761725e-11,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3528,
    "uncertainty_score": 0.6033829931612027,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 3529,
    "uncertainty_score": 0.33333457591418036,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3530,
    "uncertainty_score": 0.2500000018765191,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 3531,
    "uncertainty_score": 3.504810226771999e-09,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 3532,
    "uncertainty_score": 0.33333443885295694,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 3533,
    "uncertainty_score": 4.240421501371924e-07,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3534,
    "uncertainty_score": 1.0919541261983735e-06,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3535,
    "uncertainty_score": 0.9999999991999966,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 3536,
    "uncertainty_score": 3.7045162546131715e-05,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 3537,
    "uncertainty_score": 0.49620137148736654,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 3538,
    "uncertainty_score": 0.33792628918513595,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3539,
    "uncertainty_score": 1.523642597161989e-08,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 3540,
    "uncertainty_score": 4.3848770833974264e-07,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 3541,
    "uncertainty_score": 0.333347897044259,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3542,
    "uncertainty_score": 0.6000095771381997,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 3543,
    "uncertainty_score": 0.39999999958722243,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 3544,
    "uncertainty_score": 0.19996484574403267,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3545,
    "uncertainty_score": 0.25000000000653233,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3546,
    "uncertainty_score": 0.16666666666667138,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 3547,
    "uncertainty_score": 2.1197023002660985e-06,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 3548,
    "uncertainty_score": 0.3333331526451606,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 3549,
    "uncertainty_score": 0.21445729637849373,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 3550,
    "uncertainty_score": 0.5972456051114204,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3551,
    "uncertainty_score": 0.33378010315421464,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 3552,
    "uncertainty_score": 1.546752568521884e-07,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 3553,
    "uncertainty_score": 2.75027990709595e-09,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3554,
    "uncertainty_score": 0.001340686919783687,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3555,
    "uncertainty_score": 0.49781909529637,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 3556,
    "uncertainty_score": 3.8295026478221985e-09,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 3557,
    "uncertainty_score": 9.757713920571874e-08,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 3558,
    "uncertainty_score": 0.20000006439534457,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 3559,
    "uncertainty_score": 0.4000000233625688,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 3560,
    "uncertainty_score": 8.956487504892443e-08,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3561,
    "uncertainty_score": 3.6819591162409164e-08,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 3562,
    "uncertainty_score": 0.010009517614103094,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3563,
    "uncertainty_score": 0.10295232300771315,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 3564,
    "uncertainty_score": 0.0001676723835981472,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3565,
    "uncertainty_score": 0.33444890476033956,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 3566,
    "uncertainty_score": 0.6,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 3567,
    "uncertainty_score": 6.2775099908536425e-09,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 3568,
    "uncertainty_score": 0.20514769674266348,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 3569,
    "uncertainty_score": 0.40000004476590145,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3570,
    "uncertainty_score": 8.658493432392508e-05,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 3571,
    "uncertainty_score": 0.20000000014373098,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 3572,
    "uncertainty_score": 0.22593885986191653,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3573,
    "uncertainty_score": 0.06043143370795473,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 3574,
    "uncertainty_score": 0.2017338745197101,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3575,
    "uncertainty_score": 3.0879750200227644e-05,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3576,
    "uncertainty_score": 0.00018037327792643152,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3577,
    "uncertainty_score": 8.592395267862042e-09,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 3578,
    "uncertainty_score": 5.7026914513803146e-09,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 3579,
    "uncertainty_score": 2.4543630758612314e-09,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 3580,
    "uncertainty_score": 0.20000374667883256,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 3581,
    "uncertainty_score": 0.40000119124189615,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3582,
    "uncertainty_score": 0.20035736081326264,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 3583,
    "uncertainty_score": 0.8324992484673919,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3584,
    "uncertainty_score": 5.86202050122838e-07,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 3585,
    "uncertainty_score": 0.24999999659575914,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 3586,
    "uncertainty_score": 0.16666666682088502,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3587,
    "uncertainty_score": 0.06257081483203102,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 3588,
    "uncertainty_score": 0.40000004248885795,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 3589,
    "uncertainty_score": 0.00024497349291756836,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 3590,
    "uncertainty_score": 0.5,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 3591,
    "uncertainty_score": 0.4741688412868135,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 3592,
    "uncertainty_score": 0.33333333312318814,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3593,
    "uncertainty_score": 0.20000109608708758,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 3594,
    "uncertainty_score": 4.615897485781705e-06,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 3595,
    "uncertainty_score": 0.19999881177542764,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 3596,
    "uncertainty_score": 4.07612414058407e-05,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 3597,
    "uncertainty_score": 1.9176280578184457e-08,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 3598,
    "uncertainty_score": 2.271609132753512e-05,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 3599,
    "uncertainty_score": 0.666552343936361,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 3600,
    "uncertainty_score": 0.2500008843791527,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3601,
    "uncertainty_score": 0.2500632890896985,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 3602,
    "uncertainty_score": 0.4,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3603,
    "uncertainty_score": 0.25013821657328167,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 3604,
    "uncertainty_score": 0.7500087472423421,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3605,
    "uncertainty_score": 0.0007989350728763278,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 3606,
    "uncertainty_score": 0.2500000034144135,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 3607,
    "uncertainty_score": 6.217117478367335e-07,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 3608,
    "uncertainty_score": 1.5970297827031294e-06,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 3609,
    "uncertainty_score": 0.0019927818555544098,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 3610,
    "uncertainty_score": 0.3333332911752845,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3611,
    "uncertainty_score": 0.5000000002143147,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3612,
    "uncertainty_score": 4.4472726014378124e-11,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 3613,
    "uncertainty_score": 1.4361151447203802e-05,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3614,
    "uncertainty_score": 0.31622264539184064,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3615,
    "uncertainty_score": 0.00023403012125505318,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 3616,
    "uncertainty_score": 0.1999271031085622,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 3617,
    "uncertainty_score": 0.6000000793796201,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3618,
    "uncertainty_score": 0.1483226874703603,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 3619,
    "uncertainty_score": 0.2500002327563454,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3620,
    "uncertainty_score": 0.20000003318225495,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 3621,
    "uncertainty_score": 1.6794246706879937e-05,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 3622,
    "uncertainty_score": 0.5180728685789328,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3623,
    "uncertainty_score": 0.2500200878727341,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 3624,
    "uncertainty_score": 0.2500761718163618,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3625,
    "uncertainty_score": 0.166666687045099,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 3626,
    "uncertainty_score": 0.20000004352699524,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3627,
    "uncertainty_score": 3.26180800488162e-08,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3628,
    "uncertainty_score": 0.797242759367865,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 3629,
    "uncertainty_score": 0.0003016517428602114,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3630,
    "uncertainty_score": 0.005124331082754019,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 3631,
    "uncertainty_score": 0.8393652403220171,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3632,
    "uncertainty_score": 0.16666872520896456,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 3633,
    "uncertainty_score": 0.20195858594166277,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3634,
    "uncertainty_score": 3.2485610197665435e-07,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3635,
    "uncertainty_score": 0.39999663211615066,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 3636,
    "uncertainty_score": 0.20000096218878238,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 3637,
    "uncertainty_score": 0.25000000127923255,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 3638,
    "uncertainty_score": 0.0006945685558441031,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 3639,
    "uncertainty_score": 0.5000959902134892,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3640,
    "uncertainty_score": 0.40077760164243215,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3641,
    "uncertainty_score": 0.27550384393222693,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 3642,
    "uncertainty_score": 0.0015086930882570486,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 3643,
    "uncertainty_score": 1.178039064310693e-05,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 3644,
    "uncertainty_score": 0.49999999975000026,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 3645,
    "uncertainty_score": 0.3415017656550124,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3646,
    "uncertainty_score": 0.2499999997609613,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 3647,
    "uncertainty_score": 0.1999997227541008,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 3648,
    "uncertainty_score": 0.7998995549715697,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3649,
    "uncertainty_score": 2.0452523014436321e-07,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 3650,
    "uncertainty_score": 0.33342417371420835,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 3651,
    "uncertainty_score": 3.5924507684042325e-07,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 3652,
    "uncertainty_score": 0.2503701904551259,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3653,
    "uncertainty_score": 5.7037470075260905e-06,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 3654,
    "uncertainty_score": 0.2500000010212772,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3655,
    "uncertainty_score": 0.40002539404604986,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 3656,
    "uncertainty_score": 0.20275552551323478,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 3657,
    "uncertainty_score": 0.2533491397952689,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 3658,
    "uncertainty_score": 1.4133012477820188e-06,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3659,
    "uncertainty_score": 0.7500600774815533,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 3660,
    "uncertainty_score": 0.0037791320635269035,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 3661,
    "uncertainty_score": 0.3332139296106717,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3662,
    "uncertainty_score": 0.4009315205353169,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3663,
    "uncertainty_score": 1.2460311740291693e-06,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3664,
    "uncertainty_score": 0.4000000002387081,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3665,
    "uncertainty_score": 0.37569116037577227,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 3666,
    "uncertainty_score": 0.6666666194676215,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3667,
    "uncertainty_score": 0.6,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 3668,
    "uncertainty_score": 0.33333334181842994,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3669,
    "uncertainty_score": 0.25035258985658987,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 3670,
    "uncertainty_score": 0.8062287662572292,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3671,
    "uncertainty_score": 0.20000008809824657,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 3672,
    "uncertainty_score": 0.25000001964079716,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 3673,
    "uncertainty_score": 0.4000017147708766,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3674,
    "uncertainty_score": 0.999995994667356,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3675,
    "uncertainty_score": 4.379290226377104e-06,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 3676,
    "uncertainty_score": 0.16631755093589054,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 3677,
    "uncertainty_score": 0.19831477954662463,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 3678,
    "uncertainty_score": 4.052469868725923e-10,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 3679,
    "uncertainty_score": 0.005629945862780135,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 3680,
    "uncertainty_score": 0.20000320404051836,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3681,
    "uncertainty_score": 0.3333333333334367,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 3682,
    "uncertainty_score": 6.4140587595313765e-09,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 3683,
    "uncertainty_score": 0.20000884621123896,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 3684,
    "uncertainty_score": 0.4000320556571347,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3685,
    "uncertainty_score": 0.4000020089665287,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 3686,
    "uncertainty_score": 0.00026777499601616394,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3687,
    "uncertainty_score": 9.112657768324554e-05,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 3688,
    "uncertainty_score": 0.3999958427668165,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3689,
    "uncertainty_score": 0.33333313237712686,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 3690,
    "uncertainty_score": 0.39999999981813883,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 3691,
    "uncertainty_score": 0.1666690606922513,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 3692,
    "uncertainty_score": 7.697542725628381e-10,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 3693,
    "uncertainty_score": 0.33333333299999995,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3694,
    "uncertainty_score": 0.20000068319912997,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3695,
    "uncertainty_score": 7.130793749181201e-07,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 3696,
    "uncertainty_score": 0.2928257549897061,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 3697,
    "uncertainty_score": 0.5000094582798076,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 3698,
    "uncertainty_score": 0.13480073731171952,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 3699,
    "uncertainty_score": 0.20000214529449462,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 3700,
    "uncertainty_score": 0.7496438251963338,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3701,
    "uncertainty_score": 2.4441780436268845e-05,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 3702,
    "uncertainty_score": 4.563097758017013e-08,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3703,
    "uncertainty_score": 0.49861584905429035,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3704,
    "uncertainty_score": 0.5000000454286536,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 3705,
    "uncertainty_score": 0.2500767706863661,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3706,
    "uncertainty_score": 0.59999949309643,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 3707,
    "uncertainty_score": 0.3333333333333333,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3708,
    "uncertainty_score": 0.4000019154238627,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3709,
    "uncertainty_score": 0.2500027820472659,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3710,
    "uncertainty_score": 0.00012924485576216757,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 3711,
    "uncertainty_score": 0.20004562488898792,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 3712,
    "uncertainty_score": 9.828003299549871e-06,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3713,
    "uncertainty_score": 0.00014052532021176047,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 3714,
    "uncertainty_score": 6.41130428112405e-09,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 3715,
    "uncertainty_score": 0.00657520074370795,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 3716,
    "uncertainty_score": 0.0032718792069462697,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 3717,
    "uncertainty_score": 0.38744424061091653,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3718,
    "uncertainty_score": 2.3061547459733163e-08,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 3719,
    "uncertainty_score": 0.3333333388128787,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3720,
    "uncertainty_score": 0.2500000001137852,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 3721,
    "uncertainty_score": 0.14285714272476563,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3722,
    "uncertainty_score": 0.7511055740874422,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3723,
    "uncertainty_score": 0.2526631276788437,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 3724,
    "uncertainty_score": 2.2378911779993075e-08,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 3725,
    "uncertainty_score": 0.2500504583309755,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 3726,
    "uncertainty_score": 3.704697714326449e-05,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 3727,
    "uncertainty_score": 0.2500000018639887,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 3728,
    "uncertainty_score": 0.25056296373974807,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 3729,
    "uncertainty_score": 7.565948915185495e-05,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 3730,
    "uncertainty_score": 0.25000006541391545,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 3731,
    "uncertainty_score": 0.20002703844311925,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3732,
    "uncertainty_score": 0.012214445291897635,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3733,
    "uncertainty_score": 2.048342974660497e-12,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 3734,
    "uncertainty_score": 4.7380970445332935e-07,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 3735,
    "uncertainty_score": 0.2000000000910278,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3736,
    "uncertainty_score": 0.00015579620664520457,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 3737,
    "uncertainty_score": 0.2508981721333675,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3738,
    "uncertainty_score": 3.179030558669512e-05,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3739,
    "uncertainty_score": 0.7153223528789979,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 3740,
    "uncertainty_score": 1.9074808014546262e-07,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 3741,
    "uncertainty_score": 1.5778690074105535e-07,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 3742,
    "uncertainty_score": 0.6666667008216086,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3743,
    "uncertainty_score": 0.1666668062979385,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 3744,
    "uncertainty_score": 0.8584114213656949,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 3745,
    "uncertainty_score": 0.19746916551203514,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3746,
    "uncertainty_score": 0.3848292943992179,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 3747,
    "uncertainty_score": 0.16666833792550195,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 3748,
    "uncertainty_score": 2.0068544753559397e-07,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3749,
    "uncertainty_score": 0.2522804392122208,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 3750,
    "uncertainty_score": 0.43990556581762835,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 3751,
    "uncertainty_score": 0.39999664982709904,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 3752,
    "uncertainty_score": 2.072110712774744e-09,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 3753,
    "uncertainty_score": 0.012836014805157735,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3754,
    "uncertainty_score": 0.4999770920170601,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 3755,
    "uncertainty_score": 4.07095530945845e-05,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3756,
    "uncertainty_score": 0.009444245476523744,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3757,
    "uncertainty_score": 0.03690902462696909,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3758,
    "uncertainty_score": 1.924166129359492e-07,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 3759,
    "uncertainty_score": 5.8894415154636473e-08,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 3760,
    "uncertainty_score": 0.5000049325722766,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 3761,
    "uncertainty_score": 4.397576620169034e-07,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 3762,
    "uncertainty_score": 0.25000001874114636,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 3763,
    "uncertainty_score": 0.2000000002848727,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 3764,
    "uncertainty_score": 0.25703715161042695,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3765,
    "uncertainty_score": 0.004163362104308973,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 3766,
    "uncertainty_score": 0.40000873548901666,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 3767,
    "uncertainty_score": 0.4092455054127906,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 3768,
    "uncertainty_score": 0.14295211739975697,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 3769,
    "uncertainty_score": 2.456577333828327e-05,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 3770,
    "uncertainty_score": 6.804660859004357e-14,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3771,
    "uncertainty_score": 0.3333333340191029,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3772,
    "uncertainty_score": 1.2549829859913282e-06,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 3773,
    "uncertainty_score": 6.153419070709597e-08,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 3774,
    "uncertainty_score": 0.2500038984313174,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3775,
    "uncertainty_score": 0.25004064274423793,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 3776,
    "uncertainty_score": 0.33365990299903414,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 3777,
    "uncertainty_score": 2.7610965317013004e-06,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3778,
    "uncertainty_score": 0.6000010732088754,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3779,
    "uncertainty_score": 0.0032719063675032915,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 3780,
    "uncertainty_score": 0.5999791105668039,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 3781,
    "uncertainty_score": 0.37969485751928617,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3782,
    "uncertainty_score": 0.02409559444560311,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 3783,
    "uncertainty_score": 0.33333335259593017,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3784,
    "uncertainty_score": 1.0226722020713284e-05,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 3785,
    "uncertainty_score": 0.19995280888910466,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 3786,
    "uncertainty_score": 0.2072488714916076,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 3787,
    "uncertainty_score": 0.2000073740453392,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3788,
    "uncertainty_score": 0.39630013316371393,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3789,
    "uncertainty_score": 0.5527845155958717,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 3790,
    "uncertainty_score": 0.04720209779490119,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3791,
    "uncertainty_score": 0.20000029231028899,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 3792,
    "uncertainty_score": 4.382977415721395e-09,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 3793,
    "uncertainty_score": 1.860143518939881e-05,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3794,
    "uncertainty_score": 0.600000000334705,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3795,
    "uncertainty_score": 0.40001696230805217,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 3796,
    "uncertainty_score": 0.6001231239914974,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 3797,
    "uncertainty_score": 2.648121878087894e-06,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 3798,
    "uncertainty_score": 0.40004806982010005,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3799,
    "uncertainty_score": 0.3695944682165964,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3800,
    "uncertainty_score": 0.3333336981638914,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 3801,
    "uncertainty_score": 3.572352018749234e-05,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 3802,
    "uncertainty_score": 0.0006153342813801206,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 3803,
    "uncertainty_score": 6.402322806443672e-06,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 3804,
    "uncertainty_score": 0.4056299038763491,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3805,
    "uncertainty_score": 7.880560425286379e-09,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 3806,
    "uncertainty_score": 0.2858816589125837,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 3807,
    "uncertainty_score": 2.711534967716485e-05,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 3808,
    "uncertainty_score": 0.19983003347801473,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3809,
    "uncertainty_score": 0.33333407150885264,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 3810,
    "uncertainty_score": 0.6666141588720348,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3811,
    "uncertainty_score": 0.16669124399711702,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3812,
    "uncertainty_score": 3.216104154714625e-05,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3813,
    "uncertainty_score": 2.2003274207905455e-06,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3814,
    "uncertainty_score": 7.7971554782654e-11,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3815,
    "uncertainty_score": 0.2000022948926766,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 3816,
    "uncertainty_score": 0.6666660147104658,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3817,
    "uncertainty_score": 1.7074372673268408e-05,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3818,
    "uncertainty_score": 0.5004788189803315,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 3819,
    "uncertainty_score": 0.19999644503944083,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 3820,
    "uncertainty_score": 0.6669877837138168,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 3821,
    "uncertainty_score": 1.1533375114429291e-08,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 3822,
    "uncertainty_score": 0.20003406077304103,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3823,
    "uncertainty_score": 0.25000005877521264,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 3824,
    "uncertainty_score": 8.979300709398494e-05,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3825,
    "uncertainty_score": 0.500004684373984,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 3826,
    "uncertainty_score": 0.7500000651628947,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 3827,
    "uncertainty_score": 0.4992225363115999,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 3828,
    "uncertainty_score": 0.024115087216698868,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3829,
    "uncertainty_score": 0.2000000582066713,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 3830,
    "uncertainty_score": 0.6000000000132512,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3831,
    "uncertainty_score": 0.0001888514176443646,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3832,
    "uncertainty_score": 0.5005347322976605,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3833,
    "uncertainty_score": 0.4000003385662074,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 3834,
    "uncertainty_score": 0.395450503647877,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 3835,
    "uncertainty_score": 0.00035263747301642095,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 3836,
    "uncertainty_score": 0.001291582773515593,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 3837,
    "uncertainty_score": 0.2041543021067239,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 3838,
    "uncertainty_score": 7.947580429558177e-09,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 3839,
    "uncertainty_score": 0.33350824579875965,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 3840,
    "uncertainty_score": 0.7499991819978,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 3841,
    "uncertainty_score": 1.968434671388086e-10,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 3842,
    "uncertainty_score": 0.500000000617451,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3843,
    "uncertainty_score": 0.250000417137926,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 3844,
    "uncertainty_score": 0.5603180954951952,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3845,
    "uncertainty_score": 9.636017732147308e-05,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 3846,
    "uncertainty_score": 0.2500000000011596,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3847,
    "uncertainty_score": 3.946167515696549e-06,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 3848,
    "uncertainty_score": 0.00024047702276897278,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 3849,
    "uncertainty_score": 1.3072434820204892e-06,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3850,
    "uncertainty_score": 0.6000000611804468,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3851,
    "uncertainty_score": 0.749999999219858,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 3852,
    "uncertainty_score": 0.0002380006058042916,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 3853,
    "uncertainty_score": 2.9665129289589482e-06,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3854,
    "uncertainty_score": 0.2505940745414682,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 3855,
    "uncertainty_score": 0.9006716382341543,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 3856,
    "uncertainty_score": 1.5184514162880132e-07,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 3857,
    "uncertainty_score": 0.0004461489414801232,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3858,
    "uncertainty_score": 2.7692176325859597e-06,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 3859,
    "uncertainty_score": 0.25000937847056093,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3860,
    "uncertainty_score": 0.8000066428386046,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3861,
    "uncertainty_score": 6.13967683846332e-09,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3862,
    "uncertainty_score": 0.12825463317161367,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3863,
    "uncertainty_score": 1.7041970244702578e-07,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 3864,
    "uncertainty_score": 0.2500002617105055,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 3865,
    "uncertainty_score": 0.24999999974999493,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3866,
    "uncertainty_score": 0.1999374949042028,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3867,
    "uncertainty_score": 0.5999999998,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3868,
    "uncertainty_score": 0.2000385158792289,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 3869,
    "uncertainty_score": 0.4000001378282828,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 3870,
    "uncertainty_score": 0.60264750118325,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 3871,
    "uncertainty_score": 8.357532933293909e-06,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 3872,
    "uncertainty_score": 0.05296424127440058,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 3873,
    "uncertainty_score": 1.397854446725879e-14,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 3874,
    "uncertainty_score": 0.00042756304199630503,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 3875,
    "uncertainty_score": 0.4999999962548047,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 3876,
    "uncertainty_score": 0.3333333327700497,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3877,
    "uncertainty_score": 0.250079693149252,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3878,
    "uncertainty_score": 0.33524341559835347,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3879,
    "uncertainty_score": 0.22212487960048058,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3880,
    "uncertainty_score": 0.39999999990926643,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 3881,
    "uncertainty_score": 0.5000000000083958,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 3882,
    "uncertainty_score": 3.110352678373312e-08,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 3883,
    "uncertainty_score": 0.3333334070112289,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3884,
    "uncertainty_score": 0.3338743750651016,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 3885,
    "uncertainty_score": 0.16666077742369007,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 3886,
    "uncertainty_score": 0.26117105924199957,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 3887,
    "uncertainty_score": 0.49999359988160896,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3888,
    "uncertainty_score": 0.16674998540685784,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 3889,
    "uncertainty_score": 0.00010933045185986537,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 3890,
    "uncertainty_score": 4.9673356927822985e-09,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 3891,
    "uncertainty_score": 0.500019272015848,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3892,
    "uncertainty_score": 0.07706631434112642,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 3893,
    "uncertainty_score": 1.1024614406579719e-07,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3894,
    "uncertainty_score": 0.7497343908757215,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 3895,
    "uncertainty_score": 0.2003641240690696,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 3896,
    "uncertainty_score": 0.5001483133407661,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3897,
    "uncertainty_score": 0.6666679752960296,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3898,
    "uncertainty_score": 0.250101123005674,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3899,
    "uncertainty_score": 0.00045893892842527805,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 3900,
    "uncertainty_score": 0.40000000000747205,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 3901,
    "uncertainty_score": 0.7999999768620272,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 3902,
    "uncertainty_score": 6.79704640930955e-05,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 3903,
    "uncertainty_score": 0.6010882102669546,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 3904,
    "uncertainty_score": 0.200000001997325,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 3905,
    "uncertainty_score": 0.20001473937556075,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 3906,
    "uncertainty_score": 0.2500181357688884,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3907,
    "uncertainty_score": 0.8000043767154965,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3908,
    "uncertainty_score": 2.0778001810415726e-05,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 3909,
    "uncertainty_score": 0.20000000018603328,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3910,
    "uncertainty_score": 0.5714285714287107,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3911,
    "uncertainty_score": 0.3999995570727508,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 3912,
    "uncertainty_score": 4.120698839679548e-06,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3913,
    "uncertainty_score": 0.4670868899474611,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 3914,
    "uncertainty_score": 2.775362982641712e-07,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 3915,
    "uncertainty_score": 1.0,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 3916,
    "uncertainty_score": 0.028990204435469007,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3917,
    "uncertainty_score": 5.719350289594789e-07,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 3918,
    "uncertainty_score": 0.25000677242034675,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3919,
    "uncertainty_score": 0.002543294089900703,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 3920,
    "uncertainty_score": 0.40019597879251184,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 3921,
    "uncertainty_score": 4.846075934092185e-06,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 3922,
    "uncertainty_score": 8.825930834200503e-08,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 3923,
    "uncertainty_score": 1.0,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 3924,
    "uncertainty_score": 0.4000000144895319,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 3925,
    "uncertainty_score": 0.20026783010369648,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3926,
    "uncertainty_score": 3.1598937054934084e-08,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 3927,
    "uncertainty_score": 0.20115401248684148,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3928,
    "uncertainty_score": 1.2835497528678109e-08,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3929,
    "uncertainty_score": 3.2749591636517325e-08,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 3930,
    "uncertainty_score": 0.40000008364006645,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3931,
    "uncertainty_score": 0.39564271458551226,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3932,
    "uncertainty_score": 1.445934556597356e-08,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 3933,
    "uncertainty_score": 3.2912899690881163e-09,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 3934,
    "uncertainty_score": 0.6000161048679088,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 3935,
    "uncertainty_score": 0.33926773003373883,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3936,
    "uncertainty_score": 0.3999999994440426,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 3937,
    "uncertainty_score": 0.012047788043912362,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 3938,
    "uncertainty_score": 0.6614706143728294,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 3939,
    "uncertainty_score": 2.6493068721295365e-16,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3940,
    "uncertainty_score": 0.18540021561410042,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3941,
    "uncertainty_score": 0.4285714284420187,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 3942,
    "uncertainty_score": 0.0,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3943,
    "uncertainty_score": 3.413689022755419e-07,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 3944,
    "uncertainty_score": 0.002374713981711001,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3945,
    "uncertainty_score": 0.20017726215360115,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 3946,
    "uncertainty_score": 0.2500004731280506,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 3947,
    "uncertainty_score": 3.090578022909909e-08,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 3948,
    "uncertainty_score": 0.4289016397926401,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 3949,
    "uncertainty_score": 5.285839978842176e-07,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 3950,
    "uncertainty_score": 0.003943825574295007,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3951,
    "uncertainty_score": 5.197975343352316e-10,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 3952,
    "uncertainty_score": 0.19999997830446845,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 3953,
    "uncertainty_score": 2.9301837698668156e-06,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 3954,
    "uncertainty_score": 0.7499993496819124,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 3955,
    "uncertainty_score": 1.842008145807487e-08,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 3956,
    "uncertainty_score": 0.16667610902514474,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3957,
    "uncertainty_score": 0.6310282413697457,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3958,
    "uncertainty_score": 1.663833397912832e-10,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 3959,
    "uncertainty_score": 2.5293885772441042e-09,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 3960,
    "uncertainty_score": 1.07041577371539e-09,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 3961,
    "uncertainty_score": 8.157685820641933e-07,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3962,
    "uncertainty_score": 7.891860211956977e-06,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 3963,
    "uncertainty_score": 1.0,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 3964,
    "uncertainty_score": 0.22428289914034769,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3965,
    "uncertainty_score": 0.1999856038868373,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 3966,
    "uncertainty_score": 3.379257513569346e-09,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 3967,
    "uncertainty_score": 0.0008098102188715358,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 3968,
    "uncertainty_score": 0.0009485593836302014,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3969,
    "uncertainty_score": 0.2504359682396324,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3970,
    "uncertainty_score": 0.018071745815459252,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3971,
    "uncertainty_score": 0.500000000000005,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3972,
    "uncertainty_score": 0.7501065239433049,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 3973,
    "uncertainty_score": 3.4648339986134316e-07,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3974,
    "uncertainty_score": 0.3572441604244772,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 3975,
    "uncertainty_score": 0.2000000004122307,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 3976,
    "uncertainty_score": 0.16666669157444566,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 3977,
    "uncertainty_score": 0.38382336372135306,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3978,
    "uncertainty_score": 0.40224319856377877,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3979,
    "uncertainty_score": 0.2897173627400747,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 3980,
    "uncertainty_score": 0.800003745616895,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 3981,
    "uncertainty_score": 1.0355251525903741e-08,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 3982,
    "uncertainty_score": 4.648872918454241e-08,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3983,
    "uncertainty_score": 0.33333357905241545,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3984,
    "uncertainty_score": 2.897983744326131e-05,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3985,
    "uncertainty_score": 0.36505372378674805,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3986,
    "uncertainty_score": 2.630242790038612e-07,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3987,
    "uncertainty_score": 1.3036168711782622e-07,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 3988,
    "uncertainty_score": 0.3999999992232971,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3989,
    "uncertainty_score": 0.40000048305612373,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 3990,
    "uncertainty_score": 2.3534306825399424e-08,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 3991,
    "uncertainty_score": 0.16666631666748963,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3992,
    "uncertainty_score": 0.4739194733517028,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 3993,
    "uncertainty_score": 9.742871344728015e-06,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 3994,
    "uncertainty_score": 0.3333333375504517,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3995,
    "uncertainty_score": 0.7499997853792868,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 3996,
    "uncertainty_score": 5.542095962711898e-06,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 3997,
    "uncertainty_score": 0.33333403379336546,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 3998,
    "uncertainty_score": 0.01078698172612099,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 3999,
    "uncertainty_score": 0.2500000023148977,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 4000,
    "uncertainty_score": 0.25344868392175834,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 4001,
    "uncertainty_score": 0.00591062223027178,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 4002,
    "uncertainty_score": 1.2739017071969525e-06,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 4003,
    "uncertainty_score": 0.39983234999503103,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4004,
    "uncertainty_score": 0.05420159346312038,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 4005,
    "uncertainty_score": 1.8686504804870591e-06,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 4006,
    "uncertainty_score": 8.647457416248791e-05,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4007,
    "uncertainty_score": 1.7353906412670244e-08,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4008,
    "uncertainty_score": 1.2232226112879633e-05,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 4009,
    "uncertainty_score": 0.0,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4010,
    "uncertainty_score": 0.2000013948143108,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 4011,
    "uncertainty_score": 0.49999652999905475,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4012,
    "uncertainty_score": 5.454247539866857e-08,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 4013,
    "uncertainty_score": 0.25001022584469496,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4014,
    "uncertainty_score": 0.7499999544821512,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 4015,
    "uncertainty_score": 0.21190023701703514,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 4016,
    "uncertainty_score": 0.20202346717981762,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4017,
    "uncertainty_score": 0.3990522707584935,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 4018,
    "uncertainty_score": 7.109434172242988e-06,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 4019,
    "uncertainty_score": 0.15522929717015313,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4020,
    "uncertainty_score": 0.45238157394374745,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 4021,
    "uncertainty_score": 0.20001999045036994,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 4022,
    "uncertainty_score": 0.24999999977632598,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4023,
    "uncertainty_score": 0.33333333300006135,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4024,
    "uncertainty_score": 0.33340939041462486,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 4025,
    "uncertainty_score": 0.00014557911314217018,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 4026,
    "uncertainty_score": 0.07211418905069192,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 4027,
    "uncertainty_score": 0.33334621039445717,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4028,
    "uncertainty_score": 7.278573965933021e-06,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 4029,
    "uncertainty_score": 1.4719390333003113e-12,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 4030,
    "uncertainty_score": 0.001790684733596776,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 4031,
    "uncertainty_score": 1.2841114235692802e-05,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 4032,
    "uncertainty_score": 0.33324519152630877,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4033,
    "uncertainty_score": 1.0760810682487738e-05,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4034,
    "uncertainty_score": 1.0,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4035,
    "uncertainty_score": 0.20000062181935446,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 4036,
    "uncertainty_score": 0.5999820723613576,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 4037,
    "uncertainty_score": 0.75,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 4038,
    "uncertainty_score": 1.9941725305818394e-10,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 4039,
    "uncertainty_score": 9.399505854290609e-05,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4040,
    "uncertainty_score": 0.25000000434271524,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 4041,
    "uncertainty_score": 0.20000609599803393,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4042,
    "uncertainty_score": 0.20416630434681232,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 4043,
    "uncertainty_score": 6.066018626472728e-06,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 4044,
    "uncertainty_score": 1.321197954155124e-10,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 4045,
    "uncertainty_score": 0.5,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 4046,
    "uncertainty_score": 2.2585530127373532e-10,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 4047,
    "uncertainty_score": 0.3992590989526691,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4048,
    "uncertainty_score": 0.26508076322780794,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 4049,
    "uncertainty_score": 0.199956774453353,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 4050,
    "uncertainty_score": 8.713760766474232e-07,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4051,
    "uncertainty_score": 0.626597342636344,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4052,
    "uncertainty_score": 0.16666678141411304,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4053,
    "uncertainty_score": 0.4000124101144588,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 4054,
    "uncertainty_score": 0.22879768160879266,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 4055,
    "uncertainty_score": 0.33333336748814496,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 4056,
    "uncertainty_score": 1.552615638423083e-08,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 4057,
    "uncertainty_score": 0.05851636908822265,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 4058,
    "uncertainty_score": 0.2092987503532091,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4059,
    "uncertainty_score": 2.568690272999615e-07,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 4060,
    "uncertainty_score": 0.20002710425832135,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4061,
    "uncertainty_score": 0.18003572915065624,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 4062,
    "uncertainty_score": 3.3382885441497954e-05,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 4063,
    "uncertainty_score": 1.1349467477916889e-05,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 4064,
    "uncertainty_score": 0.19997473498118604,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 4065,
    "uncertainty_score": 0.3333333333345952,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 4066,
    "uncertainty_score": 0.2500337884111727,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 4067,
    "uncertainty_score": 0.19999999642696456,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 4068,
    "uncertainty_score": 0.7500000137113673,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4069,
    "uncertainty_score": 0.333333333,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4070,
    "uncertainty_score": 0.19992321921936546,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 4071,
    "uncertainty_score": 3.183633753977348e-10,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 4072,
    "uncertainty_score": 0.8565111050136743,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4073,
    "uncertainty_score": 0.6000000000119402,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4074,
    "uncertainty_score": 0.2500000007126855,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4075,
    "uncertainty_score": 0.36525288416507107,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 4076,
    "uncertainty_score": 6.538152138746849e-10,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4077,
    "uncertainty_score": 8.581276927402777e-06,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4078,
    "uncertainty_score": 0.3333335530492891,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 4079,
    "uncertainty_score": 0.2478537398655832,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 4080,
    "uncertainty_score": 0.28850245488653375,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 4081,
    "uncertainty_score": 6.870511546046358e-10,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 4082,
    "uncertainty_score": 2.80647874582056e-09,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 4083,
    "uncertainty_score": 2.9734385785583647e-09,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 4084,
    "uncertainty_score": 5.613934696349348e-06,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 4085,
    "uncertainty_score": 0.20000015623377893,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 4086,
    "uncertainty_score": 0.20079186985496184,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4087,
    "uncertainty_score": 0.5018478057772301,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 4088,
    "uncertainty_score": 0.1428944767775196,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4089,
    "uncertainty_score": 0.41026718342211277,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4090,
    "uncertainty_score": 0.5000016522326347,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4091,
    "uncertainty_score": 6.980353160598616e-09,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 4092,
    "uncertainty_score": 0.0033133453508365548,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4093,
    "uncertainty_score": 0.08962115063696399,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 4094,
    "uncertainty_score": 0.28578895494688894,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 4095,
    "uncertainty_score": 0.20326168631762825,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4096,
    "uncertainty_score": 0.7499999981841649,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 4097,
    "uncertainty_score": 0.1302924075324408,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 4098,
    "uncertainty_score": 0.3999999998,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 4099,
    "uncertainty_score": 0.0011886235501043147,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 4100,
    "uncertainty_score": 0.19998830189815345,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 4101,
    "uncertainty_score": 0.3333333333333333,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4102,
    "uncertainty_score": 0.40001756912196385,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 4103,
    "uncertainty_score": 0.1666666664904045,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 4104,
    "uncertainty_score": 8.36649898426724e-09,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 4105,
    "uncertainty_score": 0.2000000009241481,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 4106,
    "uncertainty_score": 4.632853085817758e-10,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 4107,
    "uncertainty_score": 0.11764764923857515,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 4108,
    "uncertainty_score": 1.8873296222852306e-10,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 4109,
    "uncertainty_score": 2.4915322449288773e-10,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 4110,
    "uncertainty_score": 0.24999968808623918,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 4111,
    "uncertainty_score": 0.20000020270282493,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 4112,
    "uncertainty_score": 5.61885736944974e-05,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 4113,
    "uncertainty_score": 0.1781456760939071,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 4114,
    "uncertainty_score": 0.2696452217612608,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4115,
    "uncertainty_score": 0.2000000003082083,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4116,
    "uncertainty_score": 0.2500139800252499,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 4117,
    "uncertainty_score": 0.0002520773160399928,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 4118,
    "uncertainty_score": 0.20038619828602866,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4119,
    "uncertainty_score": 0.5782544761329491,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 4120,
    "uncertainty_score": 5.2076035754569925e-09,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 4121,
    "uncertainty_score": 0.0007384559102099262,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 4122,
    "uncertainty_score": 3.8236264878769835e-11,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 4123,
    "uncertainty_score": 0.24999975946347613,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4124,
    "uncertainty_score": 0.25000108897459,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 4125,
    "uncertainty_score": 0.500000000000011,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 4126,
    "uncertainty_score": 0.2500034259013273,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4127,
    "uncertainty_score": 0.0007357655882549045,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 4128,
    "uncertainty_score": 0.23123369162913837,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 4129,
    "uncertainty_score": 0.01669934736040104,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 4130,
    "uncertainty_score": 0.003987102213438733,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4131,
    "uncertainty_score": 3.168725443361464e-05,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4132,
    "uncertainty_score": 5.40370161949257e-07,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4133,
    "uncertainty_score": 0.08333670798114871,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 4134,
    "uncertainty_score": 0.24999939215956793,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 4135,
    "uncertainty_score": 1.8174058279638358e-09,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 4136,
    "uncertainty_score": 0.600000006036556,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 4137,
    "uncertainty_score": 7.03352792902352e-05,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4138,
    "uncertainty_score": 0.02117257471441243,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 4139,
    "uncertainty_score": 0.02918794897361573,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 4140,
    "uncertainty_score": 2.33276029252246e-09,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 4141,
    "uncertainty_score": 0.20000002274282033,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4142,
    "uncertainty_score": 0.5983539324125948,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4143,
    "uncertainty_score": 0.47593694383156554,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 4144,
    "uncertainty_score": 0.6794964330172587,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 4145,
    "uncertainty_score": 0.49999994500556894,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 4146,
    "uncertainty_score": 0.20000125470762836,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 4147,
    "uncertainty_score": 2.0526077320757905e-07,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 4148,
    "uncertainty_score": 1.0086008394785577e-06,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 4149,
    "uncertainty_score": 0.2500000838821568,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4150,
    "uncertainty_score": 0.4050871452151572,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 4151,
    "uncertainty_score": 1.4844811444334363e-07,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 4152,
    "uncertainty_score": 0.25000165198263546,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 4153,
    "uncertainty_score": 2.3815899111093292e-06,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 4154,
    "uncertainty_score": 7.084580753530571e-07,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 4155,
    "uncertainty_score": 1.4510098202906558e-05,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 4156,
    "uncertainty_score": 0.20655088626431625,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4157,
    "uncertainty_score": 6.742148955563533e-08,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 4158,
    "uncertainty_score": 0.25000105800936323,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 4159,
    "uncertainty_score": 0.00027261416397191863,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 4160,
    "uncertainty_score": 0.21077971459659853,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4161,
    "uncertainty_score": 0.5558057607015251,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4162,
    "uncertainty_score": 1.1594470135138896e-10,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 4163,
    "uncertainty_score": 1.5375012519066642e-05,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4164,
    "uncertainty_score": 0.3333315049610393,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4165,
    "uncertainty_score": 0.08036880421512953,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4166,
    "uncertainty_score": 0.2500001428908033,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 4167,
    "uncertainty_score": 0.39872886840634875,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4168,
    "uncertainty_score": 3.1687284357373026e-05,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 4169,
    "uncertainty_score": 0.20000017103805795,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4170,
    "uncertainty_score": 0.8000076900705226,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4171,
    "uncertainty_score": 0.2500049326099491,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 4172,
    "uncertainty_score": 0.5000000001080103,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 4173,
    "uncertainty_score": 6.92839988951339e-06,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 4174,
    "uncertainty_score": 0.20000026358736536,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4175,
    "uncertainty_score": 0.49999999983334487,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4176,
    "uncertainty_score": 1.0,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4177,
    "uncertainty_score": 0.24998527439321885,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4178,
    "uncertainty_score": 6.543345096640063e-08,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 4179,
    "uncertainty_score": 0.25004173210182257,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4180,
    "uncertainty_score": 0.25,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 4181,
    "uncertainty_score": 2.6899130730354763e-09,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4182,
    "uncertainty_score": 0.5070373798200046,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 4183,
    "uncertainty_score": 0.5000000000065699,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 4184,
    "uncertainty_score": 0.23010220967818162,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 4185,
    "uncertainty_score": 0.714285714145117,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 4186,
    "uncertainty_score": 0.5203617734723158,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 4187,
    "uncertainty_score": 1.508285016699136e-08,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 4188,
    "uncertainty_score": 0.20000000232221712,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 4189,
    "uncertainty_score": 0.6253096264934507,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4190,
    "uncertainty_score": 0.20000000048423933,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 4191,
    "uncertainty_score": 2.452549152234974e-09,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 4192,
    "uncertainty_score": 0.0030418869786502383,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 4193,
    "uncertainty_score": 0.6666666608612682,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4194,
    "uncertainty_score": 7.45007714377405e-11,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 4195,
    "uncertainty_score": 0.38095172264188093,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4196,
    "uncertainty_score": 0.5999962508571385,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 4197,
    "uncertainty_score": 0.06574254571496876,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 4198,
    "uncertainty_score": 0.37598106760939,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4199,
    "uncertainty_score": 0.2499992516970936,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4200,
    "uncertainty_score": 1.719325140392619e-08,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4201,
    "uncertainty_score": 0.7499997163045442,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 4202,
    "uncertainty_score": 0.030622667113208612,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4203,
    "uncertainty_score": 0.40460546408662595,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 4204,
    "uncertainty_score": 0.2006902005212689,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 4205,
    "uncertainty_score": 0.3996522457455768,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4206,
    "uncertainty_score": 0.20002236020601322,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4207,
    "uncertainty_score": 0.24999251758544136,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4208,
    "uncertainty_score": 0.5003016487640174,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4209,
    "uncertainty_score": 0.20000030747986983,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 4210,
    "uncertainty_score": 0.4000001030118606,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 4211,
    "uncertainty_score": 1.5810516413546902e-08,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 4212,
    "uncertainty_score": 0.33333291413948046,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4213,
    "uncertainty_score": 0.6662996928163057,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 4214,
    "uncertainty_score": 0.6666705055773233,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4215,
    "uncertainty_score": 0.2211635396357335,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 4216,
    "uncertainty_score": 1.502203111242051e-10,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 4217,
    "uncertainty_score": 0.12500041297801204,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 4218,
    "uncertainty_score": 0.25043411701578294,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 4219,
    "uncertainty_score": 0.20000008370064223,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4220,
    "uncertainty_score": 4.655194143289546e-05,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4221,
    "uncertainty_score": 0.002949496733220177,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4222,
    "uncertainty_score": 0.7500000000000044,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4223,
    "uncertainty_score": 0.19694663819898944,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 4224,
    "uncertainty_score": 0.07127139288682802,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 4225,
    "uncertainty_score": 0.4142705786757559,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 4226,
    "uncertainty_score": 0.002407148143907674,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 4227,
    "uncertainty_score": 0.310117188907459,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 4228,
    "uncertainty_score": 0.25205770490608226,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 4229,
    "uncertainty_score": 0.20000591197547787,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 4230,
    "uncertainty_score": 0.25000000001036543,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4231,
    "uncertainty_score": 0.00011821454876281448,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4232,
    "uncertainty_score": 0.25009043844809337,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 4233,
    "uncertainty_score": 0.5000001123603377,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 4234,
    "uncertainty_score": 1.8257521501815105e-10,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 4235,
    "uncertainty_score": 8.245909752894347e-06,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 4236,
    "uncertainty_score": 2.7509919960690675e-05,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4237,
    "uncertainty_score": 4.139650594745557e-05,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 4238,
    "uncertainty_score": 0.20000015461651385,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4239,
    "uncertainty_score": 2.337245470063965e-06,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4240,
    "uncertainty_score": 0.3391548298994325,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4241,
    "uncertainty_score": 0.20204133663822682,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4242,
    "uncertainty_score": 0.33769774113325496,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 4243,
    "uncertainty_score": 0.16667423412412233,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 4244,
    "uncertainty_score": 0.20002200744086687,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 4245,
    "uncertainty_score": 0.02664081080766534,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 4246,
    "uncertainty_score": 0.06044563982127607,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 4247,
    "uncertainty_score": 1.3255000227901282e-07,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 4248,
    "uncertainty_score": 0.0003412827515382153,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 4249,
    "uncertainty_score": 2.532513076070309e-09,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 4250,
    "uncertainty_score": 2.6339568372236608e-09,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 4251,
    "uncertainty_score": 0.0005675045088311048,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 4252,
    "uncertainty_score": 0.0005263347839634008,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4253,
    "uncertainty_score": 7.05203867465325e-05,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 4254,
    "uncertainty_score": 0.4997010794536232,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4255,
    "uncertainty_score": 1.6888299615342164e-08,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4256,
    "uncertainty_score": 0.2001368745962584,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 4257,
    "uncertainty_score": 0.20005210597282636,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4258,
    "uncertainty_score": 7.490616831605704e-09,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 4259,
    "uncertainty_score": 2.258360243326806e-06,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 4260,
    "uncertainty_score": 0.49999999975,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 4261,
    "uncertainty_score": 0.020828349807266493,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4262,
    "uncertainty_score": 0.3998232427486256,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 4263,
    "uncertainty_score": 0.25002750939452834,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 4264,
    "uncertainty_score": 0.24454002998037763,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4265,
    "uncertainty_score": 7.287963322113661e-10,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 4266,
    "uncertainty_score": 3.684054028926475e-07,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 4267,
    "uncertainty_score": 0.25000400510751436,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 4268,
    "uncertainty_score": 0.2500051884495953,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4269,
    "uncertainty_score": 0.25003960905875694,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 4270,
    "uncertainty_score": 0.3333401482220135,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4271,
    "uncertainty_score": 0.004835248273528697,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 4272,
    "uncertainty_score": 0.017977416562151276,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4273,
    "uncertainty_score": 0.40017648212962503,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 4274,
    "uncertainty_score": 1.3772077428546142e-06,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 4275,
    "uncertainty_score": 0.20022902335736242,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 4276,
    "uncertainty_score": 0.9999999998,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4277,
    "uncertainty_score": 0.25001695445990374,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 4278,
    "uncertainty_score": 0.3023080811089912,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 4279,
    "uncertainty_score": 0.4999999581249389,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 4280,
    "uncertainty_score": 1.5982457065659298e-10,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4281,
    "uncertainty_score": 2.2028237053587578e-05,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4282,
    "uncertainty_score": 0.6000039460611095,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 4283,
    "uncertainty_score": 0.4994678041016706,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 4284,
    "uncertainty_score": 4.252931766506086e-09,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 4285,
    "uncertainty_score": 0.25136572504383153,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 4286,
    "uncertainty_score": 4.336790904762937e-05,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 4287,
    "uncertainty_score": 0.20000280583116492,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4288,
    "uncertainty_score": 0.800000000020652,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4289,
    "uncertainty_score": 2.0261557107360113e-08,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 4290,
    "uncertainty_score": 0.4448815813060455,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 4291,
    "uncertainty_score": 0.007867624099569504,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 4292,
    "uncertainty_score": 0.37028176969385174,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 4293,
    "uncertainty_score": 0.16666872683794584,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 4294,
    "uncertainty_score": 0.39998758475803375,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4295,
    "uncertainty_score": 2.6782186558648353e-05,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 4296,
    "uncertainty_score": 0.2002677888350101,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 4297,
    "uncertainty_score": 0.3329096971997346,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4298,
    "uncertainty_score": 1.64224863074016e-05,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 4299,
    "uncertainty_score": 0.07573544975336106,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 4300,
    "uncertainty_score": 0.3333333333815491,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 4301,
    "uncertainty_score": 0.4000206683115211,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4302,
    "uncertainty_score": 0.20000119044514716,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 4303,
    "uncertainty_score": 0.7999988675809762,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4304,
    "uncertainty_score": 1.0,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 4305,
    "uncertainty_score": 0.1999999877698943,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 4306,
    "uncertainty_score": 0.7974465336350521,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4307,
    "uncertainty_score": 7.640073047288617e-10,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 4308,
    "uncertainty_score": 5.436426031019938e-10,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4309,
    "uncertainty_score": 6.375693863806674e-09,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 4310,
    "uncertainty_score": 1.1443881222688191e-05,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 4311,
    "uncertainty_score": 0.40007336653044784,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 4312,
    "uncertainty_score": 3.5290825185258866e-08,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4313,
    "uncertainty_score": 0.20005639107955614,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 4314,
    "uncertainty_score": 0.33333344057382974,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4315,
    "uncertainty_score": 5.932113681830688e-06,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 4316,
    "uncertainty_score": 1.1916214868140833e-06,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 4317,
    "uncertainty_score": 0.250000000010639,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4318,
    "uncertainty_score": 2.8766550319573636e-11,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 4319,
    "uncertainty_score": 0.399840957320498,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4320,
    "uncertainty_score": 0.4,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 4321,
    "uncertainty_score": 0.5972468185918478,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4322,
    "uncertainty_score": 2.4580377572391147e-08,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4323,
    "uncertainty_score": 0.2501245321114904,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4324,
    "uncertainty_score": 2.4344077459146846e-07,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 4325,
    "uncertainty_score": 0.20002089149907576,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4326,
    "uncertainty_score": 0.2633343253927107,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4327,
    "uncertainty_score": 0.24995587792314342,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 4328,
    "uncertainty_score": 0.5,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4329,
    "uncertainty_score": 0.7418114181038099,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4330,
    "uncertainty_score": 2.707441057499067e-07,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 4331,
    "uncertainty_score": 9.39091245623222e-10,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 4332,
    "uncertainty_score": 0.0033757839681403607,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 4333,
    "uncertainty_score": 0.49999773851279466,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4334,
    "uncertainty_score": 2.1913382507196965e-08,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 4335,
    "uncertainty_score": 0.200085219026869,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 4336,
    "uncertainty_score": 5.58641233439024e-06,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 4337,
    "uncertainty_score": 0.01669817016034336,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4338,
    "uncertainty_score": 7.968968513198387e-07,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 4339,
    "uncertainty_score": 0.5000010500238421,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4340,
    "uncertainty_score": 1.1229986558678583e-11,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 4341,
    "uncertainty_score": 0.40007384994008444,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4342,
    "uncertainty_score": 1.038376320837147e-06,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 4343,
    "uncertainty_score": 6.641689000810665e-05,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4344,
    "uncertainty_score": 1.4556987994725744e-10,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 4345,
    "uncertainty_score": 1.7861684645642717e-13,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 4346,
    "uncertainty_score": 1.062860315452119e-08,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 4347,
    "uncertainty_score": 3.8402736200366185e-09,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4348,
    "uncertainty_score": 0.40000260143274985,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4349,
    "uncertainty_score": 8.842506329977824e-09,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 4350,
    "uncertainty_score": 3.9488712541075974e-06,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4351,
    "uncertainty_score": 0.4005125580639892,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4352,
    "uncertainty_score": 0.4566778961161122,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 4353,
    "uncertainty_score": 1.1781224743191794e-05,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 4354,
    "uncertainty_score": 1.976218595135995e-07,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 4355,
    "uncertainty_score": 5.867570584706747e-08,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 4356,
    "uncertainty_score": 8.502874749176803e-07,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 4357,
    "uncertainty_score": 0.6923822189694108,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4358,
    "uncertainty_score": 0.20275552527753002,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4359,
    "uncertainty_score": 2.8568018875724965e-09,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 4360,
    "uncertainty_score": 1.1490334550609881e-10,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 4361,
    "uncertainty_score": 4.900481084018975e-06,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 4362,
    "uncertainty_score": 0.20655089557088258,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 4363,
    "uncertainty_score": 0.2500004734153381,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 4364,
    "uncertainty_score": 1.2954349314695396e-05,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4365,
    "uncertainty_score": 0.24999999975259837,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 4366,
    "uncertainty_score": 0.2500139819844288,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4367,
    "uncertainty_score": 0.5000000798462926,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 4368,
    "uncertainty_score": 0.013774182423574241,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 4369,
    "uncertainty_score": 6.101972945792345e-08,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 4370,
    "uncertainty_score": 0.014875772180407122,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 4371,
    "uncertainty_score": 0.20120694528156685,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4372,
    "uncertainty_score": 0.3999466809875757,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 4373,
    "uncertainty_score": 0.2501065241830268,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 4374,
    "uncertainty_score": 0.2500181357113685,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 4375,
    "uncertainty_score": 0.0011746862221605617,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 4376,
    "uncertainty_score": 4.2923185030207295e-08,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 4377,
    "uncertainty_score": 0.00209290368966179,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 4378,
    "uncertainty_score": 3.039215312169928e-10,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 4379,
    "uncertainty_score": 0.3353013603495758,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 4380,
    "uncertainty_score": 0.7946481669496143,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 4381,
    "uncertainty_score": 0.8000000011179302,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 4382,
    "uncertainty_score": 2.9760157193436852e-06,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4383,
    "uncertainty_score": 0.25000000293966146,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 4384,
    "uncertainty_score": 0.5005346053873381,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4385,
    "uncertainty_score": 0.0004869786545254378,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 4386,
    "uncertainty_score": 0.20000002659614285,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4387,
    "uncertainty_score": 0.24999999976596218,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 4388,
    "uncertainty_score": 4.6351100379065844e-11,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 4389,
    "uncertainty_score": 0.6664723796894748,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 4390,
    "uncertainty_score": 3.3703086541593346e-13,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 4391,
    "uncertainty_score": 0.16695608270868256,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 4392,
    "uncertainty_score": 9.756235873226898e-06,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 4393,
    "uncertainty_score": 3.2603669273575433e-06,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 4394,
    "uncertainty_score": 0.8482503744490035,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4395,
    "uncertainty_score": 0.2500092461743132,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 4396,
    "uncertainty_score": 0.337269416969723,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4397,
    "uncertainty_score": 0.6009562219316937,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4398,
    "uncertainty_score": 1.5124963326460105e-10,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 4399,
    "uncertainty_score": 0.7499999118912775,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4400,
    "uncertainty_score": 1.6633194880298756e-09,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 4401,
    "uncertainty_score": 4.914019991813718e-07,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 4402,
    "uncertainty_score": 0.005460818667337145,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 4403,
    "uncertainty_score": 0.1666668121904057,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 4404,
    "uncertainty_score": 0.2000000002720455,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 4405,
    "uncertainty_score": 0.025461622198517397,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 4406,
    "uncertainty_score": 0.5000000388795286,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 4407,
    "uncertainty_score": 0.0056755522785750835,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 4408,
    "uncertainty_score": 1.8759351678114617e-07,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 4409,
    "uncertainty_score": 0.5019545323069268,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 4410,
    "uncertainty_score": 0.1700649398188776,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4411,
    "uncertainty_score": 0.40140963413665104,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 4412,
    "uncertainty_score": 0.200009097687385,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 4413,
    "uncertainty_score": 0.2,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 4414,
    "uncertainty_score": 8.379393239487374e-09,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4415,
    "uncertainty_score": 0.3256380059354615,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 4416,
    "uncertainty_score": 1.3972288300740295e-12,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 4417,
    "uncertainty_score": 3.236786881457862e-06,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 4418,
    "uncertainty_score": 0.00038185209174013205,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 4419,
    "uncertainty_score": 0.2501346515506208,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 4420,
    "uncertainty_score": 1.4346644329627009e-08,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 4421,
    "uncertainty_score": 0.20002707886701404,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4422,
    "uncertainty_score": 0.20000000038660098,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 4423,
    "uncertainty_score": 0.00015348627966294202,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 4424,
    "uncertainty_score": 5.992338892206717e-08,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 4425,
    "uncertainty_score": 1.665676688478562e-08,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 4426,
    "uncertainty_score": 2.5501284284482e-05,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4427,
    "uncertainty_score": 5.50208258332059e-05,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 4428,
    "uncertainty_score": 0.0012073974330770697,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 4429,
    "uncertainty_score": 0.40001882377852327,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 4430,
    "uncertainty_score": 1.7646044328437687e-11,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 4431,
    "uncertainty_score": 0.0019100822301127444,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4432,
    "uncertainty_score": 0.33333334969189016,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 4433,
    "uncertainty_score": 3.960910617786241e-05,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 4434,
    "uncertainty_score": 2.771748235057872e-07,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 4435,
    "uncertainty_score": 0.24999999981780546,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4436,
    "uncertainty_score": 0.5000000011068909,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4437,
    "uncertainty_score": 0.19203172032631535,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4438,
    "uncertainty_score": 0.5996150024440349,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 4439,
    "uncertainty_score": 1.5211157190233068e-06,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 4440,
    "uncertainty_score": 3.275276439899544e-08,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 4441,
    "uncertainty_score": 2.4694076126292677e-06,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4442,
    "uncertainty_score": 7.196807115485695e-06,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 4443,
    "uncertainty_score": 0.2043839553018183,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 4444,
    "uncertainty_score": 0.6445402481383371,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4445,
    "uncertainty_score": 3.000372576930354e-07,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 4446,
    "uncertainty_score": 0.24999999992260058,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 4447,
    "uncertainty_score": 0.0014974031010103195,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 4448,
    "uncertainty_score": 0.250001593156852,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4449,
    "uncertainty_score": 0.4000035569083213,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 4450,
    "uncertainty_score": 3.063966824441026e-05,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 4451,
    "uncertainty_score": 1.4704297873575099e-10,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 4452,
    "uncertainty_score": 0.5582072665566306,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4453,
    "uncertainty_score": 0.3999998751100084,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 4454,
    "uncertainty_score": 0.20000442511489966,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4455,
    "uncertainty_score": 0.7999999840655867,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 4456,
    "uncertainty_score": 7.668067694863177e-13,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 4457,
    "uncertainty_score": 0.24986361278017064,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 4458,
    "uncertainty_score": 1.9026893435442247e-05,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4459,
    "uncertainty_score": 0.42858176695788747,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4460,
    "uncertainty_score": 0.2535151251729288,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 4461,
    "uncertainty_score": 1.8938785681404855e-05,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4462,
    "uncertainty_score": 0.3333333336319251,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4463,
    "uncertainty_score": 1.8072196973416777e-06,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 4464,
    "uncertainty_score": 0.2501016884046819,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 4465,
    "uncertainty_score": 9.103125254712954e-10,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 4466,
    "uncertainty_score": 6.398948261868734e-08,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 4467,
    "uncertainty_score": 0.6000176304143681,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 4468,
    "uncertainty_score": 2.7955474062201305e-05,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 4469,
    "uncertainty_score": 0.20000001128547873,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 4470,
    "uncertainty_score": 0.00027527091671186114,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 4471,
    "uncertainty_score": 0.5000000000005188,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 4472,
    "uncertainty_score": 4.157065673823624e-06,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4473,
    "uncertainty_score": 6.203032144961711e-06,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4474,
    "uncertainty_score": 0.005643610310320335,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 4475,
    "uncertainty_score": 0.5031197342546458,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4476,
    "uncertainty_score": 0.00023910047255444342,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4477,
    "uncertainty_score": 8.135232070920467e-05,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 4478,
    "uncertainty_score": 0.0033218761953285473,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 4479,
    "uncertainty_score": 0.13030496943778322,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4480,
    "uncertainty_score": 0.22537660561765419,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4481,
    "uncertainty_score": 0.0005073903674200667,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4482,
    "uncertainty_score": 0.40072560653138084,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4483,
    "uncertainty_score": 0.8321586380540918,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 4484,
    "uncertainty_score": 2.194056956581524e-09,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 4485,
    "uncertainty_score": 0.20000000072525242,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 4486,
    "uncertainty_score": 0.37740830957896004,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 4487,
    "uncertainty_score": 0.2500002735472769,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 4488,
    "uncertainty_score": 9.221050217175475e-06,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 4489,
    "uncertainty_score": 0.6666580561346844,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4490,
    "uncertainty_score": 0.20248633632509844,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 4491,
    "uncertainty_score": 1.963563424625569e-05,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 4492,
    "uncertainty_score": 0.75,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4493,
    "uncertainty_score": 0.5,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4494,
    "uncertainty_score": 0.199807767421377,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 4495,
    "uncertainty_score": 5.765400269823817e-10,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 4496,
    "uncertainty_score": 0.00012453104355386995,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 4497,
    "uncertainty_score": 0.3333342422380184,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 4498,
    "uncertainty_score": 0.639365241042244,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4499,
    "uncertainty_score": 2.612380547530345e-09,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4500,
    "uncertainty_score": 0.5001916325614348,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4501,
    "uncertainty_score": 0.2500000111580768,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4502,
    "uncertainty_score": 0.33607675755695365,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4503,
    "uncertainty_score": 3.874641297981947e-10,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 4504,
    "uncertainty_score": 0.00013389750057267742,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 4505,
    "uncertainty_score": 0.2000945818554977,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 4506,
    "uncertainty_score": 1.4362976509894154e-07,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4507,
    "uncertainty_score": 0.2499999996474715,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 4508,
    "uncertainty_score": 1.2883838265602992e-07,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 4509,
    "uncertainty_score": 0.40003971838895486,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 4510,
    "uncertainty_score": 0.5000000017985333,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4511,
    "uncertainty_score": 0.39931762667430654,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4512,
    "uncertainty_score": 1.4023039631657366e-05,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4513,
    "uncertainty_score": 0.25000001003145084,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 4514,
    "uncertainty_score": 0.2301790045996601,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 4515,
    "uncertainty_score": 1.3788608770674134e-08,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 4516,
    "uncertainty_score": 0.2000007118303821,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 4517,
    "uncertainty_score": 3.6343008832146435e-08,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 4518,
    "uncertainty_score": 0.6002290851170375,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 4519,
    "uncertainty_score": 0.2045967618313554,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 4520,
    "uncertainty_score": 0.5004816807071132,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 4521,
    "uncertainty_score": 2.018001540107294e-05,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4522,
    "uncertainty_score": 0.24999876399990748,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 4523,
    "uncertainty_score": 0.0,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 4524,
    "uncertainty_score": 7.598467555405272e-09,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 4525,
    "uncertainty_score": 0.25009599094716295,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4526,
    "uncertainty_score": 5.02225144636229e-05,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4527,
    "uncertainty_score": 1.3197489802070697e-08,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4528,
    "uncertainty_score": 5.322969818420768e-06,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4529,
    "uncertainty_score": 0.333335654085461,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 4530,
    "uncertainty_score": 0.003562104650705914,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4531,
    "uncertainty_score": 0.20462565008505657,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 4532,
    "uncertainty_score": 0.026425359793047543,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 4533,
    "uncertainty_score": 0.33336815056697217,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4534,
    "uncertainty_score": 0.40021747209828284,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 4535,
    "uncertainty_score": 0.3359386293237178,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4536,
    "uncertainty_score": 3.804083076394666e-06,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 4537,
    "uncertainty_score": 0.2500000096962603,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4538,
    "uncertainty_score": 2.0003786351270965e-05,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4539,
    "uncertainty_score": 0.2000107104459949,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4540,
    "uncertainty_score": 0.74999999975,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4541,
    "uncertainty_score": 0.1999999997988541,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4542,
    "uncertainty_score": 1.769154703439154e-08,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 4543,
    "uncertainty_score": 0.20156421060330415,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 4544,
    "uncertainty_score": 0.20257421736535752,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4545,
    "uncertainty_score": 0.2000000050594201,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 4546,
    "uncertainty_score": 6.23881614067848e-11,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 4547,
    "uncertainty_score": 0.20000000000025303,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4548,
    "uncertainty_score": 0.2069047625108588,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4549,
    "uncertainty_score": 4.913508705058847e-06,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 4550,
    "uncertainty_score": 2.7547419189764607e-06,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 4551,
    "uncertainty_score": 0.24999988969236542,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4552,
    "uncertainty_score": 0.5000216282347324,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 4553,
    "uncertainty_score": 0.2025380918617205,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4554,
    "uncertainty_score": 3.111406319744814e-09,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4555,
    "uncertainty_score": 1.6348299733709962e-05,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 4556,
    "uncertainty_score": 0.20875162808065295,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 4557,
    "uncertainty_score": 0.00027942331095916087,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 4558,
    "uncertainty_score": 0.28576635481242596,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 4559,
    "uncertainty_score": 0.5000042994645166,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4560,
    "uncertainty_score": 0.4000000000009801,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4561,
    "uncertainty_score": 5.641879998532324e-10,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 4562,
    "uncertainty_score": 0.021245366324836448,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4563,
    "uncertainty_score": 4.707818591788874e-07,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4564,
    "uncertainty_score": 0.49999968768230346,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4565,
    "uncertainty_score": 0.20177421037921411,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 4566,
    "uncertainty_score": 0.2001411955027593,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4567,
    "uncertainty_score": 0.0,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4568,
    "uncertainty_score": 4.053461724368019e-10,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 4569,
    "uncertainty_score": 0.005473196707628992,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 4570,
    "uncertainty_score": 0.0002815133248401734,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 4571,
    "uncertainty_score": 0.20198781832728746,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4572,
    "uncertainty_score": 0.200000545096153,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 4573,
    "uncertainty_score": 0.5000000936347062,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 4574,
    "uncertainty_score": 4.50095195853954e-11,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 4575,
    "uncertainty_score": 0.3735524209854061,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4576,
    "uncertainty_score": 0.8000130735776747,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4577,
    "uncertainty_score": 0.5000000941893855,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 4578,
    "uncertainty_score": 0.016186019901529663,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 4579,
    "uncertainty_score": 0.7501533578943848,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 4580,
    "uncertainty_score": 2.0806491335314167e-10,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 4581,
    "uncertainty_score": 0.4000039459410706,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 4582,
    "uncertainty_score": 0.20000200481375643,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 4583,
    "uncertainty_score": 3.729000018582547e-09,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 4584,
    "uncertainty_score": 0.3999946226356653,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4585,
    "uncertainty_score": 0.5999999811339072,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4586,
    "uncertainty_score": 2.2644988199342392e-05,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 4587,
    "uncertainty_score": 0.1999999998118435,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4588,
    "uncertainty_score": 0.6000005744585185,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 4589,
    "uncertainty_score": 1.2263988998625995e-08,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 4590,
    "uncertainty_score": 5.026938631590532e-10,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 4591,
    "uncertainty_score": 1.0784127035709277e-05,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 4592,
    "uncertainty_score": 0.16721005279294596,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 4593,
    "uncertainty_score": 0.25000000060700345,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 4594,
    "uncertainty_score": 0.20000090146690602,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 4595,
    "uncertainty_score": 0.25136039758405593,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4596,
    "uncertainty_score": 0.6085591860135019,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 4597,
    "uncertainty_score": 0.33333333299999995,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4598,
    "uncertainty_score": 0.0016702879326562017,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 4599,
    "uncertainty_score": 0.4000304051816646,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 4600,
    "uncertainty_score": 5.051576440091227e-05,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 4601,
    "uncertainty_score": 1.0,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 4602,
    "uncertainty_score": 0.5000071024354199,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4603,
    "uncertainty_score": 0.20000000001549215,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4604,
    "uncertainty_score": 0.3386158612235874,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 4605,
    "uncertainty_score": 0.2000071896929439,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 4606,
    "uncertainty_score": 0.39999999980272805,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 4607,
    "uncertainty_score": 0.21956482634098612,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 4608,
    "uncertainty_score": 0.4000000077389501,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4609,
    "uncertainty_score": 0.20000003457445717,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 4610,
    "uncertainty_score": 2.6211796453465006e-10,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4611,
    "uncertainty_score": 0.499882232719498,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 4612,
    "uncertainty_score": 0.25094718453449133,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4613,
    "uncertainty_score": 0.25669050230381973,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 4614,
    "uncertainty_score": 0.0071893201225754835,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 4615,
    "uncertainty_score": 0.21273990999064432,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 4616,
    "uncertainty_score": 0.2000038720841712,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4617,
    "uncertainty_score": 0.5000000185231015,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 4618,
    "uncertainty_score": 0.2010882012129636,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4619,
    "uncertainty_score": 0.999999990217666,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4620,
    "uncertainty_score": 0.7999830375917425,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4621,
    "uncertainty_score": 0.3333285212752885,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 4622,
    "uncertainty_score": 1.311793441660364e-06,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 4623,
    "uncertainty_score": 4.607539097359409e-09,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 4624,
    "uncertainty_score": 0.005807774866771617,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 4625,
    "uncertainty_score": 9.778947809986347e-11,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4626,
    "uncertainty_score": 0.11202589117760797,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4627,
    "uncertainty_score": 0.1205899057573554,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 4628,
    "uncertainty_score": 4.004239428529238e-06,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 4629,
    "uncertainty_score": 2.772029078610502e-10,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 4630,
    "uncertainty_score": 0.5974258841332162,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 4631,
    "uncertainty_score": 7.681175467068433e-08,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 4632,
    "uncertainty_score": 9.99635050015898e-10,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 4633,
    "uncertainty_score": 0.12542772249193002,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4634,
    "uncertainty_score": 0.8024863301664267,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4635,
    "uncertainty_score": 0.2496602692129977,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4636,
    "uncertainty_score": 3.596543204897091e-09,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 4637,
    "uncertainty_score": 0.24951913484132465,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4638,
    "uncertainty_score": 0.00013614602292041063,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4639,
    "uncertainty_score": 0.3332517563095949,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 4640,
    "uncertainty_score": 0.0003472959754046459,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4641,
    "uncertainty_score": 0.40569225859263974,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4642,
    "uncertainty_score": 2.5228642687686096e-06,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 4643,
    "uncertainty_score": 1.0932203960137281e-10,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4644,
    "uncertainty_score": 0.25252933322405896,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4645,
    "uncertainty_score": 0.0033724467230756565,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4646,
    "uncertainty_score": 0.2000009608779935,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4647,
    "uncertainty_score": 0.20000184208940414,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4648,
    "uncertainty_score": 0.2000000045533385,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 4649,
    "uncertainty_score": 0.25000085830868096,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4650,
    "uncertainty_score": 0.5000043082984882,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 4651,
    "uncertainty_score": 0.75,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 4652,
    "uncertainty_score": 9.893737310171287e-10,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 4653,
    "uncertainty_score": 0.192502909556194,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 4654,
    "uncertainty_score": 0.5000014834621318,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 4655,
    "uncertainty_score": 8.076671376638194e-13,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 4656,
    "uncertainty_score": 3.813225277889494e-08,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4657,
    "uncertainty_score": 0.16666865994711222,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4658,
    "uncertainty_score": 0.2508896540119853,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4659,
    "uncertainty_score": 0.20156554042125224,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 4660,
    "uncertainty_score": 0.3026370805423608,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4661,
    "uncertainty_score": 0.4000405347860691,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 4662,
    "uncertainty_score": 0.0,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4663,
    "uncertainty_score": 7.804979922861325e-05,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 4664,
    "uncertainty_score": 6.841551786891686e-06,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 4665,
    "uncertainty_score": 5.755361698460787e-05,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4666,
    "uncertainty_score": 3.431419528722759e-06,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 4667,
    "uncertainty_score": 0.6000000241638315,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 4668,
    "uncertainty_score": 3.2918020478963205e-07,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 4669,
    "uncertainty_score": 0.7500007968913441,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4670,
    "uncertainty_score": 0.5000000062774975,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4671,
    "uncertainty_score": 0.400000182650966,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4672,
    "uncertainty_score": 0.11799767046383486,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4673,
    "uncertainty_score": 0.011924594649108326,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4674,
    "uncertainty_score": 3.5838786982890765e-05,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 4675,
    "uncertainty_score": 0.4000013218706213,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4676,
    "uncertainty_score": 0.0013602511010923793,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4677,
    "uncertainty_score": 9.349883246704537e-08,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 4678,
    "uncertainty_score": 0.20000532198924317,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 4679,
    "uncertainty_score": 2.4700437222172877e-06,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 4680,
    "uncertainty_score": 0.00034729899671390575,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 4681,
    "uncertainty_score": 0.3749882356645901,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 4682,
    "uncertainty_score": 0.5000393540575854,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 4683,
    "uncertainty_score": 0.16826896430509633,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 4684,
    "uncertainty_score": 0.02541474857163009,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 4685,
    "uncertainty_score": 0.33356901739646644,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 4686,
    "uncertainty_score": 0.2000005258488037,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 4687,
    "uncertainty_score": 1.4517338162752344e-08,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 4688,
    "uncertainty_score": 0.20617229354287342,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4689,
    "uncertainty_score": 0.281775482499481,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4690,
    "uncertainty_score": 0.00023255208250258294,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4691,
    "uncertainty_score": 0.0019231648608085392,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 4692,
    "uncertainty_score": 0.1428573294029993,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 4693,
    "uncertainty_score": 7.578243320560998e-06,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4694,
    "uncertainty_score": 0.20000085855225577,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4695,
    "uncertainty_score": 0.33333335264894015,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 4696,
    "uncertainty_score": 4.330862897277962e-09,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 4697,
    "uncertainty_score": 0.5327382722783892,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4698,
    "uncertainty_score": 0.22051282928651067,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4699,
    "uncertainty_score": 6.867060282222021e-12,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 4700,
    "uncertainty_score": 0.24999999974718928,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4701,
    "uncertainty_score": 1.682750091644429e-06,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 4702,
    "uncertainty_score": 0.2499862048862309,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 4703,
    "uncertainty_score": 4.444671010029445e-06,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 4704,
    "uncertainty_score": 0.19717430738945352,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4705,
    "uncertainty_score": 0.002375849137956722,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 4706,
    "uncertainty_score": 0.24999999993183097,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 4707,
    "uncertainty_score": 3.299795065362881e-06,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4708,
    "uncertainty_score": 4.115383562838511e-08,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 4709,
    "uncertainty_score": 9.228858887549288e-06,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4710,
    "uncertainty_score": 0.20032834232331137,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 4711,
    "uncertainty_score": 0.36960106720390384,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 4712,
    "uncertainty_score": 0.49999825891725624,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 4713,
    "uncertainty_score": 0.2528039177928029,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4714,
    "uncertainty_score": 0.20181296014015188,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 4715,
    "uncertainty_score": 3.1948472070339857e-09,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4716,
    "uncertainty_score": 1.344193259913244e-06,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 4717,
    "uncertainty_score": 1.5312392803936078e-09,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 4718,
    "uncertainty_score": 0.4999999995001446,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 4719,
    "uncertainty_score": 0.24999289759722437,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 4720,
    "uncertainty_score": 9.817185473737993e-06,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 4721,
    "uncertainty_score": 1.8884019002921437e-06,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 4722,
    "uncertainty_score": 0.3322756302576313,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 4723,
    "uncertainty_score": 0.3356627194073402,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4724,
    "uncertainty_score": 0.0007299357055017141,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 4725,
    "uncertainty_score": 0.0012735998550059842,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 4726,
    "uncertainty_score": 1.891980023466082e-07,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 4727,
    "uncertainty_score": 0.2909755062553134,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4728,
    "uncertainty_score": 4.637969180515785e-07,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 4729,
    "uncertainty_score": 0.019852528071335997,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 4730,
    "uncertainty_score": 1.4872070976339194e-06,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4731,
    "uncertainty_score": 0.2000000115832526,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 4732,
    "uncertainty_score": 0.4999988449387195,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 4733,
    "uncertainty_score": 4.350038463497172e-06,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 4734,
    "uncertainty_score": 0.25000806487636495,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 4735,
    "uncertainty_score": 3.1206899675594146e-07,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 4736,
    "uncertainty_score": 0.00338830354659479,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 4737,
    "uncertainty_score": 1.2943833085904672e-05,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4738,
    "uncertainty_score": 8.564223222291752e-07,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4739,
    "uncertainty_score": 1.9517880759043175e-06,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 4740,
    "uncertainty_score": 0.3333334962767535,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 4741,
    "uncertainty_score": 0.03608170046334021,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 4742,
    "uncertainty_score": 9.34236249518185e-08,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 4743,
    "uncertainty_score": 0.20000107457523134,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 4744,
    "uncertainty_score": 0.0007299745985071364,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 4745,
    "uncertainty_score": 3.0022220837410796e-09,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4746,
    "uncertainty_score": 0.5763248600913133,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 4747,
    "uncertainty_score": 0.00010547253957810713,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 4748,
    "uncertainty_score": 0.25345380502129283,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 4749,
    "uncertainty_score": 0.0004341138191166403,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 4750,
    "uncertainty_score": 7.11427908290477e-09,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4751,
    "uncertainty_score": 0.614448909525544,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 4752,
    "uncertainty_score": 0.36696565339291665,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 4753,
    "uncertainty_score": 0.09778382918444749,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 4754,
    "uncertainty_score": 8.250127899162872e-05,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 4755,
    "uncertainty_score": 0.36363768913300604,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4756,
    "uncertainty_score": 5.532104490966449e-09,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 4757,
    "uncertainty_score": 0.2500119559106264,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 4758,
    "uncertainty_score": 0.7496983520496736,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 4759,
    "uncertainty_score": 8.693241716955616e-05,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4760,
    "uncertainty_score": 0.2500008398367087,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 4761,
    "uncertainty_score": 0.20000401480577326,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 4762,
    "uncertainty_score": 1.4370303971913293e-05,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 4763,
    "uncertainty_score": 0.33333368890610343,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 4764,
    "uncertainty_score": 4.844096964903462e-09,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 4765,
    "uncertainty_score": 2.3506344251530714e-06,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 4766,
    "uncertainty_score": 0.2000007279471348,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 4767,
    "uncertainty_score": 0.25000002308325947,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 4768,
    "uncertainty_score": 0.011900266356749786,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 4769,
    "uncertainty_score": 1.1310380177715534e-06,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 4770,
    "uncertainty_score": 0.7500027814125301,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4771,
    "uncertainty_score": 0.001967893899748785,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4772,
    "uncertainty_score": 1.3066014529305664e-05,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 4773,
    "uncertainty_score": 0.6666761366171317,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4774,
    "uncertainty_score": 0.3999992557167598,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 4775,
    "uncertainty_score": 1.4330680725666313e-08,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 4776,
    "uncertainty_score": 0.20001326977814715,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4777,
    "uncertainty_score": 0.00039055203555422,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 4778,
    "uncertainty_score": 2.8369086074383026e-06,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4779,
    "uncertainty_score": 0.39999770642959026,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 4780,
    "uncertainty_score": 0.20000051756138984,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 4781,
    "uncertainty_score": 5.845683428495964e-06,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 4782,
    "uncertainty_score": 0.00027542646310003147,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4783,
    "uncertainty_score": 0.00036245348928869576,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 4784,
    "uncertainty_score": 1.446679504739579e-08,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 4785,
    "uncertainty_score": 0.3576714905343521,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 4786,
    "uncertainty_score": 5.626038734707306e-06,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4787,
    "uncertainty_score": 0.00031300012093911887,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 4788,
    "uncertainty_score": 0.20009970669368887,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4789,
    "uncertainty_score": 0.001282133713408979,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 4790,
    "uncertainty_score": 1.7326559228045097e-09,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 4791,
    "uncertainty_score": 0.33339527280856407,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 4792,
    "uncertainty_score": 2.9214563344704956e-06,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4793,
    "uncertainty_score": 0.0003329708503418655,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 4794,
    "uncertainty_score": 4.3968404063035536e-05,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 4795,
    "uncertainty_score": 0.20000270901020376,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 4796,
    "uncertainty_score": 0.03635983668269173,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4797,
    "uncertainty_score": 0.250000000043033,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 4798,
    "uncertainty_score": 0.2916513979035954,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 4799,
    "uncertainty_score": 0.5036258942997576,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 4800,
    "uncertainty_score": 2.207756940148088e-07,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 4801,
    "uncertainty_score": 0.16666667885224837,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 4802,
    "uncertainty_score": 0.37903082217335193,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 4803,
    "uncertainty_score": 0.2000000002119892,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 4804,
    "uncertainty_score": 0.001592839465422582,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 4805,
    "uncertainty_score": 0.199999831966498,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 4806,
    "uncertainty_score": 0.6000049052702373,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4807,
    "uncertainty_score": 6.93603258675218e-08,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 4808,
    "uncertainty_score": 0.5,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 4809,
    "uncertainty_score": 0.33422843488921905,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 4810,
    "uncertainty_score": 1.3884147614242208e-09,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 4811,
    "uncertainty_score": 0.02501385490978244,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 4812,
    "uncertainty_score": 0.00014561887088261947,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4813,
    "uncertainty_score": 0.4000007764133736,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 4814,
    "uncertainty_score": 0.25000073700891784,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 4815,
    "uncertainty_score": 0.010848940559238721,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 4816,
    "uncertainty_score": 0.8000040501877124,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 4817,
    "uncertainty_score": 0.5000003104477233,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 4818,
    "uncertainty_score": 7.023571659580688e-05,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 4819,
    "uncertainty_score": 0.28477114599735176,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 4820,
    "uncertainty_score": 0.25068416515571507,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 4821,
    "uncertainty_score": 1.5286073522677048e-08,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 4822,
    "uncertainty_score": 0.39999999906436123,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 4823,
    "uncertainty_score": 0.16666729045113438,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4824,
    "uncertainty_score": 0.00012292292036779028,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 4825,
    "uncertainty_score": 2.4351619708871894e-07,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4826,
    "uncertainty_score": 2.4516260872222763e-05,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4827,
    "uncertainty_score": 4.196658335149246e-08,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 4828,
    "uncertainty_score": 0.500004790716915,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 4829,
    "uncertainty_score": 0.39999998535558473,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 4830,
    "uncertainty_score": 0.7500017405348876,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4831,
    "uncertainty_score": 0.1657283137629244,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 4832,
    "uncertainty_score": 0.25905816406242105,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 4833,
    "uncertainty_score": 0.4999992445065805,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4834,
    "uncertainty_score": 4.871836536012596e-07,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 4835,
    "uncertainty_score": 0.2000393021656855,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 4836,
    "uncertainty_score": 0.3999998052327741,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 4837,
    "uncertainty_score": 2.2164225838153516e-05,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 4838,
    "uncertainty_score": 0.16688045016659284,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 4839,
    "uncertainty_score": 1.29008849913056e-09,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 4840,
    "uncertainty_score": 2.9784603340915597e-05,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 4841,
    "uncertainty_score": 2.1503582616575763e-05,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4842,
    "uncertainty_score": 0.5001424915550026,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 4843,
    "uncertainty_score": 5.623465078695262e-09,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4844,
    "uncertainty_score": 0.21383685675863834,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 4845,
    "uncertainty_score": 0.22114053085196228,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 4846,
    "uncertainty_score": 6.399901114599614e-11,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 4847,
    "uncertainty_score": 0.20000638493554884,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 4848,
    "uncertainty_score": 0.39995211247615936,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 4849,
    "uncertainty_score": 0.25000013783992975,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 4850,
    "uncertainty_score": 0.20001179017535367,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 4851,
    "uncertainty_score": 0.9999999873750065,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4852,
    "uncertainty_score": 1.9049807632780997e-09,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 4853,
    "uncertainty_score": 0.0009315240267385091,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 4854,
    "uncertainty_score": 0.5035930393188556,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4855,
    "uncertainty_score": 0.0584165400457808,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 4856,
    "uncertainty_score": 0.19998419605938828,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 4857,
    "uncertainty_score": 0.3333350309282115,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 4858,
    "uncertainty_score": 0.3333333013452662,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 4859,
    "uncertainty_score": 0.19999999983564717,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 4860,
    "uncertainty_score": 0.3333333536221055,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 4861,
    "uncertainty_score": 0.3333328255585463,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 4862,
    "uncertainty_score": 5.536523042861821e-07,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 4863,
    "uncertainty_score": 0.28502052992228205,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4864,
    "uncertainty_score": 1.3073758556165005e-05,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 4865,
    "uncertainty_score": 8.646754555608647e-07,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 4866,
    "uncertainty_score": 0.001659140734121288,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 4867,
    "uncertainty_score": 0.027826900984410673,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 4868,
    "uncertainty_score": 4.076232949967742e-06,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 4869,
    "uncertainty_score": 0.1994248394349308,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4870,
    "uncertainty_score": 1.0032314995425415e-08,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 4871,
    "uncertainty_score": 6.530733914988383e-09,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 4872,
    "uncertainty_score": 5.7247004095882775e-05,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 4873,
    "uncertainty_score": 0.5000113494679344,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4874,
    "uncertainty_score": 0.1668830926713816,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 4875,
    "uncertainty_score": 0.33333334192781844,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4876,
    "uncertainty_score": 0.2254188530407185,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 4877,
    "uncertainty_score": 0.5000000707021308,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 4878,
    "uncertainty_score": 0.22545403826786936,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4879,
    "uncertainty_score": 0.3333333333333333,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 4880,
    "uncertainty_score": 1.569323035736201e-13,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 4881,
    "uncertainty_score": 3.859674581093991e-06,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 4882,
    "uncertainty_score": 2.8106368033458977e-14,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 4883,
    "uncertainty_score": 0.009772611618843203,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 4884,
    "uncertainty_score": 0.0002809162319342951,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 4885,
    "uncertainty_score": 0.6666666679470078,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4886,
    "uncertainty_score": 0.002130511245378398,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 4887,
    "uncertainty_score": 0.0037906967232386774,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 4888,
    "uncertainty_score": 0.20000316159203635,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 4889,
    "uncertainty_score": 0.16666666902744662,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4890,
    "uncertainty_score": 8.412679596902852e-08,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 4891,
    "uncertainty_score": 0.2000000169946346,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 4892,
    "uncertainty_score": 0.000239031437844814,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 4893,
    "uncertainty_score": 6.401658966154429e-08,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 4894,
    "uncertainty_score": 8.652938634244363e-10,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 4895,
    "uncertainty_score": 0.0015635778481388539,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 4896,
    "uncertainty_score": 0.06116559324882382,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 4897,
    "uncertainty_score": 0.2000015603496756,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4898,
    "uncertainty_score": 0.20000484117830353,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 4899,
    "uncertainty_score": 7.519747081015389e-10,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 4900,
    "uncertainty_score": 0.23610544940319733,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 4901,
    "uncertainty_score": 4.9682991941082525e-08,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 4902,
    "uncertainty_score": 0.16666678194427875,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 4903,
    "uncertainty_score": 1.6296192276634475e-06,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 4904,
    "uncertainty_score": 1.4230109770624586e-08,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 4905,
    "uncertainty_score": 3.0475758580744344e-06,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 4906,
    "uncertainty_score": 5.975658338532453e-10,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 4907,
    "uncertainty_score": 0.4023345564523523,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 4908,
    "uncertainty_score": 1.8336247944680336e-06,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 4909,
    "uncertainty_score": 8.867153096294954e-07,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 4910,
    "uncertainty_score": 0.00010605923511724033,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 4911,
    "uncertainty_score": 7.59675224190541e-09,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 4912,
    "uncertainty_score": 0.33492443156123014,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 4913,
    "uncertainty_score": 3.3282746520114515e-05,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 4914,
    "uncertainty_score": 0.19998693043215282,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 4915,
    "uncertainty_score": 0.5000000006254977,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 4916,
    "uncertainty_score": 1.4514104382494643e-13,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 4917,
    "uncertainty_score": 9.581408372429815e-05,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 4918,
    "uncertainty_score": 0.25001813566476794,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4919,
    "uncertainty_score": 6.649092036141583e-07,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 4920,
    "uncertainty_score": 1.904561535505606e-05,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 4921,
    "uncertainty_score": 0.19999206243199816,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 4922,
    "uncertainty_score": 0.3336029136012992,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4923,
    "uncertainty_score": 0.2503715163316536,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 4924,
    "uncertainty_score": 0.5000002288815246,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4925,
    "uncertainty_score": 0.003408714937156,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 4926,
    "uncertainty_score": 1.0511629362091577e-07,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 4927,
    "uncertainty_score": 0.1999986073601258,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 4928,
    "uncertainty_score": 0.2006842807760528,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 4929,
    "uncertainty_score": 7.645979078011261e-07,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 4930,
    "uncertainty_score": 0.12738528424625817,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 4931,
    "uncertainty_score": 0.0003095298419107142,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 4932,
    "uncertainty_score": 8.882159715496153e-07,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 4933,
    "uncertainty_score": 0.00959116102434506,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 4934,
    "uncertainty_score": 0.0006573020333572754,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 4935,
    "uncertainty_score": 0.333333420550678,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 4936,
    "uncertainty_score": 0.23928344251529465,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 4937,
    "uncertainty_score": 0.008703283874116298,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 4938,
    "uncertainty_score": 0.4202322364862541,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4939,
    "uncertainty_score": 4.494099746457841e-07,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 4940,
    "uncertainty_score": 0.25000001412171496,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4941,
    "uncertainty_score": 0.166668338679222,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 4942,
    "uncertainty_score": 8.608326598814918e-11,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 4943,
    "uncertainty_score": 1.5500616395452647e-07,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 4944,
    "uncertainty_score": 0.3335699002079255,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 4945,
    "uncertainty_score": 0.20002463964742376,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 4946,
    "uncertainty_score": 0.4999929286436105,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 4947,
    "uncertainty_score": 1.5051409613071036e-07,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 4948,
    "uncertainty_score": 0.0002609567106104445,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 4949,
    "uncertainty_score": 0.35316117411254416,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 4950,
    "uncertainty_score": 0.41026718352016545,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4951,
    "uncertainty_score": 0.5999558476575911,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4952,
    "uncertainty_score": 2.369611529117714e-09,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 4953,
    "uncertainty_score": 0.2500000429119407,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 4954,
    "uncertainty_score": 0.30373263419503854,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 4955,
    "uncertainty_score": 0.2000000003913119,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4956,
    "uncertainty_score": 1.3635502620126197e-06,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 4957,
    "uncertainty_score": 0.3224152718203713,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 4958,
    "uncertainty_score": 0.0017620464525274558,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 4959,
    "uncertainty_score": 0.00032663181587655596,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4960,
    "uncertainty_score": 8.855438182274344e-08,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 4961,
    "uncertainty_score": 3.276017174569973e-08,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 4962,
    "uncertainty_score": 0.0026175298601751446,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 4963,
    "uncertainty_score": 1.8067114830503062e-06,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 4964,
    "uncertainty_score": 2.6703553346747233e-07,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 4965,
    "uncertainty_score": 0.310312630923203,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 4966,
    "uncertainty_score": 0.19999515929158407,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 4967,
    "uncertainty_score": 4.78571910976402e-08,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 4968,
    "uncertainty_score": 0.007026161781793578,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 4969,
    "uncertainty_score": 0.5182868451342186,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 4970,
    "uncertainty_score": 0.24993993181701754,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 4971,
    "uncertainty_score": 0.20028309034066702,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 4972,
    "uncertainty_score": 0.24999999182587831,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 4973,
    "uncertainty_score": 0.33333335965755245,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4974,
    "uncertainty_score": 0.33330472436539804,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4975,
    "uncertainty_score": 3.562168319960236e-07,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4976,
    "uncertainty_score": 0.2097718057412453,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 4977,
    "uncertainty_score": 1.3158352835853022e-09,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 4978,
    "uncertainty_score": 0.24998605313899558,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 4979,
    "uncertainty_score": 0.25605340602954707,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 4980,
    "uncertainty_score": 0.2500000002699263,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 4981,
    "uncertainty_score": 0.25000000338119177,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4982,
    "uncertainty_score": 5.250181319500697e-10,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 4983,
    "uncertainty_score": 0.00012924707500943457,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 4984,
    "uncertainty_score": 0.48437907218678783,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4985,
    "uncertainty_score": 7.907389870239697e-09,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 4986,
    "uncertainty_score": 0.00011357614723433819,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 4987,
    "uncertainty_score": 0.2000145227565937,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 4988,
    "uncertainty_score": 0.0,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4989,
    "uncertainty_score": 2.0231692844996537e-05,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 4990,
    "uncertainty_score": 0.0031078329829189186,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 4991,
    "uncertainty_score": 0.6666666663349669,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 4992,
    "uncertainty_score": 0.20000000005999857,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 4993,
    "uncertainty_score": 0.20000001604643072,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 4994,
    "uncertainty_score": 0.33309938273239337,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 4995,
    "uncertainty_score": 0.40000001766969484,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 4996,
    "uncertainty_score": 0.3333332505979624,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 4997,
    "uncertainty_score": 6.672780907519001e-06,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 4998,
    "uncertainty_score": 2.3266708242921333e-11,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 4999,
    "uncertainty_score": 0.00035631385820128833,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 5000,
    "uncertainty_score": 0.4996958286933228,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 5001,
    "uncertainty_score": 5.7299682062163565e-05,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 5002,
    "uncertainty_score": 0.25029490580211267,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 5003,
    "uncertainty_score": 0.600000011287525,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 5004,
    "uncertainty_score": 0.2955005067674303,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 5005,
    "uncertainty_score": 0.4993426063383719,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 5006,
    "uncertainty_score": 1.2553981772991857e-06,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 5007,
    "uncertainty_score": 6.576049731116497e-08,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 5008,
    "uncertainty_score": 0.5180613932436122,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 5009,
    "uncertainty_score": 0.02131919395139829,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 5010,
    "uncertainty_score": 0.39997279379666484,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 5011,
    "uncertainty_score": 0.20013688030997606,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 5012,
    "uncertainty_score": 6.812820971035083e-05,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 5013,
    "uncertainty_score": 0.5342676197492213,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 5014,
    "uncertainty_score": 0.2005732363827161,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 5015,
    "uncertainty_score": 0.2500000843091961,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 5016,
    "uncertainty_score": 2.6164306147622834e-06,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 5017,
    "uncertainty_score": 3.68979342279447e-07,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 5018,
    "uncertainty_score": 0.010757311715046312,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 5019,
    "uncertainty_score": 0.3333333899145911,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 5020,
    "uncertainty_score": 0.0001405564252153423,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 5021,
    "uncertainty_score": 0.2000132378407664,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 5022,
    "uncertainty_score": 1.4295266985492225e-09,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 5023,
    "uncertainty_score": 0.39984725862393866,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 5024,
    "uncertainty_score": 7.874066739507515e-06,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 5025,
    "uncertainty_score": 1.7085974870877993e-07,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 5026,
    "uncertainty_score": 0.3334311236972692,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 5027,
    "uncertainty_score": 6.090484255873899e-05,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 5028,
    "uncertainty_score": 4.742837111512322e-07,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 5029,
    "uncertainty_score": 0.0,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 5030,
    "uncertainty_score": 0.25000577147232256,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 5031,
    "uncertainty_score": 0.0303517972869882,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 5032,
    "uncertainty_score": 0.2003473357572906,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 5033,
    "uncertainty_score": 0.00038621830310278573,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 5034,
    "uncertainty_score": 0.332602900298145,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 5035,
    "uncertainty_score": 1.1717451461841227e-09,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 5036,
    "uncertainty_score": 0.034354505147601536,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 5037,
    "uncertainty_score": 0.4000000055733475,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 5038,
    "uncertainty_score": 4.493525647433964e-07,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 5039,
    "uncertainty_score": 0.14285615240518584,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 5040,
    "uncertainty_score": 0.4998618398041479,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 5041,
    "uncertainty_score": 0.31146505788884166,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 5042,
    "uncertainty_score": 0.16666508807588035,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 5043,
    "uncertainty_score": 1.135029107998529e-05,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 5044,
    "uncertainty_score": 0.0016839361085986388,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 5045,
    "uncertainty_score": 3.9748268978441284e-10,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 5046,
    "uncertainty_score": 1.8505237166621504e-08,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 5047,
    "uncertainty_score": 0.0004021966478487817,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 5048,
    "uncertainty_score": 0.5000016519762683,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 5049,
    "uncertainty_score": 0.7500000368849437,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 5050,
    "uncertainty_score": 0.0650755388542987,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 5051,
    "uncertainty_score": 0.2500000051201563,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 5052,
    "uncertainty_score": 0.009521379576086654,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 5053,
    "uncertainty_score": 8.097301668907082e-12,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 5054,
    "uncertainty_score": 0.2002889826106371,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 5055,
    "uncertainty_score": 0.579638928690627,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 5056,
    "uncertainty_score": 0.3333270901132866,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 5057,
    "uncertainty_score": 0.3333333432929669,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 5058,
    "uncertainty_score": 0.2500015630446896,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 5059,
    "uncertainty_score": 0.0,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 5060,
    "uncertainty_score": 0.40415027997281106,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 5061,
    "uncertainty_score": 0.19311098023047008,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 5062,
    "uncertainty_score": 3.0939054591821267e-10,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 5063,
    "uncertainty_score": 0.20068237772308972,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 5064,
    "uncertainty_score": 7.219781819564954e-05,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 5065,
    "uncertainty_score": 0.3333319273907489,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 5066,
    "uncertainty_score": 4.403384318831244e-06,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 5067,
    "uncertainty_score": 9.447245774762599e-08,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 5068,
    "uncertainty_score": 1.058347769043026e-08,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 5069,
    "uncertainty_score": 2.7803440916271133e-08,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 5070,
    "uncertainty_score": 5.878007775080816e-09,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 5071,
    "uncertainty_score": 0.06839918515055665,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 5072,
    "uncertainty_score": 6.891042979641023e-08,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 5073,
    "uncertainty_score": 0.1666667243284544,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 5074,
    "uncertainty_score": 2.2052349916365747e-09,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 5075,
    "uncertainty_score": 0.000624610801637736,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 5076,
    "uncertainty_score": 0.25468427211794203,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 5077,
    "uncertainty_score": 0.2500007564470918,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 5078,
    "uncertainty_score": 9.41161855647325e-05,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 5079,
    "uncertainty_score": 1.2701658015748207e-08,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 5080,
    "uncertainty_score": 3.1550830053450103e-09,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 5081,
    "uncertainty_score": 5.120516799777448e-06,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 5082,
    "uncertainty_score": 5.3202695202334104e-08,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 5083,
    "uncertainty_score": 0.6666681095136971,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 5084,
    "uncertainty_score": 0.2500600777754954,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 5085,
    "uncertainty_score": 0.199603432569103,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 5086,
    "uncertainty_score": 0.5985048335241927,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 5087,
    "uncertainty_score": 2.3305645924317882e-06,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 5088,
    "uncertainty_score": 0.25000019528709627,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 5089,
    "uncertainty_score": 4.21161262070668e-05,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 5090,
    "uncertainty_score": 0.24999252171247477,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 5091,
    "uncertainty_score": 1.2536765796193145e-05,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 5092,
    "uncertainty_score": 1.8083505141111282e-05,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 5093,
    "uncertainty_score": 1.1279320677044894e-09,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 5094,
    "uncertainty_score": 6.684667736483443e-11,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 5095,
    "uncertainty_score": 0.2673827428375175,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 5096,
    "uncertainty_score": 1.587189029883434e-07,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 5097,
    "uncertainty_score": 0.7499346663395956,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 5098,
    "uncertainty_score": 0.00034678437901873815,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 5099,
    "uncertainty_score": 8.531714772190964e-05,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 5100,
    "uncertainty_score": 0.6666666666666666,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 5101,
    "uncertainty_score": 0.33340110437202286,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 5102,
    "uncertainty_score": 5.333741342422093e-05,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 5103,
    "uncertainty_score": 0.0012510566003741844,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 5104,
    "uncertainty_score": 0.05273041277849588,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 5105,
    "uncertainty_score": 0.19999999984690525,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 5106,
    "uncertainty_score": 0.00019081946497681812,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 5107,
    "uncertainty_score": 0.6666815968221188,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 5108,
    "uncertainty_score": 0.2509595655674417,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 5109,
    "uncertainty_score": 0.5000000016062343,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 5110,
    "uncertainty_score": 0.14527209008990313,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 5111,
    "uncertainty_score": 0.019969033521466215,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 5112,
    "uncertainty_score": 5.355967355882176e-09,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 5113,
    "uncertainty_score": 0.5005605642126374,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 5114,
    "uncertainty_score": 0.00010948421408003378,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 5115,
    "uncertainty_score": 1.0108776391061966e-05,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 5116,
    "uncertainty_score": 9.599192302508468e-05,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 5117,
    "uncertainty_score": 6.552709380339005e-05,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 5118,
    "uncertainty_score": 1.4864808084996104e-06,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 5119,
    "uncertainty_score": 0.3333279949292258,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 5120,
    "uncertainty_score": 0.0036884433810225425,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 5121,
    "uncertainty_score": 0.00016817630390142662,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 5122,
    "uncertainty_score": 1.4961120844525656e-06,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 5123,
    "uncertainty_score": 0.16666944205604903,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 5124,
    "uncertainty_score": 3.6831060199812852e-09,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 5125,
    "uncertainty_score": 1.9608527024592508e-07,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 5126,
    "uncertainty_score": 0.00024156760501405352,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 5127,
    "uncertainty_score": 0.40483686442223554,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 5128,
    "uncertainty_score": 7.407387738098184e-05,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 5129,
    "uncertainty_score": 2.511796281843433e-08,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 5130,
    "uncertainty_score": 0.2500000122382657,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 5131,
    "uncertainty_score": 0.600017230559911,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 5132,
    "uncertainty_score": 0.005727628643702047,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 5133,
    "uncertainty_score": 6.253021791154401e-09,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 5134,
    "uncertainty_score": 0.14313788700068744,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 5135,
    "uncertainty_score": 0.3641710944741864,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 5136,
    "uncertainty_score": 0.4000940437839198,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 5137,
    "uncertainty_score": 0.2500003462791153,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 5138,
    "uncertainty_score": 2.821079507032639e-07,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 5139,
    "uncertainty_score": 0.395410583453407,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 5140,
    "uncertainty_score": 1.382246715316062e-08,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 5141,
    "uncertainty_score": 0.16680845111136777,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 5142,
    "uncertainty_score": 2.5274964460511785e-05,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 5143,
    "uncertainty_score": 0.023192162209868798,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 5144,
    "uncertainty_score": 3.061007393849344e-07,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 5145,
    "uncertainty_score": 6.24634429729064e-05,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 5146,
    "uncertainty_score": 5.86093083145307e-05,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 5147,
    "uncertainty_score": 0.3333333335017025,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 5148,
    "uncertainty_score": 2.984436403012666e-08,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 5149,
    "uncertainty_score": 1.8647881343328734e-06,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 5150,
    "uncertainty_score": 0.13474587067065413,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 5151,
    "uncertainty_score": 0.20001040497747521,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 5152,
    "uncertainty_score": 0.02281498695216266,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 5153,
    "uncertainty_score": 0.0705083352099951,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 5154,
    "uncertainty_score": 0.40000684050575225,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 5155,
    "uncertainty_score": 0.04920764106840597,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 5156,
    "uncertainty_score": 1.4510291725898113e-05,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 5157,
    "uncertainty_score": 0.2500000077315342,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 5158,
    "uncertainty_score": 0.2520576033603447,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 5159,
    "uncertainty_score": 1.1199367313401014e-07,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 5160,
    "uncertainty_score": 5.077705528716821e-11,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 5161,
    "uncertainty_score": 5.948431388340024e-08,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 5162,
    "uncertainty_score": 6.498324886780542e-10,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 5163,
    "uncertainty_score": 0.0001646846715653743,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 5164,
    "uncertainty_score": 0.00024132143460199286,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 5165,
    "uncertainty_score": 0.24999983291393782,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 5166,
    "uncertainty_score": 0.001523418279209023,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 5167,
    "uncertainty_score": 1.5941996217430098e-05,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 5168,
    "uncertainty_score": 0.2000023305306023,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 5169,
    "uncertainty_score": 0.20000000080813538,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 5170,
    "uncertainty_score": 0.40000000537336844,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 5171,
    "uncertainty_score": 1.277083258763458e-05,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 5172,
    "uncertainty_score": 0.19999330861709805,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 5173,
    "uncertainty_score": 0.2000728515696169,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 5174,
    "uncertainty_score": 0.0389854771083988,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 5175,
    "uncertainty_score": 0.19999987307618552,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 5176,
    "uncertainty_score": 1.3575409563175914e-07,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 5177,
    "uncertainty_score": 6.947818730800952e-10,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 5178,
    "uncertainty_score": 0.5000000000997049,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 5179,
    "uncertainty_score": 9.413087774739376e-08,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 5180,
    "uncertainty_score": 0.3335821796867235,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 5181,
    "uncertainty_score": 0.20000000597772102,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 5182,
    "uncertainty_score": 0.39999999989589435,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 5183,
    "uncertainty_score": 1.0778033969478589e-08,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 5184,
    "uncertainty_score": 7.938519200046298e-11,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 5185,
    "uncertainty_score": 3.4708639283154183e-07,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 5186,
    "uncertainty_score": 0.25002611585976436,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 5187,
    "uncertainty_score": 0.24992061213057765,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 5188,
    "uncertainty_score": 0.16666678529248866,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 5189,
    "uncertainty_score": 0.5316491298381992,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 5190,
    "uncertainty_score": 5.140202626910761e-05,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 5191,
    "uncertainty_score": 2.6175409110186364e-10,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 5192,
    "uncertainty_score": 8.061091897672081e-08,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 5193,
    "uncertainty_score": 0.0001260992877857091,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 5194,
    "uncertainty_score": 3.7085358834938765e-06,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 5195,
    "uncertainty_score": 2.9200629123198853e-07,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 5196,
    "uncertainty_score": 0.15363088492710616,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 5197,
    "uncertainty_score": 0.0008099147340053813,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 5198,
    "uncertainty_score": 1.6534489825878235e-08,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 5199,
    "uncertainty_score": 3.8515022641909284e-10,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 5200,
    "uncertainty_score": 0.00011221665715064863,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 5201,
    "uncertainty_score": 0.25468403123096145,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 5202,
    "uncertainty_score": 1.509622939325148e-10,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 5203,
    "uncertainty_score": 0.3346820275642798,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 5204,
    "uncertainty_score": 0.00013410703350945921,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 5205,
    "uncertainty_score": 7.861012685286552e-06,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 5206,
    "uncertainty_score": 5.203020208944867e-06,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 5207,
    "uncertainty_score": 0.40006539656715534,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 5208,
    "uncertainty_score": 7.225245577681637e-07,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 5209,
    "uncertainty_score": 0.20000312905769607,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 5210,
    "uncertainty_score": 2.8666841351795717e-10,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 5211,
    "uncertainty_score": 7.078702706468365e-07,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 5212,
    "uncertainty_score": 1.0383033472297332e-06,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 5213,
    "uncertainty_score": 1.060646054314416e-08,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 5214,
    "uncertainty_score": 6.919832744911728e-05,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 5215,
    "uncertainty_score": 0.5816291097741065,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 5216,
    "uncertainty_score": 0.25065791860312725,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 5217,
    "uncertainty_score": 0.26875751705975603,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 5218,
    "uncertainty_score": 0.333309151792868,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 5219,
    "uncertainty_score": 1.89262217180941e-07,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 5220,
    "uncertainty_score": 1.807095552188461e-08,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 5221,
    "uncertainty_score": 1.3276780914957935e-05,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 5222,
    "uncertainty_score": 2.5063921538824856e-06,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 5223,
    "uncertainty_score": 0.005187869946002965,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 5224,
    "uncertainty_score": 4.3609357587215355e-09,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 5225,
    "uncertainty_score": 0.4000007291673623,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 5226,
    "uncertainty_score": 0.0006585569751408771,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 5227,
    "uncertainty_score": 0.75,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 5228,
    "uncertainty_score": 0.25001813594573813,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 5229,
    "uncertainty_score": 0.4365606146750287,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 5230,
    "uncertainty_score": 0.0006150739811320116,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 5231,
    "uncertainty_score": 0.3333378376317519,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 5232,
    "uncertainty_score": 0.3999831055265461,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 5233,
    "uncertainty_score": 0.5019921619681117,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 5234,
    "uncertainty_score": 6.42595382285776e-08,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 5235,
    "uncertainty_score": 0.49970337119475206,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 5236,
    "uncertainty_score": 4.507234605261849e-05,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 5237,
    "uncertainty_score": 8.792568670793238e-09,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 5238,
    "uncertainty_score": 6.722127945159229e-08,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 5239,
    "uncertainty_score": 0.33333647298093466,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 5240,
    "uncertainty_score": 0.19996305243672047,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 5241,
    "uncertainty_score": 0.7987930398854625,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 5242,
    "uncertainty_score": 0.5126432864737486,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 5243,
    "uncertainty_score": 0.3333333356380048,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 5244,
    "uncertainty_score": 0.0,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 5245,
    "uncertainty_score": 0.6631281155840457,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 5246,
    "uncertainty_score": 7.180229487307189e-09,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 5247,
    "uncertainty_score": 0.00031820421396144214,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 5248,
    "uncertainty_score": 0.20000027614829047,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 5249,
    "uncertainty_score": 3.2520727956365824e-06,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 5250,
    "uncertainty_score": 0.3154266470952933,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 5251,
    "uncertainty_score": 0.500153390513323,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 5252,
    "uncertainty_score": 0.20003706771017954,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 5253,
    "uncertainty_score": 0.253107912799286,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 5254,
    "uncertainty_score": 1.8937911288375625e-07,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 5255,
    "uncertainty_score": 0.40000007048191905,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 5256,
    "uncertainty_score": 0.5325892054686789,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 5257,
    "uncertainty_score": 0.00022908562706329508,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 5258,
    "uncertainty_score": 0.0019539724256817255,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 5259,
    "uncertainty_score": 0.25489383828441814,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 5260,
    "uncertainty_score": 0.11303600765710038,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 5261,
    "uncertainty_score": 0.005650836940459694,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 5262,
    "uncertainty_score": 0.750000583020887,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 5263,
    "uncertainty_score": 0.5001638907678216,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 5264,
    "uncertainty_score": 0.4000160077635491,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 5265,
    "uncertainty_score": 0.5999999993999999,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 5266,
    "uncertainty_score": 0.11483027149636964,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 5267,
    "uncertainty_score": 0.3334969716109078,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 5268,
    "uncertainty_score": 0.75,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 5269,
    "uncertainty_score": 7.684280614690469e-05,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 5270,
    "uncertainty_score": 3.0681609117945083e-06,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 5271,
    "uncertainty_score": 0.002411430564512927,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 5272,
    "uncertainty_score": 0.6666666666666666,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 5273,
    "uncertainty_score": 0.20123703392924602,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 5274,
    "uncertainty_score": 0.33341824932813546,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 5275,
    "uncertainty_score": 5.207605587462872e-09,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 5276,
    "uncertainty_score": 9.082348618489656e-06,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 5277,
    "uncertainty_score": 3.388883090864892e-07,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 5278,
    "uncertainty_score": 0.00011619492345844523,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 5279,
    "uncertainty_score": 0.2863595993620197,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 5280,
    "uncertainty_score": 0.3999999998125786,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 5281,
    "uncertainty_score": 0.6666702566147165,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 5282,
    "uncertainty_score": 0.4000000221886168,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 5283,
    "uncertainty_score": 0.6,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 5284,
    "uncertainty_score": 7.44047555313883e-09,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 5285,
    "uncertainty_score": 0.33333519638403325,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 5286,
    "uncertainty_score": 3.760499529941095e-05,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 5287,
    "uncertainty_score": 0.6000001652257355,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 5288,
    "uncertainty_score": 8.081946030650506e-09,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 5289,
    "uncertainty_score": 0.40000121745585204,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 5290,
    "uncertainty_score": 1.8812852406889722e-10,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 5291,
    "uncertainty_score": 0.33334280330713795,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 5292,
    "uncertainty_score": 0.399999999600184,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 5293,
    "uncertainty_score": 2.6711532465412815e-08,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 5294,
    "uncertainty_score": 0.7482057958003155,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 5295,
    "uncertainty_score": 0.4016486611557372,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 5296,
    "uncertainty_score": 0.2500000054548232,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 5297,
    "uncertainty_score": 0.21725804869097104,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 5298,
    "uncertainty_score": 0.16666690112442517,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 5299,
    "uncertainty_score": 0.25000000000000017,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 5300,
    "uncertainty_score": 0.012240879451931443,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 5301,
    "uncertainty_score": 0.25004172650917567,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 5302,
    "uncertainty_score": 0.7500000000000698,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 5303,
    "uncertainty_score": 0.20000726964407808,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 5304,
    "uncertainty_score": 0.6666666663333333,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 5305,
    "uncertainty_score": 0.25000000007145984,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 5306,
    "uncertainty_score": 2.443390795943718e-05,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 5307,
    "uncertainty_score": 0.5051906386339581,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 5308,
    "uncertainty_score": 0.6000000000000152,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 5309,
    "uncertainty_score": 0.7152303582467746,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 5310,
    "uncertainty_score": 0.75,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 5311,
    "uncertainty_score": 4.7498988384528784e-07,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 5312,
    "uncertainty_score": 0.5999882195081836,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 5313,
    "uncertainty_score": 0.20000287617316714,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 5314,
    "uncertainty_score": 0.4000591914245484,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 5315,
    "uncertainty_score": 0.3333785065986208,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 5316,
    "uncertainty_score": 0.34147781180534187,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 5317,
    "uncertainty_score": 0.5000000015569206,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 5318,
    "uncertainty_score": 0.4000000001988247,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 5319,
    "uncertainty_score": 0.8003658251241138,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 5320,
    "uncertainty_score": 0.6666666666666666,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 5321,
    "uncertainty_score": 0.6537719594034987,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 5322,
    "uncertainty_score": 0.25000000000195777,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 5323,
    "uncertainty_score": 0.6885347169380834,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 5324,
    "uncertainty_score": 0.5000000000054665,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 5325,
    "uncertainty_score": 0.1999701856351504,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 5326,
    "uncertainty_score": 0.1672656004315373,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 5327,
    "uncertainty_score": 0.5000006886237262,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 5328,
    "uncertainty_score": 0.1999999998,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 5329,
    "uncertainty_score": 0.41669813526135674,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 5330,
    "uncertainty_score": 0.24276281142714745,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 5331,
    "uncertainty_score": 0.4,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 5332,
    "uncertainty_score": 0.20000017503037842,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 5333,
    "uncertainty_score": 0.19999999979944733,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 5334,
    "uncertainty_score": 0.24999999974999998,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 5335,
    "uncertainty_score": 0.20000154578625007,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 5336,
    "uncertainty_score": 0.20036583750398398,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 5337,
    "uncertainty_score": 0.4444444785553462,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 5338,
    "uncertainty_score": 0.2736664391923907,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 5339,
    "uncertainty_score": 0.5000460390726902,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 5340,
    "uncertainty_score": 0.00023903233981042602,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 5341,
    "uncertainty_score": 6.206093283978666e-09,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 5342,
    "uncertainty_score": 0.49996739303751314,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 5343,
    "uncertainty_score": 0.249999999750001,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 5344,
    "uncertainty_score": 0.4000003964748385,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 5345,
    "uncertainty_score": 0.5561520025314967,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 5346,
    "uncertainty_score": 0.0016873407987201617,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 5347,
    "uncertainty_score": 6.316063950571853e-08,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 5348,
    "uncertainty_score": 0.3512977234163278,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 5349,
    "uncertainty_score": 0.5134837704112849,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 5350,
    "uncertainty_score": 1.551598858231942e-05,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 5351,
    "uncertainty_score": 0.33333104771607686,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 5352,
    "uncertainty_score": 0.5000159415019824,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 5353,
    "uncertainty_score": 0.33413782936399844,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 5354,
    "uncertainty_score": 0.6667510521102185,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 5355,
    "uncertainty_score": 0.20004688103226936,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 5356,
    "uncertainty_score": 2.4423272752944782e-05,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 5357,
    "uncertainty_score": 0.00011653526204733447,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 5358,
    "uncertainty_score": 0.6666666603345678,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 5359,
    "uncertainty_score": 0.20764829279974975,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 5360,
    "uncertainty_score": 0.7291271585899815,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 5361,
    "uncertainty_score": 0.20487689779201532,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 5362,
    "uncertainty_score": 8.315151434353951e-09,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 5363,
    "uncertainty_score": 0.6818206158553863,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 5364,
    "uncertainty_score": 0.333333272484716,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 5365,
    "uncertainty_score": 0.2499494016120153,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 5366,
    "uncertainty_score": 5.490833867273993e-16,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 5367,
    "uncertainty_score": 0.20000001278273233,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 5368,
    "uncertainty_score": 0.25000001956649903,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 5369,
    "uncertainty_score": 6.016597510381489e-07,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 5370,
    "uncertainty_score": 0.3333918952136383,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 5371,
    "uncertainty_score": 0.5714489700138399,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 5372,
    "uncertainty_score": 0.25000342564044137,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 5373,
    "uncertainty_score": 0.2500000090909499,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 5374,
    "uncertainty_score": 0.5840818704086601,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 5375,
    "uncertainty_score": 0.16460771224899115,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 5376,
    "uncertainty_score": 0.2000041570346455,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 5377,
    "uncertainty_score": 0.7506629045832461,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 5378,
    "uncertainty_score": 0.00010273133108967285,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 5379,
    "uncertainty_score": 3.63068539384214e-07,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 5380,
    "uncertainty_score": 1.4145538167000373e-05,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 5381,
    "uncertainty_score": 0.2500017409422619,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 5382,
    "uncertainty_score": 0.39999806805126525,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 5383,
    "uncertainty_score": 0.2152291073582351,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 5384,
    "uncertainty_score": 0.33333366584988355,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 5385,
    "uncertainty_score": 1.9105682091635327e-05,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 5386,
    "uncertainty_score": 1.2073002365067216e-10,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 5387,
    "uncertainty_score": 0.2500000007199923,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 5388,
    "uncertainty_score": 0.25000059377342165,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 5389,
    "uncertainty_score": 6.809828720051057e-06,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 5390,
    "uncertainty_score": 0.20003121008604102,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 5391,
    "uncertainty_score": 0.25000000368691555,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 5392,
    "uncertainty_score": 0.38570353335460256,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 5393,
    "uncertainty_score": 0.33366719262088756,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 5394,
    "uncertainty_score": 3.569141595665164e-05,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 5395,
    "uncertainty_score": 5.776790958665219e-06,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 5396,
    "uncertainty_score": 3.423704015426303e-07,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 5397,
    "uncertainty_score": 0.0004343023976718613,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 5398,
    "uncertainty_score": 0.003924810446858032,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 5399,
    "uncertainty_score": 7.973730776741845e-06,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 5400,
    "uncertainty_score": 5.002047224533624e-05,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 5401,
    "uncertainty_score": 5.302508666942675e-08,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 5402,
    "uncertainty_score": 0.4999950722502863,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 5403,
    "uncertainty_score": 0.25009803175526557,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 5404,
    "uncertainty_score": 0.0003177584671727892,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 5405,
    "uncertainty_score": 6.15241209683189e-06,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 5406,
    "uncertainty_score": 0.5999995408179943,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 5407,
    "uncertainty_score": 0.2000000003740884,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 5408,
    "uncertainty_score": 0.2000300799330208,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 5409,
    "uncertainty_score": 7.926017713960104e-07,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 5410,
    "uncertainty_score": 1.1921243011093722e-07,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 5411,
    "uncertainty_score": 0.004375479427241063,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 5412,
    "uncertainty_score": 0.3076961018964593,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 5413,
    "uncertainty_score": 8.977421275498149e-05,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 5414,
    "uncertainty_score": 0.39998951357959334,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 5415,
    "uncertainty_score": 6.3207540410893935e-06,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 5416,
    "uncertainty_score": 0.6137740699213731,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 5417,
    "uncertainty_score": 3.661656886194355e-10,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 5418,
    "uncertainty_score": 0.19999867891547252,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 5419,
    "uncertainty_score": 0.4992678490582798,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 5420,
    "uncertainty_score": 8.864639509177391e-07,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 5421,
    "uncertainty_score": 0.20000000166689436,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 5422,
    "uncertainty_score": 0.24999975640392935,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 5423,
    "uncertainty_score": 2.238602503178265e-05,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 5424,
    "uncertainty_score": 0.0048388206893453115,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 5425,
    "uncertainty_score": 2.0350750924000956e-11,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 5426,
    "uncertainty_score": 3.323255970595173e-05,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 5427,
    "uncertainty_score": 7.823419785585582e-10,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 5428,
    "uncertainty_score": 0.009125250514787644,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 5429,
    "uncertainty_score": 0.0001472999400674082,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 5430,
    "uncertainty_score": 0.3333333333333337,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 5431,
    "uncertainty_score": 1.7809786456903485e-07,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 5432,
    "uncertainty_score": 0.00021764753238783793,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 5433,
    "uncertainty_score": 0.0013387198341931778,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 5434,
    "uncertainty_score": 2.3275371261285405e-08,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 5435,
    "uncertainty_score": 9.149476746268432e-07,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 5436,
    "uncertainty_score": 0.19982613368201024,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 5437,
    "uncertainty_score": 0.41052192853377,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 5438,
    "uncertainty_score": 7.447968522860692e-06,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 5439,
    "uncertainty_score": 3.250099411124103e-07,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 5440,
    "uncertainty_score": 0.00015761904291380156,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 5441,
    "uncertainty_score": 0.03354350558284513,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 5442,
    "uncertainty_score": 8.251420415033115e-19,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 5443,
    "uncertainty_score": 0.25015335639820613,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 5444,
    "uncertainty_score": 0.500809342960627,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 5445,
    "uncertainty_score": 7.040014097214156e-07,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 5446,
    "uncertainty_score": 3.83314294517865e-06,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 5447,
    "uncertainty_score": 0.016064627267211647,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 5448,
    "uncertainty_score": 0.30779547993936507,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 5449,
    "uncertainty_score": 0.40000632227891614,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 5450,
    "uncertainty_score": 5.063187369419487e-05,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 5451,
    "uncertainty_score": 0.20000126255658895,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 5452,
    "uncertainty_score": 5.274404254244099e-08,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 5453,
    "uncertainty_score": 2.967703088258008e-07,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 5454,
    "uncertainty_score": 0.605597940045475,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 5455,
    "uncertainty_score": 0.4135464063002851,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 5456,
    "uncertainty_score": 0.17044565834517025,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 5457,
    "uncertainty_score": 9.907669450731863e-06,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 5458,
    "uncertainty_score": 0.49998192900741834,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 5459,
    "uncertainty_score": 6.8420601182760545e-06,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 5460,
    "uncertainty_score": 0.003271906326894349,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 5461,
    "uncertainty_score": 0.2499297646343435,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 5462,
    "uncertainty_score": 6.672414121622682e-06,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 5463,
    "uncertainty_score": 3.757204192621511e-08,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 5464,
    "uncertainty_score": 0.5000029985694433,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 5465,
    "uncertainty_score": 0.22429464774740385,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 5466,
    "uncertainty_score": 0.000507753125720074,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 5467,
    "uncertainty_score": 0.4999999424823756,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 5468,
    "uncertainty_score": 0.333409373063042,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 5469,
    "uncertainty_score": 0.0020610096493568664,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 5470,
    "uncertainty_score": 0.0001274351864552722,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 5471,
    "uncertainty_score": 0.49999999975000614,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 5472,
    "uncertainty_score": 0.5011055587480837,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 5473,
    "uncertainty_score": 1.9482247126148432e-07,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 5474,
    "uncertainty_score": 5.3092700704593455e-05,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 5475,
    "uncertainty_score": 0.40000054529408774,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 5476,
    "uncertainty_score": 0.40536972554025735,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 5477,
    "uncertainty_score": 0.25155919173060876,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 5478,
    "uncertainty_score": 0.3328381214647877,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 5479,
    "uncertainty_score": 0.4128963370944233,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 5480,
    "uncertainty_score": 0.2500005830210031,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 5481,
    "uncertainty_score": 2.2888618049430803e-10,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 5482,
    "uncertainty_score": 0.5015859964718241,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 5483,
    "uncertainty_score": 0.21747526756043217,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 5484,
    "uncertainty_score": 1.1411760488188072e-06,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 5485,
    "uncertainty_score": 2.6453650794188114e-06,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 5486,
    "uncertainty_score": 0.2000000017348768,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 5487,
    "uncertainty_score": 0.33302216589264383,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 5488,
    "uncertainty_score": 1.0496060404871303e-08,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 5489,
    "uncertainty_score": 4.169166122841695e-10,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 5490,
    "uncertainty_score": 8.75051995050163e-08,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 5491,
    "uncertainty_score": 0.2506246110519381,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 5492,
    "uncertainty_score": 4.932590641360522e-06,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 5493,
    "uncertainty_score": 0.2000001826509649,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 5494,
    "uncertainty_score": 4.169164489643999e-09,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 5495,
    "uncertainty_score": 0.4000000003020432,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 5496,
    "uncertainty_score": 0.19994837730779086,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 5497,
    "uncertainty_score": 0.7999989805573496,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 5498,
    "uncertainty_score": 2.260935820155333e-08,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 5499,
    "uncertainty_score": 1.1188520673128286e-11,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 5500,
    "uncertainty_score": 0.25002178424648874,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 5501,
    "uncertainty_score": 0.25001397791044694,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 5502,
    "uncertainty_score": 1.0809313533321444e-08,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 5503,
    "uncertainty_score": 5.363370779976688e-06,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 5504,
    "uncertainty_score": 0.16669595551756644,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 5505,
    "uncertainty_score": 0.2005655346487047,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 5506,
    "uncertainty_score": 0.33333333380324426,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 5507,
    "uncertainty_score": 0.3002112880904637,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 5508,
    "uncertainty_score": 0.2500000431317269,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 5509,
    "uncertainty_score": 6.0140094968327924e-05,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 5510,
    "uncertainty_score": 0.0010120623501173964,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 5511,
    "uncertainty_score": 0.00028294592124024196,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 5512,
    "uncertainty_score": 0.20039048550552266,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 5513,
    "uncertainty_score": 0.2519553136115116,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 5514,
    "uncertainty_score": 0.18252051870823843,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 5515,
    "uncertainty_score": 1.6625610444359135e-06,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 5516,
    "uncertainty_score": 0.2759184400101855,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 5517,
    "uncertainty_score": 0.025978018519752077,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 5518,
    "uncertainty_score": 0.19999979649347127,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 5519,
    "uncertainty_score": 0.19997572086050222,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 5520,
    "uncertainty_score": 0.5000235302343965,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 5521,
    "uncertainty_score": 8.896476785318798e-10,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 5522,
    "uncertainty_score": 0.004018470412085637,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 5523,
    "uncertainty_score": 1.0388137921045276e-07,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 5524,
    "uncertainty_score": 0.24999993083997787,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 5525,
    "uncertainty_score": 1.6978027561017192e-08,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 5526,
    "uncertainty_score": 0.3333333689809814,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 5527,
    "uncertainty_score": 0.25000647608755533,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 5528,
    "uncertainty_score": 0.20012268722170296,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 5529,
    "uncertainty_score": 0.27552133977573945,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 5530,
    "uncertainty_score": 0.19000808580188416,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 5531,
    "uncertainty_score": 0.3987934241489123,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 5532,
    "uncertainty_score": 0.00033787818073483905,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 5533,
    "uncertainty_score": 1.414979288948793e-08,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 5534,
    "uncertainty_score": 0.00018756460940146533,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 5535,
    "uncertainty_score": 2.0573984079587558e-08,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 5536,
    "uncertainty_score": 4.190507658258234e-09,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 5537,
    "uncertainty_score": 0.20000000212528263,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 5538,
    "uncertainty_score": 8.123147125967528e-08,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 5539,
    "uncertainty_score": 0.19671669767810004,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 5540,
    "uncertainty_score": 0.20087405885570137,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 5541,
    "uncertainty_score": 5.688681030329374e-06,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 5542,
    "uncertainty_score": 8.04556768231329e-08,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 5543,
    "uncertainty_score": 0.014072939370187934,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 5544,
    "uncertainty_score": 0.25000668539026316,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 5545,
    "uncertainty_score": 1.3347933304358777e-06,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 5546,
    "uncertainty_score": 9.240884121237011e-09,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 5547,
    "uncertainty_score": 0.20140062616272644,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 5548,
    "uncertainty_score": 0.12386646062155045,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 5549,
    "uncertainty_score": 0.027662003474004365,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 5550,
    "uncertainty_score": 1.2305659190119848e-10,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 5551,
    "uncertainty_score": 0.4000000123193076,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 5552,
    "uncertainty_score": 1.0007677292357672e-08,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 5553,
    "uncertainty_score": 0.7499998273812194,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 5554,
    "uncertainty_score": 1.2411208669568595e-05,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 5555,
    "uncertainty_score": 0.20394387083657883,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 5556,
    "uncertainty_score": 0.20001001685745182,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 5557,
    "uncertainty_score": 0.19996297340482383,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 5558,
    "uncertainty_score": 0.1845574368532468,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 5559,
    "uncertainty_score": 0.8127281933966776,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 5560,
    "uncertainty_score": 2.410425350695353e-07,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 5561,
    "uncertainty_score": 0.20018729646720468,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 5562,
    "uncertainty_score": 5.856145821816417e-05,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 5563,
    "uncertainty_score": 1.615751835569479e-08,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 5564,
    "uncertainty_score": 1.57287690847102e-08,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 5565,
    "uncertainty_score": 5.766897970215739e-06,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 5566,
    "uncertainty_score": 0.25004550929380587,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 5567,
    "uncertainty_score": 0.25017927464568646,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 5568,
    "uncertainty_score": 0.3371632968448541,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 5569,
    "uncertainty_score": 1.586081742701714e-06,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 5570,
    "uncertainty_score": 1.5052428747635332e-10,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 5571,
    "uncertainty_score": 3.0020329922144513e-11,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 5572,
    "uncertainty_score": 8.382729846434358e-10,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 5573,
    "uncertainty_score": 5.119939947093953e-06,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 5574,
    "uncertainty_score": 3.685387248881058e-11,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 5575,
    "uncertainty_score": 9.98312997988803e-12,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 5576,
    "uncertainty_score": 7.618150968094955e-09,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 5577,
    "uncertainty_score": 0.5000576936790285,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 5578,
    "uncertainty_score": 6.075081209454035e-06,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 5579,
    "uncertainty_score": 2.8335552445612556e-09,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 5580,
    "uncertainty_score": 0.00014962242565152151,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 5581,
    "uncertainty_score": 0.2000626798269987,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 5582,
    "uncertainty_score": 0.25000003048865954,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 5583,
    "uncertainty_score": 0.00020274754614121166,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 5584,
    "uncertainty_score": 8.821117516742181e-09,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 5585,
    "uncertainty_score": 0.2494078964933767,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 5586,
    "uncertainty_score": 0.2500000739204923,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 5587,
    "uncertainty_score": 1.0850797695992493e-07,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 5588,
    "uncertainty_score": 0.2515099547655272,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 5589,
    "uncertainty_score": 0.2000027675355649,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 5590,
    "uncertainty_score": 1.0647739760490046e-08,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 5591,
    "uncertainty_score": 7.981093052914544e-12,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 5592,
    "uncertainty_score": 9.903825316724038e-10,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 5593,
    "uncertainty_score": 0.20000057430478524,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 5594,
    "uncertainty_score": 0.00013527908983134373,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 5595,
    "uncertainty_score": 1.0009591771998426e-09,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 5596,
    "uncertainty_score": 0.0003698199317099502,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 5597,
    "uncertainty_score": 7.417663291099744e-05,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 5598,
    "uncertainty_score": 0.0002290937033122498,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 5599,
    "uncertainty_score": 1.9367514550190198e-07,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 5600,
    "uncertainty_score": 0.5013512734472311,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 5601,
    "uncertainty_score": 2.8979905875850455e-05,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 5602,
    "uncertainty_score": 0.25000000000347605,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 5603,
    "uncertainty_score": 0.24454002776011313,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 5604,
    "uncertainty_score": 9.288628743390445e-12,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 5605,
    "uncertainty_score": 0.5000000007659007,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 5606,
    "uncertainty_score": 0.4000334949494893,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 5607,
    "uncertainty_score": 4.818321793194466e-08,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 5608,
    "uncertainty_score": 4.867328444442936e-06,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 5609,
    "uncertainty_score": 0.03722052721724655,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 5610,
    "uncertainty_score": 7.41942035191785e-08,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 5611,
    "uncertainty_score": 3.829873487138885e-09,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 5612,
    "uncertainty_score": 9.89977068455202e-05,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 5613,
    "uncertainty_score": 0.9987469258596081,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 5614,
    "uncertainty_score": 3.0098627519292827e-05,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 5615,
    "uncertainty_score": 1.773711915363719e-10,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 5616,
    "uncertainty_score": 0.19961469454413344,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 5617,
    "uncertainty_score": 1.816452925590556e-06,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 5618,
    "uncertainty_score": 2.12824990360044e-05,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 5619,
    "uncertainty_score": 0.4004961837255011,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 5620,
    "uncertainty_score": 3.4945940960534685e-07,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 5621,
    "uncertainty_score": 5.196266079879747e-05,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 5622,
    "uncertainty_score": 2.8713635856378415e-09,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 5623,
    "uncertainty_score": 2.027044277680183e-07,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 5624,
    "uncertainty_score": 0.6666666754642449,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 5625,
    "uncertainty_score": 0.00033928392511590615,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 5626,
    "uncertainty_score": 3.086785775892817e-06,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 5627,
    "uncertainty_score": 0.0003440981565588593,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 5628,
    "uncertainty_score": 0.00030165595540948575,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 5629,
    "uncertainty_score": 2.6116252857907998e-05,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 5630,
    "uncertainty_score": 0.19817487345427734,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 5631,
    "uncertainty_score": 0.08068227907599314,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 5632,
    "uncertainty_score": 0.006365176846576112,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 5633,
    "uncertainty_score": 0.4000000055913633,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 5634,
    "uncertainty_score": 0.40000006861105675,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 5635,
    "uncertainty_score": 0.25002750919381195,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 5636,
    "uncertainty_score": 5.3517837311119287e-05,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 5637,
    "uncertainty_score": 0.19999207914955677,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 5638,
    "uncertainty_score": 1.6536669465415587e-06,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 5639,
    "uncertainty_score": 1.0716846674069693e-08,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 5640,
    "uncertainty_score": 2.5064894424256392e-06,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 5641,
    "uncertainty_score": 0.0897371893431419,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 5642,
    "uncertainty_score": 1.8259869688738966e-05,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 5643,
    "uncertainty_score": 0.25041926234243245,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 5644,
    "uncertainty_score": 0.5235942090407736,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 5645,
    "uncertainty_score": 1.8447255693908864e-06,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 5646,
    "uncertainty_score": 1.0361681077250631e-06,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 5647,
    "uncertainty_score": 2.5816433601843065e-05,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 5648,
    "uncertainty_score": 0.20127162084284098,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 5649,
    "uncertainty_score": 0.01672824952125779,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 5650,
    "uncertainty_score": 1.21998928113565e-08,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 5651,
    "uncertainty_score": 3.524000839177844e-07,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 5652,
    "uncertainty_score": 3.621661650946753e-05,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 5653,
    "uncertainty_score": 2.2515225108472906e-07,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 5654,
    "uncertainty_score": 0.20000002057043975,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 5655,
    "uncertainty_score": 0.3333345752148344,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 5656,
    "uncertainty_score": 6.078910126815347e-05,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 5657,
    "uncertainty_score": 1.1342398984331076e-07,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 5658,
    "uncertainty_score": 7.186224290344164e-10,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 5659,
    "uncertainty_score": 8.906719267182532e-09,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 5660,
    "uncertainty_score": 0.1999999778798427,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 5661,
    "uncertainty_score": 7.774879648713477e-09,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 5662,
    "uncertainty_score": 0.008105272894853448,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 5663,
    "uncertainty_score": 9.155329608598704e-11,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 5664,
    "uncertainty_score": 2.0525724007918712e-07,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 5665,
    "uncertainty_score": 8.560424822408358e-10,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 5666,
    "uncertainty_score": 0.16666666669171046,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 5667,
    "uncertainty_score": 0.02189103130559087,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 5668,
    "uncertainty_score": 4.4315337244003234e-08,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 5669,
    "uncertainty_score": 1.3484502541386564e-06,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 5670,
    "uncertainty_score": 0.1666683874633542,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 5671,
    "uncertainty_score": 1.6471390532387795e-07,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 5672,
    "uncertainty_score": 0.0001412710637694468,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 5673,
    "uncertainty_score": 6.81115122299066e-05,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 5674,
    "uncertainty_score": 1.1218750925656782e-05,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 5675,
    "uncertainty_score": 0.20000000144431113,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 5676,
    "uncertainty_score": 0.25076174392689793,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 5677,
    "uncertainty_score": 4.7271516363405646e-06,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 5678,
    "uncertainty_score": 0.20000008229146987,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 5679,
    "uncertainty_score": 0.31858766952143885,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 5680,
    "uncertainty_score": 8.037945101189314e-10,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 5681,
    "uncertainty_score": 8.048133157849285e-11,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 5682,
    "uncertainty_score": 8.089649873482219e-05,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 5683,
    "uncertainty_score": 6.350640709980837e-12,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 5684,
    "uncertainty_score": 0.16806557568605715,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 5685,
    "uncertainty_score": 6.203376515923623e-06,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 5686,
    "uncertainty_score": 0.0014220830809483186,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 5687,
    "uncertainty_score": 8.024942232119245e-05,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 5688,
    "uncertainty_score": 7.455326425116828e-07,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 5689,
    "uncertainty_score": 3.510244685724538e-10,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 5690,
    "uncertainty_score": 2.0341984412049555e-10,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 5691,
    "uncertainty_score": 2.5330683312695697e-08,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 5692,
    "uncertainty_score": 0.20014980516594633,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 5693,
    "uncertainty_score": 1.1063415414644721e-10,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 5694,
    "uncertainty_score": 4.401712540634736e-10,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 5695,
    "uncertainty_score": 1.1912618413008505e-09,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 5696,
    "uncertainty_score": 0.39680501583603434,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 5697,
    "uncertainty_score": 0.40461513384738573,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 5698,
    "uncertainty_score": 4.084433785836756e-09,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 5699,
    "uncertainty_score": 0.0016734562757851025,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 5700,
    "uncertainty_score": 0.20224311764942585,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 5701,
    "uncertainty_score": 0.2500000003568023,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 5702,
    "uncertainty_score": 2.9378997938305224e-07,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 5703,
    "uncertainty_score": 7.6924974434496e-08,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 5704,
    "uncertainty_score": 0.19999401413136061,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 5705,
    "uncertainty_score": 4.3859841108819456e-05,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 5706,
    "uncertainty_score": 0.2000003008497863,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 5707,
    "uncertainty_score": 9.64483655579503e-10,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 5708,
    "uncertainty_score": 0.2917337094725103,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 5709,
    "uncertainty_score": 0.19997697215972418,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 5710,
    "uncertainty_score": 1.7656371454131283e-07,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 5711,
    "uncertainty_score": 4.69730421215884e-07,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 5712,
    "uncertainty_score": 0.19999739885061002,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 5713,
    "uncertainty_score": 0.0017221079223674405,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 5714,
    "uncertainty_score": 0.3333331617277062,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 5715,
    "uncertainty_score": 0.3333333330570984,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 5716,
    "uncertainty_score": 4.0995199565622557e-07,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 5717,
    "uncertainty_score": 4.2807635906290033e-07,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 5718,
    "uncertainty_score": 0.1666674112738786,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 5719,
    "uncertainty_score": 0.2764457540846685,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 5720,
    "uncertainty_score": 0.21370488461615525,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 5721,
    "uncertainty_score": 1.7881670877610762e-05,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 5722,
    "uncertainty_score": 0.16666667222618126,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 5723,
    "uncertainty_score": 0.5258289443068714,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 5724,
    "uncertainty_score": 3.33306855521407e-10,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 5725,
    "uncertainty_score": 0.00010592048035063706,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 5726,
    "uncertainty_score": 2.2534938950889957e-06,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 5727,
    "uncertainty_score": 1.5760608498465528e-08,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 5728,
    "uncertainty_score": 4.986852312150523e-07,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 5729,
    "uncertainty_score": 6.44951093381675e-08,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 5730,
    "uncertainty_score": 1.3006714283930126e-08,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 5731,
    "uncertainty_score": 0.2000006116306532,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 5732,
    "uncertainty_score": 7.157046508811218e-08,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 5733,
    "uncertainty_score": 0.664435715986341,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 5734,
    "uncertainty_score": 4.856211103043136e-05,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 5735,
    "uncertainty_score": 1.608416203317468e-07,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 5736,
    "uncertainty_score": 0.27528136444322293,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 5737,
    "uncertainty_score": 1.760887758888878e-07,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 5738,
    "uncertainty_score": 2.7896302803908765e-10,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 5739,
    "uncertainty_score": 6.070307928435361e-07,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 5740,
    "uncertainty_score": 0.0003351883537599593,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 5741,
    "uncertainty_score": 1.1924422670605877e-07,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 5742,
    "uncertainty_score": 0.25000001113746145,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 5743,
    "uncertainty_score": 0.40028207152848444,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 5744,
    "uncertainty_score": 5.61881920869973e-05,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 5745,
    "uncertainty_score": 0.14285717651301416,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 5746,
    "uncertainty_score": 1.20788166359731e-06,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 5747,
    "uncertainty_score": 0.3355642832855104,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 5748,
    "uncertainty_score": 1.1261845401995965e-09,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 5749,
    "uncertainty_score": 7.638644659842815e-10,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 5750,
    "uncertainty_score": 3.746093959994721e-06,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 5751,
    "uncertainty_score": 0.1684646629946278,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 5752,
    "uncertainty_score": 6.973326161385591e-09,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 5753,
    "uncertainty_score": 3.4940390518204806e-10,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 5754,
    "uncertainty_score": 0.4999421150332591,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 5755,
    "uncertainty_score": 0.20083988041274559,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 5756,
    "uncertainty_score": 4.7013944805839605e-07,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 5757,
    "uncertainty_score": 0.1999147822558955,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 5758,
    "uncertainty_score": 0.242962568030992,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 5759,
    "uncertainty_score": 0.3104225536829231,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 5760,
    "uncertainty_score": 0.9971808473811355,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 5761,
    "uncertainty_score": 7.477545592266419e-09,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 5762,
    "uncertainty_score": 1.8625848868096425e-08,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 5763,
    "uncertainty_score": 1.0594249040863029e-08,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 5764,
    "uncertainty_score": 0.19775499040817962,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 5765,
    "uncertainty_score": 0.7999999955749547,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 5766,
    "uncertainty_score": 6.91458169539302e-08,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 5767,
    "uncertainty_score": 1.2127499562961609e-09,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 5768,
    "uncertainty_score": 2.7130910600207304e-06,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 5769,
    "uncertainty_score": 1.484364010215748e-08,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 5770,
    "uncertainty_score": 7.561848857119311e-10,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 5771,
    "uncertainty_score": 3.585559156347235e-10,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 5772,
    "uncertainty_score": 0.0012069587075640928,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 5773,
    "uncertainty_score": 4.5419376629651846e-07,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 5774,
    "uncertainty_score": 5.679774890437917e-10,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 5775,
    "uncertainty_score": 0.20000283306520367,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 5776,
    "uncertainty_score": 4.159899261416807e-08,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 5777,
    "uncertainty_score": 9.539729936929503e-05,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 5778,
    "uncertainty_score": 0.6665006241759278,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 5779,
    "uncertainty_score": 0.19999872409362035,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 5780,
    "uncertainty_score": 0.25000004520094704,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 5781,
    "uncertainty_score": 4.864671229511207e-06,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 5782,
    "uncertainty_score": 0.20004544601903515,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 5783,
    "uncertainty_score": 8.963501156176954e-12,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 5784,
    "uncertainty_score": 1.0116812749892094e-07,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 5785,
    "uncertainty_score": 0.10260370686544536,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 5786,
    "uncertainty_score": 0.3205376392648735,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 5787,
    "uncertainty_score": 1.4951756246717367e-06,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 5788,
    "uncertainty_score": 1.97916282977269e-15,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 5789,
    "uncertainty_score": 4.820413021107191e-09,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 5790,
    "uncertainty_score": 8.224859014009086e-06,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 5791,
    "uncertainty_score": 0.3999999916996,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 5792,
    "uncertainty_score": 3.1682745001137356e-07,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 5793,
    "uncertainty_score": 0.177526610616546,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 5794,
    "uncertainty_score": 7.517090557583973e-14,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 5795,
    "uncertainty_score": 5.986473611129078e-06,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 5796,
    "uncertainty_score": 1.547107995907617e-07,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 5797,
    "uncertainty_score": 7.025689532026645e-06,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 5798,
    "uncertainty_score": 0.25005540555751066,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 5799,
    "uncertainty_score": 3.4278475581324014e-07,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 5800,
    "uncertainty_score": 1.0376663983412896e-07,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 5801,
    "uncertainty_score": 0.4012087527619707,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 5802,
    "uncertainty_score": 1.7563980210823061e-07,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 5803,
    "uncertainty_score": 0.20000000101627635,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 5804,
    "uncertainty_score": 9.756507414093376e-06,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 5805,
    "uncertainty_score": 4.80599570956318e-08,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 5806,
    "uncertainty_score": 1.6935123273621328e-07,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 5807,
    "uncertainty_score": 1.2060955876361683e-12,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 5808,
    "uncertainty_score": 1.6484408966251037e-09,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 5809,
    "uncertainty_score": 3.1271163497699883e-09,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 5810,
    "uncertainty_score": 0.22430461459371145,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 5811,
    "uncertainty_score": 3.5696223215812396e-05,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 5812,
    "uncertainty_score": 2.522530866347079e-11,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 5813,
    "uncertainty_score": 0.0004503811612262939,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 5814,
    "uncertainty_score": 3.68390707534019e-11,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 5815,
    "uncertainty_score": 2.7645261184351132e-06,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 5816,
    "uncertainty_score": 0.33333333299998774,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 5817,
    "uncertainty_score": 0.00011400890093228559,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 5818,
    "uncertainty_score": 1.2734264341099306e-06,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 5819,
    "uncertainty_score": 3.405857933122409e-07,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 5820,
    "uncertainty_score": 0.40000191081975167,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 5821,
    "uncertainty_score": 1.54569291288231e-06,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 5822,
    "uncertainty_score": 0.19999664295511843,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 5823,
    "uncertainty_score": 1.6705655110157366e-09,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 5824,
    "uncertainty_score": 3.0504680268690497e-09,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 5825,
    "uncertainty_score": 0.7499972298261406,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 5826,
    "uncertainty_score": 4.841240933480393e-09,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 5827,
    "uncertainty_score": 4.722064668167704e-06,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 5828,
    "uncertainty_score": 1.0827401466492856e-10,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 5829,
    "uncertainty_score": 0.20748958626200104,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 5830,
    "uncertainty_score": 0.20509026327074847,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 5831,
    "uncertainty_score": 0.0004059131955191626,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 5832,
    "uncertainty_score": 0.16674152257054345,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 5833,
    "uncertainty_score": 4.188001381738951e-08,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 5834,
    "uncertainty_score": 9.54879077632336e-10,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 5835,
    "uncertainty_score": 9.294110278656068e-12,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 5836,
    "uncertainty_score": 0.04150820181865978,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 5837,
    "uncertainty_score": 2.693815739036104e-06,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 5838,
    "uncertainty_score": 0.2501788699581041,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 5839,
    "uncertainty_score": 0.18750033085082035,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 5840,
    "uncertainty_score": 0.16666634963545798,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 5841,
    "uncertainty_score": 0.2499999999266598,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 5842,
    "uncertainty_score": 0.0017620426688652216,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 5843,
    "uncertainty_score": 0.19999450918183825,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 5844,
    "uncertainty_score": 0.0907195320098534,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 5845,
    "uncertainty_score": 0.3578077413996477,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 5846,
    "uncertainty_score": 0.500000056137028,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 5847,
    "uncertainty_score": 1.6611413942877352e-10,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 5848,
    "uncertainty_score": 0.2500250056729249,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 5849,
    "uncertainty_score": 0.24999999977797213,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 5850,
    "uncertainty_score": 3.377359616148919e-10,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 5851,
    "uncertainty_score": 6.464236021652454e-11,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 5852,
    "uncertainty_score": 2.109531629387768e-09,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 5853,
    "uncertainty_score": 0.16667042360918552,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 5854,
    "uncertainty_score": 1.4858204598247815e-08,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 5855,
    "uncertainty_score": 0.002665146957295892,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 5856,
    "uncertainty_score": 0.0032719916403547342,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 5857,
    "uncertainty_score": 1.4294845658054929e-08,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 5858,
    "uncertainty_score": 0.18248723122303695,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 5859,
    "uncertainty_score": 1.6133878465924267e-09,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 5860,
    "uncertainty_score": 0.020697317694204652,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 5861,
    "uncertainty_score": 5.321096663582714e-07,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 5862,
    "uncertainty_score": 1.6934823577985253e-06,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 5863,
    "uncertainty_score": 0.15340489691786804,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 5864,
    "uncertainty_score": 6.776701932526406e-06,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 5865,
    "uncertainty_score": 8.394979015701516e-07,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 5866,
    "uncertainty_score": 7.647983148938613e-08,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 5867,
    "uncertainty_score": 3.882239683209212e-07,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 5868,
    "uncertainty_score": 6.521633896604954e-08,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 5869,
    "uncertainty_score": 0.0003910842995478349,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 5870,
    "uncertainty_score": 0.4877855566732032,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 5871,
    "uncertainty_score": 0.027681765422461164,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 5872,
    "uncertainty_score": 0.0007688740544376084,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 5873,
    "uncertainty_score": 4.972876777915393e-06,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 5874,
    "uncertainty_score": 0.2435681984519264,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 5875,
    "uncertainty_score": 3.413571846416347e-12,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 5876,
    "uncertainty_score": 0.25043454380100544,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 5877,
    "uncertainty_score": 0.2500000032025866,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 5878,
    "uncertainty_score": 0.0024181276560647515,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 5879,
    "uncertainty_score": 2.707831379888179e-09,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 5880,
    "uncertainty_score": 0.010521968691818198,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 5881,
    "uncertainty_score": 0.3333323270297222,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 5882,
    "uncertainty_score": 0.5004572851413298,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 5883,
    "uncertainty_score": 2.9979001904378194e-05,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 5884,
    "uncertainty_score": 1.5925602378169316e-08,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 5885,
    "uncertainty_score": 1.3336582619051864e-09,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 5886,
    "uncertainty_score": 0.18973289011869948,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 5887,
    "uncertainty_score": 4.609500664170813e-09,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 5888,
    "uncertainty_score": 5.787427490126447e-07,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 5889,
    "uncertainty_score": 0.0005073853137537144,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 5890,
    "uncertainty_score": 7.35147114947459e-07,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 5891,
    "uncertainty_score": 0.40000585761918933,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 5892,
    "uncertainty_score": 0.00015108128053038154,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 5893,
    "uncertainty_score": 0.4062287675826929,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 5894,
    "uncertainty_score": 0.2500000000226491,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 5895,
    "uncertainty_score": 1.1402119862561908e-06,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 5896,
    "uncertainty_score": 0.4000000032919127,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 5897,
    "uncertainty_score": 4.8382734063719504e-09,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 5898,
    "uncertainty_score": 9.614183768829971e-08,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 5899,
    "uncertainty_score": 1.0229868519074818e-05,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 5900,
    "uncertainty_score": 0.006047253455558811,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 5901,
    "uncertainty_score": 1.521662237366491e-08,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 5902,
    "uncertainty_score": 0.20000015567516752,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 5903,
    "uncertainty_score": 0.499999999746528,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 5904,
    "uncertainty_score": 2.9039381710678104e-06,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 5905,
    "uncertainty_score": 0.19958306576210477,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 5906,
    "uncertainty_score": 0.04671230048419415,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 5907,
    "uncertainty_score": 0.6643172849107356,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 5908,
    "uncertainty_score": 0.008738417397307501,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 5909,
    "uncertainty_score": 5.625719839136208e-05,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 5910,
    "uncertainty_score": 3.486690471812714e-05,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 5911,
    "uncertainty_score": 7.797328535500052e-10,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 5912,
    "uncertainty_score": 1.6550641839681309e-09,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 5913,
    "uncertainty_score": 6.852368115305828e-05,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 5914,
    "uncertainty_score": 0.40061780834387994,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 5915,
    "uncertainty_score": 7.627011408758151e-11,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 5916,
    "uncertainty_score": 4.307297161816298e-10,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 5917,
    "uncertainty_score": 5.978407987187108e-11,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 5918,
    "uncertainty_score": 0.20000115861923784,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 5919,
    "uncertainty_score": 1.2265256831466477e-08,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 5920,
    "uncertainty_score": 0.2600090995898786,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 5921,
    "uncertainty_score": 0.00012077901572332353,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 5922,
    "uncertainty_score": 0.0020236934133500677,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 5923,
    "uncertainty_score": 4.992161562803302e-07,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 5924,
    "uncertainty_score": 0.20000119103284758,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 5925,
    "uncertainty_score": 0.2000000005536225,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 5926,
    "uncertainty_score": 0.00033825550748182754,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 5927,
    "uncertainty_score": 0.14366788150538087,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 5928,
    "uncertainty_score": 6.125973011817562e-09,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 5929,
    "uncertainty_score": 8.021287537012826e-05,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 5930,
    "uncertainty_score": 1.908024647674996e-06,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 5931,
    "uncertainty_score": 3.555885802808546e-06,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 5932,
    "uncertainty_score": 0.0002465546098961621,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 5933,
    "uncertainty_score": 1.196635136482128e-07,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 5934,
    "uncertainty_score": 1.9139494115388108e-13,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 5935,
    "uncertainty_score": 9.386187590648168e-07,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 5936,
    "uncertainty_score": 0.39999784531105026,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 5937,
    "uncertainty_score": 0.20041816366710932,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 5938,
    "uncertainty_score": 4.5340939143940967e-08,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 5939,
    "uncertainty_score": 7.466159409847982e-08,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 5940,
    "uncertainty_score": 2.020348638260469e-09,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 5941,
    "uncertainty_score": 0.4147131315068666,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 5942,
    "uncertainty_score": 6.738498873550396e-10,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 5943,
    "uncertainty_score": 3.278883438005177e-08,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 5944,
    "uncertainty_score": 2.742970620815098e-08,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 5945,
    "uncertainty_score": 5.196292797912083e-06,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 5946,
    "uncertainty_score": 3.0127170218356226e-12,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 5947,
    "uncertainty_score": 0.25000000112071635,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 5948,
    "uncertainty_score": 0.00011229698886348399,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 5949,
    "uncertainty_score": 0.00018611312112271883,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 5950,
    "uncertainty_score": 8.805082148779376e-11,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 5951,
    "uncertainty_score": 1.8624472046219502e-07,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 5952,
    "uncertainty_score": 1.3720021789414113e-08,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 5953,
    "uncertainty_score": 0.1667094945409102,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 5954,
    "uncertainty_score": 0.20000630570794192,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 5955,
    "uncertainty_score": 0.0032719103011538066,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 5956,
    "uncertainty_score": 2.7732061385640272e-05,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 5957,
    "uncertainty_score": 5.342480764365027e-08,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 5958,
    "uncertainty_score": 0.20003694782740258,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 5959,
    "uncertainty_score": 0.4000018065025694,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 5960,
    "uncertainty_score": 2.475568901650696e-06,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 5961,
    "uncertainty_score": 2.8828005075883707e-13,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 5962,
    "uncertainty_score": 1.229529741051293e-07,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 5963,
    "uncertainty_score": 1.354914271563894e-05,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 5964,
    "uncertainty_score": 1.6053188414654132e-10,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 5965,
    "uncertainty_score": 3.948031153260222e-09,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 5966,
    "uncertainty_score": 1.1739328469559663e-08,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 5967,
    "uncertainty_score": 6.960344782481511e-08,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 5968,
    "uncertainty_score": 0.20000000123874231,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 5969,
    "uncertainty_score": 2.4840212273465013e-05,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 5970,
    "uncertainty_score": 0.33333333398558457,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 5971,
    "uncertainty_score": 3.342118501991189e-09,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 5972,
    "uncertainty_score": 1.200022627337935e-08,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 5973,
    "uncertainty_score": 0.04505590512402017,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 5974,
    "uncertainty_score": 0.13027098828923123,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 5975,
    "uncertainty_score": 0.000332661967840903,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 5976,
    "uncertainty_score": 0.2500000082919964,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 5977,
    "uncertainty_score": 5.7669760160901135e-06,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 5978,
    "uncertainty_score": 6.194576108728708e-05,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 5979,
    "uncertainty_score": 2.31511128090404e-09,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 5980,
    "uncertainty_score": 8.299231471239083e-08,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 5981,
    "uncertainty_score": 1.715853362252877e-08,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 5982,
    "uncertainty_score": 4.0611540662660574e-12,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 5983,
    "uncertainty_score": 4.396216461513529e-05,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 5984,
    "uncertainty_score": 0.24999926032688063,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 5985,
    "uncertainty_score": 1.1903504058867644e-10,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 5986,
    "uncertainty_score": 0.13616588630584409,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 5987,
    "uncertainty_score": 1.5394115520213145e-05,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 5988,
    "uncertainty_score": 0.6667067964601093,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 5989,
    "uncertainty_score": 0.14580123247845234,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 5990,
    "uncertainty_score": 3.897577682818781e-08,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 5991,
    "uncertainty_score": 5.099244595702065e-08,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 5992,
    "uncertainty_score": 3.175983049787053e-09,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 5993,
    "uncertainty_score": 5.801380260858831e-09,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 5994,
    "uncertainty_score": 1.8613410713752175e-08,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 5995,
    "uncertainty_score": 8.982422476423668e-05,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 5996,
    "uncertainty_score": 0.33340937306111407,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 5997,
    "uncertainty_score": 0.024283637800086556,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 5998,
    "uncertainty_score": 0.0016266149958108888,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 5999,
    "uncertainty_score": 6.5824437583084525e-09,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 6000,
    "uncertainty_score": 8.564331630695512e-10,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 6001,
    "uncertainty_score": 0.00037612935610748037,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 6002,
    "uncertainty_score": 0.20000075935861278,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 6003,
    "uncertainty_score": 4.158089531610227e-10,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 6004,
    "uncertainty_score": 0.33531695061672484,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 6005,
    "uncertainty_score": 3.215556319467994e-05,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 6006,
    "uncertainty_score": 0.00015342931326206208,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 6007,
    "uncertainty_score": 1.6793963098756057e-05,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 6008,
    "uncertainty_score": 8.043726769170253e-07,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 6009,
    "uncertainty_score": 1.2666079899743954e-08,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 6010,
    "uncertainty_score": 5.2915269010711106e-08,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 6011,
    "uncertainty_score": 1.1877741078096898e-07,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 6012,
    "uncertainty_score": 2.3608293638479203e-10,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 6013,
    "uncertainty_score": 1.7234942310620103e-10,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 6014,
    "uncertainty_score": 1.5467370765722088e-07,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 6015,
    "uncertainty_score": 0.24969821631898748,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 6016,
    "uncertainty_score": 6.882495345591467e-07,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 6017,
    "uncertainty_score": 1.4860412190712873e-09,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 6018,
    "uncertainty_score": 0.33356024331386097,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 6019,
    "uncertainty_score": 6.790015586235114e-08,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 6020,
    "uncertainty_score": 0.20000000631993925,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 6021,
    "uncertainty_score": 6.010913244280156e-07,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 6022,
    "uncertainty_score": 0.0001434230602992117,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 6023,
    "uncertainty_score": 5.427293009057903e-08,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 6024,
    "uncertainty_score": 0.24999885229378696,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 6025,
    "uncertainty_score": 0.2000000304453693,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 6026,
    "uncertainty_score": 1.101181709288214e-07,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 6027,
    "uncertainty_score": 3.126626042769175e-07,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 6028,
    "uncertainty_score": 0.39939390494380433,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 6029,
    "uncertainty_score": 0.0026155708426109777,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 6030,
    "uncertainty_score": 7.32073777014616e-08,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 6031,
    "uncertainty_score": 0.20000000075722507,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 6032,
    "uncertainty_score": 0.4000353903379639,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 6033,
    "uncertainty_score": 8.890820309032193e-05,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 6034,
    "uncertainty_score": 1.4085121321407252e-07,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 6035,
    "uncertainty_score": 0.2498192316801961,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 6036,
    "uncertainty_score": 0.00010497444585718947,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 6037,
    "uncertainty_score": 0.4000046085518288,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 6038,
    "uncertainty_score": 5.383918182483401e-09,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 6039,
    "uncertainty_score": 6.220119988234519e-10,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 6040,
    "uncertainty_score": 4.151198686576136e-08,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 6041,
    "uncertainty_score": 0.2500113730178336,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 6042,
    "uncertainty_score": 0.00013819467663593937,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 6043,
    "uncertainty_score": 4.739905170061344e-08,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 6044,
    "uncertainty_score": 0.36856736693265724,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 6045,
    "uncertainty_score": 2.30205110322139e-10,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 6046,
    "uncertainty_score": 3.3480544026645427e-09,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 6047,
    "uncertainty_score": 0.0005470794669044333,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 6048,
    "uncertainty_score": 4.030406705083217e-07,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 6049,
    "uncertainty_score": 0.001432561625284544,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 6050,
    "uncertainty_score": 0.2000003416120928,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 6051,
    "uncertainty_score": 0.004349138837827328,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 6052,
    "uncertainty_score": 1.8081116215368938e-06,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 6053,
    "uncertainty_score": 0.40002773335276476,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 6054,
    "uncertainty_score": 0.6666666674291499,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 6055,
    "uncertainty_score": 7.624833010263958e-10,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 6056,
    "uncertainty_score": 2.5797056113042343e-07,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 6057,
    "uncertainty_score": 1.218437723873942e-08,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 6058,
    "uncertainty_score": 0.00017910660604463603,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 6059,
    "uncertainty_score": 0.3892137438644414,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 6060,
    "uncertainty_score": 1.2926760328145122e-09,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 6061,
    "uncertainty_score": 1.6293825337819777e-06,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 6062,
    "uncertainty_score": 1.5954518882333745e-09,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 6063,
    "uncertainty_score": 2.9631968588221375e-06,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 6064,
    "uncertainty_score": 4.967469604946879e-08,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 6065,
    "uncertainty_score": 0.33348295576103754,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 6066,
    "uncertainty_score": 0.33359888978605495,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 6067,
    "uncertainty_score": 0.16822637715725136,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 6068,
    "uncertainty_score": 9.919979258686782e-09,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 6069,
    "uncertainty_score": 0.24426482098569716,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 6070,
    "uncertainty_score": 1.2012041332590293e-06,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 6071,
    "uncertainty_score": 0.0010332663663490658,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 6072,
    "uncertainty_score": 0.3333325148790213,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 6073,
    "uncertainty_score": 6.73439902145248e-12,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 6074,
    "uncertainty_score": 0.19999969232442305,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 6075,
    "uncertainty_score": 9.505072138493696e-13,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 6076,
    "uncertainty_score": 7.709989649660064e-05,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 6077,
    "uncertainty_score": 5.585725006828584e-08,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 6078,
    "uncertainty_score": 0.5000163439048964,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 6079,
    "uncertainty_score": 9.307080029514238e-10,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 6080,
    "uncertainty_score": 0.2500053010615291,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 6081,
    "uncertainty_score": 0.2000001470909841,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 6082,
    "uncertainty_score": 0.16498048389296252,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 6083,
    "uncertainty_score": 0.1027491315160652,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 6084,
    "uncertainty_score": 0.206974305567315,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 6085,
    "uncertainty_score": 0.4994908283695749,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 6086,
    "uncertainty_score": 0.008847625050571283,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 6087,
    "uncertainty_score": 4.13933253391226e-05,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 6088,
    "uncertainty_score": 0.14164860704595467,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 6089,
    "uncertainty_score": 6.158437040506542e-10,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 6090,
    "uncertainty_score": 3.8024646028559104e-06,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 6091,
    "uncertainty_score": 0.0034521632337849856,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 6092,
    "uncertainty_score": 0.40000171149941205,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 6093,
    "uncertainty_score": 6.091318787995711e-11,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 6094,
    "uncertainty_score": 0.4000000013624934,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 6095,
    "uncertainty_score": 0.27805342854266346,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 6096,
    "uncertainty_score": 6.759124237690173e-11,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 6097,
    "uncertainty_score": 3.556067830575015e-08,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 6098,
    "uncertainty_score": 3.142330684384184e-08,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 6099,
    "uncertainty_score": 1.59651764482016e-13,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 6100,
    "uncertainty_score": 6.856070540187169e-06,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 6101,
    "uncertainty_score": 1.0107100226777583e-07,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 6102,
    "uncertainty_score": 2.6266515124466555e-08,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 6103,
    "uncertainty_score": 6.158824859814864e-07,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 6104,
    "uncertainty_score": 5.1730552911212936e-08,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 6105,
    "uncertainty_score": 0.1999999246211793,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 6106,
    "uncertainty_score": 2.3168508488637176e-07,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 6107,
    "uncertainty_score": 0.20000000064542672,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 6108,
    "uncertainty_score": 3.8076878810141416e-06,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 6109,
    "uncertainty_score": 0.2500102484224158,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 6110,
    "uncertainty_score": 1.5575071282567278e-13,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 6111,
    "uncertainty_score": 0.2500000042761731,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 6112,
    "uncertainty_score": 4.741817796815146e-13,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 6113,
    "uncertainty_score": 5.678781015114362e-09,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 6114,
    "uncertainty_score": 0.00013614543778492298,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 6115,
    "uncertainty_score": 8.650006323560064e-05,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 6116,
    "uncertainty_score": 7.314206046197279e-08,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 6117,
    "uncertainty_score": 1.7161408482020766e-06,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 6118,
    "uncertainty_score": 0.20010152121070898,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 6119,
    "uncertainty_score": 5.3271676516788597e-08,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 6120,
    "uncertainty_score": 1.0464543204993603e-05,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 6121,
    "uncertainty_score": 1.1595974552121905e-06,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 6122,
    "uncertainty_score": 1.3486831417928742e-08,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 6123,
    "uncertainty_score": 1.3190188944356144e-08,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 6124,
    "uncertainty_score": 3.3265945917750225e-10,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 6125,
    "uncertainty_score": 9.26183425973636e-06,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 6126,
    "uncertainty_score": 0.00019410557209109108,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 6127,
    "uncertainty_score": 5.667240991950293e-10,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 6128,
    "uncertainty_score": 0.23598213544087013,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 6129,
    "uncertainty_score": 0.6003534933351226,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 6130,
    "uncertainty_score": 7.376565127501455e-10,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 6131,
    "uncertainty_score": 0.3333349447550593,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 6132,
    "uncertainty_score": 0.799917032352861,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 6133,
    "uncertainty_score": 7.468391339057768e-09,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 6134,
    "uncertainty_score": 1.5818133331829603e-08,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 6135,
    "uncertainty_score": 0.20000001221802305,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 6136,
    "uncertainty_score": 0.2499999827141602,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 6137,
    "uncertainty_score": 7.496028051347911e-10,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 6138,
    "uncertainty_score": 0.33333308474871093,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 6139,
    "uncertainty_score": 1.85049574271232e-09,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 6140,
    "uncertainty_score": 0.25000047828897065,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 6141,
    "uncertainty_score": 4.21651982650957e-05,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 6142,
    "uncertainty_score": 0.25000007285529685,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 6143,
    "uncertainty_score": 1.1399696625407867e-09,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 6144,
    "uncertainty_score": 5.985791613187422e-06,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 6145,
    "uncertainty_score": 4.005000270210601e-06,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 6146,
    "uncertainty_score": 0.25000171038651003,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 6147,
    "uncertainty_score": 0.20422320796334997,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 6148,
    "uncertainty_score": 0.3077966425721362,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 6149,
    "uncertainty_score": 1.9900131457568002e-05,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 6150,
    "uncertainty_score": 4.729043659701621e-09,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 6151,
    "uncertainty_score": 0.2500000315832692,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 6152,
    "uncertainty_score": 0.0008610549970652005,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 6153,
    "uncertainty_score": 1.2850610562329279e-11,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 6154,
    "uncertainty_score": 0.6599585288145786,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 6155,
    "uncertainty_score": 2.103481496068619e-05,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 6156,
    "uncertainty_score": 0.20000000598198603,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 6157,
    "uncertainty_score": 0.00012590098754868638,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 6158,
    "uncertainty_score": 2.8310100494858064e-12,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 6159,
    "uncertainty_score": 1.1848504626500607e-05,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 6160,
    "uncertainty_score": 0.2500163417319986,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 6161,
    "uncertainty_score": 6.401810832550134e-06,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 6162,
    "uncertainty_score": 9.990086379882611e-08,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 6163,
    "uncertainty_score": 2.9078423765194833e-10,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 6164,
    "uncertainty_score": 4.828137500378491e-08,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 6165,
    "uncertainty_score": 0.00494612385056018,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 6166,
    "uncertainty_score": 2.6880822665638674e-09,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 6167,
    "uncertainty_score": 3.1533417102271717e-10,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 6168,
    "uncertainty_score": 3.678395817396786e-09,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 6169,
    "uncertainty_score": 2.4603586772461563e-10,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 6170,
    "uncertainty_score": 0.00022076696709271603,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 6171,
    "uncertainty_score": 3.0529129761498786e-05,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 6172,
    "uncertainty_score": 1.4505736382406998e-07,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 6173,
    "uncertainty_score": 4.8903998380052815e-06,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 6174,
    "uncertainty_score": 2.405250230093752e-07,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 6175,
    "uncertainty_score": 1.683785661548352e-10,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 6176,
    "uncertainty_score": 0.2857175661440205,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 6177,
    "uncertainty_score": 6.074560060842507e-12,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 6178,
    "uncertainty_score": 7.685339054105389e-06,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 6179,
    "uncertainty_score": 7.757520973924765e-10,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 6180,
    "uncertainty_score": 1.168132352454315e-08,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 6181,
    "uncertainty_score": 0.6667014838327484,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 6182,
    "uncertainty_score": 0.2000000009884459,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 6183,
    "uncertainty_score": 2.1442849181433532e-10,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 6184,
    "uncertainty_score": 1.2844079326895313e-10,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 6185,
    "uncertainty_score": 0.4998567796282387,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 6186,
    "uncertainty_score": 6.892733354151468e-08,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 6187,
    "uncertainty_score": 4.445012686254511e-11,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 6188,
    "uncertainty_score": 1.088443472510341e-07,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 6189,
    "uncertainty_score": 2.1825793571218044e-10,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 6190,
    "uncertainty_score": 0.20024661005943173,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 6191,
    "uncertainty_score": 0.11111111116181914,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 6192,
    "uncertainty_score": 0.1938114137072658,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 6193,
    "uncertainty_score": 0.0004997372664231342,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 6194,
    "uncertainty_score": 6.331165351149021e-06,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 6195,
    "uncertainty_score": 0.48627459122879135,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 6196,
    "uncertainty_score": 7.852423485808785e-07,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 6197,
    "uncertainty_score": 2.865762596999488e-11,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 6198,
    "uncertainty_score": 5.325135608801511e-05,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 6199,
    "uncertainty_score": 0.20000684424233342,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 6200,
    "uncertainty_score": 5.353278440650838e-10,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 6201,
    "uncertainty_score": 0.5999366249144302,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 6202,
    "uncertainty_score": 1.7416419217082135e-06,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 6203,
    "uncertainty_score": 5.534329471291786e-07,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 6204,
    "uncertainty_score": 7.882164388010452e-06,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 6205,
    "uncertainty_score": 0.250188851403594,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 6206,
    "uncertainty_score": 0.2541987766823287,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 6207,
    "uncertainty_score": 0.33394760970287535,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 6208,
    "uncertainty_score": 1.9350399438917705e-06,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 6209,
    "uncertainty_score": 0.1666647148145816,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 6210,
    "uncertainty_score": 4.485988517515334e-09,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 6211,
    "uncertainty_score": 3.536496864650781e-08,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 6212,
    "uncertainty_score": 2.7179590273421723e-05,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 6213,
    "uncertainty_score": 1.7760612085688855e-06,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 6214,
    "uncertainty_score": 1.1531250968928542e-08,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 6215,
    "uncertainty_score": 8.494019118002243e-06,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 6216,
    "uncertainty_score": 0.20058402466625042,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 6217,
    "uncertainty_score": 1.048544692689272e-09,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 6218,
    "uncertainty_score": 2.8375311179271818e-08,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 6219,
    "uncertainty_score": 0.20000008741737557,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 6220,
    "uncertainty_score": 0.019605053465534643,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 6221,
    "uncertainty_score": 2.2256311726489598e-08,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 6222,
    "uncertainty_score": 0.20000001170691323,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 6223,
    "uncertainty_score": 0.6666458906226055,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 6224,
    "uncertainty_score": 1.118519696284808e-11,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 6225,
    "uncertainty_score": 0.6519167751439574,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 6226,
    "uncertainty_score": 2.848325614199986e-11,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 6227,
    "uncertainty_score": 0.1162235792224589,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 6228,
    "uncertainty_score": 1.216654027836845e-15,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 6229,
    "uncertainty_score": 3.7016112781493927e-08,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 6230,
    "uncertainty_score": 0.33334769774610873,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 6231,
    "uncertainty_score": 4.179317904559064e-10,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 6232,
    "uncertainty_score": 0.2500008269778102,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 6233,
    "uncertainty_score": 0.00016160977326090025,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 6234,
    "uncertainty_score": 2.240513483353742e-08,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 6235,
    "uncertainty_score": 1.8517912051585376e-06,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 6236,
    "uncertainty_score": 1.8318680169496444e-11,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 6237,
    "uncertainty_score": 4.675227028670352e-05,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 6238,
    "uncertainty_score": 1.516997656329423e-07,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 6239,
    "uncertainty_score": 0.20000000000015977,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 6240,
    "uncertainty_score": 0.3333332779467762,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 6241,
    "uncertainty_score": 0.00148451115301436,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 6242,
    "uncertainty_score": 2.875540519512947e-07,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 6243,
    "uncertainty_score": 0.24999999976235326,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 6244,
    "uncertainty_score": 3.578988426300131e-10,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 6245,
    "uncertainty_score": 0.5999972198252506,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 6246,
    "uncertainty_score": 2.5079017728642476e-07,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 6247,
    "uncertainty_score": 6.255174230485398e-06,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 6248,
    "uncertainty_score": 1.0250251575432625e-07,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 6249,
    "uncertainty_score": 0.20214805707657518,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 6250,
    "uncertainty_score": 2.2663954927276093e-08,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 6251,
    "uncertainty_score": 7.803064092800942e-09,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 6252,
    "uncertainty_score": 7.444329545251823e-10,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 6253,
    "uncertainty_score": 0.24993671068068393,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 6254,
    "uncertainty_score": 3.6143605542250503e-07,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 6255,
    "uncertainty_score": 4.805138552936129e-08,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 6256,
    "uncertainty_score": 4.3019676052516596e-07,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 6257,
    "uncertainty_score": 3.738841209857219e-08,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 6258,
    "uncertainty_score": 0.199999999799999,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 6259,
    "uncertainty_score": 2.202481181659835e-10,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 6260,
    "uncertainty_score": 0.18482837546197645,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 6261,
    "uncertainty_score": 0.21675894476131963,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 6262,
    "uncertainty_score": 3.6890920364499495e-07,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 6263,
    "uncertainty_score": 0.0,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 6264,
    "uncertainty_score": 0.24999999814863036,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 6265,
    "uncertainty_score": 4.124783836397612e-06,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 6266,
    "uncertainty_score": 4.535961856086878e-05,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 6267,
    "uncertainty_score": 0.33412398611484284,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 6268,
    "uncertainty_score": 0.20000173787701722,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 6269,
    "uncertainty_score": 1.51324727873284e-08,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 6270,
    "uncertainty_score": 0.014965728321173289,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 6271,
    "uncertainty_score": 6.067079482379009e-06,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 6272,
    "uncertainty_score": 0.0005145887474858133,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 6273,
    "uncertainty_score": 8.384348264066231e-06,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 6274,
    "uncertainty_score": 5.180804160476424e-07,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 6275,
    "uncertainty_score": 3.761275278578803e-09,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 6276,
    "uncertainty_score": 1.6929301525290132e-09,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 6277,
    "uncertainty_score": 0.2500002579667853,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 6278,
    "uncertainty_score": 4.222666341762157e-11,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 6279,
    "uncertainty_score": 1.908956923344828e-11,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 6280,
    "uncertainty_score": 1.932903144931306e-07,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 6281,
    "uncertainty_score": 0.2500000000562838,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 6282,
    "uncertainty_score": 2.71204763036726e-06,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 6283,
    "uncertainty_score": 1.8869793778336767e-06,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 6284,
    "uncertainty_score": 3.168757918318087e-05,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 6285,
    "uncertainty_score": 0.27527668460528165,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 6286,
    "uncertainty_score": 1.4933801608707135e-07,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 6287,
    "uncertainty_score": 6.71202580303726e-08,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 6288,
    "uncertainty_score": 0.20000673150338838,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 6289,
    "uncertainty_score": 0.10247798885951341,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 6290,
    "uncertainty_score": 0.0031224290698086,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 6291,
    "uncertainty_score": 6.481140961553708e-10,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 6292,
    "uncertainty_score": 2.3227820049169844e-09,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 6293,
    "uncertainty_score": 0.11202612378096696,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 6294,
    "uncertainty_score": 1.5147276474389582e-08,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 6295,
    "uncertainty_score": 0.25188475963569684,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 6296,
    "uncertainty_score": 2.881443927640161e-09,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 6297,
    "uncertainty_score": 0.7498988673545257,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 6298,
    "uncertainty_score": 0.00015387665686641933,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 6299,
    "uncertainty_score": 1.910545023268283e-05,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 6300,
    "uncertainty_score": 4.265527077687462e-07,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 6301,
    "uncertainty_score": 1.4320964399705508e-07,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 6302,
    "uncertainty_score": 1.451094117352096e-05,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 6303,
    "uncertainty_score": 0.2373592328335163,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 6304,
    "uncertainty_score": 0.00013186721489743947,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 6305,
    "uncertainty_score": 6.235472019714771e-05,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 6306,
    "uncertainty_score": 3.9241749088287977e-07,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 6307,
    "uncertainty_score": 9.747900969592091e-05,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 6308,
    "uncertainty_score": 9.997207784275955e-05,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 6309,
    "uncertainty_score": 1.6711245125898159e-06,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 6310,
    "uncertainty_score": 6.198183318503094e-05,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 6311,
    "uncertainty_score": 0.3333333330000107,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 6312,
    "uncertainty_score": 0.2500000019404734,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 6313,
    "uncertainty_score": 0.19999922559144806,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 6314,
    "uncertainty_score": 0.24734269702888925,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 6315,
    "uncertainty_score": 1.6420291624138114e-08,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 6316,
    "uncertainty_score": 4.140204907909691e-11,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 6317,
    "uncertainty_score": 0.6663042128361952,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 6318,
    "uncertainty_score": 0.054421357393140565,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 6319,
    "uncertainty_score": 0.25000001375743963,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 6320,
    "uncertainty_score": 0.0670819534125387,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 6321,
    "uncertainty_score": 0.2009810444388374,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 6322,
    "uncertainty_score": 7.099750511897756e-08,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 6323,
    "uncertainty_score": 1.347323923830179e-10,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 6324,
    "uncertainty_score": 2.01278399995588e-05,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 6325,
    "uncertainty_score": 0.33333334049257113,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 6326,
    "uncertainty_score": 0.4282283725752261,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 6327,
    "uncertainty_score": 2.0617393642041913e-08,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 6328,
    "uncertainty_score": 5.016045901754373e-07,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 6329,
    "uncertainty_score": 3.093687903267791e-07,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 6330,
    "uncertainty_score": 5.815155755012524e-10,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 6331,
    "uncertainty_score": 0.005968814958325159,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 6332,
    "uncertainty_score": 2.5728726980977033e-05,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 6333,
    "uncertainty_score": 0.00045733770794705833,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 6334,
    "uncertainty_score": 0.00015125575140052472,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 6335,
    "uncertainty_score": 0.0005788400323630789,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 6336,
    "uncertainty_score": 9.662854726169304e-15,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 6337,
    "uncertainty_score": 5.320488734317415e-06,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 6338,
    "uncertainty_score": 0.36923344809901115,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 6339,
    "uncertainty_score": 0.2000001143000926,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 6340,
    "uncertainty_score": 0.2500000368856762,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 6341,
    "uncertainty_score": 0.2027334939893441,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 6342,
    "uncertainty_score": 0.37458520280412405,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 6343,
    "uncertainty_score": 5.888857337628287e-14,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 6344,
    "uncertainty_score": 1.061642188105514e-05,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 6345,
    "uncertainty_score": 0.2505344510972525,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 6346,
    "uncertainty_score": 0.19407800011858772,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 6347,
    "uncertainty_score": 1.9749636072167566e-08,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 6348,
    "uncertainty_score": 1.0833713383184306e-08,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 6349,
    "uncertainty_score": 4.0150372207772575e-07,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 6350,
    "uncertainty_score": 8.100280611606167e-06,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 6351,
    "uncertainty_score": 0.33258271865317207,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 6352,
    "uncertainty_score": 0.08708926648925955,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 6353,
    "uncertainty_score": 0.16666666650000342,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 6354,
    "uncertainty_score": 1.9203003596755534e-06,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 6355,
    "uncertainty_score": 0.0007189129335525375,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 6356,
    "uncertainty_score": 0.2000000050245221,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 6357,
    "uncertainty_score": 4.075109658628615e-10,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 6358,
    "uncertainty_score": 2.5784915380764125e-06,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 6359,
    "uncertainty_score": 3.1076856905620815e-08,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 6360,
    "uncertainty_score": 1.510095410641299e-06,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 6361,
    "uncertainty_score": 3.0251234877739056e-09,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 6362,
    "uncertainty_score": 0.2508098165955839,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 6363,
    "uncertainty_score": 0.14348605987221222,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 6364,
    "uncertainty_score": 0.00011747731233835632,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 6365,
    "uncertainty_score": 3.109110695075454e-08,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 6366,
    "uncertainty_score": 0.018146250415568332,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 6367,
    "uncertainty_score": 3.964746688135223e-07,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 6368,
    "uncertainty_score": 2.208744317563495e-05,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 6369,
    "uncertainty_score": 0.004991710999695345,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 6370,
    "uncertainty_score": 1.423587277833219e-07,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 6371,
    "uncertainty_score": 7.232233389426424e-09,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 6372,
    "uncertainty_score": 0.13027097447502997,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 6373,
    "uncertainty_score": 0.1999999988514646,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 6374,
    "uncertainty_score": 0.2500001853899224,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 6375,
    "uncertainty_score": 0.2011460492278892,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 6376,
    "uncertainty_score": 1.330335932970414e-10,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 6377,
    "uncertainty_score": 0.2000000430888967,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 6378,
    "uncertainty_score": 0.2501122169173684,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 6379,
    "uncertainty_score": 0.25000140474231697,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 6380,
    "uncertainty_score": 2.1026510197457038e-08,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 6381,
    "uncertainty_score": 4.838270587456256e-09,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 6382,
    "uncertainty_score": 0.20019652388476455,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 6383,
    "uncertainty_score": 6.086375500407697e-08,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 6384,
    "uncertainty_score": 0.017382845738609057,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 6385,
    "uncertainty_score": 4.064358953163583e-09,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 6386,
    "uncertainty_score": 4.0393165424473284e-05,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 6387,
    "uncertainty_score": 0.07728193087205561,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 6388,
    "uncertainty_score": 0.16706199023496338,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 6389,
    "uncertainty_score": 0.25013823536930824,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 6390,
    "uncertainty_score": 0.40003894979485316,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 6391,
    "uncertainty_score": 2.447231594090641e-06,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 6392,
    "uncertainty_score": 1.814426093004315e-08,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 6393,
    "uncertainty_score": 5.803041301891674e-09,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 6394,
    "uncertainty_score": 0.3318594718823032,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 6395,
    "uncertainty_score": 0.6664397397267865,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 6396,
    "uncertainty_score": 1.1801927562507552e-05,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 6397,
    "uncertainty_score": 0.39912940124019786,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 6398,
    "uncertainty_score": 0.15175384814885162,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 6399,
    "uncertainty_score": 1.9824411808078912e-07,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 6400,
    "uncertainty_score": 5.749032353176613e-07,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 6401,
    "uncertainty_score": 0.25013968344313353,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 6402,
    "uncertainty_score": 2.8079513686355017e-08,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 6403,
    "uncertainty_score": 4.231898112344891e-08,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 6404,
    "uncertainty_score": 1.9033502332400844e-10,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 6405,
    "uncertainty_score": 0.2857144390023243,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 6406,
    "uncertainty_score": 2.5294712005652755e-05,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 6407,
    "uncertainty_score": 0.3266602786090766,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 6408,
    "uncertainty_score": 0.49996844811075036,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 6409,
    "uncertainty_score": 0.0002535063634296447,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 6410,
    "uncertainty_score": 1.6563823266655673e-07,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 6411,
    "uncertainty_score": 6.047088390782088e-09,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 6412,
    "uncertainty_score": 0.20000005010019492,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 6413,
    "uncertainty_score": 5.253454071352047e-07,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 6414,
    "uncertainty_score": 7.406875989574703e-06,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 6415,
    "uncertainty_score": 8.059382041641356e-10,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 6416,
    "uncertainty_score": 3.4009304083073443e-06,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 6417,
    "uncertainty_score": 0.2500314761207003,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 6418,
    "uncertainty_score": 6.382676764770519e-08,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 6419,
    "uncertainty_score": 0.24836139452775483,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 6420,
    "uncertainty_score": 0.14285722436514622,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 6421,
    "uncertainty_score": 5.843700820279199e-09,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 6422,
    "uncertainty_score": 8.100111670314389e-06,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 6423,
    "uncertainty_score": 1.7160302315916087e-06,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 6424,
    "uncertainty_score": 0.2014096350074619,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 6425,
    "uncertainty_score": 1.808819003350546e-10,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 6426,
    "uncertainty_score": 5.7949906293655685e-08,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 6427,
    "uncertainty_score": 4.684267217680776e-06,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 6428,
    "uncertainty_score": 6.961383211718306e-10,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 6429,
    "uncertainty_score": 1.541216383763977e-10,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 6430,
    "uncertainty_score": 0.2500001709158677,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 6431,
    "uncertainty_score": 1.4461104852752837e-09,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 6432,
    "uncertainty_score": 2.4972749331110275e-08,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 6433,
    "uncertainty_score": 1.2156569331292773e-09,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 6434,
    "uncertainty_score": 0.18543317885748287,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 6435,
    "uncertainty_score": 0.20000018250298682,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 6436,
    "uncertainty_score": 7.159264975982261e-09,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 6437,
    "uncertainty_score": 1.0746730952228957e-08,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 6438,
    "uncertainty_score": 0.40001350660524704,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 6439,
    "uncertainty_score": 0.0013778668837909121,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 6440,
    "uncertainty_score": 4.958501654934144e-10,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 6441,
    "uncertainty_score": 0.5000000998939614,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 6442,
    "uncertainty_score": 2.6349833386047897e-06,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 6443,
    "uncertainty_score": 0.49913894583466706,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 6444,
    "uncertainty_score": 0.24115723820053234,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 6445,
    "uncertainty_score": 3.232425072247114e-05,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 6446,
    "uncertainty_score": 2.430318890650079e-08,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 6447,
    "uncertainty_score": 0.2009009114329193,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 6448,
    "uncertainty_score": 0.4999972253305438,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 6449,
    "uncertainty_score": 0.5475056293172343,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 6450,
    "uncertainty_score": 0.24989889540819404,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 6451,
    "uncertainty_score": 5.517049736800355e-10,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 6452,
    "uncertainty_score": 0.3333326560351529,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 6453,
    "uncertainty_score": 0.20183253057864325,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 6454,
    "uncertainty_score": 2.117994938987485e-09,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 6455,
    "uncertainty_score": 6.229626285077959e-07,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 6456,
    "uncertainty_score": 1.0076503511766106e-05,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 6457,
    "uncertainty_score": 0.25000001661142984,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 6458,
    "uncertainty_score": 6.8715797313568345e-06,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 6459,
    "uncertainty_score": 8.127718677855437e-07,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 6460,
    "uncertainty_score": 0.0032719082102586738,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 6461,
    "uncertainty_score": 0.19999999867378732,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 6462,
    "uncertainty_score": 0.00036582662745926264,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 6463,
    "uncertainty_score": 5.739501189434076e-11,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 6464,
    "uncertainty_score": 0.24995655452187648,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 6465,
    "uncertainty_score": 0.00026855065044314297,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 6466,
    "uncertainty_score": 1.3814253338970767e-10,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 6467,
    "uncertainty_score": 0.20012522213422052,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 6468,
    "uncertainty_score": 0.20000547388509166,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 6469,
    "uncertainty_score": 6.804132280298605e-10,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 6470,
    "uncertainty_score": 0.25000018758541337,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 6471,
    "uncertainty_score": 0.24999999982907198,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 6472,
    "uncertainty_score": 0.24999999979944326,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 6473,
    "uncertainty_score": 3.867547552316219e-07,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 6474,
    "uncertainty_score": 0.08333600322112815,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 6475,
    "uncertainty_score": 0.06269361630291542,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 6476,
    "uncertainty_score": 1.1132772618121218e-08,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 6477,
    "uncertainty_score": 0.0002546958223327684,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 6478,
    "uncertainty_score": 0.23894038617747293,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 6479,
    "uncertainty_score": 1.4051590474348525e-05,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 6480,
    "uncertainty_score": 0.20022340994688675,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 6481,
    "uncertainty_score": 0.2542032293056323,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 6482,
    "uncertainty_score": 2.099574205992185e-07,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 6483,
    "uncertainty_score": 7.487874641113304e-05,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 6484,
    "uncertainty_score": 5.7018158322313313e-08,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 6485,
    "uncertainty_score": 5.694431530635459e-11,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 6486,
    "uncertainty_score": 2.2925271048533532e-11,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 6487,
    "uncertainty_score": 0.2500022583204315,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 6488,
    "uncertainty_score": 0.6000017507173475,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 6489,
    "uncertainty_score": 4.92404923218147e-07,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 6490,
    "uncertainty_score": 3.3861793879195667e-09,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 6491,
    "uncertainty_score": 2.0305028575435532e-05,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 6492,
    "uncertainty_score": 6.246050611240098e-09,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 6493,
    "uncertainty_score": 4.591968688276263e-07,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 6494,
    "uncertainty_score": 0.3333333333333339,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 6495,
    "uncertainty_score": 0.0009000529192486602,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 6496,
    "uncertainty_score": 0.006551143468206219,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 6497,
    "uncertainty_score": 4.199943600367468e-09,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 6498,
    "uncertainty_score": 1.5193557953951684e-08,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 6499,
    "uncertainty_score": 6.0751133845133815e-06,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 6500,
    "uncertainty_score": 0.21142013850696512,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 6501,
    "uncertainty_score": 1.2470632201345053e-09,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 6502,
    "uncertainty_score": 2.1920947265583204e-05,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 6503,
    "uncertainty_score": 0.0007873802791019206,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 6504,
    "uncertainty_score": 1.471409297002911e-06,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 6505,
    "uncertainty_score": 6.793951602330954e-09,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 6506,
    "uncertainty_score": 3.6092503666465615e-06,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 6507,
    "uncertainty_score": 0.0001455993956988944,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 6508,
    "uncertainty_score": 7.504973747799997e-08,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 6509,
    "uncertainty_score": 1.9451672095749728e-05,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 6510,
    "uncertainty_score": 0.33333333333333354,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 6511,
    "uncertainty_score": 2.2204909134226771e-07,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 6512,
    "uncertainty_score": 2.8286890082871358e-06,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 6513,
    "uncertainty_score": 0.08962886469750155,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 6514,
    "uncertainty_score": 2.8871975906685665e-06,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 6515,
    "uncertainty_score": 4.83211474250213e-05,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 6516,
    "uncertainty_score": 0.14285897207185433,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 6517,
    "uncertainty_score": 0.20015915689104014,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 6518,
    "uncertainty_score": 0.25266303816737035,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 6519,
    "uncertainty_score": 0.00041536680807716656,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 6520,
    "uncertainty_score": 4.7246470940305196e-07,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 6521,
    "uncertainty_score": 2.1613894872242193e-08,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 6522,
    "uncertainty_score": 1.753645207064078e-06,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 6523,
    "uncertainty_score": 0.00015771003071686938,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 6524,
    "uncertainty_score": 0.6666672654687016,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 6525,
    "uncertainty_score": 1.7724967272014914e-09,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 6526,
    "uncertainty_score": 4.0403033677214827e-10,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 6527,
    "uncertainty_score": 2.6038338559404285e-06,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 6528,
    "uncertainty_score": 0.3990029384253396,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 6529,
    "uncertainty_score": 2.463972550841718e-07,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 6530,
    "uncertainty_score": 0.4113599266643284,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 6531,
    "uncertainty_score": 0.24980816229321695,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 6532,
    "uncertainty_score": 0.30414538495032467,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 6533,
    "uncertainty_score": 2.4134049677893903e-07,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 6534,
    "uncertainty_score": 3.119049190180626e-08,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 6535,
    "uncertainty_score": 3.175221378189741e-07,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 6536,
    "uncertainty_score": 2.122890796168734e-13,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 6537,
    "uncertainty_score": 0.18408203444183785,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 6538,
    "uncertainty_score": 6.42803023337926e-11,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 6539,
    "uncertainty_score": 0.25000633829166635,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 6540,
    "uncertainty_score": 1.824670281707724e-08,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 6541,
    "uncertainty_score": 7.310880408418631e-07,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 6542,
    "uncertainty_score": 0.24999599633252592,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 6543,
    "uncertainty_score": 0.24999251777380915,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 6544,
    "uncertainty_score": 2.8036343872439687e-09,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 6545,
    "uncertainty_score": 7.769375528465213e-06,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 6546,
    "uncertainty_score": 2.3761050561783213e-06,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 6547,
    "uncertainty_score": 0.16666669380197494,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 6548,
    "uncertainty_score": 6.303029281082315e-09,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 6549,
    "uncertainty_score": 4.485722586903131e-07,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 6550,
    "uncertainty_score": 7.252678672800877e-08,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 6551,
    "uncertainty_score": 0.49832687213717186,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 6552,
    "uncertainty_score": 0.0007308258623621814,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 6553,
    "uncertainty_score": 0.0638995628114927,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 6554,
    "uncertainty_score": 3.215729831308301e-12,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 6555,
    "uncertainty_score": 2.0829733206406894e-10,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 6556,
    "uncertainty_score": 1.8011580602013326e-10,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 6557,
    "uncertainty_score": 0.2221445464143204,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 6558,
    "uncertainty_score": 8.677516218079013e-05,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 6559,
    "uncertainty_score": 1.4259523189786338e-09,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 6560,
    "uncertainty_score": 3.908941846593968e-08,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 6561,
    "uncertainty_score": 3.455795628234286e-08,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 6562,
    "uncertainty_score": 3.167583123746058e-08,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 6563,
    "uncertainty_score": 0.4999987504165576,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 6564,
    "uncertainty_score": 7.072822312322027e-10,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 6565,
    "uncertainty_score": 0.00550547641797423,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 6566,
    "uncertainty_score": 6.948685192869548e-10,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 6567,
    "uncertainty_score": 0.20002581328897467,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 6568,
    "uncertainty_score": 1.3250086897601258e-06,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 6569,
    "uncertainty_score": 6.744263887782666e-10,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 6570,
    "uncertainty_score": 5.76756620435892e-09,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 6571,
    "uncertainty_score": 0.5554624317042285,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 6572,
    "uncertainty_score": 6.004296159439531e-06,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 6573,
    "uncertainty_score": 2.6296729454731804e-05,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 6574,
    "uncertainty_score": 2.232232644686911e-09,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 6575,
    "uncertainty_score": 2.8271914940021753e-05,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 6576,
    "uncertainty_score": 0.00011646346934877447,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 6577,
    "uncertainty_score": 5.929248467459555e-09,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 6578,
    "uncertainty_score": 6.205102703357923e-10,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 6579,
    "uncertainty_score": 0.16673006160433032,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 6580,
    "uncertainty_score": 0.19999999981208288,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 6581,
    "uncertainty_score": 4.1156665678940244e-06,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 6582,
    "uncertainty_score": 1.3524208933300617e-05,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 6583,
    "uncertainty_score": 7.46165237581865e-12,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 6584,
    "uncertainty_score": 0.5999988982122557,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 6585,
    "uncertainty_score": 4.4022262738485854e-05,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 6586,
    "uncertainty_score": 0.007037638441510319,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 6587,
    "uncertainty_score": 0.250112216950953,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 6588,
    "uncertainty_score": 2.912498932682976e-09,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 6589,
    "uncertainty_score": 0.8008495004454614,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 6590,
    "uncertainty_score": 0.00019246024306684368,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 6591,
    "uncertainty_score": 0.16697441838090946,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 6592,
    "uncertainty_score": 0.00025631653168537523,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 6593,
    "uncertainty_score": 0.013483061837962594,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 6594,
    "uncertainty_score": 0.0010333822257239174,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 6595,
    "uncertainty_score": 0.2000000152215899,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 6596,
    "uncertainty_score": 0.2511051026125307,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 6597,
    "uncertainty_score": 0.19091940393664433,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 6598,
    "uncertainty_score": 3.798458921358108e-09,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 6599,
    "uncertainty_score": 0.2000248676386267,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 6600,
    "uncertainty_score": 0.2500013240152273,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 6601,
    "uncertainty_score": 0.2334082181949768,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 6602,
    "uncertainty_score": 1.818483919548664e-10,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 6603,
    "uncertainty_score": 0.18785764209864392,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 6604,
    "uncertainty_score": 5.333378276644881e-10,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 6605,
    "uncertainty_score": 0.3333324702983928,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 6606,
    "uncertainty_score": 1.779005123886063e-08,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 6607,
    "uncertainty_score": 0.33333333300000234,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 6608,
    "uncertainty_score": 2.9508133215707834e-08,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 6609,
    "uncertainty_score": 0.0006929967434592682,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 6610,
    "uncertainty_score": 6.6151688476213214e-09,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 6611,
    "uncertainty_score": 1.3759373162395283e-06,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 6612,
    "uncertainty_score": 0.15723791082202193,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 6613,
    "uncertainty_score": 3.2456711608329457e-10,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 6614,
    "uncertainty_score": 0.20000000160184173,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 6615,
    "uncertainty_score": 3.037373736603087e-08,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 6616,
    "uncertainty_score": 3.5868684531270856e-07,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 6617,
    "uncertainty_score": 3.203150248077476e-09,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 6618,
    "uncertainty_score": 0.2500327163185812,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 6619,
    "uncertainty_score": 6.939928787627255e-07,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 6620,
    "uncertainty_score": 1.517352247058141e-09,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 6621,
    "uncertainty_score": 3.9931019756807763e-08,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 6622,
    "uncertainty_score": 0.20000000867275408,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 6623,
    "uncertainty_score": 2.690579145995798e-10,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 6624,
    "uncertainty_score": 2.796255656207428e-10,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 6625,
    "uncertainty_score": 2.1879262031942902e-10,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 6626,
    "uncertainty_score": 0.003290042403042379,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 6627,
    "uncertainty_score": 0.1666959812243947,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 6628,
    "uncertainty_score": 5.974909487477339e-09,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 6629,
    "uncertainty_score": 0.2605889694201949,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 6630,
    "uncertainty_score": 0.20000005917186817,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 6631,
    "uncertainty_score": 4.916367999897925e-07,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 6632,
    "uncertainty_score": 0.33527252740678165,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 6633,
    "uncertainty_score": 0.3333302145075498,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 6634,
    "uncertainty_score": 7.48117697267139e-05,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 6635,
    "uncertainty_score": 0.0014439119668770712,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 6636,
    "uncertainty_score": 0.4999996874587608,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 6637,
    "uncertainty_score": 1.5077534535588802e-07,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 6638,
    "uncertainty_score": 8.695713530014911e-11,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 6639,
    "uncertainty_score": 9.097956457145183e-05,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 6640,
    "uncertainty_score": 4.179707005630216e-08,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 6641,
    "uncertainty_score": 0.3833032402071978,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 6642,
    "uncertainty_score": 0.20152367637397614,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 6643,
    "uncertainty_score": 2.575530372536179e-06,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 6644,
    "uncertainty_score": 0.20000070796123487,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 6645,
    "uncertainty_score": 3.493478379385871e-06,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 6646,
    "uncertainty_score": 1.1440803633187989e-06,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 6647,
    "uncertainty_score": 9.533247987625343e-09,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 6648,
    "uncertainty_score": 3.8210238399064593e-07,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 6649,
    "uncertainty_score": 0.2500025057295267,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 6650,
    "uncertainty_score": 1.4398478982808086e-06,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 6651,
    "uncertainty_score": 4.879073865852866e-09,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 6652,
    "uncertainty_score": 1.9392083065926937e-12,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 6653,
    "uncertainty_score": 0.19996665911182934,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 6654,
    "uncertainty_score": 1.3454271870861878e-06,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 6655,
    "uncertainty_score": 2.0891938429461584e-05,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 6656,
    "uncertainty_score": 0.16666681880438108,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 6657,
    "uncertainty_score": 4.2426999205062483e-07,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 6658,
    "uncertainty_score": 7.135163771442324e-09,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 6659,
    "uncertainty_score": 0.6666666658032588,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 6660,
    "uncertainty_score": 1.8128656832926436e-12,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 6661,
    "uncertainty_score": 8.793220599514398e-09,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 6662,
    "uncertainty_score": 1.2247886676430725e-07,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 6663,
    "uncertainty_score": 1.906726947951547e-13,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 6664,
    "uncertainty_score": 0.0003016536535793415,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 6665,
    "uncertainty_score": 7.289645630208162e-09,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 6666,
    "uncertainty_score": 3.769545435114984e-08,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 6667,
    "uncertainty_score": 0.011904183130455041,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 6668,
    "uncertainty_score": 0.00014994278522909943,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 6669,
    "uncertainty_score": 9.569344536331118e-05,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 6670,
    "uncertainty_score": 0.2525522858209346,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 6671,
    "uncertainty_score": 2.5420319449231125e-07,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 6672,
    "uncertainty_score": 5.924346777243844e-09,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 6673,
    "uncertainty_score": 1.3889498307742968e-09,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 6674,
    "uncertainty_score": 9.100237046025823e-09,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 6675,
    "uncertainty_score": 1.2730021468267935e-07,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 6676,
    "uncertainty_score": 0.25000000064431877,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 6677,
    "uncertainty_score": 0.28196998132551754,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 6678,
    "uncertainty_score": 1.3300210511132537e-08,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 6679,
    "uncertainty_score": 1.0247330630565823e-12,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 6680,
    "uncertainty_score": 0.4000000109894666,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 6681,
    "uncertainty_score": 0.0017070492714201797,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 6682,
    "uncertainty_score": 5.171617040932649e-08,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 6683,
    "uncertainty_score": 8.160942580248175e-10,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 6684,
    "uncertainty_score": 0.17696460274530224,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 6685,
    "uncertainty_score": 3.6443166034804735e-09,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 6686,
    "uncertainty_score": 0.19751935158038653,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 6687,
    "uncertainty_score": 3.3823982479141846e-10,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 6688,
    "uncertainty_score": 8.290513608758811e-10,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 6689,
    "uncertainty_score": 1.6522362985765933e-06,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 6690,
    "uncertainty_score": 0.0011122313202752035,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 6691,
    "uncertainty_score": 0.33345262527707753,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 6692,
    "uncertainty_score": 0.20000005408415777,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 6693,
    "uncertainty_score": 0.0002064464286396312,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 6694,
    "uncertainty_score": 2.037021037506204e-06,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 6695,
    "uncertainty_score": 3.957273409815974e-09,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 6696,
    "uncertainty_score": 6.24407388854756e-10,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 6697,
    "uncertainty_score": 0.2856622442608424,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 6698,
    "uncertainty_score": 2.0511866374004593e-09,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 6699,
    "uncertainty_score": 0.20003607310334312,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 6700,
    "uncertainty_score": 0.29166995987167726,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 6701,
    "uncertainty_score": 5.007122602747573e-08,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 6702,
    "uncertainty_score": 5.989270626930415e-06,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 6703,
    "uncertainty_score": 0.20000000001202842,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 6704,
    "uncertainty_score": 8.827365774283454e-11,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 6705,
    "uncertainty_score": 0.2003535966799745,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 6706,
    "uncertainty_score": 1.5472944030583478e-06,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 6707,
    "uncertainty_score": 0.24999999974999998,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 6708,
    "uncertainty_score": 0.5231581077648223,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 6709,
    "uncertainty_score": 0.0008010077904353121,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 6710,
    "uncertainty_score": 0.2000000208180047,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 6711,
    "uncertainty_score": 7.757230786371815e-11,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 6712,
    "uncertainty_score": 1.9771059811486074e-05,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 6713,
    "uncertainty_score": 4.563262327354321e-09,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 6714,
    "uncertainty_score": 0.2101503018197406,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 6715,
    "uncertainty_score": 5.507200571018005e-12,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 6716,
    "uncertainty_score": 0.2002677875091167,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 6717,
    "uncertainty_score": 0.0002624860543314018,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 6718,
    "uncertainty_score": 2.7959792275993905e-09,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 6719,
    "uncertainty_score": 1.4726771099903425e-05,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 6720,
    "uncertainty_score": 0.04332412999440456,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 6721,
    "uncertainty_score": 2.4333395119296977e-09,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 6722,
    "uncertainty_score": 0.25000023400842086,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 6723,
    "uncertainty_score": 1.1563045161718859e-08,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 6724,
    "uncertainty_score": 1.5443445915246745e-06,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 6725,
    "uncertainty_score": 2.743044387194022e-07,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 6726,
    "uncertainty_score": 0.3855411579560621,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 6727,
    "uncertainty_score": 0.24999999977352275,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 6728,
    "uncertainty_score": 0.05796163164304143,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 6729,
    "uncertainty_score": 3.416851547415793e-08,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 6730,
    "uncertainty_score": 3.884178682538797e-09,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 6731,
    "uncertainty_score": 1.252194220755279e-11,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 6732,
    "uncertainty_score": 2.149315653006039e-10,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 6733,
    "uncertainty_score": 9.584207105657083e-07,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 6734,
    "uncertainty_score": 0.33333339981100024,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 6735,
    "uncertainty_score": 1.8837196024041362e-05,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 6736,
    "uncertainty_score": 3.626047238379622e-05,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 6737,
    "uncertainty_score": 4.572002627559423e-06,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 6738,
    "uncertainty_score": 7.54072661665864e-13,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 6739,
    "uncertainty_score": 0.20000009801881066,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 6740,
    "uncertainty_score": 3.7568955086077164e-05,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 6741,
    "uncertainty_score": 0.3333305187620431,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 6742,
    "uncertainty_score": 0.00015778980202713142,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 6743,
    "uncertainty_score": 0.19985247563126007,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 6744,
    "uncertainty_score": 6.919831180328756e-05,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 6745,
    "uncertainty_score": 4.937036816880355e-06,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 6746,
    "uncertainty_score": 0.14580189386966969,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 6747,
    "uncertainty_score": 1.479126077027513e-10,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 6748,
    "uncertainty_score": 2.0151772490773673e-09,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 6749,
    "uncertainty_score": 0.00018604374306693523,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 6750,
    "uncertainty_score": 4.673552477183346e-08,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 6751,
    "uncertainty_score": 8.610570280228355e-06,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 6752,
    "uncertainty_score": 1.557884996781324e-08,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 6753,
    "uncertainty_score": 0.09091609539048927,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 6754,
    "uncertainty_score": 0.4035547784610367,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 6755,
    "uncertainty_score": 0.33289472065573994,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 6756,
    "uncertainty_score": 0.2000042091854664,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 6757,
    "uncertainty_score": 0.6666669230150656,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 6758,
    "uncertainty_score": 0.8333333058826399,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 6759,
    "uncertainty_score": 0.7911545333916725,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 6760,
    "uncertainty_score": 0.3999746884713201,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 6761,
    "uncertainty_score": 0.24553333493626353,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 6762,
    "uncertainty_score": 5.239405447896628e-05,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 6763,
    "uncertainty_score": 0.20000000000673285,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 6764,
    "uncertainty_score": 0.2500000295878087,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 6765,
    "uncertainty_score": 0.9999999998,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 6766,
    "uncertainty_score": 1.5383719265597662e-09,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 6767,
    "uncertainty_score": 0.20000007637777703,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 6768,
    "uncertainty_score": 0.4999934302065925,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 6769,
    "uncertainty_score": 0.3333333330770877,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 6770,
    "uncertainty_score": 0.24998539908628023,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 6771,
    "uncertainty_score": 1.9362354005553795e-09,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 6772,
    "uncertainty_score": 3.598159835370786e-11,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 6773,
    "uncertainty_score": 0.00013646768383080587,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 6774,
    "uncertainty_score": 0.16666679002288579,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 6775,
    "uncertainty_score": 0.8000156875787781,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 6776,
    "uncertainty_score": 0.3555528665444288,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 6777,
    "uncertainty_score": 7.67927178288091e-05,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 6778,
    "uncertainty_score": 0.20000006310046406,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 6779,
    "uncertainty_score": 0.42857559700716436,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 6780,
    "uncertainty_score": 0.25027688845298174,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 6781,
    "uncertainty_score": 2.5316613519172867e-09,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 6782,
    "uncertainty_score": 1.5549735437328822e-10,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 6783,
    "uncertainty_score": 0.2000277544325773,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 6784,
    "uncertainty_score": 0.19999954057849686,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 6785,
    "uncertainty_score": 0.39999999959068855,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 6786,
    "uncertainty_score": 0.49999987085644637,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 6787,
    "uncertainty_score": 0.49999999950003365,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 6788,
    "uncertainty_score": 2.0128739789881655e-07,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 6789,
    "uncertainty_score": 0.20000000109573052,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 6790,
    "uncertainty_score": 0.20001168223623242,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 6791,
    "uncertainty_score": 0.25000674573299936,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 6792,
    "uncertainty_score": 0.0007433126517912852,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 6793,
    "uncertainty_score": 0.6000000325149095,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 6794,
    "uncertainty_score": 0.20000008983249443,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 6795,
    "uncertainty_score": 0.24895054654983337,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 6796,
    "uncertainty_score": 5.534396769975282e-07,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 6797,
    "uncertainty_score": 5.087579390452199e-05,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 6798,
    "uncertainty_score": 1.736766714460615e-07,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 6799,
    "uncertainty_score": 0.19808146380536845,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 6800,
    "uncertainty_score": 0.33333334197764364,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 6801,
    "uncertainty_score": 0.1999999998617294,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 6802,
    "uncertainty_score": 0.49999999975002957,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 6803,
    "uncertainty_score": 0.119837990635538,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 6804,
    "uncertainty_score": 0.19999999907589544,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 6805,
    "uncertainty_score": 0.20000162656791468,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 6806,
    "uncertainty_score": 0.24425565718390066,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 6807,
    "uncertainty_score": 0.25000006076759557,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 6808,
    "uncertainty_score": 0.74999999975,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 6809,
    "uncertainty_score": 0.499999999667573,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 6810,
    "uncertainty_score": 0.20000000158196096,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 6811,
    "uncertainty_score": 0.25000012851750514,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 6812,
    "uncertainty_score": 7.400324541975314e-05,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 6813,
    "uncertainty_score": 0.20114608556058383,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 6814,
    "uncertainty_score": 0.4000004451139113,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 6815,
    "uncertainty_score": 0.25000000493463825,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 6816,
    "uncertainty_score": 0.20000063807649257,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 6817,
    "uncertainty_score": 1.0,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 6818,
    "uncertainty_score": 0.5999999998,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 6819,
    "uncertainty_score": 0.20562994225368217,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 6820,
    "uncertainty_score": 0.00014557910565822683,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 6821,
    "uncertainty_score": 0.4999999994999337,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 6822,
    "uncertainty_score": 0.006044496127781837,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 6823,
    "uncertainty_score": 0.3371614857505242,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 6824,
    "uncertainty_score": 0.005171525853228287,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 6825,
    "uncertainty_score": 0.6,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 6826,
    "uncertainty_score": 0.008696924007205911,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 6827,
    "uncertainty_score": 0.0,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 6828,
    "uncertainty_score": 0.2000000401328414,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 6829,
    "uncertainty_score": 3.0401281463505306e-09,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 6830,
    "uncertainty_score": 0.0018555479567349774,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 6831,
    "uncertainty_score": 0.5884073261452041,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 6832,
    "uncertainty_score": 7.867276706543004e-07,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 6833,
    "uncertainty_score": 0.7999999998,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 6834,
    "uncertainty_score": 0.20000638344864802,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 6835,
    "uncertainty_score": 0.6000982732594035,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 6836,
    "uncertainty_score": 0.601339440519667,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 6837,
    "uncertainty_score": 0.39996511085848707,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 6838,
    "uncertainty_score": 0.20005124844639938,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 6839,
    "uncertainty_score": 0.2954056951513518,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 6840,
    "uncertainty_score": 0.2010510547642415,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 6841,
    "uncertainty_score": 2.1607059900390545e-08,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 6842,
    "uncertainty_score": 9.732715302291582e-11,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 6843,
    "uncertainty_score": 0.20000107335961817,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 6844,
    "uncertainty_score": 4.291101914294853e-08,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 6845,
    "uncertainty_score": 0.0011055713370808527,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 6846,
    "uncertainty_score": 0.5215617367341252,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 6847,
    "uncertainty_score": 1.546267976386063e-08,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 6848,
    "uncertainty_score": 0.2504816837772059,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 6849,
    "uncertainty_score": 0.2500000001907633,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 6850,
    "uncertainty_score": 0.25000059222305593,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 6851,
    "uncertainty_score": 8.863494583514315e-07,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 6852,
    "uncertainty_score": 0.25000021387834354,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 6853,
    "uncertainty_score": 0.20000000043439936,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 6854,
    "uncertainty_score": 5.868112436331008e-07,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 6855,
    "uncertainty_score": 2.7509723324930026e-05,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 6856,
    "uncertainty_score": 1.5454504680191935e-06,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 6857,
    "uncertainty_score": 1.0,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 6858,
    "uncertainty_score": 0.20017661523588837,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 6859,
    "uncertainty_score": 0.0005303481675055377,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 6860,
    "uncertainty_score": 2.6880923765087835e-09,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 6861,
    "uncertainty_score": 6.74760740730018e-12,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 6862,
    "uncertainty_score": 0.5030990658565201,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 6863,
    "uncertainty_score": 0.24999599475071602,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 6864,
    "uncertainty_score": 0.19996761888808073,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 6865,
    "uncertainty_score": 0.20225764331595766,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 6866,
    "uncertainty_score": 0.4999999764251907,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 6867,
    "uncertainty_score": 0.6666666025932146,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 6868,
    "uncertainty_score": 0.5000000081448794,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 6869,
    "uncertainty_score": 0.5000014965315417,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 6870,
    "uncertainty_score": 8.001868703094338e-11,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 6871,
    "uncertainty_score": 2.504682697001978e-07,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 6872,
    "uncertainty_score": 0.24987547913453645,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 6873,
    "uncertainty_score": 1.6034657811480741e-06,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 6874,
    "uncertainty_score": 0.0005928220705714965,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 6875,
    "uncertainty_score": 0.1999954094000635,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 6876,
    "uncertainty_score": 0.3531668767735856,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 6877,
    "uncertainty_score": 0.2502718428926909,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 6878,
    "uncertainty_score": 0.22091743107773798,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 6879,
    "uncertainty_score": 0.4000117045579967,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 6880,
    "uncertainty_score": 0.20000000019271433,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 6881,
    "uncertainty_score": 0.18363524135153245,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 6882,
    "uncertainty_score": 4.097743959481236e-05,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 6883,
    "uncertainty_score": 0.19999996572617607,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 6884,
    "uncertainty_score": 0.40000000567896504,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 6885,
    "uncertainty_score": 0.5999999117044715,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 6886,
    "uncertainty_score": 0.7997511252037619,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 6887,
    "uncertainty_score": 0.07044812492029934,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 6888,
    "uncertainty_score": 0.20070221368813962,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 6889,
    "uncertainty_score": 9.688435426764473e-08,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 6890,
    "uncertainty_score": 0.5000001941391661,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 6891,
    "uncertainty_score": 6.113599255897786e-05,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 6892,
    "uncertainty_score": 0.062109466195557926,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 6893,
    "uncertainty_score": 0.2000000036709449,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 6894,
    "uncertainty_score": 0.24999968040709963,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 6895,
    "uncertainty_score": 5.6826431049437236e-06,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 6896,
    "uncertainty_score": 0.33484413706479305,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 6897,
    "uncertainty_score": 0.2500002962306168,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 6898,
    "uncertainty_score": 0.00018604301447468368,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 6899,
    "uncertainty_score": 0.8000000068642577,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 6900,
    "uncertainty_score": 1.3772360180514774e-09,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 6901,
    "uncertainty_score": 1.0736081160046149e-07,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 6902,
    "uncertainty_score": 0.2500005263928598,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 6903,
    "uncertainty_score": 0.496722017840627,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 6904,
    "uncertainty_score": 0.6003216003576839,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 6905,
    "uncertainty_score": 0.051297670688077696,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 6906,
    "uncertainty_score": 0.3333333333333333,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 6907,
    "uncertainty_score": 0.00016906039637893953,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 6908,
    "uncertainty_score": 1.2069827572551016e-09,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 6909,
    "uncertainty_score": 0.5000000000029697,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 6910,
    "uncertainty_score": 7.250966442065812e-09,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 6911,
    "uncertainty_score": 0.0002064462937702239,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 6912,
    "uncertainty_score": 0.0003525896402535613,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 6913,
    "uncertainty_score": 0.20000000000199786,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 6914,
    "uncertainty_score": 0.7999150374862355,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 6915,
    "uncertainty_score": 0.39999976320900354,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 6916,
    "uncertainty_score": 0.6666639765905004,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 6917,
    "uncertainty_score": 0.20000243558594621,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 6918,
    "uncertainty_score": 3.2215677139786236e-06,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 6919,
    "uncertainty_score": 0.2000005084170445,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 6920,
    "uncertainty_score": 0.7499999997094168,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 6921,
    "uncertainty_score": 3.5858642380109616e-09,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 6922,
    "uncertainty_score": 4.9246048797914895e-08,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 6923,
    "uncertainty_score": 0.20000699672990402,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 6924,
    "uncertainty_score": 0.20021576221454424,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 6925,
    "uncertainty_score": 0.2500001585881107,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 6926,
    "uncertainty_score": 0.142870314184616,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 6927,
    "uncertainty_score": 0.4936229310732924,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 6928,
    "uncertainty_score": 1.5421674050814565e-08,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 6929,
    "uncertainty_score": 0.02428163489662389,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 6930,
    "uncertainty_score": 2.947588648369304e-07,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 6931,
    "uncertainty_score": 0.4999999997533889,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 6932,
    "uncertainty_score": 2.006719379491519e-07,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 6933,
    "uncertainty_score": 0.39999828985008407,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 6934,
    "uncertainty_score": 0.009930710954019567,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 6935,
    "uncertainty_score": 2.7816817358705572e-11,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 6936,
    "uncertainty_score": 0.20065780239174114,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 6937,
    "uncertainty_score": 0.5031079124031819,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 6938,
    "uncertainty_score": 0.4999916145334995,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 6939,
    "uncertainty_score": 0.005845642028323684,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 6940,
    "uncertainty_score": 0.2000024694230636,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 6941,
    "uncertainty_score": 1.967132895751351e-09,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 6942,
    "uncertainty_score": 0.5022814075318103,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 6943,
    "uncertainty_score": 0.25310792363838613,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 6944,
    "uncertainty_score": 2.98924978359571e-08,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 6945,
    "uncertainty_score": 0.29523484486831947,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 6946,
    "uncertainty_score": 0.5999998161369205,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 6947,
    "uncertainty_score": 5.009981594739773e-06,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 6948,
    "uncertainty_score": 1.7193252425966573e-05,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 6949,
    "uncertainty_score": 0.18727182651196125,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 6950,
    "uncertainty_score": 0.6,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 6951,
    "uncertainty_score": 0.25000000050752047,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 6952,
    "uncertainty_score": 0.5999999996,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 6953,
    "uncertainty_score": 1.2326843171538472e-07,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 6954,
    "uncertainty_score": 0.3374772172419282,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 6955,
    "uncertainty_score": 0.18554283756763465,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 6956,
    "uncertainty_score": 0.197638368762914,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 6957,
    "uncertainty_score": 0.24870842027541168,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 6958,
    "uncertainty_score": 2.3184241420051383e-05,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 6959,
    "uncertainty_score": 5.475186347884403e-09,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 6960,
    "uncertainty_score": 0.0005535605615469287,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 6961,
    "uncertainty_score": 2.992662186095444e-09,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 6962,
    "uncertainty_score": 0.5993288943524419,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 6963,
    "uncertainty_score": 1.3428252442294737e-05,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 6964,
    "uncertainty_score": 0.5684787405318581,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 6965,
    "uncertainty_score": 0.00042495763263951814,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 6966,
    "uncertainty_score": 0.33316735560665184,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 6967,
    "uncertainty_score": 0.2500000108438959,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 6968,
    "uncertainty_score": 0.24968243027514767,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 6969,
    "uncertainty_score": 0.3999999995950768,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 6970,
    "uncertainty_score": 0.0005217570938642347,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 6971,
    "uncertainty_score": 0.3333336463705254,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 6972,
    "uncertainty_score": 0.2499999998954986,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 6973,
    "uncertainty_score": 0.2500201265205836,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 6974,
    "uncertainty_score": 2.7457808253551235e-12,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 6975,
    "uncertainty_score": 0.18622581977571062,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 6976,
    "uncertainty_score": 1.3937302351227916e-07,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 6977,
    "uncertainty_score": 2.8756579389598183e-11,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 6978,
    "uncertainty_score": 1.3591220676842431e-11,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 6979,
    "uncertainty_score": 0.19998692626150333,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 6980,
    "uncertainty_score": 0.4000000019054551,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 6981,
    "uncertainty_score": 5.556120434682787e-12,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 6982,
    "uncertainty_score": 0.25000000597877375,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 6983,
    "uncertainty_score": 0.034810522273102114,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 6984,
    "uncertainty_score": 2.7439091171788845e-06,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 6985,
    "uncertainty_score": 0.20002313669739244,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 6986,
    "uncertainty_score": 0.33334367515862856,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 6987,
    "uncertainty_score": 2.630819639743109e-07,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 6988,
    "uncertainty_score": 9.013650262921105e-11,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 6989,
    "uncertainty_score": 0.16665518977811536,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 6990,
    "uncertainty_score": 7.731534310368176e-09,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 6991,
    "uncertainty_score": 0.6622067793470517,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 6992,
    "uncertainty_score": 0.24999999997924957,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 6993,
    "uncertainty_score": 0.2501615566231901,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 6994,
    "uncertainty_score": 1.6685048452724283e-08,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 6995,
    "uncertainty_score": 0.33333333300003837,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 6996,
    "uncertainty_score": 0.0009870771002270322,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 6997,
    "uncertainty_score": 0.4020234686929407,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 6998,
    "uncertainty_score": 2.012727043484346e-05,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 6999,
    "uncertainty_score": 0.00045054213301335506,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 7000,
    "uncertainty_score": 0.20007279877992162,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 7001,
    "uncertainty_score": 0.20001241046922985,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 7002,
    "uncertainty_score": 4.4938092299098527e-07,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 7003,
    "uncertainty_score": 7.689106163933929e-06,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 7004,
    "uncertainty_score": 3.6152336446548555e-15,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 7005,
    "uncertainty_score": 9.494068560585024e-11,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 7006,
    "uncertainty_score": 1.4018119151068406e-07,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 7007,
    "uncertainty_score": 0.1818633783522581,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 7008,
    "uncertainty_score": 8.13477679835529e-10,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 7009,
    "uncertainty_score": 8.032758793241674e-10,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 7010,
    "uncertainty_score": 0.4974706652074497,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 7011,
    "uncertainty_score": 0.14286447160147,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 7012,
    "uncertainty_score": 5.672984226406699e-06,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 7013,
    "uncertainty_score": 0.19988963665032863,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 7014,
    "uncertainty_score": 2.4273443228151766e-06,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 7015,
    "uncertainty_score": 0.49999999975,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 7016,
    "uncertainty_score": 2.7566678932461127e-11,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 7017,
    "uncertainty_score": 0.25000830383603695,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 7018,
    "uncertainty_score": 4.295542881338837e-09,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 7019,
    "uncertainty_score": 0.2000300961231523,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 7020,
    "uncertainty_score": 0.005459168270832401,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 7021,
    "uncertainty_score": 0.2958675945414736,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 7022,
    "uncertainty_score": 4.806351706581006e-05,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 7023,
    "uncertainty_score": 2.4823924220760374e-09,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 7024,
    "uncertainty_score": 0.005744342900459631,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 7025,
    "uncertainty_score": 0.20003007911849027,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 7026,
    "uncertainty_score": 1.4891296522730117e-06,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 7027,
    "uncertainty_score": 9.865237439470406e-05,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 7028,
    "uncertainty_score": 1.493702796163367e-07,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 7029,
    "uncertainty_score": 0.6666667629779996,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 7030,
    "uncertainty_score": 0.4782699898924175,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 7031,
    "uncertainty_score": 0.3431647603811556,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 7032,
    "uncertainty_score": 0.4999998324620011,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 7033,
    "uncertainty_score": 2.0951650034514473e-05,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 7034,
    "uncertainty_score": 0.8,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 7035,
    "uncertainty_score": 1.6940739251034564e-09,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 7036,
    "uncertainty_score": 4.241023719640715e-07,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 7037,
    "uncertainty_score": 0.2500000178370617,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 7038,
    "uncertainty_score": 0.0008348094009963582,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 7039,
    "uncertainty_score": 4.9949389331775095e-11,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 7040,
    "uncertainty_score": 6.253146519819205e-10,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 7041,
    "uncertainty_score": 1.9077195400389765e-07,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 7042,
    "uncertainty_score": 0.4992311570052916,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 7043,
    "uncertainty_score": 0.272303801421528,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 7044,
    "uncertainty_score": 0.833367592685362,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 7045,
    "uncertainty_score": 0.25000020411859825,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 7046,
    "uncertainty_score": 0.5000001222075677,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 7047,
    "uncertainty_score": 0.20006313526673264,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 7048,
    "uncertainty_score": 3.401658437860782e-08,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 7049,
    "uncertainty_score": 0.3372708387281369,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 7050,
    "uncertainty_score": 0.6666775533287909,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 7051,
    "uncertainty_score": 0.5,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 7052,
    "uncertainty_score": 9.917753635418814e-09,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 7053,
    "uncertainty_score": 2.3358722138351713e-08,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 7054,
    "uncertainty_score": 0.33333814471961015,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 7055,
    "uncertainty_score": 0.200874239145852,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 7056,
    "uncertainty_score": 1.9053364304173488e-07,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 7057,
    "uncertainty_score": 0.2000257299602061,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 7058,
    "uncertainty_score": 0.4005231806870996,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 7059,
    "uncertainty_score": 2.0349675549007503e-06,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 7060,
    "uncertainty_score": 0.0871612834497113,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 7061,
    "uncertainty_score": 0.0036259891731067555,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 7062,
    "uncertainty_score": 0.19999999979291574,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 7063,
    "uncertainty_score": 0.2008844596723533,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 7064,
    "uncertainty_score": 7.021294849697262e-09,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 7065,
    "uncertainty_score": 0.20000016929350725,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 7066,
    "uncertainty_score": 0.7301020815009214,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 7067,
    "uncertainty_score": 0.6666666663333335,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 7068,
    "uncertainty_score": 2.9123809777096707e-06,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 7069,
    "uncertainty_score": 2.7588174902470016e-10,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 7070,
    "uncertainty_score": 0.6000011387354169,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 7071,
    "uncertainty_score": 0.5000000002548756,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 7072,
    "uncertainty_score": 0.0006048435963679407,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 7073,
    "uncertainty_score": 2.47931102977769e-10,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 7074,
    "uncertainty_score": 3.5651059193971064e-06,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 7075,
    "uncertainty_score": 0.20022807901132592,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 7076,
    "uncertainty_score": 5.543015307359078e-07,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 7077,
    "uncertainty_score": 0.002980505157789438,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 7078,
    "uncertainty_score": 0.00021184955240271836,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 7079,
    "uncertainty_score": 9.540875813313061e-09,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 7080,
    "uncertainty_score": 2.8001821222568594e-09,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 7081,
    "uncertainty_score": 1.2514322145209413e-10,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 7082,
    "uncertainty_score": 0.333333363776128,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 7083,
    "uncertainty_score": 2.706969334835879e-12,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 7084,
    "uncertainty_score": 0.24999997790063663,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 7085,
    "uncertainty_score": 8.380826453107652e-09,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 7086,
    "uncertainty_score": 0.18834093172505453,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 7087,
    "uncertainty_score": 0.24999999976574128,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 7088,
    "uncertainty_score": 8.446404805881421e-05,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 7089,
    "uncertainty_score": 6.0397572413588545e-05,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 7090,
    "uncertainty_score": 0.20002182570904922,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 7091,
    "uncertainty_score": 0.20000014831003052,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 7092,
    "uncertainty_score": 0.20000000323653686,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 7093,
    "uncertainty_score": 3.425659843427612e-06,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 7094,
    "uncertainty_score": 0.9999969047472408,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 7095,
    "uncertainty_score": 9.11339699167433e-05,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 7096,
    "uncertainty_score": 0.20003704535670766,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 7097,
    "uncertainty_score": 0.25000183350393435,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 7098,
    "uncertainty_score": 1.7564928615243073e-06,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 7099,
    "uncertainty_score": 0.1666675855192564,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 7100,
    "uncertainty_score": 0.420175723254223,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 7101,
    "uncertainty_score": 6.353419990004281e-10,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 7102,
    "uncertainty_score": 0.001137288593684751,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 7103,
    "uncertainty_score": 0.0,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 7104,
    "uncertainty_score": 0.16662221889482723,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 7105,
    "uncertainty_score": 0.3334101240019159,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 7106,
    "uncertainty_score": 0.005919912802326656,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 7107,
    "uncertainty_score": 5.204429714283385e-08,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 7108,
    "uncertainty_score": 0.20000000280500524,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 7109,
    "uncertainty_score": 3.225501577906952e-09,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 7110,
    "uncertainty_score": 1.0500008154562011e-06,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 7111,
    "uncertainty_score": 1.6618696207255794e-12,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 7112,
    "uncertainty_score": 1.5637933745721727e-07,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 7113,
    "uncertainty_score": 0.500095990584976,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 7114,
    "uncertainty_score": 0.2500020569891228,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 7115,
    "uncertainty_score": 0.20000009262827131,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 7116,
    "uncertainty_score": 7.883477228441033e-11,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 7117,
    "uncertainty_score": 3.216017077470256e-09,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 7118,
    "uncertainty_score": 9.584515313382751e-12,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 7119,
    "uncertainty_score": 0.800195980085617,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 7120,
    "uncertainty_score": 1.5679684126757281e-09,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 7121,
    "uncertainty_score": 0.20000000000347035,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 7122,
    "uncertainty_score": 0.2507752423896424,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 7123,
    "uncertainty_score": 0.40000000067700353,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 7124,
    "uncertainty_score": 0.2500002103739814,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 7125,
    "uncertainty_score": 6.660687425857456e-08,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 7126,
    "uncertainty_score": 1.3406084320180017e-10,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 7127,
    "uncertainty_score": 1.0430654367205998e-09,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 7128,
    "uncertainty_score": 0.25000003073057164,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 7129,
    "uncertainty_score": 1.0,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 7130,
    "uncertainty_score": 3.0572686978415905e-06,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 7131,
    "uncertainty_score": 8.2114133881558e-14,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 7132,
    "uncertainty_score": 7.816439190607722e-10,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 7133,
    "uncertainty_score": 0.6001048065655247,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 7134,
    "uncertainty_score": 0.20000000073353014,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 7135,
    "uncertainty_score": 0.000737066405707484,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 7136,
    "uncertainty_score": 0.0036258949946161123,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 7137,
    "uncertainty_score": 5.766778630445752e-06,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 7138,
    "uncertainty_score": 1.9530379458681837e-07,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 7139,
    "uncertainty_score": 8.622145206402475e-07,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 7140,
    "uncertainty_score": 6.819697162797398e-06,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 7141,
    "uncertainty_score": 0.0009169503802810706,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 7142,
    "uncertainty_score": 0.20000000204227578,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 7143,
    "uncertainty_score": 0.33333399791294743,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 7144,
    "uncertainty_score": 0.001141052243563311,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 7145,
    "uncertainty_score": 7.012631546438446e-05,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 7146,
    "uncertainty_score": 7.131074029371074e-06,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 7147,
    "uncertainty_score": 0.8333333214074711,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 7148,
    "uncertainty_score": 0.0004009722702323199,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 7149,
    "uncertainty_score": 0.5000003645940732,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 7150,
    "uncertainty_score": 4.562383752523613e-05,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 7151,
    "uncertainty_score": 0.0007906533100902909,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 7152,
    "uncertainty_score": 0.20000704775986416,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 7153,
    "uncertainty_score": 0.19999999984577982,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 7154,
    "uncertainty_score": 8.790941159854393e-12,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 7155,
    "uncertainty_score": 0.250946541640436,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 7156,
    "uncertainty_score": 2.120441336789421e-06,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 7157,
    "uncertainty_score": 0.19992322191910888,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 7158,
    "uncertainty_score": 0.2536258985498511,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 7159,
    "uncertainty_score": 0.39999999955439824,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 7160,
    "uncertainty_score": 0.2000000403324364,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 7161,
    "uncertainty_score": 0.19999988579505365,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 7162,
    "uncertainty_score": 0.7999997860834325,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 7163,
    "uncertainty_score": 0.20192238428016202,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 7164,
    "uncertainty_score": 0.2521664008070451,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 7165,
    "uncertainty_score": 0.7780696234997261,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 7166,
    "uncertainty_score": 0.25,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 7167,
    "uncertainty_score": 9.820476645902485e-07,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 7168,
    "uncertainty_score": 0.5000023290628123,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 7169,
    "uncertainty_score": 1.6933405304333587e-10,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 7170,
    "uncertainty_score": 7.259449474569968e-08,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 7171,
    "uncertainty_score": 3.518365305342227e-05,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 7172,
    "uncertainty_score": 0.2500000002359171,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 7173,
    "uncertainty_score": 0.5000044619428915,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 7174,
    "uncertainty_score": 0.2500051320095263,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 7175,
    "uncertainty_score": 0.3333332323208079,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 7176,
    "uncertainty_score": 0.600000000010614,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 7177,
    "uncertainty_score": 0.25000237924470936,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 7178,
    "uncertainty_score": 0.5470012223258324,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 7179,
    "uncertainty_score": 0.49479610542619323,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 7180,
    "uncertainty_score": 0.25000029347663816,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 7181,
    "uncertainty_score": 0.0027515414292590425,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 7182,
    "uncertainty_score": 0.3999999918370524,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 7183,
    "uncertainty_score": 5.069202705496877e-06,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 7184,
    "uncertainty_score": 0.008577369891787782,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 7185,
    "uncertainty_score": 6.22509799317932e-10,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 7186,
    "uncertainty_score": 0.0003918989131522954,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 7187,
    "uncertainty_score": 0.00037857278762578635,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 7188,
    "uncertainty_score": 0.04528880872012299,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 7189,
    "uncertainty_score": 0.16811061456968754,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 7190,
    "uncertainty_score": 0.403015608336217,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 7191,
    "uncertainty_score": 0.0,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 7192,
    "uncertainty_score": 4.629332503043681e-12,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 7193,
    "uncertainty_score": 0.25004660339501744,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 7194,
    "uncertainty_score": 0.199999986546605,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 7195,
    "uncertainty_score": 0.24999706966165333,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 7196,
    "uncertainty_score": 1.4674848298154704e-06,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 7197,
    "uncertainty_score": 0.9999999989694915,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 7198,
    "uncertainty_score": 0.9999999997402864,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 7199,
    "uncertainty_score": 0.006510837968304167,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 7200,
    "uncertainty_score": 0.20000000118888378,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 7201,
    "uncertainty_score": 0.49998852710183384,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 7202,
    "uncertainty_score": 0.09014116695029128,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 7203,
    "uncertainty_score": 1.2570200776999625e-09,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 7204,
    "uncertainty_score": 5.375791324173464e-08,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 7205,
    "uncertainty_score": 0.4000000000000001,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 7206,
    "uncertainty_score": 1.244233565184131e-10,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 7207,
    "uncertainty_score": 0.20038534753679418,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 7208,
    "uncertainty_score": 0.8571428561782597,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 7209,
    "uncertainty_score": 0.7500070994026807,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 7210,
    "uncertainty_score": 1.3449676108680931e-11,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 7211,
    "uncertainty_score": 2.816072627572701e-05,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 7212,
    "uncertainty_score": 0.8,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 7213,
    "uncertainty_score": 5.044948350954478e-08,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 7214,
    "uncertainty_score": 4.6177564243147283e-07,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 7215,
    "uncertainty_score": 2.740525106150706e-06,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 7216,
    "uncertainty_score": 0.00010741734373271841,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 7217,
    "uncertainty_score": 0.16695014254905435,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 7218,
    "uncertainty_score": 0.6179907438516068,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 7219,
    "uncertainty_score": 0.25545744549059995,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 7220,
    "uncertainty_score": 3.0528870902921736e-05,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 7221,
    "uncertainty_score": 0.39999999956295695,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 7222,
    "uncertainty_score": 1.0,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 7223,
    "uncertainty_score": 0.20000246814766243,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 7224,
    "uncertainty_score": 0.4999999837197758,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 7225,
    "uncertainty_score": 0.01632238428110037,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 7226,
    "uncertainty_score": 3.216165275961002e-05,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 7227,
    "uncertainty_score": 1.9254317040969662e-07,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 7228,
    "uncertainty_score": 0.25000108921995196,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 7229,
    "uncertainty_score": 0.333336963569848,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 7230,
    "uncertainty_score": 0.2520575838772605,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 7231,
    "uncertainty_score": 2.7255397295328112e-05,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 7232,
    "uncertainty_score": 1.4539249332458973e-08,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 7233,
    "uncertainty_score": 0.000593042154877991,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 7234,
    "uncertainty_score": 5.850974827454223e-07,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 7235,
    "uncertainty_score": 0.5,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 7236,
    "uncertainty_score": 5.1138083961209026e-23,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 7237,
    "uncertainty_score": 0.749999998664453,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 7238,
    "uncertainty_score": 0.48921811688862316,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 7239,
    "uncertainty_score": 1.283873560573869e-09,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 7240,
    "uncertainty_score": 0.8,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 7241,
    "uncertainty_score": 1.5354397618696183e-06,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 7242,
    "uncertainty_score": 0.16063000211201972,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 7243,
    "uncertainty_score": 0.20000001138246976,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 7244,
    "uncertainty_score": 0.4999981672506696,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 7245,
    "uncertainty_score": 0.6540222426430607,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 7246,
    "uncertainty_score": 0.2500000103484595,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 7247,
    "uncertainty_score": 0.7291273230943841,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 7248,
    "uncertainty_score": 0.21078774647502224,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 7249,
    "uncertainty_score": 0.4000000000778602,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 7250,
    "uncertainty_score": 0.2500132686504553,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 7251,
    "uncertainty_score": 0.25000000434376335,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 7252,
    "uncertainty_score": 4.80278747312526e-09,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 7253,
    "uncertainty_score": 0.7999999995845164,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 7254,
    "uncertainty_score": 0.40000065064360407,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 7255,
    "uncertainty_score": 1.0925782739030233e-05,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 7256,
    "uncertainty_score": 0.9999519370157135,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 7257,
    "uncertainty_score": 0.9999995008178425,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 7258,
    "uncertainty_score": 0.25000000044370224,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 7259,
    "uncertainty_score": 0.20048816072081554,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 7260,
    "uncertainty_score": 0.5021666422326932,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 7261,
    "uncertainty_score": 1.6528216292679923e-10,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 7262,
    "uncertainty_score": 0.6666666660086487,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 7263,
    "uncertainty_score": 0.0021012237071540664,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 7264,
    "uncertainty_score": 0.20000000727310097,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 7265,
    "uncertainty_score": 0.2516732126983813,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 7266,
    "uncertainty_score": 0.3333333462598586,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 7267,
    "uncertainty_score": 2.103820718216208e-06,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 7268,
    "uncertainty_score": 6.804061846792249e-11,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 7269,
    "uncertainty_score": 6.0122804693431155e-12,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 7270,
    "uncertainty_score": 4.147043665006611e-09,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 7271,
    "uncertainty_score": 0.2,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 7272,
    "uncertainty_score": 3.9054663614540616e-10,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 7273,
    "uncertainty_score": 0.2013349001666965,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 7274,
    "uncertainty_score": 0.00012099592721330877,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 7275,
    "uncertainty_score": 5.944011313609631e-08,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 7276,
    "uncertainty_score": 2.116972193137179e-09,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 7277,
    "uncertainty_score": 0.36959356645864927,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 7278,
    "uncertainty_score": 3.008546025137534e-05,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 7279,
    "uncertainty_score": 0.25002907863797447,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 7280,
    "uncertainty_score": 0.20000000950210045,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 7281,
    "uncertainty_score": 0.5714285713658331,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 7282,
    "uncertainty_score": 0.24999999979015086,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 7283,
    "uncertainty_score": 0.33688353997472603,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 7284,
    "uncertainty_score": 0.3165729015890209,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 7285,
    "uncertainty_score": 0.43866586409468983,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 7286,
    "uncertainty_score": 0.06774847788193683,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 7287,
    "uncertainty_score": 2.0988388007041928e-11,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 7288,
    "uncertainty_score": 0.19980208701232144,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 7289,
    "uncertainty_score": 0.25000378493648345,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 7290,
    "uncertainty_score": 1.468792138848702e-07,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 7291,
    "uncertainty_score": 0.0001496301164294304,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 7292,
    "uncertainty_score": 0.500000040242369,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 7293,
    "uncertainty_score": 0.3333333328767108,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 7294,
    "uncertainty_score": 0.600000000105746,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 7295,
    "uncertainty_score": 0.2000390254250651,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 7296,
    "uncertainty_score": 1.9160898300383958e-10,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 7297,
    "uncertainty_score": 5.076600721581542e-32,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 7298,
    "uncertainty_score": 0.0027560637433465237,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 7299,
    "uncertainty_score": 1.9634118285554615e-05,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 7300,
    "uncertainty_score": 0.0015651296169028293,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 7301,
    "uncertainty_score": 0.39999975015255257,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 7302,
    "uncertainty_score": 2.184252065741894e-10,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 7303,
    "uncertainty_score": 1.321812838814394e-06,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 7304,
    "uncertainty_score": 0.25000326156371194,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 7305,
    "uncertainty_score": 1.1455783956761387e-11,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 7306,
    "uncertainty_score": 0.40000055557678227,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 7307,
    "uncertainty_score": 9.646712981835776e-05,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 7308,
    "uncertainty_score": 0.1666665627511976,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 7309,
    "uncertainty_score": 0.20000005878340926,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 7310,
    "uncertainty_score": 0.4000239880134059,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 7311,
    "uncertainty_score": 0.2500006141907108,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 7312,
    "uncertainty_score": 3.463430663861813e-07,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 7313,
    "uncertainty_score": 0.20000001874157966,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 7314,
    "uncertainty_score": 0.01378502866940618,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 7315,
    "uncertainty_score": 0.8000001824509632,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 7316,
    "uncertainty_score": 1.3469490755532288e-07,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 7317,
    "uncertainty_score": 4.249139484758005e-06,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 7318,
    "uncertainty_score": 0.40001240674653704,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 7319,
    "uncertainty_score": 0.0030534433171086933,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 7320,
    "uncertainty_score": 6.041916490319866e-10,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 7321,
    "uncertainty_score": 1.229541682257036e-05,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 7322,
    "uncertainty_score": 0.25062481653250773,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 7323,
    "uncertainty_score": 0.004024667408106834,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 7324,
    "uncertainty_score": 0.74999999975,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 7325,
    "uncertainty_score": 0.2500004750142659,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 7326,
    "uncertainty_score": 0.39999679582421105,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 7327,
    "uncertainty_score": 7.856644277233598e-06,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 7328,
    "uncertainty_score": 1.5216700460360647e-08,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 7329,
    "uncertainty_score": 5.758134434754553e-07,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 7330,
    "uncertainty_score": 1.0432793908452967e-08,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 7331,
    "uncertainty_score": 0.25000000210487117,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 7332,
    "uncertainty_score": 0.0002012286163361612,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 7333,
    "uncertainty_score": 0.496892093651521,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 7334,
    "uncertainty_score": 0.5077855682713773,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 7335,
    "uncertainty_score": 5.013212528017803e-05,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 7336,
    "uncertainty_score": 3.207888905825671e-05,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 7337,
    "uncertainty_score": 4.3426394190365034e-09,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 7338,
    "uncertainty_score": 0.5999999993999999,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 7339,
    "uncertainty_score": 1.8459177608909248e-07,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 7340,
    "uncertainty_score": 8.056444515259197e-08,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 7341,
    "uncertainty_score": 5.952035562211423e-08,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 7342,
    "uncertainty_score": 0.40000012041549005,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 7343,
    "uncertainty_score": 7.120285967104753e-06,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 7344,
    "uncertainty_score": 0.9999999767323144,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 7345,
    "uncertainty_score": 0.5000027168766441,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 7346,
    "uncertainty_score": 0.8333331132520098,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 7347,
    "uncertainty_score": 0.0008273889152889688,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 7348,
    "uncertainty_score": 1.425172874329531e-09,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 7349,
    "uncertainty_score": 9.494585459099596e-11,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 7350,
    "uncertainty_score": 0.6666665955192363,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 7351,
    "uncertainty_score": 0.24999998000217724,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 7352,
    "uncertainty_score": 3.38114191734956e-09,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 7353,
    "uncertainty_score": 0.24954278699762641,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 7354,
    "uncertainty_score": 0.25,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 7355,
    "uncertainty_score": 0.20000102729685346,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 7356,
    "uncertainty_score": 2.5917119892478134e-10,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 7357,
    "uncertainty_score": 2.322688479773271e-05,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 7358,
    "uncertainty_score": 0.6654920581740856,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 7359,
    "uncertainty_score": 4.1111592001180214e-05,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 7360,
    "uncertainty_score": 0.33385123608696327,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 7361,
    "uncertainty_score": 0.3333333330787459,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 7362,
    "uncertainty_score": 0.04276973761822863,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 7363,
    "uncertainty_score": 8.497695660698809e-08,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 7364,
    "uncertainty_score": 0.2857142862296339,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 7365,
    "uncertainty_score": 0.16666742090507833,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 7366,
    "uncertainty_score": 2.0847801077858438e-11,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 7367,
    "uncertainty_score": 0.49999834727358683,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 7368,
    "uncertainty_score": 4.734017799645486e-09,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 7369,
    "uncertainty_score": 8.788360530545667e-06,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 7370,
    "uncertainty_score": 7.218151044440593e-05,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 7371,
    "uncertainty_score": 0.0,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 7372,
    "uncertainty_score": 0.3333614276737933,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 7373,
    "uncertainty_score": 0.20000047923902847,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 7374,
    "uncertainty_score": 0.20000000008516663,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 7375,
    "uncertainty_score": 0.5000000000000289,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 7376,
    "uncertainty_score": 0.8,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 7377,
    "uncertainty_score": 4.090052192486524e-10,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 7378,
    "uncertainty_score": 2.9165214038721696e-05,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 7379,
    "uncertainty_score": 0.6666660874827118,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 7380,
    "uncertainty_score": 0.2503529183680257,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 7381,
    "uncertainty_score": 0.0017398147753025961,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 7382,
    "uncertainty_score": 0.33349143794357455,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 7383,
    "uncertainty_score": 3.858676610423036e-08,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 7384,
    "uncertainty_score": 6.897469984086121e-08,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 7385,
    "uncertainty_score": 0.33333264038330024,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 7386,
    "uncertainty_score": 0.2488944964247863,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 7387,
    "uncertainty_score": 5.400054108628729e-09,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 7388,
    "uncertainty_score": 0.19199252195314276,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 7389,
    "uncertainty_score": 0.7931109770068133,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 7390,
    "uncertainty_score": 0.34034808561741126,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 7391,
    "uncertainty_score": 0.200000004769687,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 7392,
    "uncertainty_score": 0.2500011475964905,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 7393,
    "uncertainty_score": 0.40000910388574296,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 7394,
    "uncertainty_score": 0.7500000016206176,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 7395,
    "uncertainty_score": 0.4000000172431825,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 7396,
    "uncertainty_score": 0.49999999747706425,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 7397,
    "uncertainty_score": 0.5465823682394,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 7398,
    "uncertainty_score": 0.002281417925175538,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 7399,
    "uncertainty_score": 0.0973965956034691,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 7400,
    "uncertainty_score": 3.767859035022117e-11,
    "reward_variance": 0.109375,
    "num_correct": 7
  },
  {
    "index": 7401,
    "uncertainty_score": 0.49999978419459296,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 7402,
    "uncertainty_score": 0.42541493637351746,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 7403,
    "uncertainty_score": 0.3297123234701404,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 7404,
    "uncertainty_score": 0.00017927800882067377,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 7405,
    "uncertainty_score": 0.400001045216399,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 7406,
    "uncertainty_score": 0.3333333330013105,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 7407,
    "uncertainty_score": 0.3333339982432679,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 7408,
    "uncertainty_score": 8.745187343627977e-09,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 7409,
    "uncertainty_score": 0.19999999980333844,
    "reward_variance": 0.0,
    "num_correct": 8
  },
  {
    "index": 7410,
    "uncertainty_score": 0.16671016842750316,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 7411,
    "uncertainty_score": 0.16822610926562795,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 7412,
    "uncertainty_score": 0.39999998710442186,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 7413,
    "uncertainty_score": 0.3333333330130041,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 7414,
    "uncertainty_score": 0.38823774904611225,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 7415,
    "uncertainty_score": 0.4,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 7416,
    "uncertainty_score": 0.2500107733100681,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 7417,
    "uncertainty_score": 2.0684220692987953e-05,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 7418,
    "uncertainty_score": 5.983948657556573e-08,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 7419,
    "uncertainty_score": 0.2048355670744722,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 7420,
    "uncertainty_score": 9.86597423231769e-10,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 7421,
    "uncertainty_score": 0.599999961412273,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 7422,
    "uncertainty_score": 0.20394382589215967,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 7423,
    "uncertainty_score": 9.30651147950518e-05,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 7424,
    "uncertainty_score": 0.34371899321267907,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 7425,
    "uncertainty_score": 0.017977541712237397,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 7426,
    "uncertainty_score": 2.1058227369839496e-09,
    "reward_variance": 0.1875,
    "num_correct": 6
  },
  {
    "index": 7427,
    "uncertainty_score": 1.1882095039949695e-09,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 7428,
    "uncertainty_score": 0.008007437255645993,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 7429,
    "uncertainty_score": 1.2414855959911507e-08,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 7430,
    "uncertainty_score": 0.2973962933913049,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 7431,
    "uncertainty_score": 0.19999939703719,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 7432,
    "uncertainty_score": 0.13515162600641845,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 7433,
    "uncertainty_score": 0.7490989453143845,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 7434,
    "uncertainty_score": 3.0862071812146997e-13,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 7435,
    "uncertainty_score": 1.0299431876466478e-07,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 7436,
    "uncertainty_score": 0.0013923035246941851,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 7437,
    "uncertainty_score": 0.1666667670326278,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 7438,
    "uncertainty_score": 1.0468246994343748e-07,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 7439,
    "uncertainty_score": 0.24965209233246866,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 7440,
    "uncertainty_score": 0.002071527831081481,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 7441,
    "uncertainty_score": 0.20006235498140706,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 7442,
    "uncertainty_score": 0.24999996907583757,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 7443,
    "uncertainty_score": 1.0015938819591004e-08,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 7444,
    "uncertainty_score": 0.33333333377669133,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 7445,
    "uncertainty_score": 0.4983986490938878,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 7446,
    "uncertainty_score": 0.7499999992499999,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 7447,
    "uncertainty_score": 0.2500000000068333,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 7448,
    "uncertainty_score": 2.803777826642197e-05,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 7449,
    "uncertainty_score": 1.0076356165876068e-05,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 7450,
    "uncertainty_score": 0.0074025033128559264,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 7451,
    "uncertainty_score": 0.2000231838004667,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 7452,
    "uncertainty_score": 3.749427098080453e-07,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 7453,
    "uncertainty_score": 2.579674110040293e-10,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 7454,
    "uncertainty_score": 4.394477283425135e-12,
    "reward_variance": 0.234375,
    "num_correct": 5
  },
  {
    "index": 7455,
    "uncertainty_score": 0.25000000000747424,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 7456,
    "uncertainty_score": 1.6295845195314637e-07,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 7457,
    "uncertainty_score": 9.564407469887781e-11,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 7458,
    "uncertainty_score": 5.4196841848284575e-08,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 7459,
    "uncertainty_score": 0.4998755134160636,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 7460,
    "uncertainty_score": 2.1353073597327058e-07,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 7461,
    "uncertainty_score": 3.659977123181141e-06,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 7462,
    "uncertainty_score": 8.744624498023509e-09,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 7463,
    "uncertainty_score": 0.2493753899522824,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 7464,
    "uncertainty_score": 0.5000006174939038,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 7465,
    "uncertainty_score": 0.7500001454251818,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 7466,
    "uncertainty_score": 0.99999999975,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 7467,
    "uncertainty_score": 0.0005350810875039682,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 7468,
    "uncertainty_score": 4.893343696583268e-07,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 7469,
    "uncertainty_score": 0.007486286041946744,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 7470,
    "uncertainty_score": 9.914131778416222e-10,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 7471,
    "uncertainty_score": 4.684569142129142e-05,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 7472,
    "uncertainty_score": 0.2503733446353608,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 7473,
    "uncertainty_score": 1.2289911726887122e-08,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 7474,
    "uncertainty_score": 9.736298144916014e-06,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 7475,
    "uncertainty_score": 0.1999999998000032,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 7476,
    "uncertainty_score": 1.8873296224128592e-10,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 7477,
    "uncertainty_score": 0.4914400414373564,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 7478,
    "uncertainty_score": 1.6903787340887654e-08,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 7479,
    "uncertainty_score": 0.41415395394638993,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 7480,
    "uncertainty_score": 0.333333333006735,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 7481,
    "uncertainty_score": 0.49969624456942957,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 7482,
    "uncertainty_score": 0.6666643296316316,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 7483,
    "uncertainty_score": 9.542804682259585e-09,
    "reward_variance": 0.25,
    "num_correct": 4
  },
  {
    "index": 7484,
    "uncertainty_score": 3.7458265940483142e-06,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 7485,
    "uncertainty_score": 0.00014473642072590617,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 7486,
    "uncertainty_score": 6.593430423366258e-11,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 7487,
    "uncertainty_score": 5.6029502855015174e-08,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 7488,
    "uncertainty_score": 1.932503529386142e-05,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 7489,
    "uncertainty_score": 0.25000000287404783,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 7490,
    "uncertainty_score": 2.1342970527478038e-05,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 7491,
    "uncertainty_score": 0.19947368379984312,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 7492,
    "uncertainty_score": 0.5,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 7493,
    "uncertainty_score": 6.74096465143337e-11,
    "reward_variance": 0.0,
    "num_correct": 0
  },
  {
    "index": 7494,
    "uncertainty_score": 0.6561814967403514,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 7495,
    "uncertainty_score": 3.745300503257303e-05,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 7496,
    "uncertainty_score": 9.814730120632886e-07,
    "reward_variance": 0.234375,
    "num_correct": 3
  },
  {
    "index": 7497,
    "uncertainty_score": 0.14285738551049013,
    "reward_variance": 0.109375,
    "num_correct": 1
  },
  {
    "index": 7498,
    "uncertainty_score": 0.1428527615687453,
    "reward_variance": 0.1875,
    "num_correct": 2
  },
  {
    "index": 7499,
    "uncertainty_score": 3.172897289749973e-05,
    "reward_variance": 0.109375,
    "num_correct": 1
  }
]