{
  "config": {
    "difficulty_levels": [
      1,
      2,
      3,
      4,
      5
    ],
    "staleness_levels": [
      0,
      2,
      4,
      6,
      8,
      10
    ],
    "samples_per_cell": 10
  },
  "grid_results": {
    "success_rate": [
      [
        0.8804464596978596,
        0.7733526477357429,
        0.59076740557346,
        0.5322068537875765,
        0.4680710361006577
      ],
      [
        0.8385467373980074,
        0.7281261299438234,
        0.57081948444406,
        0.4227039683823095,
        0.28006265542268965
      ],
      [
        0.8225286991265217,
        0.6809333550346633,
        0.471602276701982,
        0.3014532372950336,
        0.09176708195321084
      ],
      [
        0.7549081929799277,
        0.6021622878739643,
        0.39317606402231403,
        0.16089294196944823,
        0.058565142487844404
      ],
      [
        0.7169527546299558,
        0.5743607342310615,
        0.3478086868933405,
        0.02862214658531224,
        0.05818881144824904
      ],
      [
        0.6593661961198047,
        0.4631811246413166,
        0.25645308669068373,
        0.07659806692817467,
        0.05794728605485747
      ]
    ],
    "kl_divergence": [
      [
        0.0,
        0.0024222482625686666,
        0.0,
        0.0019514494827982674,
        0.01029484222826489
      ],
      [
        0.033120521294644684,
        0.040827376102545616,
        0.055680427287836634,
        0.07769297114591359,
        0.10776202716771814
      ],
      [
        0.051031512847607666,
        0.08217382069137401,
        0.11490939604266953,
        0.157396151055472,
        0.22757805276279047
      ],
      [
        0.08151743330370052,
        0.1183265418549392,
        0.16292162556826004,
        0.2508708293187266,
        0.3456174039007528
      ],
      [
        0.11896758957204896,
        0.14508099249731687,
        0.22794358658638286,
        0.3302048200348047,
        0.4576034487784334
      ],
      [
        0.1424146763238185,
        0.19631248779749727,
        0.2853757783963233,
        0.4004680791355904,
        0.5779117312516365
      ]
    ],
    "gradient_cosine_sim": [
      [
        0.9689052325322646,
        1.0,
        1.0,
        0.9854412370222224,
        1.0
      ],
      [
        0.9020647494521251,
        0.8869951855234005,
        0.8550494735602888,
        0.7569642952695889,
        0.7332594637896553
      ],
      [
        0.8054661666530509,
        0.7087999851280877,
        0.6988228351897603,
        0.5437497500639987,
        0.44260877469170806
      ],
      [
        0.6881085271358395,
        0.6268399185952224,
        0.4616388178810433,
        0.3749840208715645,
        0.14156465417398478
      ],
      [
        0.5745325104713785,
        0.4762481413345428,
        0.33384584176702276,
        0.12881688757164125,
        0.01858633047259524
      ],
      [
        0.4842719234749607,
        0.3457130961489736,
        0.1317528698877096,
        0.0,
        0.0035774426443059473
      ]
    ],
    "gradient_norm": [
      [
        0.5210419652134595,
        0.8011133199034355,
        1.067045112341852,
        1.0958508742764228,
        1.095922165057258
      ],
      [
        0.6415444263886583,
        0.8918338753474151,
        1.0799384024923102,
        1.076101293984628,
        0.9065102578411257
      ],
      [
        0.6839009529590145,
        0.9690524841436018,
        1.0967742772459568,
        0.942316732077511,
        0.43338353849201416
      ],
      [
        0.8400872526068317,
        1.058251467745429,
        1.054354586808941,
        0.6400256127754559,
        0.3205410662928916
      ],
      [
        0.9117260090338968,
        1.07788192481847,
        1.007351216859483,
        0.21121167724064455,
        0.31921149468195664
      ],
      [
        0.9984096621372157,
        1.0945774816692868,
        0.8627396040700175,
        0.38292321228416615,
        0.318357592374936
      ]
    ]
  },
  "all_results": [
    {
      "difficulty": 1,
      "staleness": 0,
      "success_rate": 0.8804464596978596,
      "kl_divergence": 0.0,
      "gradient_cosine_sim": 0.9689052325322646,
      "gradient_norm": 0.5210419652134595,
      "avg_reward": 0.8804464596978596
    },
    {
      "difficulty": 2,
      "staleness": 0,
      "success_rate": 0.7733526477357429,
      "kl_divergence": 0.0024222482625686666,
      "gradient_cosine_sim": 1.0,
      "gradient_norm": 0.8011133199034355,
      "avg_reward": 0.7733526477357429
    },
    {
      "difficulty": 3,
      "staleness": 0,
      "success_rate": 0.59076740557346,
      "kl_divergence": 0.0,
      "gradient_cosine_sim": 1.0,
      "gradient_norm": 1.067045112341852,
      "avg_reward": 0.59076740557346
    },
    {
      "difficulty": 4,
      "staleness": 0,
      "success_rate": 0.5322068537875765,
      "kl_divergence": 0.0019514494827982674,
      "gradient_cosine_sim": 0.9854412370222224,
      "gradient_norm": 1.0958508742764228,
      "avg_reward": 0.5322068537875765
    },
    {
      "difficulty": 5,
      "staleness": 0,
      "success_rate": 0.4680710361006577,
      "kl_divergence": 0.01029484222826489,
      "gradient_cosine_sim": 1.0,
      "gradient_norm": 1.095922165057258,
      "avg_reward": 0.4680710361006577
    },
    {
      "difficulty": 1,
      "staleness": 2,
      "success_rate": 0.8385467373980074,
      "kl_divergence": 0.033120521294644684,
      "gradient_cosine_sim": 0.9020647494521251,
      "gradient_norm": 0.6415444263886583,
      "avg_reward": 0.8385467373980074
    },
    {
      "difficulty": 2,
      "staleness": 2,
      "success_rate": 0.7281261299438234,
      "kl_divergence": 0.040827376102545616,
      "gradient_cosine_sim": 0.8869951855234005,
      "gradient_norm": 0.8918338753474151,
      "avg_reward": 0.7281261299438234
    },
    {
      "difficulty": 3,
      "staleness": 2,
      "success_rate": 0.57081948444406,
      "kl_divergence": 0.055680427287836634,
      "gradient_cosine_sim": 0.8550494735602888,
      "gradient_norm": 1.0799384024923102,
      "avg_reward": 0.57081948444406
    },
    {
      "difficulty": 4,
      "staleness": 2,
      "success_rate": 0.4227039683823095,
      "kl_divergence": 0.07769297114591359,
      "gradient_cosine_sim": 0.7569642952695889,
      "gradient_norm": 1.076101293984628,
      "avg_reward": 0.4227039683823095
    },
    {
      "difficulty": 5,
      "staleness": 2,
      "success_rate": 0.28006265542268965,
      "kl_divergence": 0.10776202716771814,
      "gradient_cosine_sim": 0.7332594637896553,
      "gradient_norm": 0.9065102578411257,
      "avg_reward": 0.28006265542268965
    },
    {
      "difficulty": 1,
      "staleness": 4,
      "success_rate": 0.8225286991265217,
      "kl_divergence": 0.051031512847607666,
      "gradient_cosine_sim": 0.8054661666530509,
      "gradient_norm": 0.6839009529590145,
      "avg_reward": 0.8225286991265217
    },
    {
      "difficulty": 2,
      "staleness": 4,
      "success_rate": 0.6809333550346633,
      "kl_divergence": 0.08217382069137401,
      "gradient_cosine_sim": 0.7087999851280877,
      "gradient_norm": 0.9690524841436018,
      "avg_reward": 0.6809333550346633
    },
    {
      "difficulty": 3,
      "staleness": 4,
      "success_rate": 0.471602276701982,
      "kl_divergence": 0.11490939604266953,
      "gradient_cosine_sim": 0.6988228351897603,
      "gradient_norm": 1.0967742772459568,
      "avg_reward": 0.471602276701982
    },
    {
      "difficulty": 4,
      "staleness": 4,
      "success_rate": 0.3014532372950336,
      "kl_divergence": 0.157396151055472,
      "gradient_cosine_sim": 0.5437497500639987,
      "gradient_norm": 0.942316732077511,
      "avg_reward": 0.3014532372950336
    },
    {
      "difficulty": 5,
      "staleness": 4,
      "success_rate": 0.09176708195321084,
      "kl_divergence": 0.22757805276279047,
      "gradient_cosine_sim": 0.44260877469170806,
      "gradient_norm": 0.43338353849201416,
      "avg_reward": 0.09176708195321084
    },
    {
      "difficulty": 1,
      "staleness": 6,
      "success_rate": 0.7549081929799277,
      "kl_divergence": 0.08151743330370052,
      "gradient_cosine_sim": 0.6881085271358395,
      "gradient_norm": 0.8400872526068317,
      "avg_reward": 0.7549081929799277
    },
    {
      "difficulty": 2,
      "staleness": 6,
      "success_rate": 0.6021622878739643,
      "kl_divergence": 0.1183265418549392,
      "gradient_cosine_sim": 0.6268399185952224,
      "gradient_norm": 1.058251467745429,
      "avg_reward": 0.6021622878739643
    },
    {
      "difficulty": 3,
      "staleness": 6,
      "success_rate": 0.39317606402231403,
      "kl_divergence": 0.16292162556826004,
      "gradient_cosine_sim": 0.4616388178810433,
      "gradient_norm": 1.054354586808941,
      "avg_reward": 0.39317606402231403
    },
    {
      "difficulty": 4,
      "staleness": 6,
      "success_rate": 0.16089294196944823,
      "kl_divergence": 0.2508708293187266,
      "gradient_cosine_sim": 0.3749840208715645,
      "gradient_norm": 0.6400256127754559,
      "avg_reward": 0.16089294196944823
    },
    {
      "difficulty": 5,
      "staleness": 6,
      "success_rate": 0.058565142487844404,
      "kl_divergence": 0.3456174039007528,
      "gradient_cosine_sim": 0.14156465417398478,
      "gradient_norm": 0.3205410662928916,
      "avg_reward": 0.058565142487844404
    },
    {
      "difficulty": 1,
      "staleness": 8,
      "success_rate": 0.7169527546299558,
      "kl_divergence": 0.11896758957204896,
      "gradient_cosine_sim": 0.5745325104713785,
      "gradient_norm": 0.9117260090338968,
      "avg_reward": 0.7169527546299558
    },
    {
      "difficulty": 2,
      "staleness": 8,
      "success_rate": 0.5743607342310615,
      "kl_divergence": 0.14508099249731687,
      "gradient_cosine_sim": 0.4762481413345428,
      "gradient_norm": 1.07788192481847,
      "avg_reward": 0.5743607342310615
    },
    {
      "difficulty": 3,
      "staleness": 8,
      "success_rate": 0.3478086868933405,
      "kl_divergence": 0.22794358658638286,
      "gradient_cosine_sim": 0.33384584176702276,
      "gradient_norm": 1.007351216859483,
      "avg_reward": 0.3478086868933405
    },
    {
      "difficulty": 4,
      "staleness": 8,
      "success_rate": 0.02862214658531224,
      "kl_divergence": 0.3302048200348047,
      "gradient_cosine_sim": 0.12881688757164125,
      "gradient_norm": 0.21121167724064455,
      "avg_reward": 0.02862214658531224
    },
    {
      "difficulty": 5,
      "staleness": 8,
      "success_rate": 0.05818881144824904,
      "kl_divergence": 0.4576034487784334,
      "gradient_cosine_sim": 0.01858633047259524,
      "gradient_norm": 0.31921149468195664,
      "avg_reward": 0.05818881144824904
    },
    {
      "difficulty": 1,
      "staleness": 10,
      "success_rate": 0.6593661961198047,
      "kl_divergence": 0.1424146763238185,
      "gradient_cosine_sim": 0.4842719234749607,
      "gradient_norm": 0.9984096621372157,
      "avg_reward": 0.6593661961198047
    },
    {
      "difficulty": 2,
      "staleness": 10,
      "success_rate": 0.4631811246413166,
      "kl_divergence": 0.19631248779749727,
      "gradient_cosine_sim": 0.3457130961489736,
      "gradient_norm": 1.0945774816692868,
      "avg_reward": 0.4631811246413166
    },
    {
      "difficulty": 3,
      "staleness": 10,
      "success_rate": 0.25645308669068373,
      "kl_divergence": 0.2853757783963233,
      "gradient_cosine_sim": 0.1317528698877096,
      "gradient_norm": 0.8627396040700175,
      "avg_reward": 0.25645308669068373
    },
    {
      "difficulty": 4,
      "staleness": 10,
      "success_rate": 0.07659806692817467,
      "kl_divergence": 0.4004680791355904,
      "gradient_cosine_sim": 0.0,
      "gradient_norm": 0.38292321228416615,
      "avg_reward": 0.07659806692817467
    },
    {
      "difficulty": 5,
      "staleness": 10,
      "success_rate": 0.05794728605485747,
      "kl_divergence": 0.5779117312516365,
      "gradient_cosine_sim": 0.0035774426443059473,
      "gradient_norm": 0.318357592374936,
      "avg_reward": 0.05794728605485747
    }
  ],
  "summary": {
    "mean_success_rate": 0.4554190517384617,
    "kl_range": [
      0.0,
      0.5779117312516365
    ],
    "safe_zone_threshold": {
      "threshold": 0.8,
      "safe_fraction": 0.3,
      "max_safe_staleness_by_difficulty": [
        2,
        1,
        1,
        0,
        0
      ]
    }
  }
}