{
  "aggregate": {
    "baselines": {
      "always_cma": {
        "confusion": {
          "accuracy": 0.5070093457943925,
          "n_non_ties": 428,
          "pred_cma_label_cma": 217,
          "pred_cma_label_berw": 211,
          "pred_berw_label_cma": 0,
          "pred_berw_label_berw": 0,
          "pred_berw_rate": 0.0
        },
        "regret": {
          "mean": 0.09639538561059312,
          "median": 0.0,
          "q90": 0.2563476080403629
        }
      },
      "always_berw": {
        "confusion": {
          "accuracy": 0.4929906542056075,
          "n_non_ties": 428,
          "pred_cma_label_cma": 0,
          "pred_cma_label_berw": 0,
          "pred_berw_label_cma": 217,
          "pred_berw_label_berw": 211,
          "pred_berw_rate": 1.0
        },
        "regret": {
          "mean": 0.8555507415870024,
          "median": 0.0006808337107824247,
          "q90": 1.7783138413164328
        }
      }
    },
    "cv": {
      "confusion": {
        "accuracy": 0.7476635514018691,
        "n_non_ties": 428,
        "pred_cma_label_cma": 139,
        "pred_cma_label_berw": 30,
        "pred_berw_label_cma": 78,
        "pred_berw_label_berw": 181,
        "pred_berw_rate": 0.6051401869158879
      },
      "regret": {
        "mean": 0.028393451224880482,
        "median": 0.0,
        "q90": 0.06459273732064308
      }
    },
    "fixed_threshold": {
      "confusion": {
        "accuracy": 0.7546728971962616,
        "n": 428,
        "pred_cma_label_cma": 139,
        "pred_cma_label_berw": 27,
        "pred_berw_label_cma": 78,
        "pred_berw_label_berw": 184,
        "pred_berw_rate": 0.6121495327102804
      },
      "regret": {
        "mean": 0.024393231462128802,
        "median": 0.0,
        "q90": 0.05002082048274214
      },
      "threshold": 0.12
    },
    "thresholds": {
      "max": 0.17777777777777776,
      "mean": 0.13511111111111113,
      "median": 0.12444444444444444,
      "min": 0.12444444444444444,
      "std": 0.021333333333333326
    }
  },
  "folds": [
    {
      "fold": 0,
      "test_groups": [
        1,
        6,
        11
      ],
      "train_groups": [
        2,
        3,
        4,
        5,
        7,
        8,
        9,
        10,
        12,
        13,
        14,
        15
      ]
    },
    {
      "fold": 1,
      "test_groups": [
        2,
        7,
        12
      ],
      "train_groups": [
        1,
        3,
        4,
        5,
        6,
        8,
        9,
        10,
        11,
        13,
        14,
        15
      ]
    },
    {
      "fold": 2,
      "test_groups": [
        3,
        8,
        13
      ],
      "train_groups": [
        1,
        2,
        4,
        5,
        6,
        7,
        9,
        10,
        11,
        12,
        14,
        15
      ]
    },
    {
      "fold": 3,
      "test_groups": [
        4,
        9,
        14
      ],
      "train_groups": [
        1,
        2,
        3,
        5,
        6,
        7,
        8,
        10,
        11,
        12,
        13,
        15
      ]
    },
    {
      "fold": 4,
      "test_groups": [
        5,
        10,
        15
      ],
      "train_groups": [
        1,
        2,
        3,
        4,
        6,
        7,
        8,
        9,
        11,
        12,
        13,
        14
      ]
    }
  ],
  "group_by": "instance",
  "input": "evidence/bbob_noisy_probe_decision_accuracy_noisefree_i1-15_B500/decision_points.csv",
  "k": 5,
  "loss": {
    "eps": 1e-12,
    "name": "log10"
  },
  "per_fold": [
    {
      "fold": 0,
      "group_by": "instance",
      "selected_threshold": 0.12444444444444444,
      "selection_criterion": "minimize train_regret_mean, tie-break by smaller threshold",
      "test_accuracy": 0.7558139534883721,
      "test_groups": [
        1,
        6,
        11
      ],
      "test_regret_mean": 0.01631958492560089,
      "test_regret_median": 0.0,
      "test_regret_q90": 0.056831370100081324,
      "train_accuracy": 0.7543859649122807,
      "train_groups": [
        2,
        3,
        4,
        5,
        7,
        8,
        9,
        10,
        12,
        13,
        14,
        15
      ],
      "train_label_berw_rate": 0.49122807017543857,
      "train_regret_mean": 0.026423446673068573
    },
    {
      "fold": 1,
      "group_by": "instance",
      "selected_threshold": 0.12444444444444444,
      "selection_criterion": "minimize train_regret_mean, tie-break by smaller threshold",
      "test_accuracy": 0.7647058823529411,
      "test_groups": [
        2,
        7,
        12
      ],
      "test_regret_mean": 0.02367761872112828,
      "test_regret_median": 0.0,
      "test_regret_q90": 0.044644806013915114,
      "train_accuracy": 0.7521865889212828,
      "train_groups": [
        1,
        3,
        4,
        5,
        6,
        8,
        9,
        10,
        11,
        13,
        14,
        15
      ],
      "train_label_berw_rate": 0.5043731778425656,
      "train_regret_mean": 0.02457056989648753
    },
    {
      "fold": 2,
      "group_by": "instance",
      "selected_threshold": 0.12444444444444444,
      "selection_criterion": "minimize train_regret_mean, tie-break by smaller threshold",
      "test_accuracy": 0.7647058823529411,
      "test_groups": [
        3,
        8,
        13
      ],
      "test_regret_mean": 0.033613443451571266,
      "test_regret_median": 0.0,
      "test_regret_q90": 0.10054145346537748,
      "train_accuracy": 0.7521865889212828,
      "train_groups": [
        1,
        2,
        4,
        5,
        6,
        7,
        9,
        10,
        11,
        12,
        14,
        15
      ],
      "train_label_berw_rate": 0.4868804664723032,
      "train_regret_mean": 0.02210833927815618
    },
    {
      "fold": 3,
      "group_by": "instance",
      "selected_threshold": 0.17777777777777776,
      "selection_criterion": "minimize train_regret_mean, tie-break by smaller threshold",
      "test_accuracy": 0.686046511627907,
      "test_groups": [
        4,
        9,
        14
      ],
      "test_regret_mean": 0.04878715133774088,
      "test_regret_median": 0.0,
      "test_regret_q90": 0.059188261556505695,
      "train_accuracy": 0.7807017543859649,
      "train_groups": [
        1,
        2,
        3,
        5,
        6,
        7,
        8,
        10,
        11,
        12,
        13,
        15
      ],
      "train_label_berw_rate": 0.49415204678362573,
      "train_regret_mean": 0.02219327254725107
    },
    {
      "fold": 4,
      "group_by": "instance",
      "selected_threshold": 0.12444444444444444,
      "selection_criterion": "minimize train_regret_mean, tie-break by smaller threshold",
      "test_accuracy": 0.7674418604651163,
      "test_groups": [
        5,
        10,
        15
      ],
      "test_regret_mean": 0.019575320010720865,
      "test_regret_median": 0.0,
      "test_regret_q90": 0.040490294688286466,
      "train_accuracy": 0.7514619883040936,
      "train_groups": [
        1,
        2,
        3,
        4,
        6,
        7,
        8,
        9,
        11,
        12,
        13,
        14
      ],
      "train_label_berw_rate": 0.48830409356725146,
      "train_regret_mean": 0.025604753055172902
    }
  ],
  "probe_key": "misranking_rd",
  "selection": "regret_mean_then_threshold"
}