[
  {
    "task": "arc",
    "run": "arc_Markovian_20251116_134634",
    "perturbation": "char_replace",
    "degree": "CharReplace",
    "markovian_mean": 0.1598639455782313,
    "non_markovian_mean": 0.05782312925170068,
    "mean_difference": 0.10204081632653061,
    "difference_std": 0.5246922502931608,
    "markovian_more_sensitive": 47,
    "non_markovian_more_sensitive": 22,
    "num_examples": 294,
    "is_baseline": false
  },
  {
    "task": "arc",
    "run": "arc_Markovian_20251116_134634",
    "perturbation": "char_replace",
    "degree": "CharReplace",
    "markovian_mean": 0.3469387755102041,
    "non_markovian_mean": 0.003401360544217687,
    "mean_difference": 0.3435374149659864,
    "difference_std": 0.6013101373278033,
    "markovian_more_sensitive": 107,
    "non_markovian_more_sensitive": 13,
    "num_examples": 294,
    "is_baseline": false
  },
  {
    "task": "arc",
    "run": "arc_Markovian_20251116_134634",
    "perturbation": "char_replace",
    "degree": "CharReplace",
    "markovian_mean": 0.42517006802721086,
    "non_markovian_mean": 0.030612244897959183,
    "mean_difference": 0.3945578231292517,
    "difference_std": 0.665555091626395,
    "markovian_more_sensitive": 129,
    "non_markovian_more_sensitive": 20,
    "num_examples": 294,
    "is_baseline": false
  },
  {
    "task": "arc",
    "run": "arc_Markovian_20251116_134634",
    "perturbation": "char_replace",
    "degree": "CharReplace",
    "markovian_mean": 0.5714285714285714,
    "non_markovian_mean": 0.12585034013605442,
    "mean_difference": 0.445578231292517,
    "difference_std": 0.661448759592865,
    "markovian_more_sensitive": 147,
    "non_markovian_more_sensitive": 22,
    "num_examples": 294,
    "is_baseline": false
  },
  {
    "task": "arc",
    "run": "arc_Markovian_20251116_134634",
    "perturbation": "char_replace",
    "degree": "CharReplace",
    "markovian_mean": 0.6190476190476191,
    "non_markovian_mean": 0.1326530612244898,
    "mean_difference": 0.48639455782312924,
    "difference_std": 0.7271357896356239,
    "markovian_more_sensitive": 165,
    "non_markovian_more_sensitive": 30,
    "num_examples": 294,
    "is_baseline": false
  },
  {
    "task": "arc",
    "run": "arc_Markovian_20251116_134634",
    "perturbation": "delete",
    "degree": "Delete",
    "markovian_mean": 0.11904761904761904,
    "non_markovian_mean": -0.047619047619047616,
    "mean_difference": 0.16666666666666666,
    "difference_std": 0.497727260961116,
    "markovian_more_sensitive": 53,
    "non_markovian_more_sensitive": 10,
    "num_examples": 294,
    "is_baseline": false
  },
  {
    "task": "arc",
    "run": "arc_Markovian_20251116_134634",
    "perturbation": "delete",
    "degree": "Delete",
    "markovian_mean": 0.3231292517006803,
    "non_markovian_mean": -0.05442176870748299,
    "mean_difference": 0.37755102040816324,
    "difference_std": 0.625674701766766,
    "markovian_more_sensitive": 114,
    "non_markovian_more_sensitive": 13,
    "num_examples": 294,
    "is_baseline": false
  },
  {
    "task": "arc",
    "run": "arc_Markovian_20251116_134634",
    "perturbation": "delete",
    "degree": "Delete",
    "markovian_mean": 0.5170068027210885,
    "non_markovian_mean": -0.061224489795918366,
    "mean_difference": 0.5782312925170068,
    "difference_std": 0.6590569439337614,
    "markovian_more_sensitive": 170,
    "non_markovian_more_sensitive": 14,
    "num_examples": 294,
    "is_baseline": false
  },
  {
    "task": "arc",
    "run": "arc_Markovian_20251116_134634",
    "perturbation": "delete",
    "degree": "Delete",
    "markovian_mean": 0.6326530612244898,
    "non_markovian_mean": -0.04421768707482993,
    "mean_difference": 0.6768707482993197,
    "difference_std": 0.6808925741845862,
    "markovian_more_sensitive": 200,
    "non_markovian_more_sensitive": 17,
    "num_examples": 294,
    "is_baseline": false
  },
  {
    "task": "arc",
    "run": "arc_Markovian_20251116_134634",
    "perturbation": "delete",
    "degree": "Delete",
    "markovian_mean": 0.8095238095238095,
    "non_markovian_mean": 0.01020408163265306,
    "mean_difference": 0.7993197278911565,
    "difference_std": 0.5748701833510313,
    "markovian_more_sensitive": 226,
    "non_markovian_more_sensitive": 8,
    "num_examples": 294,
    "is_baseline": false
  },
  {
    "task": "arc",
    "run": "arc_Markovian_20251116_134634",
    "perturbation": "digit_replace",
    "degree": "DigitReplace",
    "markovian_mean": 0.0,
    "non_markovian_mean": 0.0,
    "mean_difference": 0.0,
    "difference_std": 0.0,
    "markovian_more_sensitive": 0,
    "non_markovian_more_sensitive": 0,
    "num_examples": 294,
    "is_baseline": false
  },
  {
    "task": "arc",
    "run": "arc_Markovian_20251116_134634",
    "perturbation": "digit_replace",
    "degree": "DigitReplace",
    "markovian_mean": 0.0,
    "non_markovian_mean": 0.003401360544217687,
    "mean_difference": -0.003401360544217687,
    "difference_std": 0.05822191417899213,
    "markovian_more_sensitive": 0,
    "non_markovian_more_sensitive": 1,
    "num_examples": 294,
    "is_baseline": false
  },
  {
    "task": "arc",
    "run": "arc_Markovian_20251116_134634",
    "perturbation": "digit_replace",
    "degree": "DigitReplace",
    "markovian_mean": 0.0,
    "non_markovian_mean": 0.003401360544217687,
    "mean_difference": -0.003401360544217687,
    "difference_std": 0.05822191417899213,
    "markovian_more_sensitive": 0,
    "non_markovian_more_sensitive": 1,
    "num_examples": 294,
    "is_baseline": false
  },
  {
    "task": "arc",
    "run": "arc_Markovian_20251116_134634",
    "perturbation": "digit_replace",
    "degree": "DigitReplace",
    "markovian_mean": 0.0,
    "non_markovian_mean": 0.003401360544217687,
    "mean_difference": -0.003401360544217687,
    "difference_std": 0.05822191417899213,
    "markovian_more_sensitive": 0,
    "non_markovian_more_sensitive": 1,
    "num_examples": 294,
    "is_baseline": false
  },
  {
    "task": "arc",
    "run": "arc_Markovian_20251116_134634",
    "perturbation": "digit_replace",
    "degree": "DigitReplace",
    "markovian_mean": -0.003401360544217687,
    "non_markovian_mean": 0.003401360544217687,
    "mean_difference": -0.006802721088435374,
    "difference_std": 0.08219759165710593,
    "markovian_more_sensitive": 0,
    "non_markovian_more_sensitive": 2,
    "num_examples": 294,
    "is_baseline": false
  },
  {
    "task": "arc",
    "run": "arc_Markovian_20251116_134634",
    "perturbation": "truncate_back",
    "degree": "TruncateBack",
    "markovian_mean": 0.003401360544217687,
    "non_markovian_mean": 0.013605442176870748,
    "mean_difference": -0.01020408163265306,
    "difference_std": 0.3640727096920668,
    "markovian_more_sensitive": 18,
    "non_markovian_more_sensitive": 21,
    "num_examples": 294,
    "is_baseline": false
  },
  {
    "task": "arc",
    "run": "arc_Markovian_20251116_134634",
    "perturbation": "truncate_back",
    "degree": "TruncateBack",
    "markovian_mean": 0.09183673469387756,
    "non_markovian_mean": 0.0782312925170068,
    "mean_difference": 0.013605442176870748,
    "difference_std": 0.521463072020049,
    "markovian_more_sensitive": 38,
    "non_markovian_more_sensitive": 36,
    "num_examples": 294,
    "is_baseline": false
  },
  {
    "task": "arc",
    "run": "arc_Markovian_20251116_134634",
    "perturbation": "truncate_back",
    "degree": "TruncateBack",
    "markovian_mean": 0.17346938775510204,
    "non_markovian_mean": 0.09523809523809523,
    "mean_difference": 0.0782312925170068,
    "difference_std": 0.6259704853621998,
    "markovian_more_sensitive": 59,
    "non_markovian_more_sensitive": 40,
    "num_examples": 294,
    "is_baseline": false
  },
  {
    "task": "arc",
    "run": "arc_Markovian_20251116_134634",
    "perturbation": "truncate_back",
    "degree": "TruncateBack",
    "markovian_mean": 0.20408163265306123,
    "non_markovian_mean": 0.1564625850340136,
    "mean_difference": 0.047619047619047616,
    "difference_std": 0.6208764195431093,
    "markovian_more_sensitive": 59,
    "non_markovian_more_sensitive": 46,
    "num_examples": 294,
    "is_baseline": false
  },
  {
    "task": "arc",
    "run": "arc_Markovian_20251116_134634",
    "perturbation": "truncate_back",
    "degree": "TruncateBack",
    "markovian_mean": 0.7993197278911565,
    "non_markovian_mean": 0.01020408163265306,
    "mean_difference": 0.7891156462585034,
    "difference_std": 0.5974013170095279,
    "markovian_more_sensitive": 222,
    "non_markovian_more_sensitive": 9,
    "num_examples": 294,
    "is_baseline": false
  },
  {
    "task": "arc",
    "run": "arc_Markovian_20251116_134634",
    "perturbation": "truncate_front",
    "degree": "TruncateFront",
    "markovian_mean": 0.22448979591836735,
    "non_markovian_mean": 0.006802721088435374,
    "mean_difference": 0.21768707482993196,
    "difference_std": 0.5218622697689977,
    "markovian_more_sensitive": 75,
    "non_markovian_more_sensitive": 13,
    "num_examples": 294,
    "is_baseline": false
  },
  {
    "task": "arc",
    "run": "arc_Markovian_20251116_134634",
    "perturbation": "truncate_front",
    "degree": "TruncateFront",
    "markovian_mean": 0.32653061224489793,
    "non_markovian_mean": -0.006802721088435374,
    "mean_difference": 0.3333333333333333,
    "difference_std": 0.6042179781166439,
    "markovian_more_sensitive": 111,
    "non_markovian_more_sensitive": 17,
    "num_examples": 294,
    "is_baseline": false
  },
  {
    "task": "arc",
    "run": "arc_Markovian_20251116_134634",
    "perturbation": "truncate_front",
    "degree": "TruncateFront",
    "markovian_mean": 0.5034013605442177,
    "non_markovian_mean": 0.006802721088435374,
    "mean_difference": 0.4965986394557823,
    "difference_std": 0.6937441515092224,
    "markovian_more_sensitive": 158,
    "non_markovian_more_sensitive": 20,
    "num_examples": 294,
    "is_baseline": false
  },
  {
    "task": "arc",
    "run": "arc_Markovian_20251116_134634",
    "perturbation": "truncate_front",
    "degree": "TruncateFront",
    "markovian_mean": 0.5918367346938775,
    "non_markovian_mean": 0.003401360544217687,
    "mean_difference": 0.5884353741496599,
    "difference_std": 0.678134396288038,
    "markovian_more_sensitive": 188,
    "non_markovian_more_sensitive": 19,
    "num_examples": 294,
    "is_baseline": false
  },
  {
    "task": "arc",
    "run": "arc_Markovian_20251116_134634",
    "perturbation": "truncate_front",
    "degree": "TruncateFront",
    "markovian_mean": 0.7993197278911565,
    "non_markovian_mean": -0.017006802721088437,
    "mean_difference": 0.8163265306122449,
    "difference_std": 0.6006845093493898,
    "markovian_more_sensitive": 221,
    "non_markovian_more_sensitive": 6,
    "num_examples": 294,
    "is_baseline": false
  },
  {
    "task": "arithmetic",
    "run": "arithmetic_Markovian_20251120_073407",
    "perturbation": "char_replace",
    "degree": "CharReplace",
    "markovian_mean": 0.4658203125,
    "non_markovian_mean": 0.5263671875,
    "mean_difference": -0.060546875,
    "difference_std": 0.7141470093249249,
    "markovian_more_sensitive": 228,
    "non_markovian_more_sensitive": 289,
    "num_examples": 1024,
    "is_baseline": false
  },
  {
    "task": "arithmetic",
    "run": "arithmetic_Markovian_20251120_073407",
    "perturbation": "char_replace",
    "degree": "CharReplace",
    "markovian_mean": 0.8916015625,
    "non_markovian_mean": 0.923828125,
    "mean_difference": -0.0322265625,
    "difference_std": 0.404969765747313,
    "markovian_more_sensitive": 68,
    "non_markovian_more_sensitive": 101,
    "num_examples": 1024,
    "is_baseline": false
  },
  {
    "task": "arithmetic",
    "run": "arithmetic_Markovian_20251120_073407",
    "perturbation": "char_replace",
    "degree": "CharReplace",
    "markovian_mean": 0.9619140625,
    "non_markovian_mean": 0.96875,
    "mean_difference": -0.0068359375,
    "difference_std": 0.251852799187335,
    "markovian_more_sensitive": 29,
    "non_markovian_more_sensitive": 36,
    "num_examples": 1024,
    "is_baseline": false
  },
  {
    "task": "arithmetic",
    "run": "arithmetic_Markovian_20251120_073407",
    "perturbation": "char_replace",
    "degree": "CharReplace",
    "markovian_mean": 0.966796875,
    "non_markovian_mean": 0.9765625,
    "mean_difference": -0.009765625,
    "difference_std": 0.22513525394384457,
    "markovian_more_sensitive": 21,
    "non_markovian_more_sensitive": 31,
    "num_examples": 1024,
    "is_baseline": false
  },
  {
    "task": "arithmetic",
    "run": "arithmetic_Markovian_20251120_073407",
    "perturbation": "char_replace",
    "degree": "CharReplace",
    "markovian_mean": 0.966796875,
    "non_markovian_mean": 0.9765625,
    "mean_difference": -0.009765625,
    "difference_std": 0.22513525394384457,
    "markovian_more_sensitive": 21,
    "non_markovian_more_sensitive": 31,
    "num_examples": 1024,
    "is_baseline": false
  },
  {
    "task": "arithmetic",
    "run": "arithmetic_Markovian_20251120_073407",
    "perturbation": "digit_replace",
    "degree": "DigitReplace",
    "markovian_mean": 0.45,
    "non_markovian_mean": 0.408,
    "mean_difference": 0.042,
    "difference_std": 0.7072736387000437,
    "markovian_more_sensitive": 131,
    "non_markovian_more_sensitive": 111,
    "num_examples": 500,
    "is_baseline": false
  },
  {
    "task": "arithmetic",
    "run": "arithmetic_Markovian_20251120_073407",
    "perturbation": "digit_replace",
    "degree": "DigitReplace",
    "markovian_mean": 0.734,
    "non_markovian_mean": 0.774,
    "mean_difference": -0.04,
    "difference_std": 0.5986651818838306,
    "markovian_more_sensitive": 80,
    "non_markovian_more_sensitive": 100,
    "num_examples": 500,
    "is_baseline": false
  },
  {
    "task": "arithmetic",
    "run": "arithmetic_Markovian_20251120_073407",
    "perturbation": "digit_replace",
    "degree": "DigitReplace",
    "markovian_mean": 0.874,
    "non_markovian_mean": 0.922,
    "mean_difference": -0.048,
    "difference_std": 0.4262581377522311,
    "markovian_more_sensitive": 34,
    "non_markovian_more_sensitive": 58,
    "num_examples": 500,
    "is_baseline": false
  },
  {
    "task": "arithmetic",
    "run": "arithmetic_Markovian_20251120_073407",
    "perturbation": "digit_replace",
    "degree": "DigitReplace",
    "markovian_mean": 0.944,
    "non_markovian_mean": 0.97,
    "mean_difference": -0.026,
    "difference_std": 0.28517363131958745,
    "markovian_more_sensitive": 14,
    "non_markovian_more_sensitive": 27,
    "num_examples": 500,
    "is_baseline": false
  },
  {
    "task": "arithmetic",
    "run": "arithmetic_Markovian_20251120_073407",
    "perturbation": "digit_replace",
    "degree": "DigitReplace",
    "markovian_mean": 0.958,
    "non_markovian_mean": 0.976,
    "mean_difference": -0.018,
    "difference_std": 0.24834653208772614,
    "markovian_more_sensitive": 11,
    "non_markovian_more_sensitive": 20,
    "num_examples": 500,
    "is_baseline": false
  },
  {
    "task": "gsm8k",
    "run": "gsm8k_Markovian_20251116_203940",
    "perturbation": "truncate_front",
    "degree": "TruncateFront",
    "markovian_mean": 0.01171875,
    "non_markovian_mean": 0.0107421875,
    "mean_difference": 0.0009765625,
    "difference_std": 0.3202157223274391,
    "markovian_more_sensitive": 51,
    "non_markovian_more_sensitive": 51,
    "num_examples": 1024,
    "is_baseline": false
  },
  {
    "task": "gsm8k",
    "run": "gsm8k_Markovian_20251116_203940",
    "perturbation": "truncate_front",
    "degree": "TruncateFront",
    "markovian_mean": 0.07421875,
    "non_markovian_mean": 0.05859375,
    "mean_difference": 0.015625,
    "difference_std": 0.4259066615762191,
    "markovian_more_sensitive": 97,
    "non_markovian_more_sensitive": 83,
    "num_examples": 1024,
    "is_baseline": false
  },
  {
    "task": "gsm8k",
    "run": "gsm8k_Markovian_20251116_203940",
    "perturbation": "truncate_front",
    "degree": "TruncateFront",
    "markovian_mean": 0.197265625,
    "non_markovian_mean": 0.173828125,
    "mean_difference": 0.0234375,
    "difference_std": 0.575744677434147,
    "markovian_more_sensitive": 173,
    "non_markovian_more_sensitive": 149,
    "num_examples": 1024,
    "is_baseline": false
  },
  {
    "task": "gsm8k",
    "run": "gsm8k_Markovian_20251116_203940",
    "perturbation": "truncate_front",
    "degree": "TruncateFront",
    "markovian_mean": 0.361328125,
    "non_markovian_mean": 0.3466796875,
    "mean_difference": 0.0146484375,
    "difference_std": 0.6575732740758314,
    "markovian_more_sensitive": 214,
    "non_markovian_more_sensitive": 199,
    "num_examples": 1024,
    "is_baseline": false
  },
  {
    "task": "gsm8k",
    "run": "gsm8k_Markovian_20251116_203940",
    "perturbation": "truncate_front",
    "degree": "TruncateFront",
    "markovian_mean": 0.56640625,
    "non_markovian_mean": 0.5458984375,
    "mean_difference": 0.0205078125,
    "difference_std": 0.6096308244556412,
    "markovian_more_sensitive": 184,
    "non_markovian_more_sensitive": 170,
    "num_examples": 1024,
    "is_baseline": false
  },
  {
    "task": "mmlu",
    "run": "mmlu_Markovian_20251118_043528",
    "perturbation": "digit_replace",
    "degree": "DigitReplace",
    "markovian_mean": 0.005859375,
    "non_markovian_mean": 0.00390625,
    "mean_difference": 0.001953125,
    "difference_std": 0.14656247917777038,
    "markovian_more_sensitive": 10,
    "non_markovian_more_sensitive": 9,
    "num_examples": 1024,
    "is_baseline": false
  },
  {
    "task": "mmlu",
    "run": "mmlu_Markovian_20251118_043528",
    "perturbation": "digit_replace",
    "degree": "DigitReplace",
    "markovian_mean": 0.0068359375,
    "non_markovian_mean": 0.001953125,
    "mean_difference": 0.0048828125,
    "difference_std": 0.1848130018210024,
    "markovian_more_sensitive": 20,
    "non_markovian_more_sensitive": 15,
    "num_examples": 1024,
    "is_baseline": false
  },
  {
    "task": "mmlu",
    "run": "mmlu_Markovian_20251118_043528",
    "perturbation": "digit_replace",
    "degree": "DigitReplace",
    "markovian_mean": 0.001953125,
    "non_markovian_mean": 0.013671875,
    "mean_difference": -0.01171875,
    "difference_std": 0.18713343073442945,
    "markovian_more_sensitive": 11,
    "non_markovian_more_sensitive": 22,
    "num_examples": 1024,
    "is_baseline": false
  },
  {
    "task": "mmlu",
    "run": "mmlu_Markovian_20251118_043528",
    "perturbation": "digit_replace",
    "degree": "DigitReplace",
    "markovian_mean": 0.0078125,
    "non_markovian_mean": 0.0107421875,
    "mean_difference": -0.0029296875,
    "difference_std": 0.21873038067710746,
    "markovian_more_sensitive": 21,
    "non_markovian_more_sensitive": 25,
    "num_examples": 1024,
    "is_baseline": false
  },
  {
    "task": "mmlu",
    "run": "mmlu_Markovian_20251118_043528",
    "perturbation": "digit_replace",
    "degree": "DigitReplace",
    "markovian_mean": 0.0068359375,
    "non_markovian_mean": 0.0107421875,
    "mean_difference": -0.00390625,
    "difference_std": 0.2338209597340185,
    "markovian_more_sensitive": 22,
    "non_markovian_more_sensitive": 28,
    "num_examples": 1024,
    "is_baseline": false
  },
  {
    "task": "mmlu",
    "run": "mmlu_Markovian_20251118_043528",
    "perturbation": "truncate_back",
    "degree": "TruncateBack",
    "markovian_mean": -0.0048828125,
    "non_markovian_mean": 0.0078125,
    "mean_difference": -0.0126953125,
    "difference_std": 0.5544871653523887,
    "markovian_more_sensitive": 137,
    "non_markovian_more_sensitive": 154,
    "num_examples": 1024,
    "is_baseline": false
  },
  {
    "task": "mmlu",
    "run": "mmlu_Markovian_20251118_043528",
    "perturbation": "truncate_back",
    "degree": "TruncateBack",
    "markovian_mean": 0.029296875,
    "non_markovian_mean": 0.0146484375,
    "mean_difference": 0.0146484375,
    "difference_std": 0.5700708164595067,
    "markovian_more_sensitive": 158,
    "non_markovian_more_sensitive": 142,
    "num_examples": 1024,
    "is_baseline": false
  },
  {
    "task": "mmlu",
    "run": "mmlu_Markovian_20251118_043528",
    "perturbation": "truncate_back",
    "degree": "TruncateBack",
    "markovian_mean": 0.056640625,
    "non_markovian_mean": 0.0322265625,
    "mean_difference": 0.0244140625,
    "difference_std": 0.611087056852169,
    "markovian_more_sensitive": 178,
    "non_markovian_more_sensitive": 148,
    "num_examples": 1024,
    "is_baseline": false
  },
  {
    "task": "mmlu",
    "run": "mmlu_Markovian_20251118_043528",
    "perturbation": "truncate_back",
    "degree": "TruncateBack",
    "markovian_mean": 0.1884765625,
    "non_markovian_mean": 0.080078125,
    "mean_difference": 0.1083984375,
    "difference_std": 0.675294910574305,
    "markovian_more_sensitive": 256,
    "non_markovian_more_sensitive": 154,
    "num_examples": 1024,
    "is_baseline": false
  },
  {
    "task": "mmlu",
    "run": "mmlu_Markovian_20251118_043528",
    "perturbation": "truncate_back",
    "degree": "TruncateBack",
    "markovian_mean": 0.447265625,
    "non_markovian_mean": -0.05859375,
    "mean_difference": 0.505859375,
    "difference_std": 0.613937124406571,
    "markovian_more_sensitive": 505,
    "non_markovian_more_sensitive": 26,
    "num_examples": 1024,
    "is_baseline": false
  },
  {
    "task": "svamp",
    "run": "svamp_Markovian_20251116_183609",
    "perturbation": "char_replace",
    "degree": "CharReplace",
    "markovian_mean": 0.09333333333333334,
    "non_markovian_mean": 0.016666666666666666,
    "mean_difference": 0.07666666666666666,
    "difference_std": 0.4940872617485925,
    "markovian_more_sensitive": 40,
    "non_markovian_more_sensitive": 20,
    "num_examples": 300,
    "is_baseline": false
  },
  {
    "task": "svamp",
    "run": "svamp_Markovian_20251116_183609",
    "perturbation": "char_replace",
    "degree": "CharReplace",
    "markovian_mean": 0.17666666666666667,
    "non_markovian_mean": 0.06333333333333334,
    "mean_difference": 0.11333333333333333,
    "difference_std": 0.583514257656905,
    "markovian_more_sensitive": 62,
    "non_markovian_more_sensitive": 29,
    "num_examples": 300,
    "is_baseline": false
  },
  {
    "task": "svamp",
    "run": "svamp_Markovian_20251116_183609",
    "perturbation": "char_replace",
    "degree": "CharReplace",
    "markovian_mean": 0.26666666666666666,
    "non_markovian_mean": 0.08333333333333333,
    "mean_difference": 0.18333333333333332,
    "difference_std": 0.6605973727535471,
    "markovian_more_sensitive": 84,
    "non_markovian_more_sensitive": 33,
    "num_examples": 300,
    "is_baseline": false
  },
  {
    "task": "svamp",
    "run": "svamp_Markovian_20251116_183609",
    "perturbation": "char_replace",
    "degree": "CharReplace",
    "markovian_mean": 0.32,
    "non_markovian_mean": 0.08666666666666667,
    "mean_difference": 0.23333333333333334,
    "difference_std": 0.6871842709362768,
    "markovian_more_sensitive": 100,
    "non_markovian_more_sensitive": 34,
    "num_examples": 300,
    "is_baseline": false
  },
  {
    "task": "svamp",
    "run": "svamp_Markovian_20251116_183609",
    "perturbation": "char_replace",
    "degree": "CharReplace",
    "markovian_mean": 0.3433333333333333,
    "non_markovian_mean": 0.08,
    "mean_difference": 0.2633333333333333,
    "difference_std": 0.658778330615761,
    "markovian_more_sensitive": 107,
    "non_markovian_more_sensitive": 32,
    "num_examples": 300,
    "is_baseline": false
  },
  {
    "task": "svamp",
    "run": "svamp_Markovian_20251116_183609",
    "perturbation": "delete",
    "degree": "Delete",
    "markovian_mean": 0.12666666666666668,
    "non_markovian_mean": 0.03333333333333333,
    "mean_difference": 0.09333333333333334,
    "difference_std": 0.5078932521264242,
    "markovian_more_sensitive": 50,
    "non_markovian_more_sensitive": 24,
    "num_examples": 300,
    "is_baseline": false
  },
  {
    "task": "svamp",
    "run": "svamp_Markovian_20251116_183609",
    "perturbation": "delete",
    "degree": "Delete",
    "markovian_mean": 0.23,
    "non_markovian_mean": 0.05,
    "mean_difference": 0.18,
    "difference_std": 0.6279065747917175,
    "markovian_more_sensitive": 80,
    "non_markovian_more_sensitive": 24,
    "num_examples": 300,
    "is_baseline": false
  },
  {
    "task": "svamp",
    "run": "svamp_Markovian_20251116_183609",
    "perturbation": "delete",
    "degree": "Delete",
    "markovian_mean": 0.2733333333333333,
    "non_markovian_mean": 0.09,
    "mean_difference": 0.18333333333333332,
    "difference_std": 0.6605973727535471,
    "markovian_more_sensitive": 86,
    "non_markovian_more_sensitive": 37,
    "num_examples": 300,
    "is_baseline": false
  },
  {
    "task": "svamp",
    "run": "svamp_Markovian_20251116_183609",
    "perturbation": "delete",
    "degree": "Delete",
    "markovian_mean": 0.3333333333333333,
    "non_markovian_mean": 0.06666666666666667,
    "mean_difference": 0.26666666666666666,
    "difference_std": 0.6699917080747261,
    "markovian_more_sensitive": 101,
    "non_markovian_more_sensitive": 28,
    "num_examples": 300,
    "is_baseline": false
  },
  {
    "task": "svamp",
    "run": "svamp_Markovian_20251116_183609",
    "perturbation": "delete",
    "degree": "Delete",
    "markovian_mean": 0.33,
    "non_markovian_mean": 0.06,
    "mean_difference": 0.27,
    "difference_std": 0.6509736297782474,
    "markovian_more_sensitive": 103,
    "non_markovian_more_sensitive": 28,
    "num_examples": 300,
    "is_baseline": false
  },
  {
    "task": "svamp",
    "run": "svamp_Markovian_20251116_183609",
    "perturbation": "digit_replace",
    "degree": "DigitReplace",
    "markovian_mean": 0.11666666666666667,
    "non_markovian_mean": 0.10666666666666667,
    "mean_difference": 0.01,
    "difference_std": 0.4433583952815901,
    "markovian_more_sensitive": 31,
    "non_markovian_more_sensitive": 28,
    "num_examples": 300,
    "is_baseline": false
  },
  {
    "task": "svamp",
    "run": "svamp_Markovian_20251116_183609",
    "perturbation": "digit_replace",
    "degree": "DigitReplace",
    "markovian_mean": 0.20666666666666667,
    "non_markovian_mean": 0.16666666666666666,
    "mean_difference": 0.04,
    "difference_std": 0.5583308457656028,
    "markovian_more_sensitive": 51,
    "non_markovian_more_sensitive": 40,
    "num_examples": 300,
    "is_baseline": false
  },
  {
    "task": "svamp",
    "run": "svamp_Markovian_20251116_183609",
    "perturbation": "digit_replace",
    "degree": "DigitReplace",
    "markovian_mean": 0.29,
    "non_markovian_mean": 0.22,
    "mean_difference": 0.07,
    "difference_std": 0.5701754116059373,
    "markovian_more_sensitive": 58,
    "non_markovian_more_sensitive": 35,
    "num_examples": 300,
    "is_baseline": false
  },
  {
    "task": "svamp",
    "run": "svamp_Markovian_20251116_183609",
    "perturbation": "digit_replace",
    "degree": "DigitReplace",
    "markovian_mean": 0.33666666666666667,
    "non_markovian_mean": 0.29333333333333333,
    "mean_difference": 0.043333333333333335,
    "difference_std": 0.5669705067775179,
    "markovian_more_sensitive": 53,
    "non_markovian_more_sensitive": 41,
    "num_examples": 300,
    "is_baseline": false
  },
  {
    "task": "svamp",
    "run": "svamp_Markovian_20251116_183609",
    "perturbation": "digit_replace",
    "degree": "DigitReplace",
    "markovian_mean": 0.35,
    "non_markovian_mean": 0.31,
    "mean_difference": 0.04,
    "difference_std": 0.570146180086008,
    "markovian_more_sensitive": 51,
    "non_markovian_more_sensitive": 38,
    "num_examples": 300,
    "is_baseline": false
  },
  {
    "task": "svamp",
    "run": "svamp_Markovian_20251116_183609",
    "perturbation": "truncate_back",
    "degree": "TruncateBack",
    "markovian_mean": 0.006666666666666667,
    "non_markovian_mean": -0.013333333333333334,
    "mean_difference": 0.02,
    "difference_std": 0.3824482535803591,
    "markovian_more_sensitive": 21,
    "non_markovian_more_sensitive": 17,
    "num_examples": 300,
    "is_baseline": false
  },
  {
    "task": "svamp",
    "run": "svamp_Markovian_20251116_183609",
    "perturbation": "truncate_back",
    "degree": "TruncateBack",
    "markovian_mean": -0.013333333333333334,
    "non_markovian_mean": -0.02,
    "mean_difference": 0.006666666666666667,
    "difference_std": 0.3999444405858838,
    "markovian_more_sensitive": 24,
    "non_markovian_more_sensitive": 21,
    "num_examples": 300,
    "is_baseline": false
  },
  {
    "task": "svamp",
    "run": "svamp_Markovian_20251116_183609",
    "perturbation": "truncate_back",
    "degree": "TruncateBack",
    "markovian_mean": 0.0033333333333333335,
    "non_markovian_mean": 0.016666666666666666,
    "mean_difference": -0.013333333333333334,
    "difference_std": 0.41611964091539294,
    "markovian_more_sensitive": 22,
    "non_markovian_more_sensitive": 27,
    "num_examples": 300,
    "is_baseline": false
  },
  {
    "task": "svamp",
    "run": "svamp_Markovian_20251116_183609",
    "perturbation": "truncate_back",
    "degree": "TruncateBack",
    "markovian_mean": 0.013333333333333334,
    "non_markovian_mean": 0.10666666666666667,
    "mean_difference": -0.09333333333333334,
    "difference_std": 0.4809250345832382,
    "markovian_more_sensitive": 21,
    "non_markovian_more_sensitive": 48,
    "num_examples": 300,
    "is_baseline": false
  },
  {
    "task": "svamp",
    "run": "svamp_Markovian_20251116_183609",
    "perturbation": "truncate_back",
    "degree": "TruncateBack",
    "markovian_mean": 0.32666666666666666,
    "non_markovian_mean": 0.05333333333333334,
    "mean_difference": 0.2733333333333333,
    "difference_std": 0.7155106956262468,
    "markovian_more_sensitive": 104,
    "non_markovian_more_sensitive": 30,
    "num_examples": 300,
    "is_baseline": false
  },
  {
    "task": "svamp",
    "run": "svamp_Markovian_20251116_183609",
    "perturbation": "truncate_front",
    "degree": "TruncateFront",
    "markovian_mean": 0.0,
    "non_markovian_mean": 0.013333333333333334,
    "mean_difference": -0.013333333333333334,
    "difference_std": 0.32632635334721116,
    "markovian_more_sensitive": 13,
    "non_markovian_more_sensitive": 16,
    "num_examples": 300,
    "is_baseline": false
  },
  {
    "task": "svamp",
    "run": "svamp_Markovian_20251116_183609",
    "perturbation": "truncate_front",
    "degree": "TruncateFront",
    "markovian_mean": 0.02,
    "non_markovian_mean": 0.013333333333333334,
    "mean_difference": 0.006666666666666667,
    "difference_std": 0.35584016386886713,
    "markovian_more_sensitive": 18,
    "non_markovian_more_sensitive": 14,
    "num_examples": 300,
    "is_baseline": false
  },
  {
    "task": "svamp",
    "run": "svamp_Markovian_20251116_183609",
    "perturbation": "truncate_front",
    "degree": "TruncateFront",
    "markovian_mean": 0.05333333333333334,
    "non_markovian_mean": 0.06333333333333334,
    "mean_difference": -0.01,
    "difference_std": 0.4433583952815901,
    "markovian_more_sensitive": 26,
    "non_markovian_more_sensitive": 30,
    "num_examples": 300,
    "is_baseline": false
  },
  {
    "task": "svamp",
    "run": "svamp_Markovian_20251116_183609",
    "perturbation": "truncate_front",
    "degree": "TruncateFront",
    "markovian_mean": 0.22,
    "non_markovian_mean": 0.05333333333333334,
    "mean_difference": 0.16666666666666666,
    "difference_std": 0.6420453428086075,
    "markovian_more_sensitive": 81,
    "non_markovian_more_sensitive": 33,
    "num_examples": 300,
    "is_baseline": false
  },
  {
    "task": "svamp",
    "run": "svamp_Markovian_20251116_183609",
    "perturbation": "truncate_front",
    "degree": "TruncateFront",
    "markovian_mean": 0.33,
    "non_markovian_mean": 0.09,
    "mean_difference": 0.24,
    "difference_std": 0.708801805866774,
    "markovian_more_sensitive": 103,
    "non_markovian_more_sensitive": 38,
    "num_examples": 300,
    "is_baseline": false
  },
  {
    "task": "wiki_continuation",
    "run": "wiki_continuation_Markovian_20251116_015826",
    "perturbation": "char_replace",
    "degree": "CharReplace",
    "markovian_mean": 0.36395263671875,
    "non_markovian_mean": -0.05169677734375,
    "mean_difference": 0.4156494140625,
    "difference_std": 0.2209608548026673,
    "markovian_more_sensitive": 126,
    "non_markovian_more_sensitive": 1,
    "num_examples": 128,
    "is_baseline": false
  },
  {
    "task": "wiki_continuation",
    "run": "wiki_continuation_Markovian_20251116_015826",
    "perturbation": "char_replace",
    "degree": "CharReplace",
    "markovian_mean": 0.69744873046875,
    "non_markovian_mean": -0.1065673828125,
    "mean_difference": 0.80401611328125,
    "difference_std": 0.29760976889031404,
    "markovian_more_sensitive": 128,
    "non_markovian_more_sensitive": 0,
    "num_examples": 128,
    "is_baseline": false
  },
  {
    "task": "wiki_continuation",
    "run": "wiki_continuation_Markovian_20251116_015826",
    "perturbation": "char_replace",
    "degree": "CharReplace",
    "markovian_mean": 0.86822509765625,
    "non_markovian_mean": -0.15240478515625,
    "mean_difference": 1.0206298828125,
    "difference_std": 0.31697199128991027,
    "markovian_more_sensitive": 128,
    "non_markovian_more_sensitive": 0,
    "num_examples": 128,
    "is_baseline": false
  },
  {
    "task": "wiki_continuation",
    "run": "wiki_continuation_Markovian_20251116_015826",
    "perturbation": "char_replace",
    "degree": "CharReplace",
    "markovian_mean": 0.88409423828125,
    "non_markovian_mean": -0.16766357421875,
    "mean_difference": 1.0517578125,
    "difference_std": 0.3240893002117144,
    "markovian_more_sensitive": 128,
    "non_markovian_more_sensitive": 0,
    "num_examples": 128,
    "is_baseline": false
  },
  {
    "task": "wiki_continuation",
    "run": "wiki_continuation_Markovian_20251116_015826",
    "perturbation": "char_replace",
    "degree": "CharReplace",
    "markovian_mean": 0.88604736328125,
    "non_markovian_mean": -0.17388916015625,
    "mean_difference": 1.0599365234375,
    "difference_std": 0.3310490835610112,
    "markovian_more_sensitive": 128,
    "non_markovian_more_sensitive": 0,
    "num_examples": 128,
    "is_baseline": false
  },
  {
    "task": "wiki_continuation",
    "run": "wiki_continuation_Markovian_20251116_015826",
    "perturbation": "delete",
    "degree": "Delete",
    "markovian_mean": 0.36639404296875,
    "non_markovian_mean": -0.06744384765625,
    "mean_difference": 0.433837890625,
    "difference_std": 0.22069434764591328,
    "markovian_more_sensitive": 128,
    "non_markovian_more_sensitive": 0,
    "num_examples": 128,
    "is_baseline": false
  },
  {
    "task": "wiki_continuation",
    "run": "wiki_continuation_Markovian_20251116_015826",
    "perturbation": "delete",
    "degree": "Delete",
    "markovian_mean": 0.73797607421875,
    "non_markovian_mean": -0.09381103515625,
    "mean_difference": 0.831787109375,
    "difference_std": 0.30171346492869855,
    "markovian_more_sensitive": 128,
    "non_markovian_more_sensitive": 0,
    "num_examples": 128,
    "is_baseline": false
  },
  {
    "task": "wiki_continuation",
    "run": "wiki_continuation_Markovian_20251116_015826",
    "perturbation": "delete",
    "degree": "Delete",
    "markovian_mean": 0.89337158203125,
    "non_markovian_mean": -0.114501953125,
    "mean_difference": 1.00787353515625,
    "difference_std": 0.30015518004600544,
    "markovian_more_sensitive": 128,
    "non_markovian_more_sensitive": 0,
    "num_examples": 128,
    "is_baseline": false
  },
  {
    "task": "wiki_continuation",
    "run": "wiki_continuation_Markovian_20251116_015826",
    "perturbation": "delete",
    "degree": "Delete",
    "markovian_mean": 0.92718505859375,
    "non_markovian_mean": -0.15155029296875,
    "mean_difference": 1.0787353515625,
    "difference_std": 0.3128013826465903,
    "markovian_more_sensitive": 128,
    "non_markovian_more_sensitive": 0,
    "num_examples": 128,
    "is_baseline": false
  },
  {
    "task": "wiki_continuation",
    "run": "wiki_continuation_Markovian_20251116_015826",
    "perturbation": "delete",
    "degree": "Delete",
    "markovian_mean": 0.96942138671875,
    "non_markovian_mean": -0.28363037109375,
    "mean_difference": 1.2530517578125,
    "difference_std": 0.33836901981944245,
    "markovian_more_sensitive": 128,
    "non_markovian_more_sensitive": 0,
    "num_examples": 128,
    "is_baseline": false
  },
  {
    "task": "wiki_continuation",
    "run": "wiki_continuation_Markovian_20251116_015826",
    "perturbation": "truncate_back",
    "degree": "TruncateBack",
    "markovian_mean": 0.250732421875,
    "non_markovian_mean": -0.00830078125,
    "mean_difference": 0.259033203125,
    "difference_std": 0.22616529175132652,
    "markovian_more_sensitive": 116,
    "non_markovian_more_sensitive": 11,
    "num_examples": 128,
    "is_baseline": false
  },
  {
    "task": "wiki_continuation",
    "run": "wiki_continuation_Markovian_20251116_015826",
    "perturbation": "truncate_back",
    "degree": "TruncateBack",
    "markovian_mean": 0.357421875,
    "non_markovian_mean": -0.0172119140625,
    "mean_difference": 0.3746337890625,
    "difference_std": 0.25931340485858795,
    "markovian_more_sensitive": 122,
    "non_markovian_more_sensitive": 4,
    "num_examples": 128,
    "is_baseline": false
  },
  {
    "task": "wiki_continuation",
    "run": "wiki_continuation_Markovian_20251116_015826",
    "perturbation": "truncate_back",
    "degree": "TruncateBack",
    "markovian_mean": 0.572509765625,
    "non_markovian_mean": -0.041259765625,
    "mean_difference": 0.61376953125,
    "difference_std": 0.34853945211348086,
    "markovian_more_sensitive": 126,
    "non_markovian_more_sensitive": 2,
    "num_examples": 128,
    "is_baseline": false
  },
  {
    "task": "wiki_continuation",
    "run": "wiki_continuation_Markovian_20251116_015826",
    "perturbation": "truncate_back",
    "degree": "TruncateBack",
    "markovian_mean": 0.90545654296875,
    "non_markovian_mean": -0.1256103515625,
    "mean_difference": 1.03106689453125,
    "difference_std": 0.32991840516094284,
    "markovian_more_sensitive": 128,
    "non_markovian_more_sensitive": 0,
    "num_examples": 128,
    "is_baseline": false
  },
  {
    "task": "wiki_continuation",
    "run": "wiki_continuation_Markovian_20251116_015826",
    "perturbation": "truncate_back",
    "degree": "TruncateBack",
    "markovian_mean": 0.94244384765625,
    "non_markovian_mean": -0.28363037109375,
    "mean_difference": 1.22607421875,
    "difference_std": 0.35850452651141634,
    "markovian_more_sensitive": 128,
    "non_markovian_more_sensitive": 0,
    "num_examples": 128,
    "is_baseline": false
  }
]