[
  {
    "dataset": "227_cpu_small",
    "baseline": "linreg",
    "sample_size": 1638,
    "mse": 0.0110940892,
    "mse_std": 0.0033707146,
    "aug_mse": 0.0110661763,
    "aug_mse_std": 0.0032597523,
    "delta_mse": 0.0418146246,
    "delta_mse_std": 2.2314908157,
    "p_wilcoxon": 0.4613932292,
    "p_wilcoxon_std": 0.1352050066,
    "should_proceed": false
  },
  {
    "dataset": "227_cpu_small",
    "baseline": "linreg",
    "sample_size": 3276,
    "mse": 0.0109345848,
    "mse_std": 0.0022293482,
    "aug_mse": 0.0110119898,
    "aug_mse_std": 0.0023403267,
    "delta_mse": 0.5832619461,
    "delta_mse_std": 1.5757413848,
    "p_wilcoxon": 0.50625,
    "p_wilcoxon_std": 0.1459716722,
    "should_proceed": false
  },
  {
    "dataset": "227_cpu_small",
    "baseline": "linreg",
    "sample_size": 4914,
    "mse": 0.009789339,
    "mse_std": 0.0011423725,
    "aug_mse": 0.0097840051,
    "aug_mse_std": 0.0011449126,
    "delta_mse": -0.0471015939,
    "delta_mse_std": 0.8810020365,
    "p_wilcoxon": 0.451953125,
    "p_wilcoxon_std": 0.1464488672,
    "should_proceed": false
  },
  {
    "dataset": "227_cpu_small",
    "baseline": "linreg",
    "sample_size": 6552,
    "mse": 0.0098336584,
    "mse_std": 0.0013936254,
    "aug_mse": 0.0098869204,
    "aug_mse_std": 0.0013979864,
    "delta_mse": 0.5498973778,
    "delta_mse_std": 0.7083916493,
    "p_wilcoxon": 0.5147135417,
    "p_wilcoxon_std": 0.113610483,
    "should_proceed": false
  },
  {
    "dataset": "227_cpu_small",
    "baseline": "linreg",
    "sample_size": 8190,
    "mse": 0.0097047149,
    "mse_std": 0.0013432156,
    "aug_mse": 0.0097089273,
    "aug_mse_std": 0.0013404891,
    "delta_mse": 0.0491080425,
    "delta_mse_std": 0.3822691654,
    "p_wilcoxon": 0.4559244792,
    "p_wilcoxon_std": 0.156842491,
    "should_proceed": false
  },
  {
    "dataset": "294_satellite_image",
    "baseline": "linreg",
    "sample_size": 1287,
    "mse": 0.04211874,
    "mse_std": 0.0025309515,
    "aug_mse": 0.0421849001,
    "aug_mse_std": 0.0025468422,
    "delta_mse": 0.1566989153,
    "delta_mse_std": 0.5528973624,
    "p_wilcoxon": 0.2395833333,
    "p_wilcoxon_std": 0.142800762,
    "should_proceed": false
  },
  {
    "dataset": "294_satellite_image",
    "baseline": "linreg",
    "sample_size": 2574,
    "mse": 0.0411477281,
    "mse_std": 0.0019544091,
    "aug_mse": 0.0411306657,
    "aug_mse_std": 0.0019506307,
    "delta_mse": -0.0404409272,
    "delta_mse_std": 0.2571218653,
    "p_wilcoxon": 0.2641927083,
    "p_wilcoxon_std": 0.1250706113,
    "should_proceed": false
  },
  {
    "dataset": "294_satellite_image",
    "baseline": "linreg",
    "sample_size": 3861,
    "mse": 0.0406462461,
    "mse_std": 0.0015029149,
    "aug_mse": 0.0406658744,
    "aug_mse_std": 0.0015220436,
    "delta_mse": 0.0466463671,
    "delta_mse_std": 0.1918511997,
    "p_wilcoxon": 0.2745442708,
    "p_wilcoxon_std": 0.0958782588,
    "should_proceed": false
  },
  {
    "dataset": "294_satellite_image",
    "baseline": "linreg",
    "sample_size": 5148,
    "mse": 0.0401539033,
    "mse_std": 0.0011770541,
    "aug_mse": 0.0401830392,
    "aug_mse_std": 0.0011458256,
    "delta_mse": 0.07503431,
    "delta_mse_std": 0.1923073618,
    "p_wilcoxon": 0.3925130208,
    "p_wilcoxon_std": 0.1419154955,
    "should_proceed": false
  },
  {
    "dataset": "294_satellite_image",
    "baseline": "linreg",
    "sample_size": 6435,
    "mse": 0.0404922127,
    "mse_std": 0.0011260921,
    "aug_mse": 0.0405093189,
    "aug_mse_std": 0.0011169414,
    "delta_mse": 0.0430095425,
    "delta_mse_std": 0.1784654288,
    "p_wilcoxon": 0.3465494792,
    "p_wilcoxon_std": 0.1196894732,
    "should_proceed": false
  },
  {
    "dataset": "503_wind",
    "baseline": "linreg",
    "sample_size": 1314,
    "mse": 0.0073353233,
    "mse_std": 0.0010128642,
    "aug_mse": 0.0073391599,
    "aug_mse_std": 0.0010089606,
    "delta_mse": 0.0590924408,
    "delta_mse_std": 0.3996893594,
    "p_wilcoxon": 0.5007161458,
    "p_wilcoxon_std": 0.1643182479,
    "should_proceed": false
  },
  {
    "dataset": "503_wind",
    "baseline": "linreg",
    "sample_size": 2628,
    "mse": 0.0063628879,
    "mse_std": 0.0005024885,
    "aug_mse": 0.0063677735,
    "aug_mse_std": 0.0005036327,
    "delta_mse": 0.0756496513,
    "delta_mse_std": 0.2082405002,
    "p_wilcoxon": 0.4680989583,
    "p_wilcoxon_std": 0.1081983459,
    "should_proceed": false
  },
  {
    "dataset": "503_wind",
    "baseline": "linreg",
    "sample_size": 3942,
    "mse": 0.0065797273,
    "mse_std": 0.0003799669,
    "aug_mse": 0.0065825079,
    "aug_mse_std": 0.000380527,
    "delta_mse": 0.0419633805,
    "delta_mse_std": 0.1494521485,
    "p_wilcoxon": 0.4930989583,
    "p_wilcoxon_std": 0.1122191515,
    "should_proceed": false
  },
  {
    "dataset": "503_wind",
    "baseline": "linreg",
    "sample_size": 5256,
    "mse": 0.0065833743,
    "mse_std": 0.0003249035,
    "aug_mse": 0.0065835699,
    "aug_mse_std": 0.0003264795,
    "delta_mse": 0.0019145248,
    "delta_mse_std": 0.1168131618,
    "p_wilcoxon": 0.4977213542,
    "p_wilcoxon_std": 0.0950997847,
    "should_proceed": false
  },
  {
    "dataset": "503_wind",
    "baseline": "linreg",
    "sample_size": 6570,
    "mse": 0.006175107,
    "mse_std": 0.0001940659,
    "aug_mse": 0.0061749633,
    "aug_mse_std": 0.0001915566,
    "delta_mse": -0.001071816,
    "delta_mse_std": 0.0895109168,
    "p_wilcoxon": 0.5284505208,
    "p_wilcoxon_std": 0.1285218912,
    "should_proceed": false
  },
  {
    "dataset": "623_fri_c4_1000_10",
    "baseline": "linreg",
    "sample_size": 200,
    "mse": 0.0232648214,
    "mse_std": 0.0038290412,
    "aug_mse": 0.0233173472,
    "aug_mse_std": 0.0037901543,
    "delta_mse": 0.2855557809,
    "delta_mse_std": 2.3425349252,
    "p_wilcoxon": 0.3063802083,
    "p_wilcoxon_std": 0.112905417,
    "should_proceed": false
  },
  {
    "dataset": "623_fri_c4_1000_10",
    "baseline": "linreg",
    "sample_size": 400,
    "mse": 0.022073479,
    "mse_std": 0.0021368129,
    "aug_mse": 0.022100939,
    "aug_mse_std": 0.0021396551,
    "delta_mse": 0.1283039489,
    "delta_mse_std": 0.992691457,
    "p_wilcoxon": 0.3651041667,
    "p_wilcoxon_std": 0.1227141182,
    "should_proceed": false
  },
  {
    "dataset": "623_fri_c4_1000_10",
    "baseline": "linreg",
    "sample_size": 600,
    "mse": 0.0213318212,
    "mse_std": 0.0018714406,
    "aug_mse": 0.0213583809,
    "aug_mse_std": 0.0018964355,
    "delta_mse": 0.1183012738,
    "delta_mse_std": 0.6099247036,
    "p_wilcoxon": 0.3853515625,
    "p_wilcoxon_std": 0.1498034567,
    "should_proceed": false
  },
  {
    "dataset": "623_fri_c4_1000_10",
    "baseline": "linreg",
    "sample_size": 800,
    "mse": 0.015924298,
    "mse_std": 0.0014803468,
    "aug_mse": 0.0159445719,
    "aug_mse_std": 0.00149579,
    "delta_mse": 0.1192765592,
    "delta_mse_std": 0.3351513214,
    "p_wilcoxon": 0.3809895833,
    "p_wilcoxon_std": 0.1461157979,
    "should_proceed": false
  },
  {
    "dataset": "623_fri_c4_1000_10",
    "baseline": "linreg",
    "sample_size": 1000,
    "mse": 0.0159081236,
    "mse_std": 0.0014144838,
    "aug_mse": 0.0159111666,
    "aug_mse_std": 0.001397432,
    "delta_mse": 0.0297049133,
    "delta_mse_std": 0.4823153945,
    "p_wilcoxon": 0.419140625,
    "p_wilcoxon_std": 0.1215042605,
    "should_proceed": false
  },
  {
    "dataset": "ConcreteCompressiveStrength",
    "baseline": "linreg",
    "sample_size": 201,
    "mse": 0.0166212878,
    "mse_std": 0.0040543563,
    "aug_mse": 0.0165918077,
    "aug_mse_std": 0.0040407184,
    "delta_mse": -0.1536110229,
    "delta_mse_std": 1.0887229896,
    "p_wilcoxon": 0.3625,
    "p_wilcoxon_std": 0.1356684921,
    "should_proceed": false
  },
  {
    "dataset": "ConcreteCompressiveStrength",
    "baseline": "linreg",
    "sample_size": 402,
    "mse": 0.0174689259,
    "mse_std": 0.0033542669,
    "aug_mse": 0.0174305145,
    "aug_mse_std": 0.0034312966,
    "delta_mse": -0.3341100129,
    "delta_mse_std": 1.1875850778,
    "p_wilcoxon": 0.3518229167,
    "p_wilcoxon_std": 0.1188758941,
    "should_proceed": false
  },
  {
    "dataset": "ConcreteCompressiveStrength",
    "baseline": "linreg",
    "sample_size": 603,
    "mse": 0.0173229342,
    "mse_std": 0.0018281598,
    "aug_mse": 0.017335804,
    "aug_mse_std": 0.0018981089,
    "delta_mse": 0.0322626782,
    "delta_mse_std": 0.9781743839,
    "p_wilcoxon": 0.4055338542,
    "p_wilcoxon_std": 0.1096858183,
    "should_proceed": false
  },
  {
    "dataset": "ConcreteCompressiveStrength",
    "baseline": "linreg",
    "sample_size": 804,
    "mse": 0.0167109284,
    "mse_std": 0.0021350115,
    "aug_mse": 0.0167263092,
    "aug_mse_std": 0.0021787603,
    "delta_mse": 0.057400278,
    "delta_mse_std": 0.6147496132,
    "p_wilcoxon": 0.451953125,
    "p_wilcoxon_std": 0.107030062,
    "should_proceed": false
  },
  {
    "dataset": "ConcreteCompressiveStrength",
    "baseline": "linreg",
    "sample_size": 1005,
    "mse": 0.0157189589,
    "mse_std": 0.001338983,
    "aug_mse": 0.0157217693,
    "aug_mse_std": 0.0013467696,
    "delta_mse": 0.0149323815,
    "delta_mse_std": 0.3166038586,
    "p_wilcoxon": 0.4774739583,
    "p_wilcoxon_std": 0.0934092567,
    "should_proceed": false
  },
  {
    "dataset": "EnergyEfficiency",
    "baseline": "linreg",
    "sample_size": 153,
    "mse": 0.0036204533,
    "mse_std": 0.001223493,
    "aug_mse": 0.0036498733,
    "aug_mse_std": 0.0012198347,
    "delta_mse": 1.0197718886,
    "delta_mse_std": 3.5445260423,
    "p_wilcoxon": 0.4129557292,
    "p_wilcoxon_std": 0.1650353514,
    "should_proceed": false
  },
  {
    "dataset": "EnergyEfficiency",
    "baseline": "linreg",
    "sample_size": 306,
    "mse": 0.0029279248,
    "mse_std": 0.0004556871,
    "aug_mse": 0.0029264035,
    "aug_mse_std": 0.0004568618,
    "delta_mse": -0.0322637537,
    "delta_mse_std": 1.3702446943,
    "p_wilcoxon": 0.3983072917,
    "p_wilcoxon_std": 0.1467934529,
    "should_proceed": false
  },
  {
    "dataset": "EnergyEfficiency",
    "baseline": "linreg",
    "sample_size": 459,
    "mse": 0.0028719115,
    "mse_std": 0.0004630585,
    "aug_mse": 0.0028729598,
    "aug_mse_std": 0.0004620655,
    "delta_mse": 0.0444935469,
    "delta_mse_std": 0.8467760033,
    "p_wilcoxon": 0.4534505208,
    "p_wilcoxon_std": 0.1560980164,
    "should_proceed": false
  },
  {
    "dataset": "EnergyEfficiency",
    "baseline": "linreg",
    "sample_size": 612,
    "mse": 0.0026151876,
    "mse_std": 0.0003218235,
    "aug_mse": 0.0026214068,
    "aug_mse_std": 0.0003151192,
    "delta_mse": 0.2894717721,
    "delta_mse_std": 1.1472807976,
    "p_wilcoxon": 0.4524088542,
    "p_wilcoxon_std": 0.1336602019,
    "should_proceed": false
  },
  {
    "dataset": "EnergyEfficiency",
    "baseline": "linreg",
    "sample_size": 765,
    "mse": 0.002666708,
    "mse_std": 0.0002095431,
    "aug_mse": 0.0026730324,
    "aug_mse_std": 0.0002201503,
    "delta_mse": 0.2087240915,
    "delta_mse_std": 0.7439430708,
    "p_wilcoxon": 0.4357421875,
    "p_wilcoxon_std": 0.0955689695,
    "should_proceed": false
  },
  {
    "dataset": "HousePrice",
    "baseline": "linreg",
    "sample_size": 200,
    "mse": 0.0001029389,
    "mse_std": 2.37431e-05,
    "aug_mse": 0.0001034825,
    "aug_mse_std": 2.28713e-05,
    "delta_mse": 0.7670996977,
    "delta_mse_std": 2.0061238926,
    "p_wilcoxon": 0.3436197917,
    "p_wilcoxon_std": 0.1132255985,
    "should_proceed": false
  },
  {
    "dataset": "HousePrice",
    "baseline": "linreg",
    "sample_size": 400,
    "mse": 0.0001004547,
    "mse_std": 1.63567e-05,
    "aug_mse": 0.0001005442,
    "aug_mse_std": 1.63102e-05,
    "delta_mse": 0.0991641673,
    "delta_mse_std": 0.7148298493,
    "p_wilcoxon": 0.4625,
    "p_wilcoxon_std": 0.1443150128,
    "should_proceed": false
  },
  {
    "dataset": "HousePrice",
    "baseline": "linreg",
    "sample_size": 600,
    "mse": 9.95404e-05,
    "mse_std": 1.38376e-05,
    "aug_mse": 9.9615e-05,
    "aug_mse_std": 1.39024e-05,
    "delta_mse": 0.0682471911,
    "delta_mse_std": 0.4785322491,
    "p_wilcoxon": 0.5150390625,
    "p_wilcoxon_std": 0.0889825116,
    "should_proceed": false
  },
  {
    "dataset": "HousePrice",
    "baseline": "linreg",
    "sample_size": 800,
    "mse": 0.0001039586,
    "mse_std": 1.0463e-05,
    "aug_mse": 0.0001039791,
    "aug_mse_std": 1.03469e-05,
    "delta_mse": 0.0301946653,
    "delta_mse_std": 0.3439412996,
    "p_wilcoxon": 0.4761067708,
    "p_wilcoxon_std": 0.1766136493,
    "should_proceed": false
  },
  {
    "dataset": "HousePrice",
    "baseline": "linreg",
    "sample_size": 1000,
    "mse": 0.0001033912,
    "mse_std": 1.16005e-05,
    "aug_mse": 0.0001036025,
    "aug_mse_std": 1.14638e-05,
    "delta_mse": 0.2248147552,
    "delta_mse_std": 0.6322725084,
    "p_wilcoxon": 0.4452473958,
    "p_wilcoxon_std": 0.1555883888,
    "should_proceed": false
  },
  {
    "dataset": "ParkinsonsTelemonitoring",
    "baseline": "linreg",
    "sample_size": 1175,
    "mse": 0.0047502111,
    "mse_std": 0.000417576,
    "aug_mse": 0.0047541546,
    "aug_mse_std": 0.0004189657,
    "delta_mse": 0.0820232078,
    "delta_mse_std": 0.386085737,
    "p_wilcoxon": 0.4248697917,
    "p_wilcoxon_std": 0.1597907998,
    "should_proceed": false
  },
  {
    "dataset": "ParkinsonsTelemonitoring",
    "baseline": "linreg",
    "sample_size": 2350,
    "mse": 0.0046715522,
    "mse_std": 0.0003608821,
    "aug_mse": 0.0046805646,
    "aug_mse_std": 0.0003708292,
    "delta_mse": 0.1792967092,
    "delta_mse_std": 0.539395542,
    "p_wilcoxon": 0.3333984375,
    "p_wilcoxon_std": 0.0964652636,
    "should_proceed": false
  },
  {
    "dataset": "ParkinsonsTelemonitoring",
    "baseline": "linreg",
    "sample_size": 3525,
    "mse": 0.0046513566,
    "mse_std": 0.0003598472,
    "aug_mse": 0.0046503584,
    "aug_mse_std": 0.0003563438,
    "delta_mse": -0.0151504661,
    "delta_mse_std": 0.2395372597,
    "p_wilcoxon": 0.3552083333,
    "p_wilcoxon_std": 0.103094334,
    "should_proceed": false
  },
  {
    "dataset": "ParkinsonsTelemonitoring",
    "baseline": "linreg",
    "sample_size": 4700,
    "mse": 0.0046175526,
    "mse_std": 0.000286521,
    "aug_mse": 0.004619636,
    "aug_mse_std": 0.000285307,
    "delta_mse": 0.0468796616,
    "delta_mse_std": 0.1880499121,
    "p_wilcoxon": 0.4492838542,
    "p_wilcoxon_std": 0.1109479681,
    "should_proceed": false
  },
  {
    "dataset": "ParkinsonsTelemonitoring",
    "baseline": "linreg",
    "sample_size": 5875,
    "mse": 0.0046547053,
    "mse_std": 0.000203748,
    "aug_mse": 0.0046550561,
    "aug_mse_std": 0.000201277,
    "delta_mse": 0.0099633854,
    "delta_mse_std": 0.1045584754,
    "p_wilcoxon": 0.4291666667,
    "p_wilcoxon_std": 0.0887299813,
    "should_proceed": false
  },
  {
    "dataset": "WineQuality",
    "baseline": "linreg",
    "sample_size": 1063,
    "mse": 0.0215258403,
    "mse_std": 0.0024625573,
    "aug_mse": 0.0215443125,
    "aug_mse_std": 0.0025056744,
    "delta_mse": 0.0659327808,
    "delta_mse_std": 0.8995365152,
    "p_wilcoxon": 0.3926432292,
    "p_wilcoxon_std": 0.0958023685,
    "should_proceed": false
  },
  {
    "dataset": "WineQuality",
    "baseline": "linreg",
    "sample_size": 2126,
    "mse": 0.0151255207,
    "mse_std": 0.0012008827,
    "aug_mse": 0.0151308288,
    "aug_mse_std": 0.0011900705,
    "delta_mse": 0.040714915,
    "delta_mse_std": 0.1862562724,
    "p_wilcoxon": 0.4520833333,
    "p_wilcoxon_std": 0.1223626534,
    "should_proceed": false
  },
  {
    "dataset": "WineQuality",
    "baseline": "linreg",
    "sample_size": 3189,
    "mse": 0.0154476112,
    "mse_std": 0.0007695238,
    "aug_mse": 0.0154606846,
    "aug_mse_std": 0.0007635953,
    "delta_mse": 0.0869432566,
    "delta_mse_std": 0.1909212092,
    "p_wilcoxon": 0.4430338542,
    "p_wilcoxon_std": 0.1020861567,
    "should_proceed": false
  },
  {
    "dataset": "WineQuality",
    "baseline": "linreg",
    "sample_size": 4252,
    "mse": 0.0148303728,
    "mse_std": 0.0010113357,
    "aug_mse": 0.0148392816,
    "aug_mse_std": 0.0010059435,
    "delta_mse": 0.0628389203,
    "delta_mse_std": 0.1631058388,
    "p_wilcoxon": 0.487109375,
    "p_wilcoxon_std": 0.132451159,
    "should_proceed": false
  },
  {
    "dataset": "WineQuality",
    "baseline": "linreg",
    "sample_size": 5315,
    "mse": 0.0148936638,
    "mse_std": 0.0006281038,
    "aug_mse": 0.0148958235,
    "aug_mse_std": 0.0006357674,
    "delta_mse": 0.0122970919,
    "delta_mse_std": 0.1245891719,
    "p_wilcoxon": 0.505078125,
    "p_wilcoxon_std": 0.0913819023,
    "should_proceed": false
  }
]