import pandas as pd

a_and_b = {0, 2, 3, 5, 6, 8, 9, 10, 11, 13, 14, 15, 20, 21, 23, 25, 26, 27, 28, 29, 30, 31, 32, 34, 35, 36, 37, 38, 41, 42, 44, 46, 48, 49, 51, 52, 54, 56, 59, 62, 64, 66, 67, 69, 72, 74, 77, 80, 81, 82, 83, 86, 87, 89, 90, 93, 96, 97, 99, 101, 102, 104, 105, 107, 108, 110, 111, 112, 113, 115, 117, 119, 120, 124, 125, 128, 129, 134, 135, 138, 139, 140, 141, 143, 144, 146, 148, 149, 150, 151, 152, 154, 161, 163, 165, 166, 170, 171, 174, 175, 177, 178, 179, 180, 183, 184, 185, 187, 188, 192, 193, 198, 201, 202, 205, 206, 209, 210, 211, 213, 214, 215, 216, 219, 221, 222, 226, 228, 229, 230, 235, 238, 239, 240, 241, 245, 246, 247, 248, 249, 250, 251, 252, 253, 255, 256, 257, 258, 260, 261, 262, 265, 266, 268, 270, 271, 273, 275, 276, 279, 281, 286, 288, 289, 290, 291, 293, 295, 296, 299, 300, 302, 304, 306, 308, 309, 310, 311, 313, 314, 315, 316, 319, 321, 322, 325, 326, 328, 329, 330, 331, 332, 333, 336, 338, 342, 343, 345, 346, 349, 350, 352, 353, 354, 356, 358, 359, 362, 368, 370, 371, 372, 374, 379, 380, 383, 384, 385, 388, 390, 392, 394, 396, 398}
print(len(a_and_b))
a_not_b = {386, 131, 387, 389, 395, 12, 269, 142, 399, 272, 274, 19, 282, 155, 287, 160, 33, 294, 39, 169, 297, 298, 172, 301, 303, 305, 182, 312, 57, 58, 60, 61, 189, 317, 320, 65, 194, 68, 196, 324, 71, 199, 78, 334, 208, 335, 337, 84, 212, 341, 91, 92, 347, 94, 223, 348, 351, 232, 233, 377, 363, 236, 237, 364, 367, 114, 242, 116, 243, 373, 375, 376, 121, 122, 382, 127}
print(len(a_not_b))

def count_c(s, d):
    cnt, num = 0, 0
    for task_id in s:
        cnt += int(d[str(task_id)])
        num += 1
    print(f"avg: {cnt / num}")

df = pd.read_csv("control_flow.csv", names = ["task", "control_flow_num"])
dd_c = {r["task"]: r["control_flow_num"] for r in df.to_dict('records')}

df = pd.read_csv("hole_num.csv", names = ["task", "hole", "fun"])
dd_h = {r["task"]: r["hole"] for r in df.to_dict('records')}

print("A & B Control")
count_c(a_and_b, dd_c)

print("A - B Control")
count_c(a_not_b, dd_c)

print("A & B Hole")
count_c(a_and_b, dd_h)

print("A - B Hole")
count_c(a_not_b, dd_h)
