
"""
Pre-processes the SWE-V annotations for Experiment 3

The original annotations include a raw dataset with three annotations per instance,
and an ensembled dataset that takes the highest-severity score for each instance.

For Experiment 3, the raw annotations are re-ensembled by selecting instances where
all three annotators agree and all three have high confidence values (4 or 5).
This should make the final ground-truth labels more reliable.

There is no subsample provided for Experiment 3, so the list of sample IDs is
generated by this script alongside the processed annotations.

"""

import pandas as pd

print("\nPreprocessing for Experiment 3\n")

input_annotations = "inputs/swe-bench-annotation-results/samples_with_3_annotations_public.csv"
output_annotations = "inputs/annotations/experiment3_annotations.csv"
output_sample = "inputs/samples/experiment3_sample.txt"

print("Loading raw annotations")
cols = ["instance_id", "false_negative", "annotator_confidence"]  # false_negative = four-point test scores
df_raw = pd.read_csv(input_annotations, usecols=cols)  # start with all swe-v annotations (no subsample)

print("Selecting high-confidence annotations")
df_raw = df_raw[df_raw['annotator_confidence'].isin([4,5])]

print("Selecting instances where all three annotators agree (min == max)")
df_ensembled = df_raw.groupby("instance_id")['false_negative'].agg(min_score='min', max_score='max', count_score='count')
df_ensembled = df_ensembled[(df_ensembled.count_score == 3) & (df_ensembled.min_score == df_ensembled.max_score)]  # three annotators agree
df_ensembled = df_ensembled['min_score'].to_frame().rename(columns={'min_score':'false_negative'})  # rename for consistency

print("Converting ensembled scores to binary labels")
df_ensembled = df_ensembled.map(lambda score: True if score >= 2 else False)

print("Writing ensembled annotations and sample list")
df_ensembled.to_csv(output_annotations)
df_ensembled.reset_index(inplace=True)
df_ensembled['instance_id'].to_csv(output_sample, index=False)
