import json

mapping_fxn = {(True,True): 1.0, # correctly accepting is worth full reward
(False, False): 1.0, # correct rejection is also worth full reward
(True, False): -1.0, # false rejection is WORSE than false acceptance
(False, True): -0.5} # false acceptance is better

with open("trained_calibration/configs/dpo/mapping_fxn_false_accept_over_false_reject.json", "w") as f:
    json.dump(mapping_fxn, f, indent=4)