debug: True
reward_model: "mistral_weqweasdas" #refer to constants.py for Alias
postreward_dataset_hfhub_name: null
gpus: [0,1,2,3,4,5,6,7]
start: 2
end: 50


prereward_dataset_hfhub_name: "{author}/personalization_prompt_response"
cache_dir: "/shared/share_mala/{author}/huggingface/cache" #huggingface local cache
columns: 8 # number of columns of responses to score rewards with. ie 8 responses = 8 columns
batch_size: 1
