debug: True
reward_model: "mistral_weqweasdas" #refer to constants.py for Alias
prereward_dataset_hfhub_name: "{author}/personalization_prompt_response"
postreward_dataset_hfhub_name: null
gpus: [0,1,2,3,4,5,6,7]


cache_dir: "/shared/share_mala/{author}/huggingface/cache" #huggingface local cache
columns: 8 # number of columns of responses to score rewards with. ie 8 responses = 8 columns
batch_size: 1
