python3 src/rlhf_model_training/rlhf_model_pipeline.py --model_name 'EleutherAI/pythia-70m' --reward_function 'utility_reward'
