
tokenizer: null


use_shm: False





train_files: ~/data/rlhf/gsm8k/train.parquet


val_files: ~/data/rlhf/gsm8k/test.parquet


prompt_key: prompt


reward_fn_key: data_source




max_prompt_length: 512



max_response_length: 512


train_batch_size: 1024


val_batch_size: null




return_raw_input_ids: False


return_raw_chat: False


return_full_prompt: False


shuffle: True


dataloader_num_workers: 8


validation_shuffle: False


filter_overlong_prompts: False




filter_overlong_prompts_workers: 1



truncation: error


image_key: images


video_key: videos


trust_remote_code: False


custom_cls:


  path: null


  name: null


return_multi_modal_inputs: True


sampler:



  class_path: null


  class_name: null


datagen:



  path: null



  name: null