
name: ???


mode: sync


temperature: 1.0


top_k: -1


top_p: 1



prompt_length: ${oc.select:data.max_prompt_length,512}



response_length: ${oc.select:data.max_response_length,512}



dtype: bfloat16


gpu_memory_utilization: 0.5


ignore_eos: False


enforce_eager: True


free_cache_engine: True


tensor_model_parallel_size: 2


max_num_batched_tokens: 8192


max_model_len: null


max_num_seqs: 512


log_prob_micro_batch_size: null


log_prob_micro_batch_size_per_gpu: null



log_prob_use_dynamic_bsz: ${oc.select:actor_rollout_ref.actor.use_dynamic_bsz,false}



log_prob_max_token_len_per_gpu: ${oc.select:actor_rollout_ref.actor.ppo_max_token_len_per_gpu,16384}


disable_log_stats: True



do_sample: True


n: 1


multi_stage_wake_up: false


engine_kwargs:


  vllm:


    swap_space: null


    disable_mm_preprocessor_cache: False


  sglang:


    attention_backend: null


val_kwargs:



  top_k: -1


  top_p: 1.0


  temperature: 0


  n: 1


  do_sample: False


multi_turn:


  enable: False


  max_assistant_turns: null


  tool_config_path: null


  max_user_turns: null


  max_parallel_calls: 1


  max_tool_response_length: 256


  tool_response_truncate_side: middle


  interaction_config_path: null




  use_inference_chat_template: False









  tokenization_sanity_check_mode: strict


  format: hermes


calculate_log_probs: False


agent:


  num_workers: 8











  agent_loop_config_path: null


  custom_async_server:


    path: null


    name: null


update_weights_bucket_megabytes: 512


trace:


  backend: null


  token2text: False




skip_rollout: False



skip_dump_dir: /tmp/rollout_dump
