
defaults:


  - critic


  - _self_


_target_: verl.workers.config.McoreCriticConfig

strategy: megatron


nccl_timeout: 600


optim:


  _target_: verl.workers.config.McoreOptimizerConfig


  optimizer: adam


  clip_grad: 1.0


  lr_warmup_init: 0.0

  lr_decay_steps: null


  lr_decay_style: linear


  min_lr: 0.0


  weight_decay_incr_style: constant


  lr_wsd_decay_style: exponential


  lr_wsd_decay_steps: null


  use_checkpoint_opt_param_scheduler: False


model:


  _target_: verl.trainer.config.BaseModelConfig


  override_config:

    model_config: {}

    moe_config:

      freeze_moe_router: False


megatron:


  _target_: verl.workers.config.McoreEngineConfig


  param_offload: False


  grad_offload: False


  optimizer_offload: False


  tensor_model_parallel_size: 1


  expert_model_parallel_size: 1


  expert_tensor_parallel_size: null


  pipeline_model_parallel_size: 1


  virtual_pipeline_model_parallel_size: null


  context_parallel_size: 1


  sequence_parallel: True


  use_distributed_optimizer: True


  use_dist_checkpointing: False


  dist_checkpointing_path: null


  seed: ${oc.select:actor_rollout_ref.actor.megatron.seed,42}


  override_ddp_config: ${oc.select:actor_rollout_ref.actor.megatron.override_ddp_config,{}}


  override_transformer_config: ${oc.select:actor_rollout_ref.actor.megatron.override_transformer_config,{}}


  use_mbridge: ${oc.select:actor_rollout_ref.actor.megatron.use_mbridge,False}


load_weight: True


data_loader_seed: ${oc.select:actor_rollout_ref.actor.data_loader_seed,null}
