






defaults:


  - critic


  - _self_


_target_: verl.workers.config.FSDPCriticConfig


strategy: fsdp


optim:


  _target_: verl.workers.config.FSDPOptimizerConfig


  min_lr_ratio: null


  warmup_style: constant


model:


  _target_: verl.workers.config.FSDPCriticModelCfg


  use_shm: False


  enable_gradient_checkpointing: True


  enable_activation_offload: False


  use_remove_padding: False


  fsdp_config:


    _target_: verl.workers.config.FSDPEngineConfig


    param_offload: False


    optimizer_offload: False


    offload_policy: False


    reshard_after_forward: True


    wrap_policy:


      min_num_params: 0


    fsdp_size: -1



    forward_prefetch: False


  lora_rank: 0


  lora_alpha: 16


  target_modules: all-linear


forward_micro_batch_size: ${oc.select:.ppo_micro_batch_size,null}


forward_micro_batch_size_per_gpu: ${oc.select:.ppo_micro_batch_size_per_gpu,null}


ulysses_sequence_parallel_size: 1


grad_clip: 1.0
