LICENSE
README.md
pyproject.toml
setup.py
./verl/__init__.py
./verl/protocol.py
./verl/models/__init__.py
./verl/models/monkey_patch.py
./verl/models/transformers/__init__.py
./verl/models/transformers/flash_attention_utils.py
./verl/models/transformers/qwen2_vl.py
./verl/single_controller/__init__.py
./verl/single_controller/base/__init__.py
./verl/single_controller/base/decorator.py
./verl/single_controller/base/worker.py
./verl/single_controller/base/worker_group.py
./verl/single_controller/base/register_center/__init__.py
./verl/single_controller/base/register_center/ray.py
./verl/single_controller/ray/__init__.py
./verl/single_controller/ray/base.py
./verl/trainer/__init__.py
./verl/trainer/config.py
./verl/trainer/core_algos.py
./verl/trainer/main.py
./verl/trainer/metrics.py
./verl/trainer/ray_trainer.py
./verl/utils/__init__.py
./verl/utils/dataset.py
./verl/utils/flops_counter.py
./verl/utils/fsdp_utils.py
./verl/utils/model_utils.py
./verl/utils/py_functional.py
./verl/utils/rl_dataset_bak.py
./verl/utils/seqlen_balancing.py
./verl/utils/tokenizer.py
./verl/utils/torch_dtypes.py
./verl/utils/torch_functional.py
./verl/utils/tracking.py
./verl/utils/ulysses.py
./verl/utils/checkpoint/__init__.py
./verl/utils/checkpoint/checkpoint_manager.py
./verl/utils/checkpoint/fsdp_checkpoint_manager.py
./verl/utils/logger/__init__.py
./verl/utils/logger/aggregate_logger.py
./verl/utils/reward_score/__init__.py
./verl/utils/reward_score/math.py
./verl/utils/reward_score/multitask.py
./verl/utils/reward_score/r1v.py
./verl/workers/__init__.py
./verl/workers/config.py
./verl/workers/fsdp_workers.py
./verl/workers/actor/__init__.py
./verl/workers/actor/base.py
./verl/workers/actor/config.py
./verl/workers/actor/dp_actor.py
./verl/workers/critic/__init__.py
./verl/workers/critic/base.py
./verl/workers/critic/config.py
./verl/workers/critic/dp_critic.py
./verl/workers/reward/__init__.py
./verl/workers/reward/config.py
./verl/workers/reward/custom.py
./verl/workers/rollout/__init__.py
./verl/workers/rollout/base.py
./verl/workers/rollout/config.py
./verl/workers/rollout/vllm_rollout/__init__.py
./verl/workers/rollout/vllm_rollout/vllm_rollout_spmd.py
./verl/workers/sharding_manager/__init__.py
./verl/workers/sharding_manager/base.py
./verl/workers/sharding_manager/fsdp_ulysses.py
./verl/workers/sharding_manager/fsdp_vllm.py
verl/__init__.py
verl/protocol.py
verl.egg-info/PKG-INFO
verl.egg-info/SOURCES.txt
verl.egg-info/dependency_links.txt
verl.egg-info/requires.txt
verl.egg-info/top_level.txt
verl/models/__init__.py
verl/models/monkey_patch.py
verl/models/transformers/__init__.py
verl/models/transformers/flash_attention_utils.py
verl/models/transformers/qwen2_vl.py
verl/single_controller/__init__.py
verl/single_controller/base/__init__.py
verl/single_controller/base/decorator.py
verl/single_controller/base/worker.py
verl/single_controller/base/worker_group.py
verl/single_controller/base/register_center/__init__.py
verl/single_controller/base/register_center/ray.py
verl/single_controller/ray/__init__.py
verl/single_controller/ray/base.py
verl/trainer/__init__.py
verl/trainer/config.py
verl/trainer/core_algos.py
verl/trainer/main.py
verl/trainer/metrics.py
verl/trainer/ray_trainer.py
verl/utils/__init__.py
verl/utils/dataset.py
verl/utils/flops_counter.py
verl/utils/fsdp_utils.py
verl/utils/model_utils.py
verl/utils/py_functional.py
verl/utils/rl_dataset_bak.py
verl/utils/seqlen_balancing.py
verl/utils/tokenizer.py
verl/utils/torch_dtypes.py
verl/utils/torch_functional.py
verl/utils/tracking.py
verl/utils/ulysses.py
verl/utils/checkpoint/__init__.py
verl/utils/checkpoint/checkpoint_manager.py
verl/utils/checkpoint/fsdp_checkpoint_manager.py
verl/utils/logger/__init__.py
verl/utils/logger/aggregate_logger.py
verl/utils/reward_score/__init__.py
verl/utils/reward_score/math.py
verl/utils/reward_score/multitask.py
verl/utils/reward_score/r1v.py
verl/workers/__init__.py
verl/workers/config.py
verl/workers/fsdp_workers.py
verl/workers/actor/__init__.py
verl/workers/actor/base.py
verl/workers/actor/config.py
verl/workers/actor/dp_actor.py
verl/workers/critic/__init__.py
verl/workers/critic/base.py
verl/workers/critic/config.py
verl/workers/critic/dp_critic.py
verl/workers/reward/__init__.py
verl/workers/reward/config.py
verl/workers/reward/custom.py
verl/workers/rollout/__init__.py
verl/workers/rollout/base.py
verl/workers/rollout/config.py
verl/workers/rollout/vllm_rollout/__init__.py
verl/workers/rollout/vllm_rollout/vllm_rollout_spmd.py
verl/workers/sharding_manager/__init__.py
verl/workers/sharding_manager/base.py
verl/workers/sharding_manager/fsdp_ulysses.py
verl/workers/sharding_manager/fsdp_vllm.py