accelerate
codetiming
datasets
flash-attn==2.7.4.post1
qwen-vl-utils[decord]==0.0.8
thefuzz
liger-kernel
mathruler
numpy
omegaconf
pandas
peft
pillow
pyarrow>=15.0.0
pylatexenc
ray[default]
tensordict
tensorboard
torchdata
transformers==4.51.3
vllm==0.8.3
wandb