[project]
name = "puzzle-rl-verl"
version = "0.1.0"
description = "VERL training environment for puzzle-to-math RL transfer experiments"
requires-python = ">=3.12,<3.13"
dependencies = [
    # PyTorch with CUDA 12.8 (from working verl-latest venv)
    "torch==2.7.1",
    "torchvision==0.22.1",
    "torchaudio==2.7.1",
    
    # Core ML libraries
    "transformers==4.56.1",
    "accelerate==1.10.1",
    "peft==0.17.1",
    "safetensors==0.6.2",
    "huggingface-hub==0.34.4",
    "hf-transfer>=0.1.8",  # Fast parallel downloads (required when HF_HUB_ENABLE_HF_TRANSFER=1)
    "qwen-vl-utils>=0.0.10",  # Required by transformers for Qwen models
    
    # vLLM for fast inference
    "vllm==0.10.1",
    
    # Flash Attention (use >= to allow pre-built wheels with build metadata like +cu.12.8.torch.2.7)
    "flash-attn>=2.8.3",
    
    # Ray for distributed training
    "ray==2.49.1",
    
    # Data processing
    "numpy==1.26.4",
    "pandas==2.3.2",
    "pyarrow==21.0.0",
    "datasets==3.6.0",
    
    # Logging
    "tensorboard==2.20.0",
    "wandb==0.24.0",
    
    # Hydra config
    "hydra-core==1.3.2",
    "omegaconf==2.3.0",
    
    # VERL-specific
    "codetiming==1.4.0",
    "dill==0.3.8",
    
    # VERL - installed from PyPI
    "verl==0.7.0",
    
    # FlashInfer for attention kernels
    "flashinfer-python>=0.6.2",
]

[tool.uv]
dev-dependencies = []
package = false

# PyTorch index for CUDA 12.8 wheels
[[tool.uv.index]]
name = "pytorch-cu128"
url = "https://download.pytorch.org/whl/cu128"
explicit = true

# Astral CUDA 12.8 index (pre-built wheels for flash-attn, vllm, flashinfer, etc.)
# Mark as explicit so it's only used for packages we specify
[[tool.uv.index]]
name = "astral-cu128"
url = "https://api.pyx.dev/simple/astral-sh/cu128"
explicit = true

# Pin packages to specific indexes
[tool.uv.sources]
torch = { index = "pytorch-cu128" }
torchvision = { index = "pytorch-cu128" }
torchaudio = { index = "pytorch-cu128" }
# Use astral index for CUDA packages that need pre-built wheels
flash-attn = { index = "astral-cu128" }
vllm = { index = "astral-cu128" }
flashinfer-python = { index = "astral-cu128" }
xformers = { index = "astral-cu128" }

# Note: verl==0.7.0 is available from PyPI, so no local path dependency needed.
# This pyproject.toml mirrors the legacy `verl-latest` venv. For B200/SM100a
# devpods, prefer the `verl-vllm012` venv built by scripts/setup_vllm012_venv.sh
# (vLLM 0.12.0, PyTorch 2.9.0+cu129, FA2 2.8.3, with the PDL patch applied).
