[build-system]
requires = [
    "setuptools>=49.4.0",
    "setuptools-scm",

    # Build dependencies. (Especially for flash-attn)
    "cmake>=3.21",
    "ninja",
    "packaging",
    "torch==2.5.1",
    "wheel",
]
build-backend = "setuptools.build_meta"

[project]
name = "hip-attn"  # Name of package when installed using pip
version = "1.2.4"
description = "HiP Attention"
authors = [
    { name="Authors", email="authors@authors.com" },
]
license = "LicenseRef-FSL-1.1-MIT"
license-files = ["LICENSE.md"]
readme = "README.md"
requires-python = ">=3.9, <3.13"
classifiers = [
    "Topic :: Scientific/Engineering :: Artificial Intelligence",
    "Environment :: GPU",
    "Environment :: GPU :: NVIDIA CUDA :: 12",
]
dependencies = [
    # Required
    "torch",
    "triton",
    "setuptools",  # Required by triton amd backend
    "numba",
    "performer_pytorch",
    "peft",
    "seaborn",
    "sympy",
    "bitsandbytes",
    # CUDA 12
    "cupy-cuda12x",
    "nvtx",
]

[project.optional-dependencies]
sglang = [
    "sgl-kernel",
    # Needs adding `--find-links https://flashinfer.ai/whl/cu124/torch2.5/flashinfer-python`
    # For uv, see tool.uv.sources and tool.uv.index sections
    "flashinfer-python",
    # See tool.uv.sources section
    "flash-attn",
    # See tool.uv.sources section
    "sglang[all]",
]

[tool.uv.sources]
hip-attn = { workspace = true }
flashinfer-python = [
  { index = "flashinfer_cu124_torch25" },
]
flash-attn = [
    # pip format: "flash-attn @ https://github.com/Dao-AILab/flash-attention/releases/download/v2.7.4.post1/flash_attn-2.7.4.post1+cu12torch2.5cxx11abiFALSE-cp311-cp311-linux_x86_64.whl"
    { url = "https://github.com/Dao-AILab/flash-attention/releases/download/v2.7.4.post1/flash_attn-2.7.4.post1+cu12torch2.5cxx11abiFALSE-cp39-cp39-linux_x86_64.whl", marker = "sys_platform == 'linux' and python_version == '3.9'" },
    { url = "https://github.com/Dao-AILab/flash-attention/releases/download/v2.7.4.post1/flash_attn-2.7.4.post1+cu12torch2.5cxx11abiFALSE-cp310-cp310-linux_x86_64.whl", marker = "sys_platform == 'linux' and python_version == '3.10'" },
    { url = "https://github.com/Dao-AILab/flash-attention/releases/download/v2.7.4.post1/flash_attn-2.7.4.post1+cu12torch2.5cxx11abiFALSE-cp311-cp311-linux_x86_64.whl", marker = "sys_platform == 'linux' and python_version == '3.11'" },
    { url = "https://github.com/Dao-AILab/flash-attention/releases/download/v2.7.4.post1/flash_attn-2.7.4.post1+cu12torch2.5cxx11abiFALSE-cp312-cp312-linux_x86_64.whl", marker = "sys_platform == 'linux' and python_version == '3.12'" },
    { url = "https://github.com/Dao-AILab/flash-attention/releases/download/v2.7.4.post1/flash_attn-2.7.4.post1+cu12torch2.5cxx11abiFALSE-cp313-cp313-linux_x86_64.whl", marker = "sys_platform == 'linux' and python_version == '3.13'" },
]
sglang = [
    { git = "https://github.com/DeepAuto-AI/sglang.git", subdirectory = "python", rev = "deepauto/release" },
    # For local devs, you can use this instead:
    # { path = "../sglang/python", editable = true },
]
hip-research = { workspace = true }

[tool.uv]
no-build-isolation-package = ["flash-attn"]

[[tool.uv.index]]
name = "flashinfer_cu124_torch25"
url = "https://flashinfer.ai/whl/cu124/torch2.5/"
explicit = true

[tool.uv.workspace]
members = ["hip-research"]

[dependency-groups]
dev = [
    "hip-attn[sglang]",
    "hip-research",
    "pre-commit>=4.2.0",
]
