from setuptools import setup
from torch.utils.cpp_extension import BuildExtension, CUDAExtension
import os




ENABLE_PROFILING = 0


profiling_flag = f'-DENABLE_PERF_PROFILING={ENABLE_PROFILING}'

setup(
    name='sparse_ops',
    ext_modules=[
        CUDAExtension(
            name='sparse_ops',
            sources=['custom_op.cpp', 'hybrid_sp.cu'],
            extra_compile_args={
                'nvcc': [
                    '-DNDEBUG',
                    '-O3',
                    '-Xcompiler=-Wno-psabi',
                    '-Xcompiler=-fno-strict-aliasing',
                    '--resource-usage',
                    '--expt-relaxed-constexpr',
                    '-gencode=arch=compute_80,code=sm_80',     
                    '-gencode=arch=compute_86,code=sm_86',     
                    '-gencode=arch=compute_90a,code=sm_90a',   
                    profiling_flag,
                ],
                'cxx': ['-DPy_LIMITED_API=0x03090000', profiling_flag],
            },
            libraries=['cuda'],
            library_dirs=['/usr/local/cuda/lib64'],
            py_limited_api=True,
        )
    ],
    cmdclass={
        'build_ext': BuildExtension.with_options(no_python_abi_suffix=True)
    },
    options={'bdist_wheel': {'py_limited_api': 'cp39'}}
)
