task/2.2: Consolidate dependency metadata to pyproject.toml

LessUp · Copilot · LessUp · commit 43299942d838 · 2026-04-29T15:35:17.000+08:00
CHANGES:
- setup.py: Removed duplicate package metadata (name, version, description).
  Now delegates all metadata to pyproject.toml while keeping CUDA extension
  compilation logic. Made CUDA_HOME check optional for non-CUDA installations.

- requirements.txt: Changed from listing core dependencies to a guide file
  pointing users to pip install -e ".[extra]" pattern.

- pyproject.toml: Remains single source of truth for:
  * Package metadata (name, version, description, classifiers, etc.)
  * Core dependencies (torch, numpy)
  * Optional dependencies (test, benchmark, dev)

VERIFICATION:
- All metadata correctly read from pyproject.toml
- pip install -e . succeeds without CUDA_HOME
- pip install -e ".[test]" correctly installs test dependencies
- python -m compileall cuda_llm_ops tests benchmarks succeeds
- ruff check passes on all modified files

Co-authored-by: Copilot &lt;223556219+Copilot@users.noreply.github.com&gt;
diff --git a/requirements.txt b/requirements.txt
@@ -1,8 +1,9 @@
-# Core dependencies
-# For full installation with all optional dependencies, use:
-#   pip install -e ".[dev]"
-#   or
-#   pip install -e ".[test,benchmark,dev]"
+# Development and testing dependencies
+# All project metadata and dependencies are defined in pyproject.toml
+# Use one of the following to install:
+#   pip install -e .              # Install base package only
+#   pip install -e ".[test]"      # Install with test dependencies
+#   pip install -e ".[dev]"       # Install with dev tools (recommended for contributors)
+#   pip install -e ".[benchmark]" # Install with benchmark tools
+#   pip install -e ".[test,dev]"  # Install with multiple extras
 
-torch>=2.0.0
-numpy>=1.20.0
diff --git a/setup.py b/setup.py
@@ -1,101 +1,69 @@
 """
-Setup script for CUDA LLM Kernel Optimization package.
-Version is read from pyproject.toml (single source of truth).
+Setup script for CUDA extension compilation only.
+
+Package metadata, dependencies, and optional-dependencies are defined exclusively
+in pyproject.toml. Setuptools will automatically read them from there.
+This script handles only CUDA extension compilation configuration.
 """
 
 import os
 import platform
-import re
-from pathlib import Path
-from setuptools import setup, find_packages
+
+from setuptools import setup
 from torch.utils.cpp_extension import BuildExtension, CUDAExtension
 
 
-def _read_version() -> str:
-    """Read version from pyproject.toml."""
-    text = Path(__file__).with_name("pyproject.toml").read_text()
-    # Match version = "X.Y.Z" in [project] section
-    match = re.search(r'^version\s*=\s*"([^"]+)"', text, re.MULTILINE)
-    if not match:
-        raise RuntimeError("Cannot find version in pyproject.toml")
-    return match.group(1)
+def _build_cuda_extensions():
+    """Build CUDA extensions with configurable architecture support.
 
-# CUDA architectures to compile for
-CUDA_ARCHS = os.environ.get('CUDA_ARCHS', '70;75;80;86;89;90')
+    Returns empty list if CUDA_HOME is not set (for pip install without CUDA).
+    Set CUDA_HOME to enable CUDA extension compilation.
+    """
+    if not os.environ.get('CUDA_HOME'):
+        return []
 
-# Source files
-cuda_sources = [
-    'src/naive_attention.cu',
-    'src/tiled_attention.cu',
-    'src/flash_attention.cu',
-    'src/tensor_core_gemm.cu',
-    'src/hgemm_kernel.cu',
-    'cuda_llm_ops/bindings.cpp',
-]
+    cuda_archs = os.environ.get('CUDA_ARCHS', '70;75;80;86;89;90')
 
-# Include directories
-include_dirs = [
-    'include',
-]
+    cuda_sources = [
+        'src/naive_attention.cu',
+        'src/tiled_attention.cu',
+        'src/flash_attention.cu',
+        'src/tensor_core_gemm.cu',
+        'src/hgemm_kernel.cu',
+        'cuda_llm_ops/bindings.cpp',
+    ]
 
-# Compiler flags (platform-aware)
-if platform.system() == 'Windows':
-    extra_compile_args = {
-        'cxx': ['/O2', '/std:c++17'],
-        'nvcc': [
-            '-O3',
-            '--use_fast_math',
-            '-std=c++17',
-        ]
-    }
-else:
-    extra_compile_args = {
-        'cxx': ['-O3', '-std=c++17'],
-        'nvcc': [
-            '-O3',
-            '--use_fast_math',
-            '-std=c++17',
-            '-Xcompiler', '-fPIC',
-        ]
-    }
+    include_dirs = ['include']
 
-# Add architecture flags
-for arch in CUDA_ARCHS.split(';'):
-    extra_compile_args['nvcc'].extend([
-        f'-gencode=arch=compute_{arch},code=sm_{arch}',
-    ])
+    # Platform-aware compiler flags
+    if platform.system() == 'Windows':
+        extra_compile_args = {
+            'cxx': ['/O2', '/std:c++17'],
+            'nvcc': ['-O3', '--use_fast_math', '-std=c++17']
+        }
+    else:
+        extra_compile_args = {
+            'cxx': ['-O3', '-std=c++17'],
+            'nvcc': ['-O3', '--use_fast_math', '-std=c++17', '-Xcompiler', '-fPIC']
+        }
 
-setup(
-    name='cuda_llm_ops',
-    version=_read_version(),
-    description='High-performance CUDA kernels for LLM inference',
-    author='CUDA LLM Kernel Optimization',
-    packages=['cuda_llm_ops'],
-    package_dir={'cuda_llm_ops': 'cuda_llm_ops'},
-    ext_modules=[
+    # Add compute capability flags
+    for arch in cuda_archs.split(';'):
+        extra_compile_args['nvcc'].extend([
+            f'-gencode=arch=compute_{arch},code=sm_{arch}',
+        ])
+
+    return [
         CUDAExtension(
             name='cuda_llm_ops._cuda_llm_ops',
             sources=cuda_sources,
             include_dirs=include_dirs,
             extra_compile_args=extra_compile_args,
         )
-    ],
-    cmdclass={
-        'build_ext': BuildExtension
-    },
-    install_requires=[
-        'torch>=2.0.0',
-        'numpy>=1.20.0',
-    ],
-    extras_require={
-        'test': [
-            'pytest',
-            'hypothesis',
-        ],
-        'benchmark': [
-            'matplotlib',
-            'pandas',
-        ],
-    },
-    python_requires='>=3.8',
+    ]
+
+
+setup(
+    ext_modules=_build_cuda_extensions(),
+    cmdclass={'build_ext': BuildExtension},
 )