114 lines
4.1 KiB
Python
114 lines
4.1 KiB
Python
import os
|
|
import subprocess
|
|
import sys
|
|
from pathlib import Path
|
|
|
|
from setuptools import Extension, setup
|
|
from setuptools.command.build_ext import build_ext
|
|
|
|
|
|
# A CMakeExtension needs a sourcedir instead of a file list.
|
|
# The name must be the _single_ output extension from the CMake build.
|
|
# If you need multiple extensions, see scikit-build.
|
|
class CMakeExtension(Extension):
|
|
def __init__(self, name: str, sourcedir: str = "") -> None:
|
|
super().__init__(name, sources=[])
|
|
self.sourcedir = os.fspath(Path(sourcedir).resolve())
|
|
|
|
|
|
class CMakeBuild(build_ext):
|
|
def build_extension(self, ext: CMakeExtension) -> None:
|
|
# Must be in this form due to bug in .resolve() only fixed in Python 3.10+
|
|
ext_fullpath = Path.cwd() / self.get_ext_fullpath(ext.name)
|
|
extdir = ext_fullpath.parent.resolve()
|
|
|
|
# Using this requires trailing slash for auto-detection & inclusion of
|
|
# auxiliary "native" libs
|
|
|
|
debug = int(os.environ.get("DEBUG", 0)) if self.debug is None else self.debug
|
|
cfg = "Debug" if debug else "Release"
|
|
|
|
is_windows = os.name == "nt"
|
|
# Set Python_EXECUTABLE instead if you use PYBIND11_FINDPYTHON
|
|
cmake_args = []
|
|
|
|
if is_windows == False:
|
|
cmake_args += [
|
|
f"-DPython_EXECUTABLE={sys.executable}",
|
|
]
|
|
|
|
cmake_args = [
|
|
f"-DCMAKE_BUILD_TYPE={cfg}", # not used on MSVC, but no harm
|
|
f"-DCUDNN_FRONTEND_BUILD_PYTHON_BINDINGS=ON",
|
|
# There's no need to build cpp samples and tests with python
|
|
f"-DCUDNN_FRONTEND_BUILD_SAMPLES=OFF",
|
|
f"-DCUDNN_FRONTEND_BUILD_TESTS=OFF",
|
|
# All these are handled by pip
|
|
f"-DCMAKE_LIBRARY_OUTPUT_DIRECTORY={extdir}{os.sep}",
|
|
f"-DCUDNN_FRONTEND_KEEP_PYBINDS_IN_BINARY_DIR=OFF",
|
|
]
|
|
|
|
if is_windows:
|
|
cmake_args += [
|
|
f"-DCUDNN_FRONTEND_FETCH_PYBINDS_IN_CMAKE=ON",
|
|
]
|
|
else:
|
|
cmake_args += [
|
|
f"-DCUDNN_FRONTEND_FETCH_PYBINDS_IN_CMAKE=OFF",
|
|
]
|
|
if "CUDA_PATH" in os.environ:
|
|
cmake_args.append(f"-DCUDAToolkit_ROOT={os.environ['CUDA_PATH']}")
|
|
|
|
if "CUDAToolkit_ROOT" in os.environ:
|
|
cmake_args.append(f"-DCUDAToolkit_ROOT={os.environ['CUDAToolkit_ROOT']}")
|
|
|
|
if "CUDNN_PATH" in os.environ:
|
|
cmake_args.append(f"-DCUDNN_PATH={os.environ['CUDNN_PATH']}")
|
|
|
|
# Using Ninja-build since it a) is available as a wheel and b)
|
|
# multithreads automatically. MSVC would require all variables be
|
|
# exported for Ninja to pick it up, which is a little tricky to do.
|
|
# Users can override the generator with CMAKE_GENERATOR in CMake
|
|
# 3.15+.
|
|
if is_windows == False:
|
|
try:
|
|
import ninja
|
|
|
|
ninja_executable_path = Path(ninja.BIN_DIR) / "ninja"
|
|
cmake_args += [
|
|
"-GNinja",
|
|
f"-DCMAKE_MAKE_PROGRAM:FILEPATH={ninja_executable_path}",
|
|
]
|
|
except ImportError:
|
|
pass
|
|
|
|
build_args = []
|
|
if is_windows:
|
|
build_args += [f"--config Release"]
|
|
# Set CMAKE_BUILD_PARALLEL_LEVEL to control the parallel build level
|
|
# across all generators.
|
|
if "CMAKE_BUILD_PARALLEL_LEVEL" not in os.environ:
|
|
# self.parallel is a Python 3 only way to set parallel jobs by hand
|
|
# using -j in the build_ext call, not supported by pip or PyPA-build.
|
|
if hasattr(self, "parallel") and self.parallel:
|
|
# CMake 3.12+ only.
|
|
build_args += [f"-j{self.parallel}"]
|
|
|
|
build_temp = Path(self.build_temp) / ext.name
|
|
if not build_temp.exists():
|
|
build_temp.mkdir(parents=True)
|
|
|
|
print(" ".join(cmake_args))
|
|
subprocess.run(
|
|
["cmake", ext.sourcedir, *cmake_args], cwd=build_temp, check=True
|
|
)
|
|
subprocess.run(
|
|
["cmake", "--build", ".", *build_args], cwd=build_temp, check=True
|
|
)
|
|
|
|
|
|
setup(
|
|
ext_modules=[CMakeExtension("cudnn/_compiled_module")],
|
|
cmdclass={"build_ext": CMakeBuild},
|
|
)
|