230 lines
7.3 KiB
Python
230 lines
7.3 KiB
Python
load("@bazel_skylib//lib:paths.bzl", "paths")
|
|
load("@bazel_tools//tools/build_defs/repo:http.bzl", "http_archive")
|
|
load("//runtimes/common:packages.bzl", "packages")
|
|
|
|
_BUILD_FILE_DEFAULT_VISIBILITY = """\
|
|
package(default_visibility = ["//visibility:public"])
|
|
"""
|
|
|
|
ARCH = "linux-x86_64"
|
|
|
|
CUDA_REDIST_PREFIX = "https://developer.download.nvidia.com/compute/cuda/redist/"
|
|
CUDA_VERSION = "12.9.0"
|
|
CUDA_REDIST_JSON_SHA256 = "4e4e17a12adcf8cac40b990e1618406cd7ad52da1817819166af28a9dfe21d4a"
|
|
|
|
CUDNN_REDIST_PREFIX = "https://developer.download.nvidia.com/compute/cudnn/redist/"
|
|
CUDNN_VERSION = "9.10.1"
|
|
CUDNN_REDIST_JSON_SHA256 = "2ac8d48d3ab4de1acdce65fa3e8ecfb14750d4e101b05fe3307d2f95f2740563"
|
|
|
|
CUDA_PACKAGES = {
|
|
"cuda_cudart": "\n".join([
|
|
packages.cc_library(
|
|
name = "cudart",
|
|
hdrs = ["include/cuda.h"],
|
|
includes = ["include"],
|
|
deps = [":cudart_so", ":cuda_so"],
|
|
),
|
|
packages.cc_import(
|
|
name = "cudart_so",
|
|
shared_library = "lib/libcudart.so.12",
|
|
),
|
|
packages.cc_import(
|
|
name = "cuda_so",
|
|
shared_library = "lib/stubs/libcuda.so",
|
|
),
|
|
]),
|
|
"cuda_cupti": packages.cc_import(
|
|
name = "cupti",
|
|
shared_library = "lib/libcupti.so.12",
|
|
),
|
|
"cuda_nvtx": packages.cc_import_glob_hdrs(
|
|
name = "nvtx",
|
|
hdrs_glob = ["include/nvtx3/**/*.h"],
|
|
shared_library = "lib/libnvtx3interop.so.1",
|
|
),
|
|
"libcufft": packages.cc_import(
|
|
name = "cufft",
|
|
shared_library = "lib/libcufft.so.11",
|
|
),
|
|
"libcusolver": packages.cc_import(
|
|
name = "cusolver",
|
|
shared_library = "lib/libcusolver.so.11",
|
|
),
|
|
"libcusparse": packages.cc_import(
|
|
name = "cusparse",
|
|
shared_library = "lib/libcusparse.so.12",
|
|
),
|
|
"libnvjitlink": packages.cc_import(
|
|
name = "nvjitlink",
|
|
shared_library = "lib/libnvJitLink.so.12",
|
|
),
|
|
"cuda_nvcc": "\n".join([
|
|
packages.filegroup(
|
|
name = "ptxas",
|
|
srcs = ["bin/ptxas"],
|
|
),
|
|
packages.filegroup(
|
|
name = "nvlink",
|
|
srcs = ["bin/nvlink"],
|
|
),
|
|
packages.filegroup(
|
|
name = "libdevice",
|
|
srcs = ["nvvm/libdevice/libdevice.10.bc"],
|
|
),
|
|
packages.cc_import(
|
|
name = "nvvm",
|
|
shared_library = "nvvm/lib64/libnvvm.so.4",
|
|
),
|
|
packages.cc_import(
|
|
name = "nvptxcompiler",
|
|
static_library = "lib/libnvptxcompiler_static.a",
|
|
),
|
|
]),
|
|
"cuda_nvrtc": "\n".join([
|
|
packages.cc_import(
|
|
name = "nvrtc",
|
|
shared_library = "lib/libnvrtc.so.12",
|
|
deps = [":nvrtc_builtins"],
|
|
),
|
|
packages.cc_import(
|
|
name = "nvrtc_builtins",
|
|
shared_library = "lib/libnvrtc-builtins.so.12.9",
|
|
),
|
|
]),
|
|
"libcublas": "\n".join([
|
|
packages.cc_import(
|
|
name = "cublasLt",
|
|
shared_library = "lib/libcublasLt.so.12",
|
|
),
|
|
packages.cc_import(
|
|
name = "cublas",
|
|
shared_library = "lib/libcublas.so.12",
|
|
deps = [":cublasLt"],
|
|
),
|
|
]),
|
|
}
|
|
|
|
CUDNN_PACKAGES = {
|
|
"cudnn": "\n".join([
|
|
packages.cc_import(
|
|
name = "cudnn",
|
|
shared_library = "lib/libcudnn.so.9",
|
|
deps = [
|
|
":cudnn_adv",
|
|
":cudnn_ops",
|
|
":cudnn_cnn",
|
|
":cudnn_graph",
|
|
":cudnn_engines_precompiled",
|
|
":cudnn_engines_runtime_compiled",
|
|
":cudnn_heuristic",
|
|
],
|
|
),
|
|
packages.cc_import(
|
|
name = "cudnn_adv",
|
|
shared_library = "lib/libcudnn_adv.so.9",
|
|
),
|
|
packages.cc_import(
|
|
name = "cudnn_ops",
|
|
shared_library = "lib/libcudnn_ops.so.9",
|
|
),
|
|
packages.cc_import(
|
|
name = "cudnn_cnn",
|
|
shared_library = "lib/libcudnn_cnn.so.9",
|
|
deps = [":cudnn_ops"],
|
|
),
|
|
packages.cc_import(
|
|
name = "cudnn_graph",
|
|
shared_library = "lib/libcudnn_graph.so.9",
|
|
),
|
|
packages.cc_import(
|
|
name = "cudnn_engines_precompiled",
|
|
shared_library = "lib/libcudnn_engines_precompiled.so.9",
|
|
),
|
|
packages.cc_import(
|
|
name = "cudnn_engines_runtime_compiled",
|
|
shared_library = "lib/libcudnn_engines_runtime_compiled.so.9",
|
|
),
|
|
packages.cc_import(
|
|
name = "cudnn_heuristic",
|
|
shared_library = "lib/libcudnn_heuristic.so.9",
|
|
),
|
|
]),
|
|
}
|
|
|
|
def _read_redist_json(mctx, url, sha256):
|
|
fname = ".{}.json".format(sha256)
|
|
mctx.download(
|
|
url = url,
|
|
output = fname,
|
|
sha256 = sha256,
|
|
)
|
|
return json.decode(mctx.read(fname))
|
|
|
|
def _cuda_impl(mctx):
|
|
CUDA_REDIST = _read_redist_json(
|
|
mctx,
|
|
url = CUDA_REDIST_PREFIX + "redistrib_{}.json".format(CUDA_VERSION),
|
|
sha256 = CUDA_REDIST_JSON_SHA256,
|
|
)
|
|
|
|
CUDNN_REDIST = _read_redist_json(
|
|
mctx,
|
|
url = CUDNN_REDIST_PREFIX + "redistrib_{}.json".format(CUDNN_VERSION),
|
|
sha256 = CUDNN_REDIST_JSON_SHA256,
|
|
)
|
|
|
|
for pkg, build_file_content in CUDA_PACKAGES.items():
|
|
pkg_data = CUDA_REDIST[pkg]
|
|
arch_data = pkg_data.get(ARCH)
|
|
if not arch_data:
|
|
continue
|
|
http_archive(
|
|
name = pkg,
|
|
build_file_content = _BUILD_FILE_DEFAULT_VISIBILITY + build_file_content,
|
|
url = CUDA_REDIST_PREFIX + arch_data["relative_path"],
|
|
sha256 = arch_data["sha256"],
|
|
strip_prefix = paths.basename(arch_data["relative_path"]).replace(".tar.xz", ""),
|
|
)
|
|
|
|
for pkg, build_file_content in CUDNN_PACKAGES.items():
|
|
pkg_data = CUDNN_REDIST[pkg]
|
|
arch_data = pkg_data.get(ARCH)
|
|
if not arch_data:
|
|
continue
|
|
arch_data = arch_data.get("cuda12", arch_data)
|
|
http_archive(
|
|
name = pkg,
|
|
build_file_content = _BUILD_FILE_DEFAULT_VISIBILITY + build_file_content,
|
|
url = CUDNN_REDIST_PREFIX + arch_data["relative_path"],
|
|
sha256 = arch_data["sha256"],
|
|
strip_prefix = paths.basename(arch_data["relative_path"]).replace(".tar.xz", ""),
|
|
)
|
|
|
|
http_archive(
|
|
name = "nccl",
|
|
urls = ["https://files.pythonhosted.org/packages/48/fb/ec4ac065d9b0d56f72eaf1d9b0df601e33da28197b32ca351dc05b342611/nvidia_nccl_cu12-2.26.5-py3-none-manylinux2014_x86_64.manylinux_2_17_x86_64.whl"],
|
|
type = "zip",
|
|
sha256 = "ea5ed3e053c735f16809bee7111deac62ac35b10128a8c102960a0462ce16cbe",
|
|
build_file_content = _BUILD_FILE_DEFAULT_VISIBILITY + packages.cc_import(
|
|
name = "nccl",
|
|
shared_library = "nvidia/nccl/lib/libnccl.so.2",
|
|
),
|
|
)
|
|
|
|
http_archive(
|
|
name = "libpjrt_cuda",
|
|
build_file = "libpjrt_cuda.BUILD.bazel",
|
|
url = "https://github.com/zml/pjrt-artifacts/releases/download/v10.0.0/pjrt-cuda_linux-amd64.tar.gz",
|
|
sha256 = "eddf4db325aaeb1692e9eff1b5021dbeda27c08e527cae87295a61d94e654395",
|
|
)
|
|
|
|
return mctx.extension_metadata(
|
|
reproducible = True,
|
|
root_module_direct_deps = ["libpjrt_cuda"],
|
|
root_module_direct_dev_deps = [],
|
|
)
|
|
|
|
cuda_packages = module_extension(
|
|
implementation = _cuda_impl,
|
|
)
|