266 lines
12 KiB
Python
266 lines
12 KiB
Python
# Copyright 2013-2022 Lawrence Livermore National Security, LLC and other
|
|
# Spack Project Developers. See the top-level COPYRIGHT file for details.
|
|
#
|
|
# SPDX-License-Identifier: (Apache-2.0 OR MIT)
|
|
|
|
import os
|
|
|
|
from spack.package import *
|
|
|
|
|
|
class Hydrogen(CMakePackage, CudaPackage, ROCmPackage):
|
|
"""Hydrogen: Distributed-memory dense and sparse-direct linear algebra
|
|
and optimization library. Based on the Elemental library."""
|
|
|
|
homepage = "https://libelemental.org"
|
|
url = "https://github.com/LLNL/Elemental/archive/v1.0.1.tar.gz"
|
|
git = "https://github.com/LLNL/Elemental.git"
|
|
tags = ["ecp", "radiuss"]
|
|
|
|
maintainers = ["bvanessen"]
|
|
|
|
version("develop", branch="hydrogen")
|
|
version("1.5.1", sha256="447da564278f98366906d561d9c8bc4d31678c56d761679c2ff3e59ee7a2895c")
|
|
version("1.5.0", sha256="03dd487fb23b9fdbc715554a8ea48c3196a1021502e61b0172ef3fdfbee75180")
|
|
version("1.4.0", sha256="c13374ff4a6c4d1076e47ba8c8d91a7082588b9958d1ed89cffb12f1d2e1452e")
|
|
version("1.3.4", sha256="7979f6656f698f0bbad6798b39d4b569835b3013ff548d98089fce7c283c6741")
|
|
version("1.3.3", sha256="a51a1cfd40ac74d10923dfce35c2c04a3082477683f6b35e7b558ea9f4bb6d51")
|
|
version("1.3.2", sha256="50bc5e87955f8130003d04dfd9dcad63107e92b82704f8107baf95b0ccf98ed6")
|
|
version("1.3.1", sha256="a8b8521458e9e747f2b24af87c4c2749a06e500019c383e0cefb33e5df6aaa1d")
|
|
version("1.3.0", sha256="0f3006aa1d8235ecdd621e7344c99f56651c6836c2e1bc0cf006331b70126b36")
|
|
version("1.2.0", sha256="8545975139582ee7bfe5d00f8d83a8697afc285bf7026b0761e9943355974806")
|
|
version("1.1.0-1", sha256="73ce05e4166853a186469269cb00a454de71e126b2019f95bbae703b65606808")
|
|
version("1.1.0", sha256="b4c12913acd01c72d31f4522266bfeb8df1d4d3b4aef02e07ccbc9a477894e71")
|
|
version("1.0.1", sha256="27cf76e1ef1d58bd8f9b1e34081a14a682b7ff082fb5d1da56713e5e0040e528")
|
|
version("1.0", sha256="d8a97de3133f2c6b6bb4b80d32b4a4cc25eb25e0df4f0cec0f8cb19bf34ece98")
|
|
|
|
variant("shared", default=True, description="Enables the build of shared libraries")
|
|
variant("openmp", default=True, description="Make use of OpenMP within CPU-kernels")
|
|
variant(
|
|
"openmp_blas", default=False, description="Use OpenMP for threading in the BLAS library"
|
|
)
|
|
variant("quad", default=False, description="Enable quad precision")
|
|
variant("int64", default=False, description="Use 64bit integers")
|
|
variant("int64_blas", default=False, description="Use 64bit integers for BLAS.")
|
|
variant("scalapack", default=False, description="Build with ScaLAPACK library")
|
|
variant(
|
|
"build_type",
|
|
default="Release",
|
|
description="The build type to build",
|
|
values=("Debug", "Release"),
|
|
)
|
|
variant(
|
|
"blas",
|
|
default="openblas",
|
|
values=("openblas", "mkl", "accelerate", "essl", "libsci"),
|
|
description="Enable the use of OpenBlas/MKL/Accelerate/ESSL/LibSci",
|
|
)
|
|
variant(
|
|
"mpfr",
|
|
default=False,
|
|
description="Support GNU MPFR's" "arbitrary-precision floating-point arithmetic",
|
|
)
|
|
variant("test", default=False, description="Builds test suite")
|
|
variant("al", default=False, description="Builds with Aluminum communication library")
|
|
variant(
|
|
"omp_taskloops",
|
|
default=False,
|
|
description="Use OpenMP taskloops instead of parallel for loops.",
|
|
)
|
|
variant("half", default=False, description="Builds with support for FP16 precision data types")
|
|
|
|
conflicts("~openmp", when="+omp_taskloops")
|
|
conflicts("+cuda", when="+rocm", msg="CUDA and ROCm support are mutually exclusive")
|
|
|
|
depends_on("cmake@3.21.0:", type="build", when="@1.5.2:")
|
|
depends_on("cmake@3.17.0:", type="build", when="@:1.5.1")
|
|
depends_on("cmake@3.22.0:", type="build", when="%cce")
|
|
|
|
depends_on("mpi")
|
|
depends_on("hwloc@1.11:")
|
|
depends_on("hwloc +cuda +nvml", when="+cuda")
|
|
depends_on("hwloc@2.3.0:", when="+rocm")
|
|
|
|
# Note that #1712 forces us to enumerate the different blas variants
|
|
depends_on("openblas", when="blas=openblas")
|
|
depends_on("openblas +ilp64", when="blas=openblas +int64_blas")
|
|
depends_on("openblas threads=openmp", when="blas=openblas +openmp_blas")
|
|
|
|
depends_on("intel-mkl", when="blas=mkl")
|
|
depends_on("intel-mkl +ilp64", when="blas=mkl +int64_blas")
|
|
depends_on("intel-mkl threads=openmp", when="blas=mkl +openmp_blas")
|
|
|
|
depends_on("veclibfort", when="blas=accelerate")
|
|
conflicts("blas=accelerate +openmp_blas")
|
|
|
|
depends_on("essl", when="blas=essl")
|
|
depends_on("essl +ilp64", when="blas=essl +int64_blas")
|
|
depends_on("essl threads=openmp", when="blas=essl +openmp_blas")
|
|
depends_on("netlib-lapack +external-blas", when="blas=essl")
|
|
|
|
depends_on("cray-libsci", when="blas=libsci")
|
|
depends_on("cray-libsci +openmp", when="blas=libsci +openmp_blas")
|
|
|
|
# Specify the correct version of Aluminum
|
|
depends_on("aluminum@:0.3", when="@:1.3 +al")
|
|
depends_on("aluminum@0.4.0:0.4", when="@1.4.0:1.4 +al")
|
|
depends_on("aluminum@0.6.0:0.6", when="@1.5.0:1.5.1 +al")
|
|
depends_on("aluminum@0.7.0:", when="@:1.0,1.5.2: +al")
|
|
|
|
# Add Aluminum variants
|
|
depends_on("aluminum +cuda +nccl +cuda_rma", when="+al +cuda")
|
|
depends_on("aluminum +rocm +rccl", when="+al +rocm")
|
|
|
|
for arch in CudaPackage.cuda_arch_values:
|
|
depends_on("aluminum cuda_arch=%s" % arch, when="+al +cuda cuda_arch=%s" % arch)
|
|
|
|
# variants +rocm and amdgpu_targets are not automatically passed to
|
|
# dependencies, so do it manually.
|
|
for val in ROCmPackage.amdgpu_targets:
|
|
depends_on("aluminum amdgpu_target=%s" % val, when="+al +rocm amdgpu_target=%s" % val)
|
|
|
|
# Note that this forces us to use OpenBLAS until #1712 is fixed
|
|
depends_on("lapack", when="blas=openblas ~openmp_blas")
|
|
|
|
depends_on("scalapack", when="+scalapack")
|
|
depends_on("gmp", when="+mpfr")
|
|
depends_on("mpc", when="+mpfr")
|
|
depends_on("mpfr", when="+mpfr")
|
|
|
|
depends_on("cuda", when="+cuda")
|
|
depends_on("cub", when="^cuda@:10")
|
|
depends_on("hipcub", when="+rocm")
|
|
depends_on("half", when="+half")
|
|
|
|
depends_on("llvm-openmp", when="%apple-clang +openmp")
|
|
|
|
conflicts(
|
|
"@0:0.98",
|
|
msg="Hydrogen did not exist before v0.99. " + "Did you mean to use Elemental instead?",
|
|
)
|
|
|
|
generator = "Ninja"
|
|
depends_on("ninja", type="build")
|
|
|
|
@property
|
|
def libs(self):
|
|
shared = True if "+shared" in self.spec else False
|
|
return find_libraries("libEl", root=self.prefix, shared=shared, recursive=True)
|
|
|
|
def cmake_args(self):
|
|
spec = self.spec
|
|
|
|
enable_gpu_fp16 = "+cuda" in spec and "+half" in spec
|
|
|
|
args = [
|
|
"-DCMAKE_CXX_STANDARD=17",
|
|
"-DCMAKE_INSTALL_MESSAGE:STRING=LAZY",
|
|
"-DBUILD_SHARED_LIBS:BOOL=%s" % ("+shared" in spec),
|
|
"-DHydrogen_ENABLE_OPENMP:BOOL=%s" % ("+openmp" in spec),
|
|
"-DHydrogen_ENABLE_QUADMATH:BOOL=%s" % ("+quad" in spec),
|
|
"-DHydrogen_USE_64BIT_INTS:BOOL=%s" % ("+int64" in spec),
|
|
"-DHydrogen_USE_64BIT_BLAS_INTS:BOOL=%s" % ("+int64_blas" in spec),
|
|
"-DHydrogen_ENABLE_MPC:BOOL=%s" % ("+mpfr" in spec),
|
|
"-DHydrogen_GENERAL_LAPACK_FALLBACK=ON",
|
|
"-DHydrogen_ENABLE_ALUMINUM=%s" % ("+al" in spec),
|
|
"-DHydrogen_ENABLE_CUB=%s" % ("+cuda" in spec or "+rocm" in spec),
|
|
"-DHydrogen_ENABLE_CUDA=%s" % ("+cuda" in spec),
|
|
"-DHydrogen_ENABLE_ROCM=%s" % ("+rocm" in spec),
|
|
"-DHydrogen_ENABLE_TESTING=%s" % ("+test" in spec),
|
|
"-DHydrogen_ENABLE_HALF=%s" % ("+half" in spec),
|
|
"-DHydrogen_ENABLE_GPU_FP16=%s" % enable_gpu_fp16,
|
|
]
|
|
|
|
if not spec.satisfies("^cmake@3.23.0"):
|
|
# There is a bug with using Ninja generator in this version
|
|
# of CMake
|
|
args.append("-DCMAKE_EXPORT_COMPILE_COMMANDS=ON")
|
|
|
|
if "+cuda" in spec:
|
|
if self.spec.satisfies("%clang"):
|
|
for flag in self.spec.compiler_flags["cxxflags"]:
|
|
if "gcc-toolchain" in flag:
|
|
args.append("-DCMAKE_CUDA_FLAGS=-Xcompiler={0}".format(flag))
|
|
args.append("-DCMAKE_CUDA_STANDARD=14")
|
|
archs = spec.variants["cuda_arch"].value
|
|
if archs != "none":
|
|
arch_str = ";".join(archs)
|
|
args.append("-DCMAKE_CUDA_ARCHITECTURES=%s" % arch_str)
|
|
|
|
if spec.satisfies("%cce") and spec.satisfies("^cuda+allow-unsupported-compilers"):
|
|
args.append("-DCMAKE_CUDA_FLAGS=-allow-unsupported-compiler")
|
|
|
|
if "+rocm" in spec:
|
|
args.extend(
|
|
[
|
|
"-DCMAKE_CXX_FLAGS=-std=c++17",
|
|
"-DHIP_ROOT_DIR={0}".format(spec["hip"].prefix),
|
|
"-DHIP_CXX_COMPILER={0}".format(self.spec["hip"].hipcc),
|
|
]
|
|
)
|
|
archs = self.spec.variants["amdgpu_target"].value
|
|
if archs != "none":
|
|
arch_str = ",".join(archs)
|
|
cxxflags_str = " ".join(self.spec.compiler_flags["cxxflags"])
|
|
args.append(
|
|
"-DHIP_HIPCC_FLAGS=--amdgpu-target={0}"
|
|
" -g -fsized-deallocation -fPIC {1}"
|
|
" -std=c++17".format(arch_str, cxxflags_str)
|
|
)
|
|
args.extend(
|
|
[
|
|
"-DCMAKE_HIP_ARCHITECTURES=%s" % arch_str,
|
|
"-DAMDGPU_TARGETS=%s" % arch_str,
|
|
"-DGPU_TARGETS=%s" % arch_str,
|
|
]
|
|
)
|
|
|
|
# Add support for OS X to find OpenMP (LLVM installed via brew)
|
|
if self.spec.satisfies("%clang +openmp platform=darwin"):
|
|
clang = self.compiler.cc
|
|
clang_bin = os.path.dirname(clang)
|
|
clang_root = os.path.dirname(clang_bin)
|
|
args.extend(["-DOpenMP_DIR={0}".format(clang_root)])
|
|
|
|
if "blas=openblas" in spec:
|
|
args.extend(
|
|
[
|
|
"-DHydrogen_USE_OpenBLAS:BOOL=%s" % ("blas=openblas" in spec),
|
|
"-DOpenBLAS_DIR:STRING={0}".format(spec["openblas"].prefix),
|
|
]
|
|
)
|
|
elif "blas=mkl" in spec:
|
|
args.extend(["-DHydrogen_USE_MKL:BOOL=%s" % ("blas=mkl" in spec)])
|
|
elif "blas=accelerate" in spec:
|
|
args.extend(["-DHydrogen_USE_ACCELERATE:BOOL=TRUE"])
|
|
elif "blas=essl" in spec:
|
|
# IF IBM ESSL is used it needs help finding the proper LAPACK libraries
|
|
args.extend(
|
|
[
|
|
"-DLAPACK_LIBRARIES=%s;-llapack;-lblas"
|
|
% ";".join("-l{0}".format(lib) for lib in self.spec["essl"].libs.names),
|
|
"-DBLAS_LIBRARIES=%s;-lblas"
|
|
% ";".join("-l{0}".format(lib) for lib in self.spec["essl"].libs.names),
|
|
]
|
|
)
|
|
|
|
if "+omp_taskloops" in spec:
|
|
args.extend(["-DHydrogen_ENABLE_OMP_TASKLOOP:BOOL=%s" % ("+omp_taskloops" in spec)])
|
|
|
|
if "+al" in spec:
|
|
args.extend(
|
|
[
|
|
"-DHydrogen_ENABLE_ALUMINUM:BOOL=%s" % ("+al" in spec),
|
|
"-DALUMINUM_DIR={0}".format(spec["aluminum"].prefix),
|
|
]
|
|
)
|
|
|
|
return args
|
|
|
|
def setup_build_environment(self, env):
|
|
if self.spec.satisfies("%apple-clang +openmp"):
|
|
env.append_flags("CPPFLAGS", self.compiler.openmp_flag)
|
|
env.append_flags("CFLAGS", self.spec["llvm-openmp"].headers.include_flags)
|
|
env.append_flags("CXXFLAGS", self.spec["llvm-openmp"].headers.include_flags)
|
|
env.append_flags("LDFLAGS", self.spec["llvm-openmp"].libs.ld_flags)
|