254 lines
11 KiB
Python
254 lines
11 KiB
Python
# Copyright 2013-2022 Lawrence Livermore National Security, LLC and other
|
|
# Spack Project Developers. See the top-level COPYRIGHT file for details.
|
|
#
|
|
# SPDX-License-Identifier: (Apache-2.0 OR MIT)
|
|
|
|
import os
|
|
|
|
from spack.package import *
|
|
|
|
|
|
class Hydrogen(CMakePackage, CudaPackage, ROCmPackage):
|
|
"""Hydrogen: Distributed-memory dense and sparse-direct linear algebra
|
|
and optimization library. Based on the Elemental library."""
|
|
|
|
homepage = "https://libelemental.org"
|
|
url = "https://github.com/LLNL/Elemental/archive/v1.0.1.tar.gz"
|
|
git = "https://github.com/LLNL/Elemental.git"
|
|
tags = ['ecp', 'radiuss']
|
|
|
|
maintainers = ['bvanessen']
|
|
|
|
version('develop', branch='hydrogen')
|
|
version('1.5.1', sha256='447da564278f98366906d561d9c8bc4d31678c56d761679c2ff3e59ee7a2895c')
|
|
version('1.5.0', sha256='03dd487fb23b9fdbc715554a8ea48c3196a1021502e61b0172ef3fdfbee75180')
|
|
version('1.4.0', sha256='c13374ff4a6c4d1076e47ba8c8d91a7082588b9958d1ed89cffb12f1d2e1452e')
|
|
version('1.3.4', sha256='7979f6656f698f0bbad6798b39d4b569835b3013ff548d98089fce7c283c6741')
|
|
version('1.3.3', sha256='a51a1cfd40ac74d10923dfce35c2c04a3082477683f6b35e7b558ea9f4bb6d51')
|
|
version('1.3.2', sha256='50bc5e87955f8130003d04dfd9dcad63107e92b82704f8107baf95b0ccf98ed6')
|
|
version('1.3.1', sha256='a8b8521458e9e747f2b24af87c4c2749a06e500019c383e0cefb33e5df6aaa1d')
|
|
version('1.3.0', sha256='0f3006aa1d8235ecdd621e7344c99f56651c6836c2e1bc0cf006331b70126b36')
|
|
version('1.2.0', sha256='8545975139582ee7bfe5d00f8d83a8697afc285bf7026b0761e9943355974806')
|
|
version('1.1.0-1', sha256='73ce05e4166853a186469269cb00a454de71e126b2019f95bbae703b65606808')
|
|
version('1.1.0', sha256='b4c12913acd01c72d31f4522266bfeb8df1d4d3b4aef02e07ccbc9a477894e71')
|
|
version('1.0.1', sha256='27cf76e1ef1d58bd8f9b1e34081a14a682b7ff082fb5d1da56713e5e0040e528')
|
|
version('1.0', sha256='d8a97de3133f2c6b6bb4b80d32b4a4cc25eb25e0df4f0cec0f8cb19bf34ece98')
|
|
|
|
variant('shared', default=True,
|
|
description='Enables the build of shared libraries')
|
|
variant('openmp', default=True,
|
|
description='Make use of OpenMP within CPU-kernels')
|
|
variant('openmp_blas', default=False,
|
|
description='Use OpenMP for threading in the BLAS library')
|
|
variant('quad', default=False,
|
|
description='Enable quad precision')
|
|
variant('int64', default=False,
|
|
description='Use 64bit integers')
|
|
variant('int64_blas', default=False,
|
|
description='Use 64bit integers for BLAS.')
|
|
variant('scalapack', default=False,
|
|
description='Build with ScaLAPACK library')
|
|
variant('build_type', default='Release',
|
|
description='The build type to build',
|
|
values=('Debug', 'Release'))
|
|
variant('blas', default='openblas', values=('openblas', 'mkl', 'accelerate', 'essl', 'libsci'),
|
|
description='Enable the use of OpenBlas/MKL/Accelerate/ESSL/LibSci')
|
|
variant('mpfr', default=False,
|
|
description='Support GNU MPFR\'s'
|
|
'arbitrary-precision floating-point arithmetic')
|
|
variant('test', default=False,
|
|
description='Builds test suite')
|
|
variant('al', default=False,
|
|
description='Builds with Aluminum communication library')
|
|
variant('omp_taskloops', default=False,
|
|
description='Use OpenMP taskloops instead of parallel for loops.')
|
|
variant('half', default=False,
|
|
description='Builds with support for FP16 precision data types')
|
|
|
|
conflicts('~openmp', when='+omp_taskloops')
|
|
conflicts('+cuda', when='+rocm', msg='CUDA and ROCm support are mutually exclusive')
|
|
|
|
depends_on('cmake@3.21.0:', type='build', when='@1.5.2:')
|
|
depends_on('cmake@3.17.0:', type='build', when='@:1.5.1')
|
|
depends_on('cmake@3.22.0:', type='build', when='%cce')
|
|
|
|
depends_on('mpi')
|
|
depends_on('hwloc@1.11:')
|
|
depends_on('hwloc +cuda +nvml', when='+cuda')
|
|
depends_on('hwloc@2.3.0:', when='+rocm')
|
|
|
|
# Note that #1712 forces us to enumerate the different blas variants
|
|
depends_on('openblas', when='blas=openblas')
|
|
depends_on('openblas +ilp64', when='blas=openblas +int64_blas')
|
|
depends_on('openblas threads=openmp', when='blas=openblas +openmp_blas')
|
|
|
|
depends_on('intel-mkl', when="blas=mkl")
|
|
depends_on('intel-mkl +ilp64', when="blas=mkl +int64_blas")
|
|
depends_on('intel-mkl threads=openmp', when='blas=mkl +openmp_blas')
|
|
|
|
depends_on('veclibfort', when='blas=accelerate')
|
|
conflicts('blas=accelerate +openmp_blas')
|
|
|
|
depends_on('essl', when='blas=essl')
|
|
depends_on('essl +ilp64', when='blas=essl +int64_blas')
|
|
depends_on('essl threads=openmp', when='blas=essl +openmp_blas')
|
|
depends_on('netlib-lapack +external-blas', when='blas=essl')
|
|
|
|
depends_on('cray-libsci', when='blas=libsci')
|
|
depends_on('cray-libsci +openmp', when='blas=libsci +openmp_blas')
|
|
|
|
# Specify the correct version of Aluminum
|
|
depends_on('aluminum@:0.3', when='@:1.3 +al')
|
|
depends_on('aluminum@0.4.0:0.4', when='@1.4.0:1.4 +al')
|
|
depends_on('aluminum@0.6.0:0.6', when='@1.5.0:1.5.1 +al')
|
|
depends_on('aluminum@0.7.0:', when='@:1.0,1.5.2: +al')
|
|
|
|
# Add Aluminum variants
|
|
depends_on('aluminum +cuda +nccl +cuda_rma', when='+al +cuda')
|
|
depends_on('aluminum +rocm +rccl', when='+al +rocm')
|
|
|
|
for arch in CudaPackage.cuda_arch_values:
|
|
depends_on('aluminum cuda_arch=%s' % arch, when='+al +cuda cuda_arch=%s' % arch)
|
|
|
|
# variants +rocm and amdgpu_targets are not automatically passed to
|
|
# dependencies, so do it manually.
|
|
for val in ROCmPackage.amdgpu_targets:
|
|
depends_on('aluminum amdgpu_target=%s' % val, when='+al +rocm amdgpu_target=%s' % val)
|
|
|
|
# Note that this forces us to use OpenBLAS until #1712 is fixed
|
|
depends_on('lapack', when='blas=openblas ~openmp_blas')
|
|
|
|
depends_on('scalapack', when='+scalapack')
|
|
depends_on('gmp', when='+mpfr')
|
|
depends_on('mpc', when='+mpfr')
|
|
depends_on('mpfr', when='+mpfr')
|
|
|
|
depends_on('cuda', when='+cuda')
|
|
depends_on('cub', when='^cuda@:10')
|
|
depends_on('hipcub', when='+rocm')
|
|
depends_on('half', when='+half')
|
|
|
|
depends_on('llvm-openmp', when='%apple-clang +openmp')
|
|
|
|
conflicts('@0:0.98', msg="Hydrogen did not exist before v0.99. " +
|
|
"Did you mean to use Elemental instead?")
|
|
|
|
generator = 'Ninja'
|
|
depends_on('ninja', type='build')
|
|
|
|
@property
|
|
def libs(self):
|
|
shared = True if '+shared' in self.spec else False
|
|
return find_libraries(
|
|
'libEl', root=self.prefix, shared=shared, recursive=True
|
|
)
|
|
|
|
def cmake_args(self):
|
|
spec = self.spec
|
|
|
|
enable_gpu_fp16 = ('+cuda' in spec and '+half' in spec)
|
|
|
|
args = [
|
|
'-DCMAKE_CXX_STANDARD=17',
|
|
'-DCMAKE_INSTALL_MESSAGE:STRING=LAZY',
|
|
'-DBUILD_SHARED_LIBS:BOOL=%s' % ('+shared' in spec),
|
|
'-DHydrogen_ENABLE_OPENMP:BOOL=%s' % ('+openmp' in spec),
|
|
'-DHydrogen_ENABLE_QUADMATH:BOOL=%s' % ('+quad' in spec),
|
|
'-DHydrogen_USE_64BIT_INTS:BOOL=%s' % ('+int64' in spec),
|
|
'-DHydrogen_USE_64BIT_BLAS_INTS:BOOL=%s' % ('+int64_blas' in spec),
|
|
'-DHydrogen_ENABLE_MPC:BOOL=%s' % ('+mpfr' in spec),
|
|
'-DHydrogen_GENERAL_LAPACK_FALLBACK=ON',
|
|
'-DHydrogen_ENABLE_ALUMINUM=%s' % ('+al' in spec),
|
|
'-DHydrogen_ENABLE_CUB=%s' % ('+cuda' in spec or '+rocm' in spec),
|
|
'-DHydrogen_ENABLE_CUDA=%s' % ('+cuda' in spec),
|
|
'-DHydrogen_ENABLE_ROCM=%s' % ('+rocm' in spec),
|
|
'-DHydrogen_ENABLE_TESTING=%s' % ('+test' in spec),
|
|
'-DHydrogen_ENABLE_HALF=%s' % ('+half' in spec),
|
|
'-DHydrogen_ENABLE_GPU_FP16=%s' % enable_gpu_fp16,
|
|
]
|
|
|
|
if not spec.satisfies('^cmake@3.23.0'):
|
|
# There is a bug with using Ninja generator in this version
|
|
# of CMake
|
|
args.append('-DCMAKE_EXPORT_COMPILE_COMMANDS=ON')
|
|
|
|
if '+cuda' in spec:
|
|
if self.spec.satisfies('%clang'):
|
|
for flag in self.spec.compiler_flags['cxxflags']:
|
|
if 'gcc-toolchain' in flag:
|
|
args.append('-DCMAKE_CUDA_FLAGS=-Xcompiler={0}'.format(flag))
|
|
args.append('-DCMAKE_CUDA_STANDARD=14')
|
|
archs = spec.variants['cuda_arch'].value
|
|
if archs != 'none':
|
|
arch_str = ";".join(archs)
|
|
args.append('-DCMAKE_CUDA_ARCHITECTURES=%s' % arch_str)
|
|
|
|
if (spec.satisfies('%cce') and
|
|
spec.satisfies('^cuda+allow-unsupported-compilers')):
|
|
args.append('-DCMAKE_CUDA_FLAGS=-allow-unsupported-compiler')
|
|
|
|
if '+rocm' in spec:
|
|
args.extend([
|
|
'-DCMAKE_CXX_FLAGS=-std=c++17',
|
|
'-DHIP_ROOT_DIR={0}'.format(spec['hip'].prefix),
|
|
'-DHIP_CXX_COMPILER={0}'.format(self.spec['hip'].hipcc)])
|
|
archs = self.spec.variants['amdgpu_target'].value
|
|
if archs != 'none':
|
|
arch_str = ",".join(archs)
|
|
cxxflags_str = " ".join(self.spec.compiler_flags['cxxflags'])
|
|
args.append(
|
|
'-DHIP_HIPCC_FLAGS=--amdgpu-target={0}'
|
|
' -g -fsized-deallocation -fPIC {1}'
|
|
' -std=c++17'.format(arch_str, cxxflags_str)
|
|
)
|
|
|
|
# Add support for OS X to find OpenMP (LLVM installed via brew)
|
|
if self.spec.satisfies('%clang +openmp platform=darwin'):
|
|
clang = self.compiler.cc
|
|
clang_bin = os.path.dirname(clang)
|
|
clang_root = os.path.dirname(clang_bin)
|
|
args.extend([
|
|
'-DOpenMP_DIR={0}'.format(clang_root)])
|
|
|
|
if 'blas=openblas' in spec:
|
|
args.extend([
|
|
'-DHydrogen_USE_OpenBLAS:BOOL=%s' % ('blas=openblas' in spec),
|
|
'-DOpenBLAS_DIR:STRING={0}'.format(
|
|
spec['openblas'].prefix)])
|
|
elif 'blas=mkl' in spec:
|
|
args.extend([
|
|
'-DHydrogen_USE_MKL:BOOL=%s' % ('blas=mkl' in spec)])
|
|
elif 'blas=accelerate' in spec:
|
|
args.extend(['-DHydrogen_USE_ACCELERATE:BOOL=TRUE'])
|
|
elif 'blas=essl' in spec:
|
|
# IF IBM ESSL is used it needs help finding the proper LAPACK libraries
|
|
args.extend([
|
|
'-DLAPACK_LIBRARIES=%s;-llapack;-lblas' %
|
|
';'.join('-l{0}'.format(lib) for lib in self.spec['essl'].libs.names),
|
|
'-DBLAS_LIBRARIES=%s;-lblas' %
|
|
';'.join('-l{0}'.format(lib) for lib in self.spec['essl'].libs.names)])
|
|
|
|
if '+omp_taskloops' in spec:
|
|
args.extend([
|
|
'-DHydrogen_ENABLE_OMP_TASKLOOP:BOOL=%s' %
|
|
('+omp_taskloops' in spec)])
|
|
|
|
if '+al' in spec:
|
|
args.extend([
|
|
'-DHydrogen_ENABLE_ALUMINUM:BOOL=%s' % ('+al' in spec),
|
|
'-DALUMINUM_DIR={0}'.format(
|
|
spec['aluminum'].prefix)])
|
|
|
|
return args
|
|
|
|
def setup_build_environment(self, env):
|
|
if self.spec.satisfies('%apple-clang +openmp'):
|
|
env.append_flags(
|
|
'CPPFLAGS', self.compiler.openmp_flag)
|
|
env.append_flags(
|
|
'CFLAGS', self.spec['llvm-openmp'].headers.include_flags)
|
|
env.append_flags(
|
|
'CXXFLAGS', self.spec['llvm-openmp'].headers.include_flags)
|
|
env.append_flags(
|
|
'LDFLAGS', self.spec['llvm-openmp'].libs.ld_flags)
|