summaryrefslogtreecommitdiff
diff options
context:
space:
mode:
authorSreenivasa Murthy Kolam <67086238+srekolam@users.noreply.github.com>2021-10-17 23:48:07 -0700
committerGitHub <noreply@github.com>2021-10-18 08:48:07 +0200
commit1156c7d0a9378e501873bc8f914ee289bdf81474 (patch)
tree23505961086f569016fa40f5429ff082fdd4ba81
parentcab17c4ac3e509e819bdfdc2e4b4152437c317ca (diff)
downloadspack-1156c7d0a9378e501873bc8f914ee289bdf81474.tar.gz
spack-1156c7d0a9378e501873bc8f914ee289bdf81474.tar.bz2
spack-1156c7d0a9378e501873bc8f914ee289bdf81474.tar.xz
spack-1156c7d0a9378e501873bc8f914ee289bdf81474.zip
allow multiple values for tensile_architecture and expand the gpu list for rocm-4.3.1 (#26745)
-rw-r--r--var/spack/repos/builtin/packages/rocblas/package.py29
1 files changed, 20 insertions, 9 deletions
diff --git a/var/spack/repos/builtin/packages/rocblas/package.py b/var/spack/repos/builtin/packages/rocblas/package.py
index ce26e6b72a..606af8f649 100644
--- a/var/spack/repos/builtin/packages/rocblas/package.py
+++ b/var/spack/repos/builtin/packages/rocblas/package.py
@@ -26,9 +26,11 @@ class Rocblas(CMakePackage):
version('3.7.0', sha256='9425db5f8e8b6f7fb172d09e2a360025b63a4e54414607709efc5acb28819642')
version('3.5.0', sha256='8560fabef7f13e8d67da997de2295399f6ec595edfd77e452978c140d5f936f0')
- tensile_architecture = ('all', 'gfx803', 'gfx900', 'gfx906', 'gfx908')
+ tensile_architecture = ('all', 'gfx803', 'gfx900', 'gfx906:xnack-', 'gfx908:xnack-',
+ 'gfx90a:xnack+', 'gfx90a:xnack-', 'gfx1010', 'gfx1011',
+ 'gfx1012', 'gfx1030')
- variant('tensile_architecture', default='all', values=tensile_architecture, multi=False)
+ variant('tensile_architecture', default='all', values=tensile_architecture, multi=True)
depends_on('cmake@3:', type='build')
@@ -80,14 +82,21 @@ class Rocblas(CMakePackage):
def setup_build_environment(self, env):
env.set('CXX', self.spec['hip'].hipcc)
- def cmake_args(self):
+ def get_gpulist_for_tensile_support(self):
arch = self.spec.variants['tensile_architecture'].value
- if self.spec.satisfies('@4.1.0:'):
- if arch == 'gfx906' or arch == 'gfx908':
- arch = arch + ':xnack-'
+ if arch[0] == 'all':
+ if self.spec.satisfies('@:4.0.0'):
+ arch_value = self.tensile_architecture[1:2] + 'gfx906,gfx908'
+ elif self.spec.satisfies('@4.1.0:4.2.0'):
+ arch_value = self.tensile_architecture[1:4]
+ elif self.spec.satisfies('@4.3.0:'):
+ arch_value = self.tensile_architecture[1:]
+ return arch_value
+ else:
+ return arch
+ def cmake_args(self):
tensile = join_path(self.stage.source_path, 'Tensile')
-
args = [
self.define('BUILD_CLIENTS_TESTS', 'OFF'),
self.define('BUILD_CLIENTS_BENCHMARKS', 'OFF'),
@@ -109,9 +118,11 @@ class Rocblas(CMakePackage):
# See https://github.com/ROCmSoftwarePlatform/rocBLAS/commit/c1895ba4bb3f4f5947f3818ebd155cf71a27b634
if self.spec.satisfies('@:4.2.0'):
- args.append(self.define('Tensile_ARCHITECTURE', arch))
+ args.append(self.define('Tensile_ARCHITECTURE',
+ self.get_gpulist_for_tensile_support()))
else:
- args.append(self.define('AMDGPU_TARGETS', arch))
+ args.append(self.define('AMDGPU_TARGETS',
+ self.get_gpulist_for_tensile_support()))
# See https://github.com/ROCmSoftwarePlatform/rocBLAS/issues/1196
if self.spec.satisfies('^cmake@3.21.0:3.21.2'):