summaryrefslogtreecommitdiff
path: root/var
diff options
context:
space:
mode:
authorZack Galbreath <zack.galbreath@kitware.com>2022-11-03 17:26:03 -0400
committerGitHub <noreply@github.com>2022-11-03 15:26:03 -0600
commitccc716f6173127f00df2016220b45e9b5987a49a (patch)
tree24bf1af517b2cce5c81f53e62ba75aa54ea8e0cc /var
parentb55509ffa89f847df3c24ff2a90ce8a11d154a96 (diff)
downloadspack-ccc716f6173127f00df2016220b45e9b5987a49a.tar.gz
spack-ccc716f6173127f00df2016220b45e9b5987a49a.tar.bz2
spack-ccc716f6173127f00df2016220b45e9b5987a49a.tar.xz
spack-ccc716f6173127f00df2016220b45e9b5987a49a.zip
Limit the number of parallel jobs launched by Tensile (#33692)
Diffstat (limited to 'var')
-rw-r--r--var/spack/repos/builtin/packages/rocblas/package.py5
1 files changed, 5 insertions, 0 deletions
diff --git a/var/spack/repos/builtin/packages/rocblas/package.py b/var/spack/repos/builtin/packages/rocblas/package.py
index 84f90cff4b..92844ffda5 100644
--- a/var/spack/repos/builtin/packages/rocblas/package.py
+++ b/var/spack/repos/builtin/packages/rocblas/package.py
@@ -248,6 +248,11 @@ class Rocblas(CMakePackage):
args.append(self.define("Tensile_LIBRARY_FORMAT", "msgpack"))
if self.spec.satisfies("@:4.2.0"):
arch_define_name = "Tensile_ARCHITECTURE"
+ # Restrict the number of jobs Tensile can spawn.
+ # If we don't specify otherwise, Tensile creates a job per available core,
+ # and that consumes a lot of system memory.
+ # https://github.com/ROCmSoftwarePlatform/Tensile/blob/93e10678a0ced7843d9332b80bc17ebf9a166e8e/Tensile/Parallel.py#L38
+ args.append(self.define("Tensile_CPU_THREADS", min(16, make_jobs)))
# See https://github.com/ROCmSoftwarePlatform/rocBLAS/commit/c1895ba4bb3f4f5947f3818ebd155cf71a27b634
if "auto" not in self.spec.variants["amdgpu_target"]: