Limit the number of parallel jobs launched by Tensile (#33692)
This commit is contained in:
		| @@ -248,6 +248,11 @@ def cmake_args(self): | |||||||
|                 args.append(self.define("Tensile_LIBRARY_FORMAT", "msgpack")) |                 args.append(self.define("Tensile_LIBRARY_FORMAT", "msgpack")) | ||||||
|             if self.spec.satisfies("@:4.2.0"): |             if self.spec.satisfies("@:4.2.0"): | ||||||
|                 arch_define_name = "Tensile_ARCHITECTURE" |                 arch_define_name = "Tensile_ARCHITECTURE" | ||||||
|  |             # Restrict the number of jobs Tensile can spawn. | ||||||
|  |             # If we don't specify otherwise, Tensile creates a job per available core, | ||||||
|  |             # and that consumes a lot of system memory. | ||||||
|  |             # https://github.com/ROCmSoftwarePlatform/Tensile/blob/93e10678a0ced7843d9332b80bc17ebf9a166e8e/Tensile/Parallel.py#L38 | ||||||
|  |             args.append(self.define("Tensile_CPU_THREADS", min(16, make_jobs))) | ||||||
| 
 | 
 | ||||||
|         # See https://github.com/ROCmSoftwarePlatform/rocBLAS/commit/c1895ba4bb3f4f5947f3818ebd155cf71a27b634 |         # See https://github.com/ROCmSoftwarePlatform/rocBLAS/commit/c1895ba4bb3f4f5947f3818ebd155cf71a27b634 | ||||||
|         if "auto" not in self.spec.variants["amdgpu_target"]: |         if "auto" not in self.spec.variants["amdgpu_target"]: | ||||||
|   | |||||||
		Reference in New Issue
	
	Block a user
	 Zack Galbreath
					Zack Galbreath