summaryrefslogtreecommitdiff
diff options
context:
space:
mode:
-rw-r--r--var/spack/repos/builtin/packages/gptune/package.py201
-rw-r--r--var/spack/repos/builtin/packages/hypre/ij_gptune.patch440
-rw-r--r--var/spack/repos/builtin/packages/hypre/package.py10
-rw-r--r--var/spack/repos/builtin/packages/superlu-dist/CMAKE_INSTALL_LIBDIR.patch59
-rw-r--r--var/spack/repos/builtin/packages/superlu-dist/package.py2
5 files changed, 626 insertions, 86 deletions
diff --git a/var/spack/repos/builtin/packages/gptune/package.py b/var/spack/repos/builtin/packages/gptune/package.py
index eeebd6f40d..d96c86b074 100644
--- a/var/spack/repos/builtin/packages/gptune/package.py
+++ b/var/spack/repos/builtin/packages/gptune/package.py
@@ -18,7 +18,9 @@ class Gptune(CMakePackage):
version('master', branch='master')
- variant('app', default=False, description='Build all HPC application examples')
+ variant('superlu', default=False, description='Build the SuperLU_DIST example')
+ variant('hypre', default=False, description='Build the Hypre example')
+ variant('mpispawn', default=True, description='MPI spawning-based interface')
depends_on('mpi', type=('build', 'link', 'run'))
depends_on('cmake@3.3:', type='build')
@@ -48,9 +50,14 @@ class Gptune(CMakePackage):
depends_on('pygmo', type=('build', 'run'))
depends_on('openturns', type=('build', 'run'))
- depends_on('superlu-dist@develop', when='+app', type=('build', 'run'))
+ depends_on('superlu-dist@develop', when='+superlu', type=('build', 'run'))
+ depends_on('hypre+gptune@2.19.0', when='+hypre', type=('build', 'run'))
- conflicts('openmpi@:3')
+ depends_on('openmpi@4:', when='+mpispawn', type=('build', 'run'))
+ conflicts('mpich', when='+mpispawn')
+ conflicts('spectrum-mpi', when='+mpispawn')
+ conflicts('cray-mpich', when='+mpispawn')
+ conflicts('gcc@:7')
def cmake_args(self):
spec = self.spec
@@ -59,6 +66,7 @@ class Gptune(CMakePackage):
fc_flags.append('-fallow-argument-mismatch')
args = [
+ '-DGPTUNE_INSTALL_PATH=%s' % site_packages_dir,
'-DTPL_BLAS_LIBRARIES=%s' % spec['blas'].libs.joined(";"),
'-DTPL_LAPACK_LIBRARIES=%s' % spec['lapack'].libs.joined(";"),
'-DTPL_SCALAPACK_LIBRARIES=%s' % spec['scalapack'].
@@ -81,96 +89,117 @@ class Gptune(CMakePackage):
def cache_test_sources(self):
"""Copy the example source files after the package is installed to an
install test subdirectory for use during `spack test run`."""
- self.cache_extra_test_sources([self.examples_src_dir, self.src_dir])
+ self.cache_extra_test_sources([self.examples_src_dir])
+
+ def setup_run_environment(self, env):
+ env.set('GPTUNE_INSTALL_PATH', site_packages_dir)
def test(self):
spec = self.spec
comp_name = self.compiler.name
comp_version = str(self.compiler.version).replace('.', ',')
- test_dir = join_path(self.install_test_root, self.examples_src_dir)
+ test_dir = join_path(self.test_suite.current_test_cache_dir,
+ self.examples_src_dir)
- if '+app' in spec:
- superludriver = join_path(spec['superlu-dist'].prefix.bin, 'pddrive_spawn')
+ if '+superlu' in spec:
+ superludriver = join_path(spec['superlu-dist'].prefix.lib,
+ 'EXAMPLE/pddrive_spawn')
op = ['-r', superludriver, '.']
# copy superlu-dist executables to the correct place
- with working_dir(join_path(test_dir, 'SuperLU_DIST'), create=False):
- self.run_test('rm', options=['-rf', 'superlu_dist'], work_dir='.')
- self.run_test('git', options=['clone', 'https://github.com/xiaoyeli/superlu_dist.git'], work_dir='.')
- self.run_test('mkdir', options=['-p',
- 'build'], work_dir='./superlu_dist')
- self.run_test('mkdir', options=['-p', 'EXAMPLE'],
- work_dir='./superlu_dist/build')
- self.run_test('cp', options=op, work_dir='./superlu_dist/build/EXAMPLE')
-
- with working_dir(self.install_test_root, create=False):
- cdir = join_path(self.prefix, 'gptuneclcm')
- self.run_test('cp', options=['-r', cdir, '.'], work_dir='.')
- self.run_test('rm', options=['-rf', 'build'], work_dir='.')
- self.run_test('mv', options=['gptuneclcm', 'build'], work_dir='.')
-
- with open('{0}/run_env.sh'.format(self.install_test_root), 'w') as envfile:
- envfile.write('if [[ $NERSC_HOST = "cori" ]]; then\n')
- envfile.write(' export machine=cori\n')
- envfile.write('elif [[ $(uname -s) = "Darwin" ]]; then\n')
- envfile.write(' export machine=mac\n')
- envfile.write('elif [[ $(dnsdomainname) = ' +
- '"summit.olcf.ornl.gov" ]]; then\n')
- envfile.write(' export machine=summit\n')
- envfile.write('elif [[ $(cat /etc/os-release | grep "PRETTY_NAME") ==' +
- ' *"Ubuntu"* || $(cat /etc/os-release | grep' +
- ' "PRETTY_NAME") == *"Debian"* ]]; then\n')
- envfile.write(' export machine=unknownlinux\n')
- envfile.write('fi\n')
- envfile.write('export GPTUNEROOT=$PWD\n')
- envfile.write('export MPIRUN={0}\n'.format
- (which(spec['mpi'].prefix.bin + '/mpirun')))
- envfile.write('export proc=$(spack arch)\n')
- envfile.write('export mpi={0}\n'.format(spec['mpi'].name))
- envfile.write('export compiler={0}\n'.format(comp_name))
- envfile.write('export nodes={0} \n'.format(self.nodes))
- envfile.write('export cores={0} \n'.format(self.cores))
- envfile.write('export ModuleEnv=$machine-$proc-$mpi-$compiler \n')
- envfile.write('software_json=$(echo ",\\\"software_configuration\\\":' +
- '{\\\"' + spec['blas'].name +
- '\\\":{\\\"version_split\\\":' +
- ' [' + str(spec['blas'].versions).replace('.', ',') +
- ']},\\\"' + spec['mpi'].name +
- '\\\":{\\\"version_split\\\": [' +
- str(spec['mpi'].versions).replace('.', ',') + ']},\\\"' +
- spec['scalapack'].name +
- '\\\":{\\\"version_split\\\": [' +
- str(spec['scalapack'].versions).replace('.', ',') +
- ']},\\\"' +
- str(comp_name) + '\\\":{\\\"version_split\\\": [' +
- str(comp_version) + ']}}") \n')
- envfile.write('loadable_software_json=$(echo ",\\\"loadable_software_' +
- 'configurations\\\":{\\\"' + spec['blas'].name +
- '\\\":{\\\"version_split\\\": [' +
- str(spec['blas'].versions).replace('.', ',') +
- ']},\\\"' + spec['mpi'].name +
- '\\\":{\\\"version_split\\\": [' +
- str(spec['mpi'].versions).replace('.', ',') + ']},\\\"' +
- spec['scalapack'].name +
- '\\\":{\\\"version_split\\\": [' +
- str(spec['scalapack'].versions).replace('.', ',') +
- ']},\\\"' + str(comp_name) +
- '\\\":{\\\"version_split\\\": ['
- + str(comp_version) + ']}}") \n')
- envfile.write('machine_json=$(echo ",\\\"machine_configuration\\\":' +
- '{\\\"machine_name\\\":\\\"$machine\\\",\\\"$proc\\\":' +
- '{\\\"nodes\\\":$nodes,\\\"cores\\\":$cores}}") \n')
- envfile.write('loadable_machine_json=$(echo ",\\\"loadable_machine_' +
- 'configurations\\\":{\\\"$machine\\\":{\\\"$proc\\\":' +
- '{\\\"nodes\\\":$nodes,\\\"cores\\\":$cores}}}") \n')
-
- if '+app' in spec:
- apps = ['GPTune-Demo', 'SuperLU_DIST', 'SuperLU_DIST_RCI',
- 'Scalapack-PDGEQRF', 'Scalapack-PDGEQRF_RCI']
- else:
- apps = ['GPTune-Demo', 'Scalapack-PDGEQRF', 'Scalapack-PDGEQRF_RCI']
+ wd = join_path(test_dir, 'SuperLU_DIST')
+ self.run_test('rm', options=['-rf', 'superlu_dist'], work_dir=wd)
+ self.run_test('git', options=['clone', 'https://github.com/xiaoyeli/superlu_dist.git'], work_dir=wd)
+ self.run_test('mkdir', options=['-p',
+ 'build'], work_dir=wd + '/superlu_dist')
+ self.run_test('mkdir', options=['-p', 'EXAMPLE'],
+ work_dir=wd + '/superlu_dist/build')
+ self.run_test('cp', options=op, work_dir=wd + '/superlu_dist/build/EXAMPLE')
+
+ if '+hypre' in spec:
+ hypredriver = join_path(spec['hypre'].prefix.bin, 'ij')
+ op = ['-r', hypredriver, '.']
+ # copy superlu-dist executables to the correct place
+ wd = join_path(test_dir, 'Hypre')
+ self.run_test('rm', options=['-rf', 'hypre'], work_dir=wd)
+ self.run_test('git', options=['clone', 'https://github.com/hypre-space/hypre.git'], work_dir=wd)
+ self.run_test('cp', options=op, work_dir=wd + '/hypre/src/test/')
+
+ wd = self.test_suite.current_test_cache_dir
+ with open('{0}/run_env.sh'.format(wd), 'w') as envfile:
+ envfile.write('if [[ $NERSC_HOST = "cori" ]]; then\n')
+ envfile.write(' export machine=cori\n')
+ envfile.write('elif [[ $(uname -s) = "Darwin" ]]; then\n')
+ envfile.write(' export machine=mac\n')
+ envfile.write('elif [[ $(dnsdomainname) = ' +
+ '"summit.olcf.ornl.gov" ]]; then\n')
+ envfile.write(' export machine=summit\n')
+ envfile.write('elif [[ $(cat /etc/os-release | grep "PRETTY_NAME") ==' +
+ ' *"Ubuntu"* || $(cat /etc/os-release | grep' +
+ ' "PRETTY_NAME") == *"Debian"* ]]; then\n')
+ envfile.write(' export machine=unknownlinux\n')
+ envfile.write('fi\n')
+ envfile.write('export GPTUNEROOT=$PWD\n')
+ envfile.write('export MPIRUN={0}\n'.format
+ (which(spec['mpi'].prefix.bin + '/mpirun')))
+ envfile.write('export PYTHONPATH={0}:$PYTHONPATH\n'.format
+ (site_packages_dir + '/gptune'))
+ envfile.write('export proc=$(spack arch)\n')
+ envfile.write('export mpi={0}\n'.format(spec['mpi'].name))
+ envfile.write('export compiler={0}\n'.format(comp_name))
+ envfile.write('export nodes={0} \n'.format(self.nodes))
+ envfile.write('export cores={0} \n'.format(self.cores))
+ envfile.write('export ModuleEnv=$machine-$proc-$mpi-$compiler \n')
+ envfile.write('software_json=$(echo ",\\\"software_configuration\\\":' +
+ '{\\\"' + spec['blas'].name +
+ '\\\":{\\\"version_split\\\":' +
+ ' [' + str(spec['blas'].versions).replace('.', ',') +
+ ']},\\\"' + spec['mpi'].name +
+ '\\\":{\\\"version_split\\\": [' +
+ str(spec['mpi'].versions).replace('.', ',') + ']},\\\"' +
+ spec['scalapack'].name +
+ '\\\":{\\\"version_split\\\": [' +
+ str(spec['scalapack'].versions).replace('.', ',') +
+ ']},\\\"' +
+ str(comp_name) + '\\\":{\\\"version_split\\\": [' +
+ str(comp_version) + ']}}") \n')
+ envfile.write('loadable_software_json=$(echo ",\\\"loadable_software_' +
+ 'configurations\\\":{\\\"' + spec['blas'].name +
+ '\\\":{\\\"version_split\\\": [' +
+ str(spec['blas'].versions).replace('.', ',') +
+ ']},\\\"' + spec['mpi'].name +
+ '\\\":{\\\"version_split\\\": [' +
+ str(spec['mpi'].versions).replace('.', ',') + ']},\\\"' +
+ spec['scalapack'].name +
+ '\\\":{\\\"version_split\\\": [' +
+ str(spec['scalapack'].versions).replace('.', ',') +
+ ']},\\\"' + str(comp_name) +
+ '\\\":{\\\"version_split\\\": ['
+ + str(comp_version) + ']}}") \n')
+ envfile.write('machine_json=$(echo ",\\\"machine_configuration\\\":' +
+ '{\\\"machine_name\\\":\\\"$machine\\\",\\\"$proc\\\":' +
+ '{\\\"nodes\\\":$nodes,\\\"cores\\\":$cores}}") \n')
+ envfile.write('loadable_machine_json=$(echo ",\\\"loadable_machine_' +
+ 'configurations\\\":{\\\"$machine\\\":{\\\"$proc\\\":' +
+ '{\\\"nodes\\\":$nodes,\\\"cores\\\":$cores}}}") \n')
+
+ # copy the environment configuration files to non-cache directories
+ op = ['run_env.sh', site_packages_dir + '/gptune/.']
+ self.run_test('cp', options=op, work_dir=wd)
+ op = ['run_env.sh', self.install_test_root + '/.']
+ self.run_test('cp', options=op, work_dir=wd)
+
+ apps = ['Scalapack-PDGEQRF_RCI']
+ if '+mpispawn' in spec:
+ apps = apps + ['GPTune-Demo', 'Scalapack-PDGEQRF']
+ if '+superlu' in spec:
+ apps = apps + ['SuperLU_DIST_RCI']
+ if '+mpispawn' in spec:
+ apps = apps + ['SuperLU_DIST']
+ if '+hypre' in spec:
+ if '+mpispawn' in spec:
+ apps = apps + ['Hypre']
for app in apps:
- with working_dir(join_path(test_dir, app), create=False):
- # PDGEQRF with GPTune
- self.run_test('bash', options=['run_examples.sh'], work_dir='.',
- purpose='gptune smoke test for {0}'.format(app))
+ wd = join_path(test_dir, app)
+ self.run_test('bash', options=['run_examples.sh'], work_dir=wd,
+ purpose='gptune smoke test for {0}'.format(app))
diff --git a/var/spack/repos/builtin/packages/hypre/ij_gptune.patch b/var/spack/repos/builtin/packages/hypre/ij_gptune.patch
new file mode 100644
index 0000000000..36dbf44afb
--- /dev/null
+++ b/var/spack/repos/builtin/packages/hypre/ij_gptune.patch
@@ -0,0 +1,440 @@
+diff --git a/src/test/ij.c b/src/test/ij.c
+old mode 100644
+new mode 100755
+index fcda91898..c43dcf477
+--- a/src/test/ij.c
++++ b/src/test/ij.c
+@@ -85,10 +85,81 @@ extern HYPRE_Int hypre_FlexGMRESModifyPCDefault(void *precond_data, HYPRE_Int it
+ #endif
+ #define SECOND_TIME 0
+
++
++HYPRE_Int
++hypre_fPrintTiming(FILE* fp, const char *heading,
++ MPI_Comm comm )
++{
++ HYPRE_Int ierr = 0;
++
++ HYPRE_Real local_wall_time;
++ HYPRE_Real local_cpu_time;
++ HYPRE_Real wall_time;
++ HYPRE_Real cpu_time;
++ HYPRE_Real wall_mflops;
++ HYPRE_Real cpu_mflops;
++
++ HYPRE_Int i;
++ HYPRE_Int myrank;
++
++ if (hypre_global_timing == NULL)
++ return ierr;
++
++ hypre_MPI_Comm_rank(comm, &myrank );
++
++ /* print heading */
++ if (myrank == 0)
++ {
++ hypre_fprintf(fp, "=============================================\n");
++ hypre_fprintf(fp, "%s:\n", heading);
++ hypre_fprintf(fp, "=============================================\n");
++ }
++
++ for (i = 0; i < (hypre_global_timing -> size); i++)
++ {
++ if (hypre_TimingNumRegs(i) > 0)
++ {
++ local_wall_time = hypre_TimingWallTime(i);
++ local_cpu_time = hypre_TimingCPUTime(i);
++ hypre_MPI_Allreduce(&local_wall_time, &wall_time, 1,
++ hypre_MPI_REAL, hypre_MPI_MAX, comm);
++ hypre_MPI_Allreduce(&local_cpu_time, &cpu_time, 1,
++ hypre_MPI_REAL, hypre_MPI_MAX, comm);
++
++ if (myrank == 0)
++ {
++ hypre_fprintf(fp, "%s:\n", hypre_TimingName(i));
++
++ /* print wall clock info */
++ hypre_fprintf(fp, " wall clock time = %f seconds\n", wall_time);
++ if (wall_time)
++ wall_mflops = hypre_TimingFLOPS(i) / wall_time / 1.0E6;
++ else
++ wall_mflops = 0.0;
++ hypre_fprintf(fp, " wall MFLOPS = %f\n", wall_mflops);
++
++ /* print CPU clock info */
++ hypre_fprintf(fp, " cpu clock time = %f seconds\n", cpu_time);
++ if (cpu_time)
++ cpu_mflops = hypre_TimingFLOPS(i) / cpu_time / 1.0E6;
++ else
++ cpu_mflops = 0.0;
++ hypre_fprintf(fp, " cpu MFLOPS = %f\n\n", cpu_mflops);
++ }
++ }
++ }
++
++ return ierr;
++}
++
++
++
++
+ hypre_int
+ main( hypre_int argc,
+ char *argv[] )
+ {
++ FILE *fplog;
+ HYPRE_Int arg_index;
+ HYPRE_Int print_usage;
+ HYPRE_Int sparsity_known = 0;
+@@ -414,7 +485,9 @@ main( hypre_int argc,
+ size_t mempool_max_cached_bytes = 2000LL * 1024 * 1024;
+
+ /* Initialize MPI */
+- hypre_MPI_Init(&argc, &argv);
++ hypre_MPI_Init(&argc, &argv);MPI_Comm parent; MPI_Comm_get_parent(&parent);
++
++
+
+ hypre_MPI_Comm_size(hypre_MPI_COMM_WORLD, &num_procs );
+ hypre_MPI_Comm_rank(hypre_MPI_COMM_WORLD, &myid );
+@@ -481,6 +554,11 @@ main( hypre_int argc,
+ build_matrix_type = 3;
+ build_matrix_arg_index = arg_index;
+ }
++ else if ( strcmp(argv[arg_index], "-logfile") == 0 )
++ {
++ arg_index++;
++ fplog = fopen(argv[arg_index++], "w");
++ }
+ else if ( strcmp(argv[arg_index], "-27pt") == 0 )
+ {
+ arg_index++;
+@@ -2068,7 +2146,7 @@ main( hypre_int argc,
+ HYPRE_Init();
+
+ hypre_EndTiming(time_index);
+- hypre_PrintTiming("Hypre init times", hypre_MPI_COMM_WORLD);
++ hypre_fPrintTiming(fplog, "Hypre init times", hypre_MPI_COMM_WORLD);
+ hypre_FinalizeTiming(time_index);
+ hypre_ClearTiming();
+
+@@ -2182,7 +2260,7 @@ main( hypre_int argc,
+ local_num_cols = (HYPRE_Int)(last_local_col - first_local_col + 1);
+ }
+ hypre_EndTiming(time_index);
+- hypre_PrintTiming("Generate Matrix", hypre_MPI_COMM_WORLD);
++ hypre_fPrintTiming(fplog, "Generate Matrix", hypre_MPI_COMM_WORLD);
+ hypre_FinalizeTiming(time_index);
+ hypre_ClearTiming();
+
+@@ -2404,7 +2482,7 @@ main( hypre_int argc,
+ ierr += HYPRE_IJMatrixAssemble( ij_A );
+
+ hypre_EndTiming(time_index);
+- hypre_PrintTiming("IJ Matrix Setup", hypre_MPI_COMM_WORLD);
++ hypre_fPrintTiming(fplog, "IJ Matrix Setup", hypre_MPI_COMM_WORLD);
+ hypre_FinalizeTiming(time_index);
+ hypre_ClearTiming();
+
+@@ -3032,7 +3110,7 @@ main( hypre_int argc,
+ }
+
+ hypre_EndTiming(time_index);
+- hypre_PrintTiming("IJ Vector Setup", hypre_MPI_COMM_WORLD);
++ hypre_fPrintTiming(fplog, "IJ Vector Setup", hypre_MPI_COMM_WORLD);
+ hypre_FinalizeTiming(time_index);
+ hypre_ClearTiming();
+
+@@ -3124,7 +3202,7 @@ main( hypre_int argc,
+ #endif
+
+ hypre_EndTiming(time_index);
+- hypre_PrintTiming("MatVec Test", hypre_MPI_COMM_WORLD);
++ hypre_fPrintTiming(fplog, "MatVec Test", hypre_MPI_COMM_WORLD);
+ hypre_FinalizeTiming(time_index);
+ hypre_ClearTiming();
+
+@@ -3190,7 +3268,7 @@ main( hypre_int argc,
+ HYPRE_ParCSRHybridSetup(amg_solver, parcsr_A, b, x);
+
+ hypre_EndTiming(time_index);
+- hypre_PrintTiming("Setup phase times", hypre_MPI_COMM_WORLD);
++ hypre_fPrintTiming(fplog, "Setup phase times", hypre_MPI_COMM_WORLD);
+ hypre_FinalizeTiming(time_index);
+ hypre_ClearTiming();
+
+@@ -3200,7 +3278,7 @@ main( hypre_int argc,
+ HYPRE_ParCSRHybridSolve(amg_solver, parcsr_A, b, x);
+
+ hypre_EndTiming(time_index);
+- hypre_PrintTiming("Solve phase times", hypre_MPI_COMM_WORLD);
++ hypre_fPrintTiming(fplog, "Solve phase times", hypre_MPI_COMM_WORLD);
+ hypre_FinalizeTiming(time_index);
+ hypre_ClearTiming();
+
+@@ -3422,7 +3500,7 @@ main( hypre_int argc,
+ #endif
+
+ hypre_EndTiming(time_index);
+- hypre_PrintTiming("Setup phase times", hypre_MPI_COMM_WORLD);
++ hypre_fPrintTiming(fplog, "Setup phase times", hypre_MPI_COMM_WORLD);
+ hypre_FinalizeTiming(time_index);
+ hypre_ClearTiming();
+
+@@ -3448,7 +3526,7 @@ main( hypre_int argc,
+ #endif
+
+ hypre_EndTiming(time_index);
+- hypre_PrintTiming("Solve phase times", hypre_MPI_COMM_WORLD);
++ hypre_fPrintTiming(fplog, "Solve phase times", hypre_MPI_COMM_WORLD);
+ hypre_FinalizeTiming(time_index);
+ hypre_ClearTiming();
+
+@@ -3638,7 +3716,7 @@ main( hypre_int argc,
+ HYPRE_BoomerAMGSetup(amg_solver, parcsr_A, b, x);
+
+ hypre_EndTiming(time_index);
+- hypre_PrintTiming("Setup phase times", hypre_MPI_COMM_WORLD);
++ hypre_fPrintTiming(fplog, "Setup phase times", hypre_MPI_COMM_WORLD);
+ hypre_FinalizeTiming(time_index);
+ hypre_ClearTiming();
+
+@@ -3648,7 +3726,7 @@ main( hypre_int argc,
+ HYPRE_BoomerAMGSolve(amg_solver, parcsr_A, b, x);
+
+ hypre_EndTiming(time_index);
+- hypre_PrintTiming("Solve phase times", hypre_MPI_COMM_WORLD);
++ hypre_fPrintTiming(fplog, "Solve phase times", hypre_MPI_COMM_WORLD);
+ hypre_FinalizeTiming(time_index);
+ hypre_ClearTiming();
+
+@@ -4112,7 +4190,7 @@ main( hypre_int argc,
+ HYPRE_PCGSetup(pcg_solver, (HYPRE_Matrix)parcsr_A,
+ (HYPRE_Vector)b, (HYPRE_Vector)x);
+ hypre_EndTiming(time_index);
+- hypre_PrintTiming("Setup phase times", hypre_MPI_COMM_WORLD);
++ hypre_fPrintTiming(fplog, "Setup phase times", hypre_MPI_COMM_WORLD);
+ hypre_FinalizeTiming(time_index);
+ hypre_ClearTiming();
+
+@@ -4123,7 +4201,7 @@ main( hypre_int argc,
+ (HYPRE_Vector)b, (HYPRE_Vector)x);
+
+ hypre_EndTiming(time_index);
+- hypre_PrintTiming("Solve phase times", hypre_MPI_COMM_WORLD);
++ hypre_fPrintTiming(fplog, "Solve phase times", hypre_MPI_COMM_WORLD);
+ hypre_FinalizeTiming(time_index);
+ hypre_ClearTiming();
+
+@@ -4140,7 +4218,7 @@ main( hypre_int argc,
+ (HYPRE_Vector)b, (HYPRE_Vector)x);
+
+ hypre_EndTiming(time_index);
+- hypre_PrintTiming("Setup phase times", hypre_MPI_COMM_WORLD);
++ hypre_fPrintTiming(fplog, "Setup phase times", hypre_MPI_COMM_WORLD);
+ hypre_FinalizeTiming(time_index);
+ hypre_ClearTiming();
+
+@@ -4151,7 +4229,7 @@ main( hypre_int argc,
+ (HYPRE_Vector)b, (HYPRE_Vector)x);
+
+ hypre_EndTiming(time_index);
+- hypre_PrintTiming("Solve phase times", hypre_MPI_COMM_WORLD);
++ hypre_fPrintTiming(fplog, "Solve phase times", hypre_MPI_COMM_WORLD);
+ hypre_FinalizeTiming(time_index);
+ hypre_ClearTiming();
+ #endif
+@@ -4550,7 +4628,7 @@ main( hypre_int argc,
+ * (HYPRE_Vector)b, (HYPRE_Vector)x); */
+
+ hypre_EndTiming(time_index);
+- hypre_PrintTiming("Setup phase times", hypre_MPI_COMM_WORLD);
++ hypre_fPrintTiming(fplog, "Setup phase times", hypre_MPI_COMM_WORLD);
+ hypre_FinalizeTiming(time_index);
+ hypre_ClearTiming();
+
+@@ -4610,7 +4688,7 @@ main( hypre_int argc,
+ HYPRE_LOBPCGSolve(lobpcg_solver, constraints, eigenvectors, eigenvalues );
+
+ hypre_EndTiming(time_index);
+- hypre_PrintTiming("Solve phase times", hypre_MPI_COMM_WORLD);
++ hypre_fPrintTiming(fplog, "Solve phase times", hypre_MPI_COMM_WORLD);
+ hypre_FinalizeTiming(time_index);
+ hypre_ClearTiming();
+
+@@ -4942,7 +5020,7 @@ main( hypre_int argc,
+ (HYPRE_Vector)x);
+
+ hypre_EndTiming(time_index);
+- hypre_PrintTiming("Setup phase times", hypre_MPI_COMM_WORLD);
++ hypre_fPrintTiming(fplog, "Setup phase times", hypre_MPI_COMM_WORLD);
+ hypre_FinalizeTiming(time_index);
+ hypre_ClearTiming();
+
+@@ -4980,7 +5058,7 @@ main( hypre_int argc,
+ HYPRE_LOBPCGSolve(pcg_solver, constraints, eigenvectors, eigenvalues);
+
+ hypre_EndTiming(time_index);
+- hypre_PrintTiming("Solve phase times", hypre_MPI_COMM_WORLD);
++ hypre_fPrintTiming(fplog, "Solve phase times", hypre_MPI_COMM_WORLD);
+ hypre_FinalizeTiming(time_index);
+ hypre_ClearTiming();
+
+@@ -5490,7 +5568,7 @@ main( hypre_int argc,
+ (pcg_solver, (HYPRE_Matrix)parcsr_A, (HYPRE_Vector)b, (HYPRE_Vector)x);
+
+ hypre_EndTiming(time_index);
+- hypre_PrintTiming("Setup phase times", hypre_MPI_COMM_WORLD);
++ hypre_fPrintTiming(fplog, "Setup phase times", hypre_MPI_COMM_WORLD);
+ hypre_FinalizeTiming(time_index);
+ hypre_ClearTiming();
+
+@@ -5501,7 +5579,7 @@ main( hypre_int argc,
+ (pcg_solver, (HYPRE_Matrix)parcsr_A, (HYPRE_Vector)b, (HYPRE_Vector)x);
+
+ hypre_EndTiming(time_index);
+- hypre_PrintTiming("Solve phase times", hypre_MPI_COMM_WORLD);
++ hypre_fPrintTiming(fplog, "Solve phase times", hypre_MPI_COMM_WORLD);
+ hypre_FinalizeTiming(time_index);
+ hypre_ClearTiming();
+
+@@ -5723,7 +5801,7 @@ main( hypre_int argc,
+ (pcg_solver, (HYPRE_Matrix)parcsr_A, (HYPRE_Vector)b, (HYPRE_Vector)x);
+
+ hypre_EndTiming(time_index);
+- hypre_PrintTiming("Setup phase times", hypre_MPI_COMM_WORLD);
++ hypre_fPrintTiming(fplog, "Setup phase times", hypre_MPI_COMM_WORLD);
+ hypre_FinalizeTiming(time_index);
+ hypre_ClearTiming();
+
+@@ -5734,7 +5812,7 @@ main( hypre_int argc,
+ (pcg_solver, (HYPRE_Matrix)parcsr_A, (HYPRE_Vector)b, (HYPRE_Vector)x);
+
+ hypre_EndTiming(time_index);
+- hypre_PrintTiming("Solve phase times", hypre_MPI_COMM_WORLD);
++ hypre_fPrintTiming(fplog, "Solve phase times", hypre_MPI_COMM_WORLD);
+ hypre_FinalizeTiming(time_index);
+ hypre_ClearTiming();
+
+@@ -6060,7 +6138,7 @@ main( hypre_int argc,
+ (pcg_solver, (HYPRE_Matrix)parcsr_A, (HYPRE_Vector)b, (HYPRE_Vector)x);
+
+ hypre_EndTiming(time_index);
+- hypre_PrintTiming("Setup phase times", hypre_MPI_COMM_WORLD);
++ hypre_fPrintTiming(fplog, "Setup phase times", hypre_MPI_COMM_WORLD);
+ hypre_FinalizeTiming(time_index);
+ hypre_ClearTiming();
+
+@@ -6071,7 +6149,7 @@ main( hypre_int argc,
+ (pcg_solver, (HYPRE_Matrix)parcsr_A, (HYPRE_Vector)b, (HYPRE_Vector)x);
+
+ hypre_EndTiming(time_index);
+- hypre_PrintTiming("Solve phase times", hypre_MPI_COMM_WORLD);
++ hypre_fPrintTiming(fplog, "Solve phase times", hypre_MPI_COMM_WORLD);
+ hypre_FinalizeTiming(time_index);
+ hypre_ClearTiming();
+
+@@ -6397,7 +6475,7 @@ main( hypre_int argc,
+ (HYPRE_Vector)b, (HYPRE_Vector)x);
+
+ hypre_EndTiming(time_index);
+- hypre_PrintTiming("Setup phase times", hypre_MPI_COMM_WORLD);
++ hypre_fPrintTiming(fplog, "Setup phase times", hypre_MPI_COMM_WORLD);
+ hypre_FinalizeTiming(time_index);
+ hypre_ClearTiming();
+
+@@ -6408,7 +6486,7 @@ main( hypre_int argc,
+ (HYPRE_Vector)b, (HYPRE_Vector)x);
+
+ hypre_EndTiming(time_index);
+- hypre_PrintTiming("Solve phase times", hypre_MPI_COMM_WORLD);
++ hypre_fPrintTiming(fplog, "Solve phase times", hypre_MPI_COMM_WORLD);
+ hypre_FinalizeTiming(time_index);
+ hypre_ClearTiming();
+
+@@ -6723,7 +6801,7 @@ main( hypre_int argc,
+ (HYPRE_Vector)b, (HYPRE_Vector)x);
+
+ hypre_EndTiming(time_index);
+- hypre_PrintTiming("Setup phase times", hypre_MPI_COMM_WORLD);
++ hypre_fPrintTiming(fplog, "Setup phase times", hypre_MPI_COMM_WORLD);
+ hypre_FinalizeTiming(time_index);
+ hypre_ClearTiming();
+
+@@ -6734,7 +6812,7 @@ main( hypre_int argc,
+ (HYPRE_Vector)b, (HYPRE_Vector)x);
+
+ hypre_EndTiming(time_index);
+- hypre_PrintTiming("Solve phase times", hypre_MPI_COMM_WORLD);
++ hypre_fPrintTiming(fplog, "Solve phase times", hypre_MPI_COMM_WORLD);
+ hypre_FinalizeTiming(time_index);
+ hypre_ClearTiming();
+
+@@ -6930,7 +7008,7 @@ main( hypre_int argc,
+ (HYPRE_Vector)x);
+
+ hypre_EndTiming(time_index);
+- hypre_PrintTiming("Setup phase times", hypre_MPI_COMM_WORLD);
++ hypre_fPrintTiming(fplog, "Setup phase times", hypre_MPI_COMM_WORLD);
+ hypre_FinalizeTiming(time_index);
+ hypre_ClearTiming();
+
+@@ -6941,7 +7019,7 @@ main( hypre_int argc,
+ (HYPRE_Vector)x);
+
+ hypre_EndTiming(time_index);
+- hypre_PrintTiming("Solve phase times", hypre_MPI_COMM_WORLD);
++ hypre_fPrintTiming(fplog, "Solve phase times", hypre_MPI_COMM_WORLD);
+ hypre_FinalizeTiming(time_index);
+ hypre_ClearTiming();
+
+@@ -7073,7 +7151,7 @@ main( hypre_int argc,
+ HYPRE_MGRSetup(mgr_solver, parcsr_A, b, x);
+
+ hypre_EndTiming(time_index);
+- hypre_PrintTiming("Setup phase times", hypre_MPI_COMM_WORLD);
++ hypre_fPrintTiming(fplog, "Setup phase times", hypre_MPI_COMM_WORLD);
+ hypre_FinalizeTiming(time_index);
+ hypre_ClearTiming();
+
+@@ -7084,7 +7162,7 @@ main( hypre_int argc,
+ HYPRE_MGRSolve(mgr_solver, parcsr_A, b, x);
+
+ hypre_EndTiming(time_index);
+- hypre_PrintTiming("Solve phase times", hypre_MPI_COMM_WORLD);
++ hypre_fPrintTiming(fplog, "Solve phase times", hypre_MPI_COMM_WORLD);
+ hypre_FinalizeTiming(time_index);
+ hypre_ClearTiming();
+
+@@ -7170,7 +7248,7 @@ main( hypre_int argc,
+ HYPRE_ILUSetup(ilu_solver, parcsr_A, b, x);
+
+ hypre_EndTiming(time_index);
+- hypre_PrintTiming("Setup phase times", hypre_MPI_COMM_WORLD);
++ hypre_fPrintTiming(fplog, "Setup phase times", hypre_MPI_COMM_WORLD);
+ hypre_FinalizeTiming(time_index);
+ hypre_ClearTiming();
+
+@@ -7181,7 +7259,7 @@ main( hypre_int argc,
+ HYPRE_ILUSolve(ilu_solver, parcsr_A, b, x);
+
+ hypre_EndTiming(time_index);
+- hypre_PrintTiming("Solve phase times", hypre_MPI_COMM_WORLD);
++ hypre_fPrintTiming(fplog, "Solve phase times", hypre_MPI_COMM_WORLD);
+ hypre_FinalizeTiming(time_index);
+ hypre_ClearTiming();
+
+@@ -7286,7 +7364,13 @@ main( hypre_int argc,
+ /* Finalize Hypre */
+ HYPRE_Finalize();
+
++
++ fflush(fplog);
++ fclose(fplog);
++
+ /* Finalize MPI */
++ if(parent!=MPI_COMM_NULL)
++ MPI_Comm_disconnect(&parent);
+ hypre_MPI_Finalize();
+
+ /* when using cuda-memcheck --leak-check full, uncomment this */
diff --git a/var/spack/repos/builtin/packages/hypre/package.py b/var/spack/repos/builtin/packages/hypre/package.py
index dff8419df8..d4dc0d6a39 100644
--- a/var/spack/repos/builtin/packages/hypre/package.py
+++ b/var/spack/repos/builtin/packages/hypre/package.py
@@ -68,6 +68,11 @@ class Hypre(AutotoolsPackage, CudaPackage):
variant('unified-memory', default=False, description='Use unified memory')
variant('fortran', default=True,
description='Enables fortran bindings')
+ variant('gptune', default=False,
+ description='Add the GPTune hookup code')
+
+ # Patch to add gptune hookup codes
+ patch('ij_gptune.patch', when='+gptune@2.19.0')
# Patch to add ppc64le in config.guess
patch('ibm-ppc64le.patch', when='@:2.11.1')
@@ -88,6 +93,7 @@ class Hypre(AutotoolsPackage, CudaPackage):
conflicts('+cuda', when='+int64')
conflicts('+unified-memory', when='~cuda')
+ conflicts('+gptune', when='~mpi')
# Patch to build shared libraries on Darwin does not apply to
# versions before 2.13.0
@@ -228,6 +234,10 @@ class Hypre(AutotoolsPackage, CudaPackage):
sstruct('-in', 'test/sstruct.in.default', '-solver', '40',
'-rhsone')
make("install")
+ if '+gptune' in self.spec:
+ make("test")
+ self.run_test('mkdir', options=['-p', self.prefix.bin])
+ self.run_test('cp', options=['test/ij', self.prefix.bin + '/.'])
extra_install_tests = join_path('src', 'examples')
diff --git a/var/spack/repos/builtin/packages/superlu-dist/CMAKE_INSTALL_LIBDIR.patch b/var/spack/repos/builtin/packages/superlu-dist/CMAKE_INSTALL_LIBDIR.patch
new file mode 100644
index 0000000000..d3d8311863
--- /dev/null
+++ b/var/spack/repos/builtin/packages/superlu-dist/CMAKE_INSTALL_LIBDIR.patch
@@ -0,0 +1,59 @@
+diff --git a/CMakeLists.txt b/CMakeLists.txt
+index 2b2fdf2..f89cf4c 100644
+--- a/CMakeLists.txt
++++ b/CMakeLists.txt
+@@ -456,15 +456,6 @@ endif()
+ #target_compile_features(SuperLU_DIST PUBLIC cxx_std_11)
+
+ # Generate various configure files with proper definitions
+-# configure_file(${CMAKE_SOURCE_DIR}/make.inc.in ${CMAKE_BINARY_DIR}/make.inc)
+-configure_file(${SuperLU_DIST_SOURCE_DIR}/make.inc.in ${SuperLU_DIST_SOURCE_DIR}/make.inc)
+-
+-configure_file(${SuperLU_DIST_SOURCE_DIR}/SRC/superlu_dist_config.h.in ${SuperLU_DIST_BINARY_DIR}/SRC/superlu_dist_config.h)
+-configure_file(${SuperLU_DIST_SOURCE_DIR}/SRC/superlu_dist_config.h.in ${SuperLU_DIST_SOURCE_DIR}/SRC/superlu_dist_config.h)
+-
+-# Following is to configure a file for FORTRAN code
+-configure_file(${SuperLU_DIST_SOURCE_DIR}/SRC/superlu_dist_config.h.in ${SuperLU_DIST_BINARY_DIR}/FORTRAN/superlu_dist_config.h)
+-
+
+ # Add pkg-config support
+ if(IS_ABSOLUTE ${CMAKE_INSTALL_LIBDIR})
+@@ -476,4 +467,13 @@ configure_file(${CMAKE_CURRENT_SOURCE_DIR}/superlu_dist.pc.in ${CMAKE_CURRENT_BI
+ install(FILES ${CMAKE_CURRENT_BINARY_DIR}/superlu_dist.pc
+ DESTINATION ${CMAKE_INSTALL_LIBDIR}/pkgconfig)
+
++# configure_file(${CMAKE_SOURCE_DIR}/make.inc.in ${CMAKE_BINARY_DIR}/make.inc)
++configure_file(${SuperLU_DIST_SOURCE_DIR}/make.inc.in ${SuperLU_DIST_SOURCE_DIR}/make.inc)
++
++configure_file(${SuperLU_DIST_SOURCE_DIR}/SRC/superlu_dist_config.h.in ${SuperLU_DIST_BINARY_DIR}/SRC/superlu_dist_config.h)
++configure_file(${SuperLU_DIST_SOURCE_DIR}/SRC/superlu_dist_config.h.in ${SuperLU_DIST_SOURCE_DIR}/SRC/superlu_dist_config.h)
++
++# Following is to configure a file for FORTRAN code
++configure_file(${SuperLU_DIST_SOURCE_DIR}/SRC/superlu_dist_config.h.in ${SuperLU_DIST_BINARY_DIR}/FORTRAN/superlu_dist_config.h)
++
+ #message("MPI_Fortran_LINK_FLAGS '${MPI_Fortran_LINK_FLAGS}'")
+diff --git a/make.inc.in b/make.inc.in
+index 0beb461..860c0bf 100644
+--- a/make.inc.in
++++ b/make.inc.in
+@@ -18,7 +18,8 @@
+ #
+ SuperLUroot = ${CMAKE_INSTALL_PREFIX}
+ #DSUPERLULIB = $(SuperLUroot)/SRC/${PROJECT_NAME_LIB_EXPORT}
+-DSUPERLULIB = $(SuperLUroot)/@CMAKE_INSTALL_LIBDIR@/${PROJECT_NAME_LIB_EXPORT}
++#DSUPERLULIB = $(SuperLUroot)/@CMAKE_INSTALL_LIBDIR@/${PROJECT_NAME_LIB_EXPORT}
++DSUPERLULIB = @pkgconfig_libdir@/${PROJECT_NAME_LIB_EXPORT}
+ INCLUDEDIR = $(SuperLUroot)/@CMAKE_INSTALL_INCLUDEDIR@
+
+ XSDK_INDEX_SIZE = @XSDK_INDEX_SIZE@
+@@ -29,7 +30,8 @@ HAVE_CUDA = @HAVE_CUDA@
+
+ XSDK_ENABLE_Fortran = @XSDK_ENABLE_Fortran@
+ ifeq ($(XSDK_ENABLE_Fortran),ON)
+- DFORTRANLIB = $(SuperLUroot)/@CMAKE_INSTALL_LIBDIR@/${PROJECT_NAME_LIB_FORTRAN}
++# DFORTRANLIB = $(SuperLUroot)/@CMAKE_INSTALL_LIBDIR@/${PROJECT_NAME_LIB_FORTRAN}
++ DFORTRANLIB = @pkgconfig_libdir@/${PROJECT_NAME_LIB_FORTRAN}
+ LIBS = $(DFORTRANLIB) $(DSUPERLULIB) ${BLAS_LIB_EXPORT} -lm
+ LIBS += ${EXTRA_FLIB_EXPORT}
+ else
+
diff --git a/var/spack/repos/builtin/packages/superlu-dist/package.py b/var/spack/repos/builtin/packages/superlu-dist/package.py
index 9677446893..7af879c45f 100644
--- a/var/spack/repos/builtin/packages/superlu-dist/package.py
+++ b/var/spack/repos/builtin/packages/superlu-dist/package.py
@@ -20,6 +20,7 @@ class SuperluDist(CMakePackage, CudaPackage, ROCmPackage):
version('develop', branch='master')
version('amd', branch='amd')
+ version('7.2.0', sha256='20b60bd8a3d88031c9ce6511ae9700b7a8dcf12e2fd704e74b1af762b3468b8c')
version('7.1.1', sha256='558053b3d4a56eb661c4f04d4fcab6604018ce5db97115394c161b56c9c278ff')
version('7.1.0', sha256='edbea877562be95fb22c7de1ff484f18685bec4baa8e4f703c414d3c035d4a66')
version('6.4.0', sha256='cb9c0b2ba4c28e5ed5817718ba19ae1dd63ccd30bc44c8b8252b54f5f04a44cc')
@@ -58,6 +59,7 @@ class SuperluDist(CMakePackage, CudaPackage, ROCmPackage):
patch('xl-611.patch', when='@:6.1.1 %xl')
patch('xl-611.patch', when='@:6.1.1 %xl_r')
patch('superlu-cray-ftn-case.patch', when='@7.1.1 %cce')
+ patch('CMAKE_INSTALL_LIBDIR.patch', when='@7.0.0:7.2.0')
def cmake_args(self):
spec = self.spec