From c5a515681e9c17c7118283fd450a7e11a8a9b539 Mon Sep 17 00:00:00 2001 From: Samuel Moors Date: Sun, 13 Oct 2024 12:43:18 +0200 Subject: [PATCH 1/6] use mixin class for gromacs --- eessi/testsuite/eessi_mixin.py | 10 ++-- eessi/testsuite/tests/apps/gromacs.py | 69 ++++++++++----------------- 2 files changed, 31 insertions(+), 48 deletions(-) diff --git a/eessi/testsuite/eessi_mixin.py b/eessi/testsuite/eessi_mixin.py index 9396fff6..7d4ce278 100644 --- a/eessi/testsuite/eessi_mixin.py +++ b/eessi/testsuite/eessi_mixin.py @@ -1,4 +1,4 @@ -from reframe.core.builtins import parameter, run_after +from reframe.core.builtins import parameter, run_after, variable from reframe.core.exceptions import ReframeFatalError from reframe.core.pipeline import RegressionMixin from reframe.utility.sanity import make_performance_function @@ -25,18 +25,18 @@ class EESSI_Mixin(RegressionMixin): All EESSI tests should derive from this mixin class unless they have a very good reason not to. To run correctly, tests inheriting from this class need to define variables and parameters that are used here. That definition needs to be done 'on time', i.e. early enough in the execution of the ReFrame pipeline. - Here, we list which class attributes need to be defined by the child class, and by (the end of) what phase: + Here, we list which class attributes must be defined by the child class, and by (the end of) what phase: - - Init phase: device_type, scale, module_name + - Init phase: device_type, scale, module_name, bench_name (if bench_name_ci is set) - Setup phase: compute_unit, required_mem_per_node The child class may also overwrite the following attributes: - - Init phase: time_limit, measure_memory_usage + - Init phase: time_limit, measure_memory_usage, bench_name_ci """ # Set defaults for these class variables, can be overwritten by child class if desired - measure_memory_usage = False + measure_memory_usage = variable(bool, value=False) scale = parameter(SCALES.keys()) bench_name = None bench_name_ci = None diff --git a/eessi/testsuite/tests/apps/gromacs.py b/eessi/testsuite/tests/apps/gromacs.py index c10da7c6..c761a5a5 100644 --- a/eessi/testsuite/tests/apps/gromacs.py +++ b/eessi/testsuite/tests/apps/gromacs.py @@ -35,43 +35,43 @@ from hpctestlib.sciapps.gromacs.benchmarks import gromacs_check from eessi.testsuite import hooks -from eessi.testsuite.constants import SCALES, TAGS +from eessi.testsuite.constants import COMPUTE_UNIT, DEVICE_TYPES, SCALES +from eessi.testsuite.eessi_mixin import EESSI_Mixin from eessi.testsuite.utils import find_modules, log +class EESSI_GROMACS_base(gromacs_check): + @run_after('init') + def set_device_type(self): + self.device_type = self.nb_impl + + @rfm.simple_test -class EESSI_GROMACS(gromacs_check): +class EESSI_GROMACS(EESSI_GROMACS_base, EESSI_Mixin): +# class EESSI_GROMACS(gromacs_check, EESSI_Mixin): scale = parameter(SCALES.keys()) - valid_prog_environs = ['default'] - valid_systems = ['*'] time_limit = '30m' module_name = parameter(find_modules('GROMACS')) + bench_name_ci = 'HECBioSim/Crambin' + # measure_memory_usage = True - @run_after('init') - def run_after_init(self): - """Hooks to run after the init phase""" - - # Filter on which scales are supported by the partitions defined in the ReFrame configuration - hooks.filter_supported_scales(self) - - # Make sure that GPU tests run in partitions that support running on a GPU, - # and that CPU-only tests run in partitions that support running CPU-only. - # Also support setting valid_systems on the cmd line. - hooks.filter_valid_systems_by_device_type(self, required_device_type=self.nb_impl) + def required_mem_per_node(self): + return self.num_tasks_per_node * 1024 - # Support selecting modules on the cmd line. - hooks.set_modules(self) - - # Support selecting scales on the cmd line via tags. - hooks.set_tag_scale(self) + def __init__(self): + # self.device_type must be set before the @run_after('init') hooks of the EESSI_Mixin class + self.device_type = self.nb_impl @run_after('init') - def set_tag_ci(self): - """Set tag CI on smallest benchmark, so it can be selected on the cmd line via --tag CI""" - # Crambin input is smallest input (20K atoms), cfr. https://www.hecbiosim.ac.uk/access-hpc/benchmarks - if self.benchmark_info[0] == 'HECBioSim/Crambin': - self.tags.add(TAGS['CI']) - log(f'tags set to {self.tags}') + def set_compute_unit(self): + """Set the compute unit to which tasks will be assigned""" + if self.device_type == DEVICE_TYPES['CPU']: + self.compute_unit = COMPUTE_UNIT['CPU'] + elif self.device_type == DEVICE_TYPES['GPU']: + self.compute_unit = COMPUTE_UNIT['GPU'] + else: + msg = f"No mapping of device type {self.device_type} to a COMPUTE_UNIT was specified in this test" + raise NotImplementedError(msg) @run_after('setup') def set_executable_opts(self): @@ -86,15 +86,6 @@ def set_executable_opts(self): self.executable_opts += ['-dlb', 'yes', '-npme', '-1'] log(f'executable_opts set to {self.executable_opts}') - @run_after('setup') - def run_after_setup(self): - """Hooks to run after the setup phase""" - - # Calculate default requested resources based on the scale: - # 1 task per CPU for CPU-only tests, 1 task per GPU for GPU tests. - # Also support setting the resources on the cmd line. - hooks.assign_tasks_per_compute_unit(test=self, compute_unit=self.nb_impl) - @run_after('setup') def set_omp_num_threads(self): """ @@ -113,11 +104,3 @@ def set_omp_num_threads(self): self.env_vars['OMP_NUM_THREADS'] = omp_num_threads log(f'env_vars set to {self.env_vars}') - - @run_after('setup') - def set_binding_policy(self): - """ - Default process binding may depend on the launcher used. We've seen some variable performance. - Better set it explicitely to make sure process migration cannot cause such variations. - """ - hooks.set_compact_process_binding(self) From 7619481ce13989931f57e142872fee198447ef83 Mon Sep 17 00:00:00 2001 From: Samuel Moors Date: Sun, 13 Oct 2024 12:56:12 +0200 Subject: [PATCH 2/6] remove old comment --- eessi/testsuite/tests/apps/gromacs.py | 1 - 1 file changed, 1 deletion(-) diff --git a/eessi/testsuite/tests/apps/gromacs.py b/eessi/testsuite/tests/apps/gromacs.py index c761a5a5..65ad14f2 100644 --- a/eessi/testsuite/tests/apps/gromacs.py +++ b/eessi/testsuite/tests/apps/gromacs.py @@ -48,7 +48,6 @@ def set_device_type(self): @rfm.simple_test class EESSI_GROMACS(EESSI_GROMACS_base, EESSI_Mixin): -# class EESSI_GROMACS(gromacs_check, EESSI_Mixin): scale = parameter(SCALES.keys()) time_limit = '30m' module_name = parameter(find_modules('GROMACS')) From 69ca2df253b8d3295f71f239bc8acdc04b0ea8f4 Mon Sep 17 00:00:00 2001 From: Samuel Moors Date: Sun, 13 Oct 2024 14:45:16 +0200 Subject: [PATCH 3/6] fix --- eessi/testsuite/tests/apps/cp2k/cp2k.py | 74 +++++++++++++++++++------ 1 file changed, 56 insertions(+), 18 deletions(-) diff --git a/eessi/testsuite/tests/apps/cp2k/cp2k.py b/eessi/testsuite/tests/apps/cp2k/cp2k.py index 77c1a98b..30fe0867 100644 --- a/eessi/testsuite/tests/apps/cp2k/cp2k.py +++ b/eessi/testsuite/tests/apps/cp2k/cp2k.py @@ -4,13 +4,13 @@ from reframe.core.builtins import parameter, run_after, performance_function, sanity_function import reframe.utility.sanity as sn -from eessi.testsuite.constants import SCALES, COMPUTE_UNIT, DEVICE_TYPES, CPU -from eessi.testsuite.eessi_mixin import EESSI_Mixin -from eessi.testsuite.utils import find_modules +from eessi.testsuite import hooks +from eessi.testsuite.constants import SCALES, TAGS, COMPUTE_UNIT, DEVICE_TYPES, CPU +from eessi.testsuite.utils import find_modules, log @rfm.simple_test -class EESSI_CP2K(rfm.RunOnlyRegressionTest, EESSI_Mixin): +class EESSI_CP2K(rfm.RunOnlyRegressionTest): benchmark_info = parameter([ # (bench_name, energy_ref, energy_tol) @@ -24,18 +24,8 @@ class EESSI_CP2K(rfm.RunOnlyRegressionTest, EESSI_Mixin): executable = 'cp2k.popt' time_limit = '2h' - device_type = DEVICE_TYPES[CPU] - compute_unit = COMPUTE_UNIT[CPU] - bench_name_ci = 'QS/H2O-32' # set CI on smallest benchmark - - def required_mem_per_node(self): - mems = { - 'QS/H2O-32': {'intercept': 0.5, 'slope': 0.15}, - 'QS/H2O-128': {'intercept': 5, 'slope': 0.15}, - 'QS/H2O-512': {'intercept': 34, 'slope': 0.20}, - } - mem = mems[self.bench_name] - return (self.num_tasks_per_node * mem['slope'] + mem['intercept']) * 1024 + valid_systems = ['*'] + valid_prog_environs = ['default'] @run_after('init') def prepare_test(self): @@ -61,9 +51,39 @@ def assert_energy(self): def time(self): return sn.extractsingle(r'^ CP2K(\s+[\d\.]+){4}\s+(?P