diff --git a/var/ramble/repos/builtin/applications/nvidia-hpl/application.py b/var/ramble/repos/builtin/applications/nvidia-hpl/application.py index 85b0b7c2f..ed4e0d6b8 100644 --- a/var/ramble/repos/builtin/applications/nvidia-hpl/application.py +++ b/var/ramble/repos/builtin/applications/nvidia-hpl/application.py @@ -38,12 +38,29 @@ class NvidiaHpl(HplBase): "execute", "./hpl.sh --dat {experiment_run_dir}/HPL.dat", use_mpi=True ) + executable( + "execute-mxp", + './hpl-mxp.sh --gpu-affinity "{gpu_affinity}" --n {Ns} --nb {block_size} --nprow {Ps} --npcol {Qs} --nporder {nporder}', + use_mpi=True, + ) + workload("standard", executables=["execute"]) workload("calculator", executables=["execute"]) - workload_group("standard", workloads=["standard"], mode="append") - workload_group("calculator", workloads=["calculator"], mode="append") - workload_group("all_workloads", workloads=["standard", "calculator"]) + workload("standard-mxp", executables=["execute-mxp"]) + workload("calculator-mxp", executables=["execute-mxp"]) + + workload_group( + "standard", workloads=["standard", "standard-mxp"], mode="append" + ) + workload_group( + "calculator", workloads=["calculator", "calculator-mxp"], mode="append" + ) + workload_group( + "all_workloads", + workloads=["standard", "standard-mxp", "calculator", "calculator-mxp"], + ) + workload_group("mxp", workloads=["standard-mxp", "calculator-mxp"]) workload_variable( "nvshmem_disable_cuda_vmm", @@ -168,3 +185,18 @@ class NvidiaHpl(HplBase): description="Size of each block", workload_group="calculator", ) + + workload_variable( + "nporder", + default="row", + description="Major order to use for matrix", + values=["row", "column"], + workload_group="mxp", + ) + + workload_variable( + "gpu_affinity", + default="0:1:2:3:4:5:6:7", + description="Colon delimited list of GPU IDs", + workload_group="mxp", + ) diff --git a/var/ramble/repos/builtin/base_applications/hpl/base_application.py b/var/ramble/repos/builtin/base_applications/hpl/base_application.py index 8613e3a63..e8ad4aeb5 100644 --- a/var/ramble/repos/builtin/base_applications/hpl/base_application.py +++ b/var/ramble/repos/builtin/base_applications/hpl/base_application.py @@ -8,7 +8,6 @@ import os from ramble.appkit import * -from ramble.expander import Expander import math @@ -262,14 +261,8 @@ class Hpl(ExecutableApplication): ) # FOMs: - log_str = os.path.join( - Expander.expansion_str("experiment_run_dir"), - Expander.expansion_str("experiment_name") + ".out", - ) - figure_of_merit( "Time", - log_file=log_str, fom_regex=r".*\s+(?P[0-9]+)\s+(?P[0-9]+)\s+(?P

[0-9]+)\s+(?P[0-9]+)\s+(?P

[0-9]+)\s+(?P[0-9]+)\s+(?P