diff --git a/script/app-mlperf-inference-nvidia/_cm.yaml b/script/app-mlperf-inference-nvidia/_cm.yaml index d73667184b..67c8a131ef 100644 --- a/script/app-mlperf-inference-nvidia/_cm.yaml +++ b/script/app-mlperf-inference-nvidia/_cm.yaml @@ -1025,6 +1025,10 @@ variations: default_variations: batch-size: batch_size.1 + llama2-70b_,run_harness: + env: + CM_MLPERF_NVIDIA_HARNESS_USE_FP8: 'True' + gptj_,run_harness: deps: - tags: install,pytorch,from.src