From 8196595cbcc03b840593924f01fc5a736160b7af Mon Sep 17 00:00:00 2001 From: =?UTF-8?q?Micha=C5=82=20Marcinkiewicz?= <43240942+mmarcinkiewicz@users.noreply.github.com> Date: Fri, 10 Oct 2025 19:24:47 +0200 Subject: [PATCH] Add llama31_8b GBS16 RCPs --- .../training_5.1.0/rcps_llama31_8b.json | 21 +++++++++++++++++++ 1 file changed, 21 insertions(+) diff --git a/mlperf_logging/rcp_checker/training_5.1.0/rcps_llama31_8b.json b/mlperf_logging/rcp_checker/training_5.1.0/rcps_llama31_8b.json index 4e5a331b..1b7143f1 100644 --- a/mlperf_logging/rcp_checker/training_5.1.0/rcps_llama31_8b.json +++ b/mlperf_logging/rcp_checker/training_5.1.0/rcps_llama31_8b.json @@ -1,4 +1,24 @@ { + "llama31_8b_ref_16": + { + "Benchmark": "llama31_8b", + "Creator": "NVIDIA", + "When": "Reference RCPs before 5.1 submission", + "Platform": "2xDGX-B200", + "Precision": "BF16", + "BS": 16, + "Hyperparams": { + "opt_base_learning_rate": 4e-04, + "opt_learning_rate_warmup_samples": 256, + "gradient_accumulation_steps": 1 + }, + "Epochs to converge": [ + 159744, 159744, 159744, 159744, 159744, + 159744, 172032, 159744, 172032, 159744, + 172032, 159744, 159744, 159744, 159744, + 159744, 159744, 159744, 159744, 159744 + ] + }, "llama31_8b_ref_32": { @@ -89,3 +109,4 @@ +