diff --git a/mlperf_logging/rcp_checker/training_5.1.0/rcps_llama31_8b.json b/mlperf_logging/rcp_checker/training_5.1.0/rcps_llama31_8b.json index 4e5a331b..1b7143f1 100644 --- a/mlperf_logging/rcp_checker/training_5.1.0/rcps_llama31_8b.json +++ b/mlperf_logging/rcp_checker/training_5.1.0/rcps_llama31_8b.json @@ -1,4 +1,24 @@ { + "llama31_8b_ref_16": + { + "Benchmark": "llama31_8b", + "Creator": "NVIDIA", + "When": "Reference RCPs before 5.1 submission", + "Platform": "2xDGX-B200", + "Precision": "BF16", + "BS": 16, + "Hyperparams": { + "opt_base_learning_rate": 4e-04, + "opt_learning_rate_warmup_samples": 256, + "gradient_accumulation_steps": 1 + }, + "Epochs to converge": [ + 159744, 159744, 159744, 159744, 159744, + 159744, 172032, 159744, 172032, 159744, + 172032, 159744, 159744, 159744, 159744, + 159744, 159744, 159744, 159744, 159744 + ] + }, "llama31_8b_ref_32": { @@ -89,3 +109,4 @@ +