Merge pull request #440 from mmarcinkiewicz/patch-3

ShriyaRishab · web-flow · commit f987d6d85cb7 · 2025-10-08T17:37:13.000+05:30
Update rcps_llama31_8b.json
diff --git a/mlperf_logging/rcp_checker/training_5.1.0/rcps_llama31_8b.json b/mlperf_logging/rcp_checker/training_5.1.0/rcps_llama31_8b.json
@@ -5,19 +5,19 @@
       "Benchmark": "llama31_8b",
       "Creator": "NVIDIA",
       "When": "Reference RCPs before 5.1 submission",
-      "Platform": "2xDGX-B200",
+      "Platform": "4xDGX-B200",
       "Precision": "BF16",
       "BS": 32,
       "Hyperparams": {
-        "opt_base_learning_rate": 1e-03,
-        "opt_learning_rate_warmup_samples": 16348,
-        "gradient_accumulation_steps": 2
+        "opt_base_learning_rate": 8e-04,
+        "opt_learning_rate_warmup_samples": 4096,
+        "gradient_accumulation_steps": 1
       },
       "Epochs to converge": [
-        196608, 221184, 208896, 221184, 221184, 
-        208896, 208896, 196608, 233472, 208896, 
-        233472, 208896, 208896, 221184, 233472, 
-        196608, 208896, 233472, 221184, 208896
+        196608, 172032, 184320, 184320, 172032,
+        172032, 184320, 184320, 184320, 172032,
+        172032, 172032, 184320, 184320, 184320,
+        172032, 172032, 172032, 184320, 184320
       ]
     },
   
@@ -86,3 +86,5 @@
 }
 
 
+
+