Skip to content

Commit f987d6d

Browse files
authored
Merge pull request #440 from mmarcinkiewicz/patch-3
Update rcps_llama31_8b.json
2 parents d91f2e2 + dfa5081 commit f987d6d

File tree

1 file changed

+10
-8
lines changed

1 file changed

+10
-8
lines changed

mlperf_logging/rcp_checker/training_5.1.0/rcps_llama31_8b.json

Lines changed: 10 additions & 8 deletions
Original file line numberDiff line numberDiff line change
@@ -5,19 +5,19 @@
55
"Benchmark": "llama31_8b",
66
"Creator": "NVIDIA",
77
"When": "Reference RCPs before 5.1 submission",
8-
"Platform": "2xDGX-B200",
8+
"Platform": "4xDGX-B200",
99
"Precision": "BF16",
1010
"BS": 32,
1111
"Hyperparams": {
12-
"opt_base_learning_rate": 1e-03,
13-
"opt_learning_rate_warmup_samples": 16348,
14-
"gradient_accumulation_steps": 2
12+
"opt_base_learning_rate": 8e-04,
13+
"opt_learning_rate_warmup_samples": 4096,
14+
"gradient_accumulation_steps": 1
1515
},
1616
"Epochs to converge": [
17-
196608, 221184, 208896, 221184, 221184,
18-
208896, 208896, 196608, 233472, 208896,
19-
233472, 208896, 208896, 221184, 233472,
20-
196608, 208896, 233472, 221184, 208896
17+
196608, 172032, 184320, 184320, 172032,
18+
172032, 184320, 184320, 184320, 172032,
19+
172032, 172032, 184320, 184320, 184320,
20+
172032, 172032, 172032, 184320, 184320
2121
]
2222
},
2323

@@ -86,3 +86,5 @@
8686
}
8787

8888

89+
90+

0 commit comments

Comments
 (0)