Skip to content

Commit 2833aa0

Browse files
authored
Merge pull request #441 from mmarcinkiewicz/patch-4
Update LLAMA3.1 8b GBS64 RCPs
2 parents 82bfae7 + 5a142c8 commit 2833aa0

File tree

1 file changed

+9
-8
lines changed

1 file changed

+9
-8
lines changed

mlperf_logging/rcp_checker/training_5.1.0/rcps_llama31_8b.json

Lines changed: 9 additions & 8 deletions
Original file line numberDiff line numberDiff line change
@@ -26,19 +26,19 @@
2626
"Benchmark": "llama31_8b",
2727
"Creator": "NVIDIA",
2828
"When": "Reference RCPs before 5.1 submission",
29-
"Platform": "2xDGX-B200",
29+
"Platform": "4xDGX-B200",
3030
"Precision": "BF16",
3131
"BS": 64,
3232
"Hyperparams": {
33-
"opt_base_learning_rate": 1e-03,
34-
"opt_learning_rate_warmup_samples": 16348,
35-
"gradient_accumulation_steps": 4
33+
"opt_base_learning_rate": 8e-04,
34+
"opt_learning_rate_warmup_samples": 6144,
35+
"gradient_accumulation_steps": 2
3636
},
3737
"Epochs to converge": [
38-
233472, 221184, 233472, 221184, 221184,
39-
245760, 233472, 233472, 208896, 245760,
40-
233472, 221184, 233472, 233472, 221184,
41-
245760, 221184, 233472, 233472, 233472
38+
233472, 208896, 208896, 233472, 233472,
39+
233472, 233472, 233472, 208896, 233472,
40+
233472, 233472, 245760, 221184, 208896,
41+
233472, 233472, 221184, 221184, 221184
4242
]
4343
},
4444

@@ -88,3 +88,4 @@
8888

8989

9090

91+

0 commit comments

Comments
 (0)