exp1337: add seed sweep for Delphi runs (#4591)

Helw150 · web-flow · commit 28b491419964 · 2026-04-22T13:31:12.000-04:00
diff --git a/experiments/exp1337_delphi_suite.py b/experiments/exp1337_delphi_suite.py
@@ -75,6 +75,7 @@ class OptimalTrainingConfig:
     label: str
     output_path: str
     tokenized: LMMixtureDatasetConfig
+    seed: int = 0
     validation_configs: dict[str, DatasetComponent] | None = None
 
 
@@ -163,6 +164,7 @@ def run_optimal_training(config: OptimalTrainingConfig) -> None:
                     f"FLOPs={config.target_budget:.1e}",
                     f"label={config.label}",
                     f"N={params:.1e}",
+                    f"seed={config.seed}",
                 ],
             ),
             mp=jmp.get_policy("p=f32,c=bfloat16"),
@@ -181,6 +183,7 @@ def run_optimal_training(config: OptimalTrainingConfig) -> None:
                     "token_repeat": (ResourceAxis.REPLICA_DCN, ResourceAxis.REPLICA, ResourceAxis.DATA),
                 },
             ),
+            seed=config.seed,
             allow_nondivisible_batch_size=True,
         ),
         train_seq_len=SEQ_LEN,
@@ -215,23 +218,33 @@ def run_optimal_training(config: OptimalTrainingConfig) -> None:
 }
 
 # --- Step 2: Optimal Training Runs ---
+# Seeds per budget: 1e21 and 1e22 get 3 seeds (0, 42, 62746); 1e23 gets seed 0 only
+SEEDS_PER_BUDGET: dict[float, list[int]] = {
+    1e21: [0, 42, 62746],
+    1e22: [0, 42, 62746],
+    1e23: [0],
+}
+
 optimal_runs: list[ExecutorStep] = []
 for budget, (tpu_type, batch_size) in TARGET_BUDGETS.items():
-    step = ExecutorStep(
-        name=f"{EXPERIMENT_NAME}-optimal-{budget:.0e}-v5",
-        fn=run_optimal_training,
-        config=OptimalTrainingConfig(
-            analysis_output_path=analysis_step.as_input_name(),
-            target_budget=budget,
-            tpu_type=tpu_type,
-            batch_size=batch_size,
-            label=LABEL,
-            output_path=this_output_path(),
-            tokenized=nemotron_mix,
-            validation_configs=validation_configs,
-        ),
-    )
-    optimal_runs.append(step)
+    for seed in SEEDS_PER_BUDGET[budget]:
+        suffix = f"-seed{seed}" if seed != 0 else ""
+        step = ExecutorStep(
+            name=f"{EXPERIMENT_NAME}-optimal-{budget:.0e}-v5{suffix}",
+            fn=run_optimal_training,
+            config=OptimalTrainingConfig(
+                analysis_output_path=analysis_step.as_input_name(),
+                target_budget=budget,
+                tpu_type=tpu_type,
+                batch_size=batch_size,
+                label=LABEL,
+                output_path=this_output_path(),
+                tokenized=nemotron_mix,
+                seed=seed,
+                validation_configs=validation_configs,
+            ),
+        )
+        optimal_runs.append(step)
 
 all_steps = [analysis_step, *optimal_runs]