chore: allow to set tokenizer in the nemo-run script (#884)

marta-sd · web-flow · commit 51c92637749d · 2026-03-24T10:47:00.000Z
This change allows to use the script for log-probs benchmarks. I tested
it with `piqa` and got expected accuracy

Signed-off-by: Marta Stepniewska-Dziubinska &lt;martas@nvidia.com&gt;
diff --git a/scripts/evaluation_with_nemo_run.py b/scripts/evaluation_with_nemo_run.py
@@ -230,6 +230,18 @@ def get_parser():
         default=8,
         help="Number of parallel requests to send to server. Default: use default for the task.",
     )
+    parser.add_argument(
+        "--tokenizer_path",
+        type=str,
+        default=None,
+        help="Path to the tokenizer. Default: None",
+    )
+    parser.add_argument(
+        "--tokenizer_backend",
+        type=str,
+        default="huggingface",
+        help="Backend to use for the tokenizer. Default: huggingface",
+    )
     parser.add_argument(
         "--request_timeout",
         type=int,
@@ -484,11 +496,16 @@ def main():
         model_id="megatron_model",
     )
     eval_target = run.Config(EvaluationTarget, api_endpoint=api_endpoint)
+    extra = {}
+    if args.tokenizer_path:
+        extra["tokenizer"] = args.tokenizer_path
+        extra["tokenizer_backend"] = args.tokenizer_backend
     eval_params = run.Config(
         ConfigParams,
         limit_samples=args.limit,
         parallelism=args.parallel_requests,
         request_timeout=args.request_timeout,
+        extra=extra,
     )
     eval_config = run.Config(
         EvaluationConfig,