Merge pull request #368 from faster-cpython/tighter-perf

mdboom · web-flow · commit 9350f63c4f16 · 2025-03-10T10:28:18.000-04:00
Use the new perf_record hook to only include perf in the benchmarking code
diff --git a/bench_runner/scripts/run_benchmarks.py b/bench_runner/scripts/run_benchmarks.py
@@ -33,7 +33,7 @@
     "GITHUB_REPOSITORY", "faster-cpython/bench_runner"
 )
 # Environment variables that control the execution of CPython
-ENV_VARS = ["PYTHON_JIT"]
+ENV_VARS = ["PYTHON_JIT", "PYPERF_PERF_RECORD_EXTRA_OPTS"]
 
 
 class NoBenchmarkError(Exception):
@@ -64,7 +64,7 @@ def get_benchmark_names(benchmarks: str) -> list[str]:
 def run_benchmarks(
     python: PathLike,
     benchmarks: str,
-    command_prefix: Iterable[str] | None = None,
+    /,
     test_mode: bool = False,
     extra_args: Iterable[str] | None = None,
 ) -> None:
@@ -74,9 +74,6 @@ def run_benchmarks(
     if BENCHMARK_JSON.is_file():
         BENCHMARK_JSON.unlink()
 
-    if command_prefix is None:
-        command_prefix = []
-
     if test_mode:
         fast_arg = ["--fast"]
     else:
@@ -86,7 +83,6 @@ def run_benchmarks(
         extra_args = []
 
     args = [
-        *command_prefix,
         sys.executable,
         "-m",
         "pyperformance",
@@ -173,19 +169,36 @@ def collect_pystats(
         run_summarize_stats(python, fork, ref, "all", benchmark_links, flags=flags)
 
 
-def perf_to_csv(lines: Iterable[str], output: PathLike):
-    event_count_prefix = "# Event count (approx.): "
-    total = None
+def get_perf_lines(files: Iterable[PathLike]) -> Iterable[str]:
+    for filename in files:
+        p = subprocess.Popen(
+            [
+                "perf",
+                "report",
+                "--stdio",
+                "-g",
+                "none",
+                "--show-total-period",
+                "-s",
+                "pid,symbol,dso",
+                "-i",
+                str(filename),
+            ],
+            encoding="utf-8",
+            stdout=subprocess.PIPE,
+            bufsize=1,
+        )
+        assert p.stdout is not None  # for pyright
+        yield from iter(p.stdout.readline, "")
+        p.kill()
+
 
+def perf_to_csv(lines: Iterable[str], output: PathLike):
     rows = []
     for line in lines:
         line = line.strip()
-        if line.startswith(event_count_prefix):
-            total = int(line[len(event_count_prefix) :].strip())
-        elif line.startswith("#") or line == "":
+        if line.startswith("#") or line == "":
             pass
-        elif total is None:
-            raise ValueError("Could not find total sample count")
         else:
             _, period, command, _, symbol, shared, _ = line.split(maxsplit=6)
             pid, command = command.split(":")
@@ -209,47 +222,28 @@ def collect_perf(python: PathLike, benchmarks: str):
         shutil.rmtree(PROFILING_RESULTS)
     PROFILING_RESULTS.mkdir()
 
-    perf_data = Path("perf.data")
+    perf_data_glob = "perf.data.*"
     for benchmark in all_benchmarks:
-        if perf_data.exists():
-            perf_data.unlink()
-
-        try:
-            run_benchmarks(
-                python,
-                benchmark,
-                command_prefix=[
-                    "perf",
-                    "record",
-                    "-o",
-                    "perf.data",
-                    "--",
-                ],
+        for filename in Path(".").glob(perf_data_glob):
+            filename.unlink()
+
+        run_benchmarks(
+            python,
+            benchmark,
+            extra_args=["--hook", "perf_record"],
+        )
+
+        fileiter = Path(".").glob(perf_data_glob)
+        if util.has_any_element(fileiter):
+            perf_to_csv(
+                get_perf_lines(fileiter),
+                PROFILING_RESULTS / f"{benchmark}.perf.csv",
             )
-        except NoBenchmarkError:
-            pass
         else:
-            if perf_data.exists():
-                output = subprocess.check_output(
-                    [
-                        "perf",
-                        "report",
-                        "--stdio",
-                        "-g",
-                        "none",
-                        "--show-total-period",
-                        "-s",
-                        "pid,symbol,dso",
-                        "-i",
-                        "perf.data",
-                    ],
-                    encoding="utf-8",
-                )
-                perf_to_csv(
-                    output.splitlines(), PROFILING_RESULTS / f"{benchmark}.perf.csv"
-                )
-            else:
-                print(f"No perf.data file generated for {benchmark}", file=sys.stderr)
+            print(f"No perf.data files generated for {benchmark}", file=sys.stderr)
+
+    for filename in Path(".").glob(perf_data_glob):
+        filename.unlink()
 
 
 def update_metadata(
@@ -381,7 +375,7 @@ def _main(
     benchmarks = select_benchmarks(benchmarks)
 
     if mode == "benchmark":
-        run_benchmarks(python, benchmarks, [], test_mode)
+        run_benchmarks(python, benchmarks, test_mode=test_mode)
         update_metadata(BENCHMARK_JSON, fork, ref, run_id=run_id)
         copy_to_directory(BENCHMARK_JSON, python, fork, ref, flags)
     elif mode == "perf":
diff --git a/bench_runner/templates/_benchmark.src.yml b/bench_runner/templates/_benchmark.src.yml
@@ -221,7 +221,7 @@ jobs:
       - name: Tune system
         if: ${{ steps.should_run.outputs.should_run != 'false' }}
         run: |
-          sudo LD_LIBRARY_PATH=$LD_LIBRARY_PATH venv/bin/python -m pyperf system tune
+          sudo LD_LIBRARY_PATH=$LD_LIBRARY_PATH venv/bin/python -m pyperf system ${{ inputs.perf && 'reset' || 'tune' }}
       - name: Tune for (Linux) perf
         if: ${{ steps.should_run.outputs.should_run != 'false' && inputs.perf }}
         run: |
diff --git a/bench_runner/templates/env.yml b/bench_runner/templates/env.yml
@@ -1,2 +1,2 @@
-PYPERFORMANCE_HASH: 9164273e5504c410a5be08d8753c91be708fdd9a
+PYPERFORMANCE_HASH: 56d12a8fd7cc1432835965d374929bfa7f6f7a07
 PYSTON_BENCHMARKS_HASH: 265655e7f03ace13ec1e00e1ba299179e69f8a00
diff --git a/bench_runner/util.py b/bench_runner/util.py
@@ -1,5 +1,6 @@
 import functools
 import hashlib
+import itertools
 import os
 from pathlib import Path
 from typing import TypeAlias, Union
@@ -41,3 +42,16 @@ def get_excluded_benchmarks() -> set[str]:
         if key in benchmarks_section:
             return set(benchmarks_section[key])
     return set()
+
+
+def has_any_element(iterable):
+    """
+    Checks if an iterable (like a generator) has at least one element
+    without consuming the original iterable more than necessary.
+    """
+    first, iterable = itertools.tee(iterable, 2)  # Create two independent iterators
+    try:
+        next(first)  # Try to get the first element
+        return True  # If successful, the generator is not empty
+    except StopIteration:
+        return False  # If StopIteration is raised, the generator is empty
diff --git a/pyproject.toml b/pyproject.toml
@@ -16,7 +16,7 @@ classifiers = [
 ]
 dependencies = [
     "matplotlib==3.10.1",
-    "pyperf==2.8.1",
+    "pyperf==2.9.0",
     "rich==13.9.4",
     "rich-argparse==1.7.0",
     "ruamel.yaml==0.18.10",

Original file line number	Diff line number	Diff line change
`@@ -1,2 +1,2 @@`
`1`		`-PYPERFORMANCE_HASH: 9164273e5504c410a5be08d8753c91be708fdd9a`
	`1`	`+PYPERFORMANCE_HASH: 56d12a8fd7cc1432835965d374929bfa7f6f7a07`
`2`	`2`	`PYSTON_BENCHMARKS_HASH: 265655e7f03ace13ec1e00e1ba299179e69f8a00`
Original file line number	Diff line number	Diff line change
`@@ -16,7 +16,7 @@ classifiers = [`
`16`	`16`	`]`
`17`	`17`	`dependencies = [`
`18`	`18`	`"matplotlib==3.10.1",`
`19`		`- "pyperf==2.8.1",`
	`19`	`+ "pyperf==2.9.0",`
`20`	`20`	`"rich==13.9.4",`
`21`	`21`	`"rich-argparse==1.7.0",`
`22`	`22`	`"ruamel.yaml==0.18.10",`