Merge pull request #148 from faster-cpython/precise-perf-timing

mdboom · web-flow · commit 9eb8c05bd4ec · 2024-03-09T16:31:31.000-05:00
More precise perf timings
diff --git a/bench_runner/scripts/profiling_plot.py b/bench_runner/scripts/profiling_plot.py
@@ -200,6 +200,9 @@ def category_for_obj_sym(obj: str, sym: str) -> str:
     if obj.startswith("libc"):
         return "libc"
 
+    if obj == "[JIT]":
+        return "jit"
+
     if re.match(r".+\.so(\..+)?$", obj):
         return "library"
 
@@ -233,14 +236,25 @@ def _main(input_dir: Path, output_prefix: Path):
                 for row in csvreader:
                     break
 
+                # Add up all the JIT entries into a single row
+                rows = []
+                jit_time = 0.0
                 for row in csvreader:
                     self_time, _, obj, sym = row
-
+                    self_time = float(self_time)
+                    if obj == "[JIT]":
+                        jit_time += self_time
+                    else:
+                        rows.append((self_time, obj, sym))
+                if jit_time != 0.0:
+                    rows.append((jit_time, "[JIT]", "jit"))
+                rows.sort(reverse=True)
+
+                for self_time, obj, sym in rows:
                     # python3.8 is the "parent" python orchestrating pyperformance
                     if obj == "python3.8":
                         continue
 
-                    self_time = float(self_time) / 100.0
                     if self_time <= 0.0:
                         break
 
@@ -295,7 +309,7 @@ def _main(input_dir: Path, output_prefix: Path):
             label=f"{category} {val:.2%}",
             left=bottom,
             hatch=hatches[i // 10],
-            color=f"C{i%10}",
+            color=f"C{i % 10}",
         )
         bottom += values
 
@@ -313,10 +327,13 @@ def _main(input_dir: Path, output_prefix: Path):
     labels = [
         i < 10 and f"{x[1]} {x[0]:.2%}" or "" for i, x in enumerate(sorted_categories)
     ]
-    colors = [f"C{i%10}" for i in range(len(values))]
+    colors = [f"C{i % 10}" for i in range(len(values))]
     hatches = [hatches[i // 10] for i in range(len(values))]
 
-    other = 1.0 - sum(values)
+    if sum(values) < 1.0:
+        other = 1.0 - sum(values)
+    else:
+        other = 0.0
     values.append(other)
     labels.append("")
     colors.append("#ddd")
diff --git a/bench_runner/scripts/run_benchmarks.py b/bench_runner/scripts/run_benchmarks.py
@@ -157,16 +157,23 @@ def collect_pystats(
 
 
 def perf_to_csv(lines: Iterable[str], output: Path):
+    event_count_prefix = "# Event count (approx.): "
+    total = None
+
     rows = []
     for line in lines:
         line = line.strip()
+        if line.startswith(event_count_prefix):
+            total = int(line[len(event_count_prefix) :].strip())
+            continue
         if line.startswith("#") or line == "":
             continue
-        children, self_time, _, shared, _, symbol = line.split(maxsplit=5)
-        children = float(children[:-1])
-        self = float(self_time[:-1])
-        if children > 0.0 or self > 0.0:
-            rows.append([self, children, shared, symbol])
+        if total is None:
+            raise ValueError("Could not find total sample count")
+        _, period, _, shared, _, symbol = line.split(maxsplit=5)
+        self_time = float(int(period)) / total
+        if self_time > 0.0:
+            rows.append([self_time, 0.0, shared, symbol])
 
     rows.sort(key=itemgetter(0), reverse=True)
 
@@ -192,7 +199,6 @@ def collect_perf(python: Path, benchmarks: str):
                 command_prefix=[
                     "perf",
                     "record",
-                    "--call-graph=dwarf",
                     "-o",
                     "perf.data",
                     "--",
@@ -209,6 +215,7 @@ def collect_perf(python: Path, benchmarks: str):
                         "--stdio",
                         "-g",
                         "none",
+                        "--show-total-period",
                         "-i",
                         "perf.data",
                     ],