[PATCH v5 45/58] perf stackcollapse: Port stackcollapse to use python module
Ian Rogers
irogers at google.com
Fri Apr 24 09:47:07 PDT 2026
Modernize the legacy stackcollapse.py trace script by refactoring it
into a class-based architecture (StackCollapseAnalyzer).
The script uses perf.session for event processing and aggregates call
stacks to produce output suitable for flame graphs.
Assisted-by: Gemini:gemini-3.1-pro-preview
Signed-off-by: Ian Rogers <irogers at google.com>
---
v2:
- Fixed Callchain Check: Replaced hasattr(sample, "callchain") with
getattr(sample, "callchain", None) and checked if it is not None .
This avoids attempting to iterate over None when a sample lacks a
callchain, which would raise a TypeError.
- Fixed Comm Resolution: The code already used
self.session.process(sample.sample_pid).comm() to resolve the
command name using the session object (if available), avoiding the
missing comm attribute on perf.sample_event.
- Code Cleanup: Broke a long line in process_event to satisfy pylint.
---
tools/perf/python/stackcollapse.py | 126 +++++++++++++++++++++++++++++
1 file changed, 126 insertions(+)
create mode 100755 tools/perf/python/stackcollapse.py
diff --git a/tools/perf/python/stackcollapse.py b/tools/perf/python/stackcollapse.py
new file mode 100755
index 000000000000..fae0f0f503a3
--- /dev/null
+++ b/tools/perf/python/stackcollapse.py
@@ -0,0 +1,126 @@
+#!/usr/bin/env python3
+# SPDX-License-Identifier: GPL-2.0
+"""
+stackcollapse.py - format perf samples with one line per distinct call stack
+
+This script's output has two space-separated fields. The first is a semicolon
+separated stack including the program name (from the "comm" field) and the
+function names from the call stack. The second is a count:
+
+ swapper;start_kernel;rest_init;cpu_idle;default_idle;native_safe_halt 2
+
+The file is sorted according to the first field.
+
+Ported from tools/perf/scripts/python/stackcollapse.py
+"""
+
+import argparse
+from collections import defaultdict
+import sys
+import perf
+
+
+class StackCollapseAnalyzer:
+ """Accumulates call stacks and prints them collapsed."""
+
+ def __init__(self, args: argparse.Namespace) -> None:
+ self.args = args
+ self.lines: dict[str, int] = defaultdict(int)
+
+ def tidy_function_name(self, sym: str, dso: str) -> str:
+ """Beautify function names based on options."""
+ if sym is None:
+ sym = "[unknown]"
+
+ sym = sym.replace(";", ":")
+ if self.args.tidy_java:
+ # Beautify Java signatures
+ sym = sym.replace("<", "")
+ sym = sym.replace(">", "")
+ if sym.startswith("L") and "/" in sym:
+ sym = sym[1:]
+ try:
+ sym = sym[:sym.index("(")]
+ except ValueError:
+ pass
+
+ if self.args.annotate_kernel and dso == "[kernel.kallsyms]":
+ return sym + "_[k]"
+ return sym
+
+ def process_event(self, sample: perf.sample_event) -> None:
+ """Collect call stack for each sample."""
+ stack = []
+ callchain = getattr(sample, "callchain", None)
+ if callchain is not None:
+ for node in callchain:
+ stack.append(self.tidy_function_name(node.symbol, node.dso))
+ else:
+ # Fallback if no callchain
+ sym = getattr(sample, "symbol", "[unknown]")
+ dso = getattr(sample, "dso", "[unknown]")
+ stack.append(self.tidy_function_name(sym, dso))
+
+ if self.args.include_comm:
+ if hasattr(self, 'session') and self.session:
+ comm = self.session.process(sample.sample_pid).comm()
+ else:
+ comm = "Unknown"
+ comm = comm.replace(" ", "_")
+ sep = "-"
+ if self.args.include_pid:
+ comm = f"{comm}{sep}{getattr(sample, 'sample_pid', 0)}"
+ sep = "/"
+ if self.args.include_tid:
+ comm = f"{comm}{sep}{getattr(sample, 'sample_tid', 0)}"
+ stack.append(comm)
+
+ stack_string = ";".join(reversed(stack))
+ self.lines[stack_string] += 1
+
+ def print_totals(self) -> None:
+ """Print sorted collapsed stacks."""
+ for stack in sorted(self.lines):
+ print(f"{stack} {self.lines[stack]}")
+
+
+def main():
+ """Main function."""
+ ap = argparse.ArgumentParser(
+ description="Format perf samples with one line per distinct call stack"
+ )
+ ap.add_argument("-i", "--input", default="perf.data", help="Input file name")
+ ap.add_argument("--include-tid", action="store_true", help="include thread id in stack")
+ ap.add_argument("--include-pid", action="store_true", help="include process id in stack")
+ ap.add_argument("--no-comm", dest="include_comm", action="store_false", default=True,
+ help="do not separate stacks according to comm")
+ ap.add_argument("--tidy-java", action="store_true", help="beautify Java signatures")
+ ap.add_argument("--kernel", dest="annotate_kernel", action="store_true",
+ help="annotate kernel functions with _[k]")
+
+ args = ap.parse_args()
+
+ if args.include_tid and not args.include_comm:
+ print("requesting tid but not comm is invalid", file=sys.stderr)
+ sys.exit(1)
+ if args.include_pid and not args.include_comm:
+ print("requesting pid but not comm is invalid", file=sys.stderr)
+ sys.exit(1)
+
+ analyzer = StackCollapseAnalyzer(args)
+
+ try:
+ session = perf.session(perf.data(args.input), sample=analyzer.process_event)
+ analyzer.session = session
+ session.process_events()
+ except IOError as e:
+ print(f"Error: {e}", file=sys.stderr)
+ sys.exit(1)
+ except KeyboardInterrupt:
+ pass
+
+ analyzer.print_totals()
+
+
+if __name__ == "__main__":
+ main()
--
2.54.0.545.g6539524ca2-goog
More information about the linux-arm-kernel
mailing list