#!/usr/bin/perl -w # # stackcollapse-perf.pl collapse perf samples into single lines. # # Parses a list of multiline stacks generated by "perf script", and # outputs a semicolon separated stack followed by a space and a count. # If memory addresses (+0xd) are present, they are stripped, and resulting # identical stacks are colased with their counts summed. # # USAGE: ./stackcollapse-perf.pl [options] infile > outfile # # Run "./stackcollapse-perf.pl -h" to list options. # # Example input: # # swapper 0 [000] 158665.570607: cpu-clock: # ffffffff8103ce3b native_safe_halt ([kernel.kallsyms]) # ffffffff8101c6a3 default_idle ([kernel.kallsyms]) # ffffffff81013236 cpu_idle ([kernel.kallsyms]) # ffffffff815bf03e rest_init ([kernel.kallsyms]) # ffffffff81aebbfe start_kernel ([kernel.kallsyms].init.text) # [...] # # Example output: # # swapper;start_kernel;rest_init;cpu_idle;default_idle;native_safe_halt 1 # # Input may be created and processed using: # # perf record -a -g -F 997 sleep 60 # perf script | ./stackcollapse-perf.pl > out.stacks-folded # # The output of "perf script" should include stack traces. If these are missing # for you, try manually selecting the perf script output; eg: # # perf script -f comm,pid,tid,cpu,time,event,ip,sym,dso,trace | ... # # This is also required for the --pid or --tid options, so that the output has # both the PID and TID. # # Copyright 2012 Joyent, Inc. All rights reserved. # Copyright 2012 Brendan Gregg. All rights reserved. # # CDDL HEADER START # # The contents of this file are subject to the terms of the # Common Development and Distribution License (the "License"). # You may not use this file except in compliance with the License. # # You can obtain a copy of the license at docs/cddl1.txt or # http://opensource.org/licenses/CDDL-1.0. # See the License for the specific language governing permissions # and limitations under the License. # # When distributing Covered Code, include this CDDL HEADER in each # file and include the License file at docs/cddl1.txt. # If applicable, add the following below this CDDL HEADER, with the # fields enclosed by brackets "[]" replaced with your own identifying # information: Portions Copyright [yyyy] [name of copyright owner] # # CDDL HEADER END # # 02-Mar-2012 Brendan Gregg Created this. # 02-Jul-2014 " " Added process name to stacks. use strict; use Getopt::Long; my %collapsed; sub remember_stack { my ($stack, $count) = @_; $collapsed{$stack} += $count; } my $annotate_kernel = 0; # put an annotation on kernel function my $annotate_jit = 0; # put an annotation on jit symbols my $annotate_all = 0; # enale all annotations my $include_pname = 1; # include process names in stacks my $include_pid = 0; # include process ID with process name my $include_tid = 0; # include process & thread ID with process name my $include_addrs = 0; # include raw address where a symbol can't be found my $tidy_java = 1; # condense Java signatures my $tidy_generic = 1; # clean up function names a little my $target_pname; # target process name from perf invocation my $event_filter = ""; # event type filter, defaults to first encountered event my $event_defaulted = 0; # whether we defaulted to an event (none provided) my $event_warning = 0; # if we printed a warning for the event my $show_inline = 0; my $show_context = 0; GetOptions('inline' => \$show_inline, 'context' => \$show_context, 'pid' => \$include_pid, 'kernel' => \$annotate_kernel, 'jit' => \$annotate_jit, 'all' => \$annotate_all, 'tid' => \$include_tid, 'addrs' => \$include_addrs, 'event-filter=s' => \$event_filter) or die < outfile\n --pid # include PID with process names [1] --tid # include TID and PID with process names [1] --inline # un-inline using addr2line --all # all annotations (--kernel --jit) --kernel # annotate kernel functions with a _[k] --jit # annotate jit functions with a _[j] --context # adds source context to --inline --addrs # include raw addresses where symbols can't be found --event-filter=EVENT # event name filter\n [1] perf script must emit both PID and TIDs for these to work; eg, Linux < 4.1: perf script -f comm,pid,tid,cpu,time,event,ip,sym,dso,trace for Linux >= 4.1: perf script -F comm,pid,tid,cpu,time,event,ip,sym,dso,trace If you save this output add --header on Linux >= 3.14 to include perf info. USAGE_END if ($annotate_all) { $annotate_kernel = $annotate_jit = 1; } # for the --inline option sub inline { my ($pc, $mod) = @_; # capture addr2line output my $a2l_output = `addr2line -a $pc -e $mod -i -f -s -C`; # remove first line $a2l_output =~ s/^(.*\n){1}//; my @fullfunc; my $one_item = ""; for (split /^/, $a2l_output) { chomp $_; # remove discriminator info if exists $_ =~ s/ \(discriminator \S+\)//; if ($one_item eq "") { $one_item = $_; } else { if ($show_context == 1) { unshift @fullfunc, $one_item . ":$_"; } else { unshift @fullfunc, $one_item; } $one_item = ""; } } return join(";", @fullfunc); } my @stack; my $pname; my $m_pid; my $m_tid; # # Main loop # while (defined($_ = <>)) { # find the name of the process launched by perf, by stepping backwards # over the args to find the first non-option (no dash): if (/^# cmdline/) { my @args = split ' ', $_; foreach my $arg (reverse @args) { if ($arg !~ /^-/) { $target_pname = $arg; $target_pname =~ s:.*/::; # strip pathname last; } } } # skip remaining comments next if m/^#/; chomp; # end of stack. save cached data. if (m/^$/) { # ignore filtered samples next if not $pname; if ($include_pname) { if (defined $pname) { unshift @stack, $pname; } else { unshift @stack, ""; } } remember_stack(join(";", @stack), 1) if @stack; undef @stack; undef $pname; next; } # # event record start # if (/^(\S.+?)\s+(\d+)\/*(\d+)*\s+/) { # default "perf script" output has TID but not PID # eg, "java 25607 4794564.109216: cycles:" # eg, "java 12688 [002] 6544038.708352: cpu-clock:" # eg, "V8 WorkerThread 25607 4794564.109216: cycles:" # eg, "java 24636/25607 [000] 4794564.109216: cycles:" # eg, "java 12688/12764 6544038.708352: cpu-clock:" # eg, "V8 WorkerThread 24636/25607 [000] 94564.109216: cycles:" # other combinations possible my ($comm, $pid, $tid) = ($1, $2, $3); if (not $tid) { $tid = $pid; $pid = "?"; } if (/(\S+):\s*$/) { my $event = $1; if ($event_filter eq "") { # By default only show events of the first encountered # event type. Merging together different types, such as # instructions and cycles, produces misleading results. $event_filter = $event; $event_defaulted = 1; } elsif ($event ne $event_filter) { if ($event_defaulted and $event_warning == 0) { # only print this warning if necessary: # when we defaulted and there was # multiple event types. print STDERR "Filtering for events of type: $event\n"; $event_warning = 1; } next; } } ($m_pid, $m_tid) = ($pid, $tid); if ($include_tid) { $pname = "$comm-$m_pid/$m_tid"; } elsif ($include_pid) { $pname = "$comm-$m_pid"; } else { $pname = "$comm"; } $pname =~ tr/ /_/; # # stack line # } elsif (/^\s*(\w+)\s*(.+) \((\S*)\)/) { # ignore filtered samples next if not $pname; my ($pc, $rawfunc, $mod) = ($1, $2, $3); # Linux 4.8 included symbol offsets in perf script output by default, eg: # 7fffb84c9afc cpu_startup_entry+0x800047c022ec ([kernel.kallsyms]) # strip these off: $rawfunc =~ s/\+0x[\da-f]+$//; if ($show_inline == 1 && $mod !~ m/(perf-\d+.map|kernel\.|\[[^\]]+\])/) { unshift @stack, inline($pc, $mod); next; } next if $rawfunc =~ /^\(/; # skip process names my @inline; for (split /\->/, $rawfunc) { my $func = $_; if ($func eq "[unknown]") { if ($mod ne "[unknown]") { # use module name instead, if known $func = $mod; $func =~ s/.*\///; } else { $func = "unknown"; } if ($include_addrs) { $func = "\[$func \<$pc\>\]"; } else { $func = "\[$func\]"; } } if ($tidy_generic) { $func =~ s/;/:/g; if ($func !~ m/\.\(.*\)\./) { # This doesn't look like a Go method name (such as # "net/http.(*Client).Do"), so everything after the first open # paren (that is not part of an "(anonymous namespace)") is # just noise. $func =~ s/\((?!anonymous namespace\)).*//; } # now tidy this horrible thing: # 13a80b608e0a RegExp:[&<>\"\'] (/tmp/perf-7539.map) $func =~ tr/"\'//d; # fall through to $tidy_java } if ($tidy_java and $pname eq "java") { # along with $tidy_generic, converts the following: # Lorg/mozilla/javascript/ContextFactory;.call(Lorg/mozilla/javascript/ContextAction;)Ljava/lang/Object; # Lorg/mozilla/javascript/ContextFactory;.call(Lorg/mozilla/javascript/C # Lorg/mozilla/javascript/MemberBox;.(Ljava/lang/reflect/Method;)V # into: # org/mozilla/javascript/ContextFactory:.call # org/mozilla/javascript/ContextFactory:.call # org/mozilla/javascript/MemberBox:.init $func =~ s/^L// if $func =~ m:/:; } # # Annotations # # detect inlined from the @inline array # detect kernel from the module name; eg, frames to parse include: # ffffffff8103ce3b native_safe_halt ([kernel.kallsyms]) # 8c3453 tcp_sendmsg (/lib/modules/4.3.0-rc1-virtual/build/vmlinux) # 7d8 ipv4_conntrack_local+0x7f8f80b8 ([nf_conntrack_ipv4]) # detect jit from the module name; eg: # 7f722d142778 Ljava/io/PrintStream;::print (/tmp/perf-19982.map) if (scalar(@inline) > 0) { $func .= "_[i]"; # inlined } elsif ($annotate_kernel == 1 && $mod =~ m/(^\[|vmlinux$)/ && $mod !~ /unknown/) { $func .= "_[k]"; # kernel } elsif ($annotate_jit == 1 && $mod =~ m:/tmp/perf-\d+\.map:) { $func .= "_[j]"; # jitted } push @inline, $func; } unshift @stack, @inline; } else { warn "Unrecognized line: $_"; } } foreach my $k (sort { $a cmp $b } keys %collapsed) { print "$k $collapsed{$k}\n"; }