2011-02-04 19:45:46 +08:00
|
|
|
/*
|
|
|
|
* Copyright (C) 2011, Red Hat Inc, Arnaldo Carvalho de Melo <acme@redhat.com>
|
|
|
|
*
|
|
|
|
* Parts came from builtin-annotate.c, see those files for further
|
|
|
|
* copyright notes.
|
|
|
|
*
|
|
|
|
* Released under the GPL v2. (and only v2, not any later version)
|
|
|
|
*/
|
|
|
|
|
|
|
|
#include "util.h"
|
2014-02-20 09:32:53 +08:00
|
|
|
#include "ui/ui.h"
|
|
|
|
#include "sort.h"
|
2011-02-04 19:45:46 +08:00
|
|
|
#include "build-id.h"
|
|
|
|
#include "color.h"
|
|
|
|
#include "cache.h"
|
|
|
|
#include "symbol.h"
|
|
|
|
#include "debug.h"
|
|
|
|
#include "annotate.h"
|
2013-03-05 13:53:21 +08:00
|
|
|
#include "evsel.h"
|
perf annotate: Add branch stack / basic block
I wanted to know the hottest path through a function and figured the
branch-stack (LBR) information should be able to help out with that.
The below uses the branch-stack to create basic blocks and generate
statistics from them.
from to branch_i
* ----> *
|
| block
v
* ----> *
from to branch_i+1
The blocks are broken down into non-overlapping ranges, while tracking
if the start of each range is an entry point and/or the end of a range
is a branch.
Each block iterates all ranges it covers (while splitting where required
to exactly match the block) and increments the 'coverage' count.
For the range including the branch we increment the taken counter, as
well as the pred counter if flags.predicted.
Using these number we can find if an instruction:
- had coverage; given by:
br->coverage / br->sym->max_coverage
This metric ensures each symbol has a 100% spot, which reflects the
observation that each symbol must have a most covered/hottest
block.
- is a branch target: br->is_target && br->start == add
- for targets, how much of a branch's coverages comes from it:
target->entry / branch->coverage
- is a branch: br->is_branch && br->end == addr
- for branches, how often it was taken:
br->taken / br->coverage
after all, all execution that didn't take the branch would have
incremented the coverage and continued onward to a later branch.
- for branches, how often it was predicted:
br->pred / br->taken
The coverage percentage is used to color the address and asm sections;
for low (<1%) coverage we use NORMAL (uncolored), indicating that these
instructions are not 'important'. For high coverage (>75%) we color the
address RED.
For each branch, we add an asm comment after the instruction with
information on how often it was taken and predicted.
Output looks like (sans color, which does loose a lot of the
information :/)
$ perf record --branch-filter u,any -e cycles:p ./branches 27
$ perf annotate branches
Percent | Source code & Disassembly of branches for cycles:pu (217 samples)
---------------------------------------------------------------------------------
: branches():
0.00 : 40057a: push %rbp
0.00 : 40057b: mov %rsp,%rbp
0.00 : 40057e: sub $0x20,%rsp
0.00 : 400582: mov %rdi,-0x18(%rbp)
0.00 : 400586: mov %rsi,-0x20(%rbp)
0.00 : 40058a: mov -0x18(%rbp),%rax
0.00 : 40058e: mov %rax,-0x10(%rbp)
0.00 : 400592: movq $0x0,-0x8(%rbp)
0.00 : 40059a: jmpq 400656 <branches+0xdc>
1.84 : 40059f: mov -0x10(%rbp),%rax # +100.00%
3.23 : 4005a3: and $0x1,%eax
1.84 : 4005a6: test %rax,%rax
0.00 : 4005a9: je 4005bf <branches+0x45> # -54.50% (p:42.00%)
0.46 : 4005ab: mov 0x200bbe(%rip),%rax # 601170 <acc>
12.90 : 4005b2: add $0x1,%rax
2.30 : 4005b6: mov %rax,0x200bb3(%rip) # 601170 <acc>
0.46 : 4005bd: jmp 4005d1 <branches+0x57> # -100.00% (p:100.00%)
0.92 : 4005bf: mov 0x200baa(%rip),%rax # 601170 <acc> # +49.54%
13.82 : 4005c6: sub $0x1,%rax
0.46 : 4005ca: mov %rax,0x200b9f(%rip) # 601170 <acc>
2.30 : 4005d1: mov -0x10(%rbp),%rax # +50.46%
0.46 : 4005d5: mov %rax,%rdi
0.46 : 4005d8: callq 400526 <lfsr> # -100.00% (p:100.00%)
0.00 : 4005dd: mov %rax,-0x10(%rbp) # +100.00%
0.92 : 4005e1: mov -0x18(%rbp),%rax
0.00 : 4005e5: and $0x1,%eax
0.00 : 4005e8: test %rax,%rax
0.00 : 4005eb: je 4005ff <branches+0x85> # -100.00% (p:100.00%)
0.00 : 4005ed: mov 0x200b7c(%rip),%rax # 601170 <acc>
0.00 : 4005f4: shr $0x2,%rax
0.00 : 4005f8: mov %rax,0x200b71(%rip) # 601170 <acc>
0.00 : 4005ff: mov -0x10(%rbp),%rax # +100.00%
7.37 : 400603: and $0x1,%eax
3.69 : 400606: test %rax,%rax
0.00 : 400609: jne 400612 <branches+0x98> # -59.25% (p:42.99%)
1.84 : 40060b: mov $0x1,%eax
14.29 : 400610: jmp 400617 <branches+0x9d> # -100.00% (p:100.00%)
1.38 : 400612: mov $0x0,%eax # +57.65%
10.14 : 400617: test %al,%al # +42.35%
0.00 : 400619: je 40062f <branches+0xb5> # -57.65% (p:100.00%)
0.46 : 40061b: mov 0x200b4e(%rip),%rax # 601170 <acc>
2.76 : 400622: sub $0x1,%rax
0.00 : 400626: mov %rax,0x200b43(%rip) # 601170 <acc>
0.46 : 40062d: jmp 400641 <branches+0xc7> # -100.00% (p:100.00%)
0.92 : 40062f: mov 0x200b3a(%rip),%rax # 601170 <acc> # +56.13%
2.30 : 400636: add $0x1,%rax
0.92 : 40063a: mov %rax,0x200b2f(%rip) # 601170 <acc>
0.92 : 400641: mov -0x10(%rbp),%rax # +43.87%
2.30 : 400645: mov %rax,%rdi
0.00 : 400648: callq 400526 <lfsr> # -100.00% (p:100.00%)
0.00 : 40064d: mov %rax,-0x10(%rbp) # +100.00%
1.84 : 400651: addq $0x1,-0x8(%rbp)
0.92 : 400656: mov -0x8(%rbp),%rax
5.07 : 40065a: cmp -0x20(%rbp),%rax
0.00 : 40065e: jb 40059f <branches+0x25> # -100.00% (p:100.00%)
0.00 : 400664: nop
0.00 : 400665: leaveq
0.00 : 400666: retq
(Note: the --branch-filter u,any was used to avoid spurious target and
branch points due to interrupts/faults, they show up as very small -/+
annotations on 'weird' locations)
Committer note:
Please take a look at:
http://vger.kernel.org/~acme/perf/annotate_basic_blocks.png
To see the colors.
Signed-off-by: Peter Zijlstra (Intel) <peterz@infradead.org>
Tested-by: Arnaldo Carvalho de Melo <acme@redhat.com>
Cc: Alexander Shishkin <alexander.shishkin@linux.intel.com>
Cc: Andi Kleen <andi@firstfloor.org>
Cc: Anshuman Khandual <khandual@linux.vnet.ibm.com>
Cc: David Carrillo-Cisneros <davidcc@google.com>
Cc: Jiri Olsa <jolsa@kernel.org>
Cc: Kan Liang <kan.liang@intel.com>
Cc: Linus Torvalds <torvalds@linux-foundation.org>
Cc: Namhyung Kim <namhyung@kernel.org>
Cc: Stephane Eranian <eranian@google.com>
[ Moved sym->max_coverage to 'struct annotate', aka symbol__annotate(sym) ]
Signed-off-by: Arnaldo Carvalho de Melo <acme@redhat.com>
2016-09-06 03:08:12 +08:00
|
|
|
#include "block-range.h"
|
2014-11-13 10:05:26 +08:00
|
|
|
#include <regex.h>
|
2011-02-08 23:27:39 +08:00
|
|
|
#include <pthread.h>
|
2012-10-28 05:18:29 +08:00
|
|
|
#include <linux/bitops.h>
|
2011-02-04 19:45:46 +08:00
|
|
|
|
2011-09-16 05:31:41 +08:00
|
|
|
const char *disassembler_style;
|
2012-09-04 18:32:30 +08:00
|
|
|
const char *objdump_path;
|
2014-11-13 10:05:26 +08:00
|
|
|
static regex_t file_lineno;
|
2011-09-16 05:31:41 +08:00
|
|
|
|
2012-05-13 00:15:34 +08:00
|
|
|
static struct ins *ins__find(const char *name);
|
|
|
|
static int disasm_line__parse(char *line, char **namep, char **rawp);
|
|
|
|
|
2012-05-13 00:26:20 +08:00
|
|
|
static void ins__delete(struct ins_operands *ops)
|
|
|
|
{
|
2015-03-06 02:27:28 +08:00
|
|
|
if (ops == NULL)
|
|
|
|
return;
|
2013-12-28 03:55:14 +08:00
|
|
|
zfree(&ops->source.raw);
|
|
|
|
zfree(&ops->source.name);
|
|
|
|
zfree(&ops->target.raw);
|
|
|
|
zfree(&ops->target.name);
|
2012-05-13 00:26:20 +08:00
|
|
|
}
|
|
|
|
|
2012-05-08 05:54:16 +08:00
|
|
|
static int ins__raw_scnprintf(struct ins *ins, char *bf, size_t size,
|
|
|
|
struct ins_operands *ops)
|
|
|
|
{
|
|
|
|
return scnprintf(bf, size, "%-6.6s %s", ins->name, ops->raw);
|
|
|
|
}
|
|
|
|
|
|
|
|
int ins__scnprintf(struct ins *ins, char *bf, size_t size,
|
|
|
|
struct ins_operands *ops)
|
|
|
|
{
|
|
|
|
if (ins->ops->scnprintf)
|
|
|
|
return ins->ops->scnprintf(ins, bf, size, ops);
|
|
|
|
|
|
|
|
return ins__raw_scnprintf(ins, bf, size, ops);
|
|
|
|
}
|
|
|
|
|
perf annotate: Resolve 'call' operands to function names
Before this patch the '_raw_spin_lock_irqsave' and 'update_rq_clock' operands
were appearing just as hexadecimal numbers:
update_blocked_averages /proc/kcore
│ push %r12
│ push %rbx
│ and $0xfffffffffffffff0,%rsp
│ sub $0x40,%rsp
│ add -0x662cac00(,%rdi,8),%rax
│ mov %rax,%rbx
│ mov %rax,%rdi
│ mov %rax,0x38(%rsp)
│ → callq _raw_spin_lock_irqsave
│ mov %rbx,%rdi
│ mov %rax,0x30(%rsp)
│ → callq update_rq_clock
│ mov 0x8d0(%rbx),%rax
│ lea 0x8d0(%rbx),%r11
To check that all is right one can always use the 'o' hotkey and see
the original objdump -dS output, that for this case is:
update_blocked_averages /proc/kcore
│ffffffff990d5489: push %r12
│ffffffff990d548b: push %rbx
│ffffffff990d548c: and $0xfffffffffffffff0,%rsp
│ffffffff990d5490: sub $0x40,%rsp
│ffffffff990d5494: add -0x662cac00(,%rdi,8),%rax
│ffffffff990d549c: mov %rax,%rbx
│ffffffff990d549f: mov %rax,%rdi
│ffffffff990d54a2: mov %rax,0x38(%rsp)
│ffffffff990d54a7: → callq 0xffffffff997eb7a0
│ffffffff990d54ac: mov %rbx,%rdi
│ffffffff990d54af: mov %rax,0x30(%rsp)
│ffffffff990d54b4: → callq 0xffffffff990c7720
│ffffffff990d54b9: mov 0x8d0(%rbx),%rax
│ffffffff990d54c0: lea 0x8d0(%rbx),%r11
Use the 'h' hotkey to see a list of available hotkeys.
More work needed to cover operands for other instructions, such as 'mov',
that can resolve variable names, etc.
Cc: Adrian Hunter <adrian.hunter@intel.com>
Cc: Alexander Shishkin <alexander.shishkin@linux.intel.com>
Cc: Chris Riyder <chris.ryder@arm.com>
Cc: David Ahern <dsahern@gmail.com>
Cc: Hemant Kumar <hemant@linux.vnet.ibm.com>
Cc: Jiri Olsa <jolsa@kernel.org>
Cc: Markus Trippelsdorf <markus@trippelsdorf.de>
Cc: Masami Hiramatsu <mhiramat@kernel.org>
Cc: Michael Ellerman <mpe@ellerman.id.au>
Cc: Namhyung Kim <namhyung@kernel.org>
Cc: Naveen N. Rao <naveen.n.rao@linux.vnet.ibm.com>
Cc: Pawel Moll <pawel.moll@arm.com>
Cc: Peter Zijlstra <peterz@infradead.org>
Cc: Ravi Bangoria <ravi.bangoria@linux.vnet.ibm.com>
Cc: Russell King <rmk+kernel@arm.linux.org.uk>
Cc: Taeung Song <treeze.taeung@gmail.com>
Cc: Wang Nan <wangnan0@huawei.com>
Link: http://lkml.kernel.org/n/tip-xqgtw9mzmzcjgwkis9kiiv1p@git.kernel.org
Signed-off-by: Arnaldo Carvalho de Melo <acme@redhat.com>
2016-09-20 04:26:11 +08:00
|
|
|
static int call__parse(struct ins_operands *ops, struct map *map)
|
2012-04-19 03:07:38 +08:00
|
|
|
{
|
2012-04-21 02:26:47 +08:00
|
|
|
char *endptr, *tok, *name;
|
|
|
|
|
2012-04-25 19:00:23 +08:00
|
|
|
ops->target.addr = strtoull(ops->raw, &endptr, 16);
|
2012-04-21 02:26:47 +08:00
|
|
|
|
|
|
|
name = strchr(endptr, '<');
|
|
|
|
if (name == NULL)
|
|
|
|
goto indirect_call;
|
|
|
|
|
|
|
|
name++;
|
|
|
|
|
2015-12-07 07:07:13 +08:00
|
|
|
#ifdef __arm__
|
|
|
|
if (strchr(name, '+'))
|
|
|
|
return -1;
|
|
|
|
#endif
|
|
|
|
|
2012-04-21 02:26:47 +08:00
|
|
|
tok = strchr(name, '>');
|
|
|
|
if (tok == NULL)
|
|
|
|
return -1;
|
|
|
|
|
|
|
|
*tok = '\0';
|
2012-04-25 19:00:23 +08:00
|
|
|
ops->target.name = strdup(name);
|
2012-04-21 02:26:47 +08:00
|
|
|
*tok = '>';
|
|
|
|
|
2012-04-25 19:00:23 +08:00
|
|
|
return ops->target.name == NULL ? -1 : 0;
|
2012-04-21 02:26:47 +08:00
|
|
|
|
|
|
|
indirect_call:
|
2016-08-19 20:59:35 +08:00
|
|
|
tok = strchr(endptr, '*');
|
|
|
|
if (tok == NULL) {
|
perf annotate: Resolve 'call' operands to function names
Before this patch the '_raw_spin_lock_irqsave' and 'update_rq_clock' operands
were appearing just as hexadecimal numbers:
update_blocked_averages /proc/kcore
│ push %r12
│ push %rbx
│ and $0xfffffffffffffff0,%rsp
│ sub $0x40,%rsp
│ add -0x662cac00(,%rdi,8),%rax
│ mov %rax,%rbx
│ mov %rax,%rdi
│ mov %rax,0x38(%rsp)
│ → callq _raw_spin_lock_irqsave
│ mov %rbx,%rdi
│ mov %rax,0x30(%rsp)
│ → callq update_rq_clock
│ mov 0x8d0(%rbx),%rax
│ lea 0x8d0(%rbx),%r11
To check that all is right one can always use the 'o' hotkey and see
the original objdump -dS output, that for this case is:
update_blocked_averages /proc/kcore
│ffffffff990d5489: push %r12
│ffffffff990d548b: push %rbx
│ffffffff990d548c: and $0xfffffffffffffff0,%rsp
│ffffffff990d5490: sub $0x40,%rsp
│ffffffff990d5494: add -0x662cac00(,%rdi,8),%rax
│ffffffff990d549c: mov %rax,%rbx
│ffffffff990d549f: mov %rax,%rdi
│ffffffff990d54a2: mov %rax,0x38(%rsp)
│ffffffff990d54a7: → callq 0xffffffff997eb7a0
│ffffffff990d54ac: mov %rbx,%rdi
│ffffffff990d54af: mov %rax,0x30(%rsp)
│ffffffff990d54b4: → callq 0xffffffff990c7720
│ffffffff990d54b9: mov 0x8d0(%rbx),%rax
│ffffffff990d54c0: lea 0x8d0(%rbx),%r11
Use the 'h' hotkey to see a list of available hotkeys.
More work needed to cover operands for other instructions, such as 'mov',
that can resolve variable names, etc.
Cc: Adrian Hunter <adrian.hunter@intel.com>
Cc: Alexander Shishkin <alexander.shishkin@linux.intel.com>
Cc: Chris Riyder <chris.ryder@arm.com>
Cc: David Ahern <dsahern@gmail.com>
Cc: Hemant Kumar <hemant@linux.vnet.ibm.com>
Cc: Jiri Olsa <jolsa@kernel.org>
Cc: Markus Trippelsdorf <markus@trippelsdorf.de>
Cc: Masami Hiramatsu <mhiramat@kernel.org>
Cc: Michael Ellerman <mpe@ellerman.id.au>
Cc: Namhyung Kim <namhyung@kernel.org>
Cc: Naveen N. Rao <naveen.n.rao@linux.vnet.ibm.com>
Cc: Pawel Moll <pawel.moll@arm.com>
Cc: Peter Zijlstra <peterz@infradead.org>
Cc: Ravi Bangoria <ravi.bangoria@linux.vnet.ibm.com>
Cc: Russell King <rmk+kernel@arm.linux.org.uk>
Cc: Taeung Song <treeze.taeung@gmail.com>
Cc: Wang Nan <wangnan0@huawei.com>
Link: http://lkml.kernel.org/n/tip-xqgtw9mzmzcjgwkis9kiiv1p@git.kernel.org
Signed-off-by: Arnaldo Carvalho de Melo <acme@redhat.com>
2016-09-20 04:26:11 +08:00
|
|
|
struct symbol *sym = map__find_symbol(map, map->map_ip(map, ops->target.addr));
|
|
|
|
if (sym != NULL)
|
|
|
|
ops->target.name = strdup(sym->name);
|
|
|
|
else
|
|
|
|
ops->target.addr = 0;
|
2012-05-11 23:28:55 +08:00
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
2012-04-25 19:00:23 +08:00
|
|
|
ops->target.addr = strtoull(tok + 1, NULL, 16);
|
2012-04-19 03:07:38 +08:00
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
2012-04-21 02:26:47 +08:00
|
|
|
static int call__scnprintf(struct ins *ins, char *bf, size_t size,
|
2012-05-08 05:54:16 +08:00
|
|
|
struct ins_operands *ops)
|
2012-04-21 02:26:47 +08:00
|
|
|
{
|
2012-04-25 19:00:23 +08:00
|
|
|
if (ops->target.name)
|
|
|
|
return scnprintf(bf, size, "%-6.6s %s", ins->name, ops->target.name);
|
2012-04-21 02:26:47 +08:00
|
|
|
|
2012-05-11 23:28:55 +08:00
|
|
|
if (ops->target.addr == 0)
|
|
|
|
return ins__raw_scnprintf(ins, bf, size, ops);
|
|
|
|
|
2012-04-25 19:00:23 +08:00
|
|
|
return scnprintf(bf, size, "%-6.6s *%" PRIx64, ins->name, ops->target.addr);
|
2012-04-21 02:26:47 +08:00
|
|
|
}
|
|
|
|
|
2012-04-19 03:07:38 +08:00
|
|
|
static struct ins_ops call_ops = {
|
2012-04-21 02:26:47 +08:00
|
|
|
.parse = call__parse,
|
|
|
|
.scnprintf = call__scnprintf,
|
2012-04-19 03:07:38 +08:00
|
|
|
};
|
|
|
|
|
|
|
|
bool ins__is_call(const struct ins *ins)
|
|
|
|
{
|
|
|
|
return ins->ops == &call_ops;
|
|
|
|
}
|
|
|
|
|
2016-09-20 04:18:16 +08:00
|
|
|
static int jump__parse(struct ins_operands *ops, struct map *map __maybe_unused)
|
2012-04-19 00:58:34 +08:00
|
|
|
{
|
2012-04-21 01:38:46 +08:00
|
|
|
const char *s = strchr(ops->raw, '+');
|
2012-04-19 00:58:34 +08:00
|
|
|
|
2013-08-07 19:38:54 +08:00
|
|
|
ops->target.addr = strtoull(ops->raw, NULL, 16);
|
2012-04-26 01:16:03 +08:00
|
|
|
|
|
|
|
if (s++ != NULL)
|
2013-08-07 19:38:54 +08:00
|
|
|
ops->target.offset = strtoull(s, NULL, 16);
|
2012-04-26 01:16:03 +08:00
|
|
|
else
|
|
|
|
ops->target.offset = UINT64_MAX;
|
2012-04-19 00:58:34 +08:00
|
|
|
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
2012-04-21 01:38:46 +08:00
|
|
|
static int jump__scnprintf(struct ins *ins, char *bf, size_t size,
|
2012-05-08 05:54:16 +08:00
|
|
|
struct ins_operands *ops)
|
2012-04-19 21:16:27 +08:00
|
|
|
{
|
2012-04-25 19:00:23 +08:00
|
|
|
return scnprintf(bf, size, "%-6.6s %" PRIx64, ins->name, ops->target.offset);
|
2012-04-19 21:16:27 +08:00
|
|
|
}
|
|
|
|
|
2012-04-19 00:58:34 +08:00
|
|
|
static struct ins_ops jump_ops = {
|
2012-04-21 01:38:46 +08:00
|
|
|
.parse = jump__parse,
|
|
|
|
.scnprintf = jump__scnprintf,
|
2012-04-19 00:58:34 +08:00
|
|
|
};
|
|
|
|
|
|
|
|
bool ins__is_jump(const struct ins *ins)
|
|
|
|
{
|
|
|
|
return ins->ops == &jump_ops;
|
|
|
|
}
|
|
|
|
|
2012-05-12 03:48:49 +08:00
|
|
|
static int comment__symbol(char *raw, char *comment, u64 *addrp, char **namep)
|
|
|
|
{
|
|
|
|
char *endptr, *name, *t;
|
|
|
|
|
|
|
|
if (strstr(raw, "(%rip)") == NULL)
|
|
|
|
return 0;
|
|
|
|
|
|
|
|
*addrp = strtoull(comment, &endptr, 16);
|
|
|
|
name = strchr(endptr, '<');
|
|
|
|
if (name == NULL)
|
|
|
|
return -1;
|
|
|
|
|
|
|
|
name++;
|
|
|
|
|
|
|
|
t = strchr(name, '>');
|
|
|
|
if (t == NULL)
|
|
|
|
return 0;
|
|
|
|
|
|
|
|
*t = '\0';
|
|
|
|
*namep = strdup(name);
|
|
|
|
*t = '>';
|
|
|
|
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
2016-09-20 04:18:16 +08:00
|
|
|
static int lock__parse(struct ins_operands *ops, struct map *map)
|
2012-05-13 00:15:34 +08:00
|
|
|
{
|
|
|
|
char *name;
|
|
|
|
|
|
|
|
ops->locked.ops = zalloc(sizeof(*ops->locked.ops));
|
|
|
|
if (ops->locked.ops == NULL)
|
|
|
|
return 0;
|
|
|
|
|
|
|
|
if (disasm_line__parse(ops->raw, &name, &ops->locked.ops->raw) < 0)
|
|
|
|
goto out_free_ops;
|
|
|
|
|
2012-11-10 01:27:13 +08:00
|
|
|
ops->locked.ins = ins__find(name);
|
2015-01-19 03:00:21 +08:00
|
|
|
free(name);
|
|
|
|
|
2012-11-10 01:27:13 +08:00
|
|
|
if (ops->locked.ins == NULL)
|
|
|
|
goto out_free_ops;
|
2012-05-13 00:15:34 +08:00
|
|
|
|
2012-11-10 01:27:13 +08:00
|
|
|
if (!ops->locked.ins->ops)
|
|
|
|
return 0;
|
2012-05-13 00:15:34 +08:00
|
|
|
|
2015-01-19 03:00:20 +08:00
|
|
|
if (ops->locked.ins->ops->parse &&
|
2016-09-20 04:18:16 +08:00
|
|
|
ops->locked.ins->ops->parse(ops->locked.ops, map) < 0)
|
2015-01-19 03:00:20 +08:00
|
|
|
goto out_free_ops;
|
2012-05-13 00:15:34 +08:00
|
|
|
|
|
|
|
return 0;
|
|
|
|
|
|
|
|
out_free_ops:
|
2013-12-27 04:41:15 +08:00
|
|
|
zfree(&ops->locked.ops);
|
2012-05-13 00:15:34 +08:00
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
|
|
|
static int lock__scnprintf(struct ins *ins, char *bf, size_t size,
|
|
|
|
struct ins_operands *ops)
|
|
|
|
{
|
|
|
|
int printed;
|
|
|
|
|
|
|
|
if (ops->locked.ins == NULL)
|
|
|
|
return ins__raw_scnprintf(ins, bf, size, ops);
|
|
|
|
|
|
|
|
printed = scnprintf(bf, size, "%-6.6s ", ins->name);
|
|
|
|
return printed + ins__scnprintf(ops->locked.ins, bf + printed,
|
|
|
|
size - printed, ops->locked.ops);
|
|
|
|
}
|
|
|
|
|
2012-05-13 00:26:20 +08:00
|
|
|
static void lock__delete(struct ins_operands *ops)
|
|
|
|
{
|
2015-01-19 03:00:21 +08:00
|
|
|
struct ins *ins = ops->locked.ins;
|
|
|
|
|
|
|
|
if (ins && ins->ops->free)
|
|
|
|
ins->ops->free(ops->locked.ops);
|
|
|
|
else
|
|
|
|
ins__delete(ops->locked.ops);
|
|
|
|
|
2013-12-28 03:55:14 +08:00
|
|
|
zfree(&ops->locked.ops);
|
|
|
|
zfree(&ops->target.raw);
|
|
|
|
zfree(&ops->target.name);
|
2012-05-13 00:26:20 +08:00
|
|
|
}
|
|
|
|
|
2012-05-13 00:15:34 +08:00
|
|
|
static struct ins_ops lock_ops = {
|
2012-05-13 00:26:20 +08:00
|
|
|
.free = lock__delete,
|
2012-05-13 00:15:34 +08:00
|
|
|
.parse = lock__parse,
|
|
|
|
.scnprintf = lock__scnprintf,
|
|
|
|
};
|
|
|
|
|
2016-09-20 04:18:16 +08:00
|
|
|
static int mov__parse(struct ins_operands *ops, struct map *map __maybe_unused)
|
2012-05-12 03:48:49 +08:00
|
|
|
{
|
|
|
|
char *s = strchr(ops->raw, ','), *target, *comment, prev;
|
|
|
|
|
|
|
|
if (s == NULL)
|
|
|
|
return -1;
|
|
|
|
|
|
|
|
*s = '\0';
|
|
|
|
ops->source.raw = strdup(ops->raw);
|
|
|
|
*s = ',';
|
2014-12-18 04:24:45 +08:00
|
|
|
|
2012-05-12 03:48:49 +08:00
|
|
|
if (ops->source.raw == NULL)
|
|
|
|
return -1;
|
|
|
|
|
|
|
|
target = ++s;
|
2015-12-07 07:07:13 +08:00
|
|
|
#ifdef __arm__
|
|
|
|
comment = strchr(s, ';');
|
|
|
|
#else
|
2014-08-15 05:03:00 +08:00
|
|
|
comment = strchr(s, '#');
|
2015-12-07 07:07:13 +08:00
|
|
|
#endif
|
2014-08-15 05:03:00 +08:00
|
|
|
|
|
|
|
if (comment != NULL)
|
|
|
|
s = comment - 1;
|
|
|
|
else
|
|
|
|
s = strchr(s, '\0') - 1;
|
2012-05-12 03:48:49 +08:00
|
|
|
|
2014-08-15 05:03:00 +08:00
|
|
|
while (s > target && isspace(s[0]))
|
|
|
|
--s;
|
|
|
|
s++;
|
2012-05-12 03:48:49 +08:00
|
|
|
prev = *s;
|
|
|
|
*s = '\0';
|
|
|
|
|
|
|
|
ops->target.raw = strdup(target);
|
|
|
|
*s = prev;
|
|
|
|
|
|
|
|
if (ops->target.raw == NULL)
|
|
|
|
goto out_free_source;
|
|
|
|
|
|
|
|
if (comment == NULL)
|
|
|
|
return 0;
|
|
|
|
|
|
|
|
while (comment[0] != '\0' && isspace(comment[0]))
|
|
|
|
++comment;
|
|
|
|
|
|
|
|
comment__symbol(ops->source.raw, comment, &ops->source.addr, &ops->source.name);
|
|
|
|
comment__symbol(ops->target.raw, comment, &ops->target.addr, &ops->target.name);
|
|
|
|
|
|
|
|
return 0;
|
|
|
|
|
|
|
|
out_free_source:
|
2013-12-27 04:41:15 +08:00
|
|
|
zfree(&ops->source.raw);
|
2012-05-12 03:48:49 +08:00
|
|
|
return -1;
|
|
|
|
}
|
|
|
|
|
|
|
|
static int mov__scnprintf(struct ins *ins, char *bf, size_t size,
|
|
|
|
struct ins_operands *ops)
|
|
|
|
{
|
|
|
|
return scnprintf(bf, size, "%-6.6s %s,%s", ins->name,
|
|
|
|
ops->source.name ?: ops->source.raw,
|
|
|
|
ops->target.name ?: ops->target.raw);
|
|
|
|
}
|
|
|
|
|
|
|
|
static struct ins_ops mov_ops = {
|
|
|
|
.parse = mov__parse,
|
|
|
|
.scnprintf = mov__scnprintf,
|
|
|
|
};
|
|
|
|
|
2016-09-20 04:18:16 +08:00
|
|
|
static int dec__parse(struct ins_operands *ops, struct map *map __maybe_unused)
|
2012-05-12 04:21:09 +08:00
|
|
|
{
|
|
|
|
char *target, *comment, *s, prev;
|
|
|
|
|
|
|
|
target = s = ops->raw;
|
|
|
|
|
|
|
|
while (s[0] != '\0' && !isspace(s[0]))
|
|
|
|
++s;
|
|
|
|
prev = *s;
|
|
|
|
*s = '\0';
|
|
|
|
|
|
|
|
ops->target.raw = strdup(target);
|
|
|
|
*s = prev;
|
|
|
|
|
|
|
|
if (ops->target.raw == NULL)
|
|
|
|
return -1;
|
|
|
|
|
|
|
|
comment = strchr(s, '#');
|
|
|
|
if (comment == NULL)
|
|
|
|
return 0;
|
|
|
|
|
|
|
|
while (comment[0] != '\0' && isspace(comment[0]))
|
|
|
|
++comment;
|
|
|
|
|
|
|
|
comment__symbol(ops->target.raw, comment, &ops->target.addr, &ops->target.name);
|
|
|
|
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
|
|
|
static int dec__scnprintf(struct ins *ins, char *bf, size_t size,
|
|
|
|
struct ins_operands *ops)
|
|
|
|
{
|
|
|
|
return scnprintf(bf, size, "%-6.6s %s", ins->name,
|
|
|
|
ops->target.name ?: ops->target.raw);
|
|
|
|
}
|
|
|
|
|
|
|
|
static struct ins_ops dec_ops = {
|
|
|
|
.parse = dec__parse,
|
|
|
|
.scnprintf = dec__scnprintf,
|
|
|
|
};
|
|
|
|
|
2012-09-11 06:15:03 +08:00
|
|
|
static int nop__scnprintf(struct ins *ins __maybe_unused, char *bf, size_t size,
|
|
|
|
struct ins_operands *ops __maybe_unused)
|
2012-05-08 05:57:02 +08:00
|
|
|
{
|
|
|
|
return scnprintf(bf, size, "%-6.6s", "nop");
|
|
|
|
}
|
|
|
|
|
|
|
|
static struct ins_ops nop_ops = {
|
|
|
|
.scnprintf = nop__scnprintf,
|
|
|
|
};
|
|
|
|
|
2016-06-24 19:53:58 +08:00
|
|
|
static struct ins_ops ret_ops = {
|
|
|
|
.scnprintf = ins__raw_scnprintf,
|
|
|
|
};
|
|
|
|
|
|
|
|
bool ins__is_ret(const struct ins *ins)
|
|
|
|
{
|
|
|
|
return ins->ops == &ret_ops;
|
|
|
|
}
|
|
|
|
|
2012-04-19 00:58:34 +08:00
|
|
|
static struct ins instructions[] = {
|
2012-05-12 03:48:49 +08:00
|
|
|
{ .name = "add", .ops = &mov_ops, },
|
|
|
|
{ .name = "addl", .ops = &mov_ops, },
|
|
|
|
{ .name = "addq", .ops = &mov_ops, },
|
|
|
|
{ .name = "addw", .ops = &mov_ops, },
|
|
|
|
{ .name = "and", .ops = &mov_ops, },
|
2015-12-07 07:07:13 +08:00
|
|
|
#ifdef __arm__
|
|
|
|
{ .name = "b", .ops = &jump_ops, }, // might also be a call
|
|
|
|
{ .name = "bcc", .ops = &jump_ops, },
|
|
|
|
{ .name = "bcs", .ops = &jump_ops, },
|
|
|
|
{ .name = "beq", .ops = &jump_ops, },
|
|
|
|
{ .name = "bge", .ops = &jump_ops, },
|
|
|
|
{ .name = "bgt", .ops = &jump_ops, },
|
|
|
|
{ .name = "bhi", .ops = &jump_ops, },
|
|
|
|
{ .name = "bl", .ops = &call_ops, },
|
|
|
|
{ .name = "bls", .ops = &jump_ops, },
|
2016-05-20 00:59:45 +08:00
|
|
|
{ .name = "blt", .ops = &jump_ops, },
|
2015-12-07 07:07:13 +08:00
|
|
|
{ .name = "blx", .ops = &call_ops, },
|
|
|
|
{ .name = "bne", .ops = &jump_ops, },
|
|
|
|
#endif
|
2012-05-13 00:15:34 +08:00
|
|
|
{ .name = "bts", .ops = &mov_ops, },
|
2012-04-19 03:07:38 +08:00
|
|
|
{ .name = "call", .ops = &call_ops, },
|
|
|
|
{ .name = "callq", .ops = &call_ops, },
|
2012-05-12 03:48:49 +08:00
|
|
|
{ .name = "cmp", .ops = &mov_ops, },
|
|
|
|
{ .name = "cmpb", .ops = &mov_ops, },
|
|
|
|
{ .name = "cmpl", .ops = &mov_ops, },
|
|
|
|
{ .name = "cmpq", .ops = &mov_ops, },
|
|
|
|
{ .name = "cmpw", .ops = &mov_ops, },
|
|
|
|
{ .name = "cmpxch", .ops = &mov_ops, },
|
2012-05-12 04:21:09 +08:00
|
|
|
{ .name = "dec", .ops = &dec_ops, },
|
|
|
|
{ .name = "decl", .ops = &dec_ops, },
|
2012-05-12 03:48:49 +08:00
|
|
|
{ .name = "imul", .ops = &mov_ops, },
|
2012-05-12 04:21:09 +08:00
|
|
|
{ .name = "inc", .ops = &dec_ops, },
|
|
|
|
{ .name = "incl", .ops = &dec_ops, },
|
2012-04-19 00:58:34 +08:00
|
|
|
{ .name = "ja", .ops = &jump_ops, },
|
2012-04-20 04:10:12 +08:00
|
|
|
{ .name = "jae", .ops = &jump_ops, },
|
|
|
|
{ .name = "jb", .ops = &jump_ops, },
|
|
|
|
{ .name = "jbe", .ops = &jump_ops, },
|
|
|
|
{ .name = "jc", .ops = &jump_ops, },
|
|
|
|
{ .name = "jcxz", .ops = &jump_ops, },
|
2012-04-19 00:58:34 +08:00
|
|
|
{ .name = "je", .ops = &jump_ops, },
|
2012-04-20 04:10:12 +08:00
|
|
|
{ .name = "jecxz", .ops = &jump_ops, },
|
|
|
|
{ .name = "jg", .ops = &jump_ops, },
|
|
|
|
{ .name = "jge", .ops = &jump_ops, },
|
|
|
|
{ .name = "jl", .ops = &jump_ops, },
|
|
|
|
{ .name = "jle", .ops = &jump_ops, },
|
2012-04-19 00:58:34 +08:00
|
|
|
{ .name = "jmp", .ops = &jump_ops, },
|
|
|
|
{ .name = "jmpq", .ops = &jump_ops, },
|
2012-04-20 04:10:12 +08:00
|
|
|
{ .name = "jna", .ops = &jump_ops, },
|
|
|
|
{ .name = "jnae", .ops = &jump_ops, },
|
|
|
|
{ .name = "jnb", .ops = &jump_ops, },
|
|
|
|
{ .name = "jnbe", .ops = &jump_ops, },
|
|
|
|
{ .name = "jnc", .ops = &jump_ops, },
|
2012-04-19 00:58:34 +08:00
|
|
|
{ .name = "jne", .ops = &jump_ops, },
|
2012-04-20 04:10:12 +08:00
|
|
|
{ .name = "jng", .ops = &jump_ops, },
|
|
|
|
{ .name = "jnge", .ops = &jump_ops, },
|
|
|
|
{ .name = "jnl", .ops = &jump_ops, },
|
|
|
|
{ .name = "jnle", .ops = &jump_ops, },
|
|
|
|
{ .name = "jno", .ops = &jump_ops, },
|
|
|
|
{ .name = "jnp", .ops = &jump_ops, },
|
|
|
|
{ .name = "jns", .ops = &jump_ops, },
|
|
|
|
{ .name = "jnz", .ops = &jump_ops, },
|
|
|
|
{ .name = "jo", .ops = &jump_ops, },
|
|
|
|
{ .name = "jp", .ops = &jump_ops, },
|
|
|
|
{ .name = "jpe", .ops = &jump_ops, },
|
|
|
|
{ .name = "jpo", .ops = &jump_ops, },
|
|
|
|
{ .name = "jrcxz", .ops = &jump_ops, },
|
2012-04-19 00:58:34 +08:00
|
|
|
{ .name = "js", .ops = &jump_ops, },
|
2012-04-20 04:10:12 +08:00
|
|
|
{ .name = "jz", .ops = &jump_ops, },
|
2012-05-12 03:48:49 +08:00
|
|
|
{ .name = "lea", .ops = &mov_ops, },
|
2012-05-13 00:15:34 +08:00
|
|
|
{ .name = "lock", .ops = &lock_ops, },
|
2012-05-12 03:48:49 +08:00
|
|
|
{ .name = "mov", .ops = &mov_ops, },
|
|
|
|
{ .name = "movb", .ops = &mov_ops, },
|
|
|
|
{ .name = "movdqa",.ops = &mov_ops, },
|
|
|
|
{ .name = "movl", .ops = &mov_ops, },
|
|
|
|
{ .name = "movq", .ops = &mov_ops, },
|
|
|
|
{ .name = "movslq", .ops = &mov_ops, },
|
|
|
|
{ .name = "movzbl", .ops = &mov_ops, },
|
|
|
|
{ .name = "movzwl", .ops = &mov_ops, },
|
2012-05-08 05:57:02 +08:00
|
|
|
{ .name = "nop", .ops = &nop_ops, },
|
|
|
|
{ .name = "nopl", .ops = &nop_ops, },
|
|
|
|
{ .name = "nopw", .ops = &nop_ops, },
|
2012-05-12 03:48:49 +08:00
|
|
|
{ .name = "or", .ops = &mov_ops, },
|
|
|
|
{ .name = "orl", .ops = &mov_ops, },
|
|
|
|
{ .name = "test", .ops = &mov_ops, },
|
|
|
|
{ .name = "testb", .ops = &mov_ops, },
|
|
|
|
{ .name = "testl", .ops = &mov_ops, },
|
2012-05-13 00:15:34 +08:00
|
|
|
{ .name = "xadd", .ops = &mov_ops, },
|
2012-10-31 08:34:08 +08:00
|
|
|
{ .name = "xbeginl", .ops = &jump_ops, },
|
|
|
|
{ .name = "xbeginq", .ops = &jump_ops, },
|
2016-06-24 19:53:58 +08:00
|
|
|
{ .name = "retq", .ops = &ret_ops, },
|
2012-04-19 00:58:34 +08:00
|
|
|
};
|
|
|
|
|
2016-05-20 00:59:46 +08:00
|
|
|
static int ins__key_cmp(const void *name, const void *insp)
|
2012-04-19 00:58:34 +08:00
|
|
|
{
|
|
|
|
const struct ins *ins = insp;
|
|
|
|
|
|
|
|
return strcmp(name, ins->name);
|
|
|
|
}
|
|
|
|
|
2016-05-20 00:59:46 +08:00
|
|
|
static int ins__cmp(const void *a, const void *b)
|
|
|
|
{
|
|
|
|
const struct ins *ia = a;
|
|
|
|
const struct ins *ib = b;
|
|
|
|
|
|
|
|
return strcmp(ia->name, ib->name);
|
|
|
|
}
|
|
|
|
|
|
|
|
static void ins__sort(void)
|
|
|
|
{
|
|
|
|
const int nmemb = ARRAY_SIZE(instructions);
|
|
|
|
|
|
|
|
qsort(instructions, nmemb, sizeof(struct ins), ins__cmp);
|
|
|
|
}
|
|
|
|
|
2012-04-19 00:58:34 +08:00
|
|
|
static struct ins *ins__find(const char *name)
|
|
|
|
{
|
|
|
|
const int nmemb = ARRAY_SIZE(instructions);
|
2016-05-20 00:59:46 +08:00
|
|
|
static bool sorted;
|
|
|
|
|
|
|
|
if (!sorted) {
|
|
|
|
ins__sort();
|
|
|
|
sorted = true;
|
|
|
|
}
|
2012-04-19 00:58:34 +08:00
|
|
|
|
2016-05-20 00:59:46 +08:00
|
|
|
return bsearch(name, instructions, nmemb, sizeof(struct ins), ins__key_cmp);
|
2012-04-19 00:58:34 +08:00
|
|
|
}
|
|
|
|
|
2011-11-12 08:17:32 +08:00
|
|
|
int symbol__alloc_hist(struct symbol *sym)
|
2011-02-08 23:27:39 +08:00
|
|
|
{
|
|
|
|
struct annotation *notes = symbol__annotation(sym);
|
2012-04-19 21:57:06 +08:00
|
|
|
const size_t size = symbol__size(sym);
|
2012-07-20 11:05:25 +08:00
|
|
|
size_t sizeof_sym_hist;
|
|
|
|
|
|
|
|
/* Check for overflow when calculating sizeof_sym_hist */
|
|
|
|
if (size > (SIZE_MAX - sizeof(struct sym_hist)) / sizeof(u64))
|
|
|
|
return -1;
|
|
|
|
|
|
|
|
sizeof_sym_hist = (sizeof(struct sym_hist) + size * sizeof(u64));
|
|
|
|
|
|
|
|
/* Check for overflow in zalloc argument */
|
|
|
|
if (sizeof_sym_hist > (SIZE_MAX - sizeof(*notes->src))
|
|
|
|
/ symbol_conf.nr_events)
|
|
|
|
return -1;
|
2011-02-08 23:27:39 +08:00
|
|
|
|
2011-11-12 08:17:32 +08:00
|
|
|
notes->src = zalloc(sizeof(*notes->src) + symbol_conf.nr_events * sizeof_sym_hist);
|
2011-02-08 23:27:39 +08:00
|
|
|
if (notes->src == NULL)
|
|
|
|
return -1;
|
|
|
|
notes->src->sizeof_sym_hist = sizeof_sym_hist;
|
2011-11-12 08:17:32 +08:00
|
|
|
notes->src->nr_histograms = symbol_conf.nr_events;
|
2011-02-08 23:27:39 +08:00
|
|
|
INIT_LIST_HEAD(¬es->src->source);
|
|
|
|
return 0;
|
2011-02-04 19:45:46 +08:00
|
|
|
}
|
|
|
|
|
2015-07-18 23:24:48 +08:00
|
|
|
/* The cycles histogram is lazily allocated. */
|
|
|
|
static int symbol__alloc_hist_cycles(struct symbol *sym)
|
|
|
|
{
|
|
|
|
struct annotation *notes = symbol__annotation(sym);
|
|
|
|
const size_t size = symbol__size(sym);
|
|
|
|
|
|
|
|
notes->src->cycles_hist = calloc(size, sizeof(struct cyc_hist));
|
|
|
|
if (notes->src->cycles_hist == NULL)
|
|
|
|
return -1;
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
2011-02-07 00:54:44 +08:00
|
|
|
void symbol__annotate_zero_histograms(struct symbol *sym)
|
|
|
|
{
|
|
|
|
struct annotation *notes = symbol__annotation(sym);
|
|
|
|
|
2011-02-08 23:27:39 +08:00
|
|
|
pthread_mutex_lock(¬es->lock);
|
2015-07-18 23:24:48 +08:00
|
|
|
if (notes->src != NULL) {
|
2011-02-08 23:27:39 +08:00
|
|
|
memset(notes->src->histograms, 0,
|
|
|
|
notes->src->nr_histograms * notes->src->sizeof_sym_hist);
|
2015-07-18 23:24:48 +08:00
|
|
|
if (notes->src->cycles_hist)
|
|
|
|
memset(notes->src->cycles_hist, 0,
|
|
|
|
symbol__size(sym) * sizeof(struct cyc_hist));
|
|
|
|
}
|
2011-02-08 23:27:39 +08:00
|
|
|
pthread_mutex_unlock(¬es->lock);
|
2011-02-07 00:54:44 +08:00
|
|
|
}
|
|
|
|
|
2015-07-18 23:24:48 +08:00
|
|
|
static int __symbol__account_cycles(struct annotation *notes,
|
|
|
|
u64 start,
|
|
|
|
unsigned offset, unsigned cycles,
|
|
|
|
unsigned have_start)
|
|
|
|
{
|
|
|
|
struct cyc_hist *ch;
|
|
|
|
|
|
|
|
ch = notes->src->cycles_hist;
|
|
|
|
/*
|
|
|
|
* For now we can only account one basic block per
|
|
|
|
* final jump. But multiple could be overlapping.
|
|
|
|
* Always account the longest one. So when
|
|
|
|
* a shorter one has been already seen throw it away.
|
|
|
|
*
|
|
|
|
* We separately always account the full cycles.
|
|
|
|
*/
|
|
|
|
ch[offset].num_aggr++;
|
|
|
|
ch[offset].cycles_aggr += cycles;
|
|
|
|
|
|
|
|
if (!have_start && ch[offset].have_start)
|
|
|
|
return 0;
|
|
|
|
if (ch[offset].num) {
|
|
|
|
if (have_start && (!ch[offset].have_start ||
|
|
|
|
ch[offset].start > start)) {
|
|
|
|
ch[offset].have_start = 0;
|
|
|
|
ch[offset].cycles = 0;
|
|
|
|
ch[offset].num = 0;
|
|
|
|
if (ch[offset].reset < 0xffff)
|
|
|
|
ch[offset].reset++;
|
|
|
|
} else if (have_start &&
|
|
|
|
ch[offset].start < start)
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
ch[offset].have_start = have_start;
|
|
|
|
ch[offset].start = start;
|
|
|
|
ch[offset].cycles += cycles;
|
|
|
|
ch[offset].num++;
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
2013-12-19 02:37:41 +08:00
|
|
|
static int __symbol__inc_addr_samples(struct symbol *sym, struct map *map,
|
|
|
|
struct annotation *notes, int evidx, u64 addr)
|
2011-02-04 19:45:46 +08:00
|
|
|
{
|
2011-02-04 23:43:24 +08:00
|
|
|
unsigned offset;
|
2011-02-04 19:45:46 +08:00
|
|
|
struct sym_hist *h;
|
|
|
|
|
|
|
|
pr_debug3("%s: addr=%#" PRIx64 "\n", __func__, map->unmap_ip(map, addr));
|
|
|
|
|
2015-10-22 02:45:13 +08:00
|
|
|
if (addr < sym->start || addr >= sym->end) {
|
|
|
|
pr_debug("%s(%d): ERANGE! sym->name=%s, start=%#" PRIx64 ", addr=%#" PRIx64 ", end=%#" PRIx64 "\n",
|
|
|
|
__func__, __LINE__, sym->name, sym->start, addr, sym->end);
|
2012-03-27 23:55:57 +08:00
|
|
|
return -ERANGE;
|
2015-10-22 02:45:13 +08:00
|
|
|
}
|
2011-02-04 19:45:46 +08:00
|
|
|
|
2011-02-04 23:43:24 +08:00
|
|
|
offset = addr - sym->start;
|
|
|
|
h = annotation__histogram(notes, evidx);
|
2011-02-04 19:45:46 +08:00
|
|
|
h->sum++;
|
|
|
|
h->addr[offset]++;
|
|
|
|
|
|
|
|
pr_debug3("%#" PRIx64 " %s: period++ [addr: %#" PRIx64 ", %#" PRIx64
|
2011-02-04 23:43:24 +08:00
|
|
|
", evidx=%d] => %" PRIu64 "\n", sym->start, sym->name,
|
|
|
|
addr, addr - sym->start, evidx, h->addr[offset]);
|
2011-02-04 19:45:46 +08:00
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
2015-07-18 23:24:48 +08:00
|
|
|
static struct annotation *symbol__get_annotation(struct symbol *sym, bool cycles)
|
2015-05-28 01:51:46 +08:00
|
|
|
{
|
|
|
|
struct annotation *notes = symbol__annotation(sym);
|
|
|
|
|
|
|
|
if (notes->src == NULL) {
|
|
|
|
if (symbol__alloc_hist(sym) < 0)
|
|
|
|
return NULL;
|
|
|
|
}
|
2015-07-18 23:24:48 +08:00
|
|
|
if (!notes->src->cycles_hist && cycles) {
|
|
|
|
if (symbol__alloc_hist_cycles(sym) < 0)
|
|
|
|
return NULL;
|
|
|
|
}
|
2015-05-28 01:51:46 +08:00
|
|
|
return notes;
|
|
|
|
}
|
|
|
|
|
2013-12-19 04:12:24 +08:00
|
|
|
static int symbol__inc_addr_samples(struct symbol *sym, struct map *map,
|
|
|
|
int evidx, u64 addr)
|
2013-12-19 02:37:41 +08:00
|
|
|
{
|
|
|
|
struct annotation *notes;
|
|
|
|
|
2014-02-20 09:32:53 +08:00
|
|
|
if (sym == NULL)
|
2013-12-19 02:37:41 +08:00
|
|
|
return 0;
|
2015-07-18 23:24:48 +08:00
|
|
|
notes = symbol__get_annotation(sym, false);
|
2015-05-28 01:51:46 +08:00
|
|
|
if (notes == NULL)
|
|
|
|
return -ENOMEM;
|
2013-12-19 02:37:41 +08:00
|
|
|
return __symbol__inc_addr_samples(sym, map, notes, evidx, addr);
|
|
|
|
}
|
|
|
|
|
2015-07-18 23:24:48 +08:00
|
|
|
static int symbol__account_cycles(u64 addr, u64 start,
|
|
|
|
struct symbol *sym, unsigned cycles)
|
|
|
|
{
|
|
|
|
struct annotation *notes;
|
|
|
|
unsigned offset;
|
|
|
|
|
|
|
|
if (sym == NULL)
|
|
|
|
return 0;
|
|
|
|
notes = symbol__get_annotation(sym, true);
|
|
|
|
if (notes == NULL)
|
|
|
|
return -ENOMEM;
|
|
|
|
if (addr < sym->start || addr >= sym->end)
|
|
|
|
return -ERANGE;
|
|
|
|
|
|
|
|
if (start) {
|
|
|
|
if (start < sym->start || start >= sym->end)
|
|
|
|
return -ERANGE;
|
|
|
|
if (start >= addr)
|
|
|
|
start = 0;
|
|
|
|
}
|
|
|
|
offset = addr - sym->start;
|
|
|
|
return __symbol__account_cycles(notes,
|
|
|
|
start ? start - sym->start : 0,
|
|
|
|
offset, cycles,
|
|
|
|
!!start);
|
|
|
|
}
|
|
|
|
|
|
|
|
int addr_map_symbol__account_cycles(struct addr_map_symbol *ams,
|
|
|
|
struct addr_map_symbol *start,
|
|
|
|
unsigned cycles)
|
|
|
|
{
|
2015-08-14 15:11:34 +08:00
|
|
|
u64 saddr = 0;
|
2015-07-18 23:24:48 +08:00
|
|
|
int err;
|
|
|
|
|
|
|
|
if (!cycles)
|
|
|
|
return 0;
|
|
|
|
|
|
|
|
/*
|
|
|
|
* Only set start when IPC can be computed. We can only
|
|
|
|
* compute it when the basic block is completely in a single
|
|
|
|
* function.
|
|
|
|
* Special case the case when the jump is elsewhere, but
|
|
|
|
* it starts on the function start.
|
|
|
|
*/
|
|
|
|
if (start &&
|
|
|
|
(start->sym == ams->sym ||
|
|
|
|
(ams->sym &&
|
|
|
|
start->addr == ams->sym->start + ams->map->start)))
|
|
|
|
saddr = start->al_addr;
|
|
|
|
if (saddr == 0)
|
2015-08-14 15:11:34 +08:00
|
|
|
pr_debug2("BB with bad start: addr %"PRIx64" start %"PRIx64" sym %"PRIx64" saddr %"PRIx64"\n",
|
2015-07-18 23:24:48 +08:00
|
|
|
ams->addr,
|
|
|
|
start ? start->addr : 0,
|
|
|
|
ams->sym ? ams->sym->start + ams->map->start : 0,
|
|
|
|
saddr);
|
|
|
|
err = symbol__account_cycles(ams->al_addr, saddr, ams->sym, cycles);
|
|
|
|
if (err)
|
|
|
|
pr_debug2("account_cycles failed %d\n", err);
|
|
|
|
return err;
|
|
|
|
}
|
|
|
|
|
2013-12-19 03:48:29 +08:00
|
|
|
int addr_map_symbol__inc_samples(struct addr_map_symbol *ams, int evidx)
|
|
|
|
{
|
|
|
|
return symbol__inc_addr_samples(ams->sym, ams->map, evidx, ams->al_addr);
|
|
|
|
}
|
|
|
|
|
2013-12-19 04:10:15 +08:00
|
|
|
int hist_entry__inc_addr_samples(struct hist_entry *he, int evidx, u64 ip)
|
|
|
|
{
|
|
|
|
return symbol__inc_addr_samples(he->ms.sym, he->ms.map, evidx, ip);
|
|
|
|
}
|
|
|
|
|
2016-09-20 04:18:16 +08:00
|
|
|
static void disasm_line__init_ins(struct disasm_line *dl, struct map *map)
|
2012-04-19 00:58:34 +08:00
|
|
|
{
|
|
|
|
dl->ins = ins__find(dl->name);
|
|
|
|
|
|
|
|
if (dl->ins == NULL)
|
|
|
|
return;
|
|
|
|
|
|
|
|
if (!dl->ins->ops)
|
|
|
|
return;
|
|
|
|
|
2016-09-20 04:18:16 +08:00
|
|
|
if (dl->ins->ops->parse && dl->ins->ops->parse(&dl->ops, map) < 0)
|
2015-01-19 03:00:20 +08:00
|
|
|
dl->ins = NULL;
|
2012-04-19 00:58:34 +08:00
|
|
|
}
|
|
|
|
|
2012-05-13 00:15:34 +08:00
|
|
|
static int disasm_line__parse(char *line, char **namep, char **rawp)
|
|
|
|
{
|
|
|
|
char *name = line, tmp;
|
|
|
|
|
|
|
|
while (isspace(name[0]))
|
|
|
|
++name;
|
|
|
|
|
|
|
|
if (name[0] == '\0')
|
|
|
|
return -1;
|
|
|
|
|
|
|
|
*rawp = name + 1;
|
|
|
|
|
|
|
|
while ((*rawp)[0] != '\0' && !isspace((*rawp)[0]))
|
|
|
|
++*rawp;
|
|
|
|
|
|
|
|
tmp = (*rawp)[0];
|
|
|
|
(*rawp)[0] = '\0';
|
|
|
|
*namep = strdup(name);
|
|
|
|
|
|
|
|
if (*namep == NULL)
|
|
|
|
goto out_free_name;
|
|
|
|
|
|
|
|
(*rawp)[0] = tmp;
|
|
|
|
|
|
|
|
if ((*rawp)[0] != '\0') {
|
|
|
|
(*rawp)++;
|
|
|
|
while (isspace((*rawp)[0]))
|
|
|
|
++(*rawp);
|
|
|
|
}
|
|
|
|
|
|
|
|
return 0;
|
|
|
|
|
|
|
|
out_free_name:
|
2013-12-27 04:41:15 +08:00
|
|
|
zfree(namep);
|
2012-05-13 00:15:34 +08:00
|
|
|
return -1;
|
|
|
|
}
|
|
|
|
|
2014-11-13 10:05:26 +08:00
|
|
|
static struct disasm_line *disasm_line__new(s64 offset, char *line,
|
2016-09-20 04:18:16 +08:00
|
|
|
size_t privsize, int line_nr,
|
|
|
|
struct map *map)
|
2011-02-04 19:45:46 +08:00
|
|
|
{
|
2012-04-16 02:52:18 +08:00
|
|
|
struct disasm_line *dl = zalloc(sizeof(*dl) + privsize);
|
2011-02-04 19:45:46 +08:00
|
|
|
|
2012-04-16 02:24:39 +08:00
|
|
|
if (dl != NULL) {
|
|
|
|
dl->offset = offset;
|
|
|
|
dl->line = strdup(line);
|
2014-11-13 10:05:26 +08:00
|
|
|
dl->line_nr = line_nr;
|
2012-04-16 02:24:39 +08:00
|
|
|
if (dl->line == NULL)
|
2012-04-02 23:59:01 +08:00
|
|
|
goto out_delete;
|
2012-04-16 02:52:18 +08:00
|
|
|
|
|
|
|
if (offset != -1) {
|
2012-05-13 00:15:34 +08:00
|
|
|
if (disasm_line__parse(dl->line, &dl->name, &dl->ops.raw) < 0)
|
2012-04-16 02:52:18 +08:00
|
|
|
goto out_free_line;
|
|
|
|
|
2016-09-20 04:18:16 +08:00
|
|
|
disasm_line__init_ins(dl, map);
|
2012-04-16 02:52:18 +08:00
|
|
|
}
|
2011-02-04 19:45:46 +08:00
|
|
|
}
|
|
|
|
|
2012-04-16 02:24:39 +08:00
|
|
|
return dl;
|
2012-04-16 02:52:18 +08:00
|
|
|
|
|
|
|
out_free_line:
|
2013-12-28 03:55:14 +08:00
|
|
|
zfree(&dl->line);
|
2012-04-02 23:59:01 +08:00
|
|
|
out_delete:
|
2012-04-16 02:24:39 +08:00
|
|
|
free(dl);
|
2012-04-02 23:59:01 +08:00
|
|
|
return NULL;
|
2011-02-04 19:45:46 +08:00
|
|
|
}
|
|
|
|
|
2012-04-16 02:24:39 +08:00
|
|
|
void disasm_line__free(struct disasm_line *dl)
|
2011-02-04 19:45:46 +08:00
|
|
|
{
|
2013-12-28 03:55:14 +08:00
|
|
|
zfree(&dl->line);
|
|
|
|
zfree(&dl->name);
|
2012-05-13 00:26:20 +08:00
|
|
|
if (dl->ins && dl->ins->ops->free)
|
|
|
|
dl->ins->ops->free(&dl->ops);
|
|
|
|
else
|
|
|
|
ins__delete(&dl->ops);
|
2012-04-16 02:24:39 +08:00
|
|
|
free(dl);
|
2011-02-04 19:45:46 +08:00
|
|
|
}
|
|
|
|
|
2012-05-08 05:54:16 +08:00
|
|
|
int disasm_line__scnprintf(struct disasm_line *dl, char *bf, size_t size, bool raw)
|
|
|
|
{
|
|
|
|
if (raw || !dl->ins)
|
|
|
|
return scnprintf(bf, size, "%-6.6s %s", dl->name, dl->ops.raw);
|
|
|
|
|
|
|
|
return ins__scnprintf(dl->ins, bf, size, &dl->ops);
|
|
|
|
}
|
|
|
|
|
2012-04-16 02:24:39 +08:00
|
|
|
static void disasm__add(struct list_head *head, struct disasm_line *line)
|
2011-02-04 19:45:46 +08:00
|
|
|
{
|
|
|
|
list_add_tail(&line->node, head);
|
|
|
|
}
|
|
|
|
|
2012-04-16 02:24:39 +08:00
|
|
|
struct disasm_line *disasm__get_next_ip_line(struct list_head *head, struct disasm_line *pos)
|
2011-02-04 19:45:46 +08:00
|
|
|
{
|
|
|
|
list_for_each_entry_continue(pos, head, node)
|
|
|
|
if (pos->offset >= 0)
|
|
|
|
return pos;
|
|
|
|
|
|
|
|
return NULL;
|
|
|
|
}
|
|
|
|
|
2013-03-05 13:53:30 +08:00
|
|
|
double disasm__calc_percent(struct annotation *notes, int evidx, s64 offset,
|
2015-06-20 03:10:43 +08:00
|
|
|
s64 end, const char **path, u64 *nr_samples)
|
2013-03-05 13:53:23 +08:00
|
|
|
{
|
|
|
|
struct source_line *src_line = notes->src->lines;
|
|
|
|
double percent = 0.0;
|
2015-06-20 03:10:43 +08:00
|
|
|
*nr_samples = 0;
|
2013-03-05 13:53:23 +08:00
|
|
|
|
2013-03-05 13:53:24 +08:00
|
|
|
if (src_line) {
|
2013-03-05 13:53:28 +08:00
|
|
|
size_t sizeof_src_line = sizeof(*src_line) +
|
2015-06-20 03:36:12 +08:00
|
|
|
sizeof(src_line->samples) * (src_line->nr_pcnt - 1);
|
2013-03-05 13:53:28 +08:00
|
|
|
|
2013-03-05 13:53:24 +08:00
|
|
|
while (offset < end) {
|
2013-03-05 13:53:28 +08:00
|
|
|
src_line = (void *)notes->src->lines +
|
|
|
|
(sizeof_src_line * offset);
|
|
|
|
|
2013-03-05 13:53:23 +08:00
|
|
|
if (*path == NULL)
|
2013-03-05 13:53:28 +08:00
|
|
|
*path = src_line->path;
|
2013-03-05 13:53:23 +08:00
|
|
|
|
2015-06-20 03:36:12 +08:00
|
|
|
percent += src_line->samples[evidx].percent;
|
|
|
|
*nr_samples += src_line->samples[evidx].nr;
|
2013-03-05 13:53:28 +08:00
|
|
|
offset++;
|
2013-03-05 13:53:24 +08:00
|
|
|
}
|
|
|
|
} else {
|
2013-03-05 13:53:28 +08:00
|
|
|
struct sym_hist *h = annotation__histogram(notes, evidx);
|
|
|
|
unsigned int hits = 0;
|
|
|
|
|
2013-03-05 13:53:24 +08:00
|
|
|
while (offset < end)
|
|
|
|
hits += h->addr[offset++];
|
2013-03-05 13:53:23 +08:00
|
|
|
|
2015-06-20 03:10:43 +08:00
|
|
|
if (h->sum) {
|
|
|
|
*nr_samples = hits;
|
2013-03-05 13:53:24 +08:00
|
|
|
percent = 100.0 * hits / h->sum;
|
2015-06-20 03:10:43 +08:00
|
|
|
}
|
2013-03-05 13:53:24 +08:00
|
|
|
}
|
2013-03-05 13:53:23 +08:00
|
|
|
|
|
|
|
return percent;
|
|
|
|
}
|
|
|
|
|
perf annotate: Add branch stack / basic block
I wanted to know the hottest path through a function and figured the
branch-stack (LBR) information should be able to help out with that.
The below uses the branch-stack to create basic blocks and generate
statistics from them.
from to branch_i
* ----> *
|
| block
v
* ----> *
from to branch_i+1
The blocks are broken down into non-overlapping ranges, while tracking
if the start of each range is an entry point and/or the end of a range
is a branch.
Each block iterates all ranges it covers (while splitting where required
to exactly match the block) and increments the 'coverage' count.
For the range including the branch we increment the taken counter, as
well as the pred counter if flags.predicted.
Using these number we can find if an instruction:
- had coverage; given by:
br->coverage / br->sym->max_coverage
This metric ensures each symbol has a 100% spot, which reflects the
observation that each symbol must have a most covered/hottest
block.
- is a branch target: br->is_target && br->start == add
- for targets, how much of a branch's coverages comes from it:
target->entry / branch->coverage
- is a branch: br->is_branch && br->end == addr
- for branches, how often it was taken:
br->taken / br->coverage
after all, all execution that didn't take the branch would have
incremented the coverage and continued onward to a later branch.
- for branches, how often it was predicted:
br->pred / br->taken
The coverage percentage is used to color the address and asm sections;
for low (<1%) coverage we use NORMAL (uncolored), indicating that these
instructions are not 'important'. For high coverage (>75%) we color the
address RED.
For each branch, we add an asm comment after the instruction with
information on how often it was taken and predicted.
Output looks like (sans color, which does loose a lot of the
information :/)
$ perf record --branch-filter u,any -e cycles:p ./branches 27
$ perf annotate branches
Percent | Source code & Disassembly of branches for cycles:pu (217 samples)
---------------------------------------------------------------------------------
: branches():
0.00 : 40057a: push %rbp
0.00 : 40057b: mov %rsp,%rbp
0.00 : 40057e: sub $0x20,%rsp
0.00 : 400582: mov %rdi,-0x18(%rbp)
0.00 : 400586: mov %rsi,-0x20(%rbp)
0.00 : 40058a: mov -0x18(%rbp),%rax
0.00 : 40058e: mov %rax,-0x10(%rbp)
0.00 : 400592: movq $0x0,-0x8(%rbp)
0.00 : 40059a: jmpq 400656 <branches+0xdc>
1.84 : 40059f: mov -0x10(%rbp),%rax # +100.00%
3.23 : 4005a3: and $0x1,%eax
1.84 : 4005a6: test %rax,%rax
0.00 : 4005a9: je 4005bf <branches+0x45> # -54.50% (p:42.00%)
0.46 : 4005ab: mov 0x200bbe(%rip),%rax # 601170 <acc>
12.90 : 4005b2: add $0x1,%rax
2.30 : 4005b6: mov %rax,0x200bb3(%rip) # 601170 <acc>
0.46 : 4005bd: jmp 4005d1 <branches+0x57> # -100.00% (p:100.00%)
0.92 : 4005bf: mov 0x200baa(%rip),%rax # 601170 <acc> # +49.54%
13.82 : 4005c6: sub $0x1,%rax
0.46 : 4005ca: mov %rax,0x200b9f(%rip) # 601170 <acc>
2.30 : 4005d1: mov -0x10(%rbp),%rax # +50.46%
0.46 : 4005d5: mov %rax,%rdi
0.46 : 4005d8: callq 400526 <lfsr> # -100.00% (p:100.00%)
0.00 : 4005dd: mov %rax,-0x10(%rbp) # +100.00%
0.92 : 4005e1: mov -0x18(%rbp),%rax
0.00 : 4005e5: and $0x1,%eax
0.00 : 4005e8: test %rax,%rax
0.00 : 4005eb: je 4005ff <branches+0x85> # -100.00% (p:100.00%)
0.00 : 4005ed: mov 0x200b7c(%rip),%rax # 601170 <acc>
0.00 : 4005f4: shr $0x2,%rax
0.00 : 4005f8: mov %rax,0x200b71(%rip) # 601170 <acc>
0.00 : 4005ff: mov -0x10(%rbp),%rax # +100.00%
7.37 : 400603: and $0x1,%eax
3.69 : 400606: test %rax,%rax
0.00 : 400609: jne 400612 <branches+0x98> # -59.25% (p:42.99%)
1.84 : 40060b: mov $0x1,%eax
14.29 : 400610: jmp 400617 <branches+0x9d> # -100.00% (p:100.00%)
1.38 : 400612: mov $0x0,%eax # +57.65%
10.14 : 400617: test %al,%al # +42.35%
0.00 : 400619: je 40062f <branches+0xb5> # -57.65% (p:100.00%)
0.46 : 40061b: mov 0x200b4e(%rip),%rax # 601170 <acc>
2.76 : 400622: sub $0x1,%rax
0.00 : 400626: mov %rax,0x200b43(%rip) # 601170 <acc>
0.46 : 40062d: jmp 400641 <branches+0xc7> # -100.00% (p:100.00%)
0.92 : 40062f: mov 0x200b3a(%rip),%rax # 601170 <acc> # +56.13%
2.30 : 400636: add $0x1,%rax
0.92 : 40063a: mov %rax,0x200b2f(%rip) # 601170 <acc>
0.92 : 400641: mov -0x10(%rbp),%rax # +43.87%
2.30 : 400645: mov %rax,%rdi
0.00 : 400648: callq 400526 <lfsr> # -100.00% (p:100.00%)
0.00 : 40064d: mov %rax,-0x10(%rbp) # +100.00%
1.84 : 400651: addq $0x1,-0x8(%rbp)
0.92 : 400656: mov -0x8(%rbp),%rax
5.07 : 40065a: cmp -0x20(%rbp),%rax
0.00 : 40065e: jb 40059f <branches+0x25> # -100.00% (p:100.00%)
0.00 : 400664: nop
0.00 : 400665: leaveq
0.00 : 400666: retq
(Note: the --branch-filter u,any was used to avoid spurious target and
branch points due to interrupts/faults, they show up as very small -/+
annotations on 'weird' locations)
Committer note:
Please take a look at:
http://vger.kernel.org/~acme/perf/annotate_basic_blocks.png
To see the colors.
Signed-off-by: Peter Zijlstra (Intel) <peterz@infradead.org>
Tested-by: Arnaldo Carvalho de Melo <acme@redhat.com>
Cc: Alexander Shishkin <alexander.shishkin@linux.intel.com>
Cc: Andi Kleen <andi@firstfloor.org>
Cc: Anshuman Khandual <khandual@linux.vnet.ibm.com>
Cc: David Carrillo-Cisneros <davidcc@google.com>
Cc: Jiri Olsa <jolsa@kernel.org>
Cc: Kan Liang <kan.liang@intel.com>
Cc: Linus Torvalds <torvalds@linux-foundation.org>
Cc: Namhyung Kim <namhyung@kernel.org>
Cc: Stephane Eranian <eranian@google.com>
[ Moved sym->max_coverage to 'struct annotate', aka symbol__annotate(sym) ]
Signed-off-by: Arnaldo Carvalho de Melo <acme@redhat.com>
2016-09-06 03:08:12 +08:00
|
|
|
static const char *annotate__address_color(struct block_range *br)
|
|
|
|
{
|
|
|
|
double cov = block_range__coverage(br);
|
|
|
|
|
|
|
|
if (cov >= 0) {
|
|
|
|
/* mark red for >75% coverage */
|
|
|
|
if (cov > 0.75)
|
|
|
|
return PERF_COLOR_RED;
|
|
|
|
|
|
|
|
/* mark dull for <1% coverage */
|
|
|
|
if (cov < 0.01)
|
|
|
|
return PERF_COLOR_NORMAL;
|
|
|
|
}
|
|
|
|
|
|
|
|
return PERF_COLOR_MAGENTA;
|
|
|
|
}
|
|
|
|
|
|
|
|
static const char *annotate__asm_color(struct block_range *br)
|
|
|
|
{
|
|
|
|
double cov = block_range__coverage(br);
|
|
|
|
|
|
|
|
if (cov >= 0) {
|
|
|
|
/* mark dull for <1% coverage */
|
|
|
|
if (cov < 0.01)
|
|
|
|
return PERF_COLOR_NORMAL;
|
|
|
|
}
|
|
|
|
|
|
|
|
return PERF_COLOR_BLUE;
|
|
|
|
}
|
|
|
|
|
|
|
|
static void annotate__branch_printf(struct block_range *br, u64 addr)
|
|
|
|
{
|
|
|
|
bool emit_comment = true;
|
|
|
|
|
|
|
|
if (!br)
|
|
|
|
return;
|
|
|
|
|
|
|
|
#if 1
|
|
|
|
if (br->is_target && br->start == addr) {
|
|
|
|
struct block_range *branch = br;
|
|
|
|
double p;
|
|
|
|
|
|
|
|
/*
|
|
|
|
* Find matching branch to our target.
|
|
|
|
*/
|
|
|
|
while (!branch->is_branch)
|
|
|
|
branch = block_range__next(branch);
|
|
|
|
|
|
|
|
p = 100 *(double)br->entry / branch->coverage;
|
|
|
|
|
|
|
|
if (p > 0.1) {
|
|
|
|
if (emit_comment) {
|
|
|
|
emit_comment = false;
|
|
|
|
printf("\t#");
|
|
|
|
}
|
|
|
|
|
|
|
|
/*
|
|
|
|
* The percentage of coverage joined at this target in relation
|
|
|
|
* to the next branch.
|
|
|
|
*/
|
|
|
|
printf(" +%.2f%%", p);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
#endif
|
|
|
|
if (br->is_branch && br->end == addr) {
|
|
|
|
double p = 100*(double)br->taken / br->coverage;
|
|
|
|
|
|
|
|
if (p > 0.1) {
|
|
|
|
if (emit_comment) {
|
|
|
|
emit_comment = false;
|
|
|
|
printf("\t#");
|
|
|
|
}
|
|
|
|
|
|
|
|
/*
|
|
|
|
* The percentage of coverage leaving at this branch, and
|
|
|
|
* its prediction ratio.
|
|
|
|
*/
|
|
|
|
printf(" -%.2f%% (p:%.2f%%)", p, 100*(double)br->pred / br->taken);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
|
2012-04-16 02:24:39 +08:00
|
|
|
static int disasm_line__print(struct disasm_line *dl, struct symbol *sym, u64 start,
|
2013-03-05 13:53:21 +08:00
|
|
|
struct perf_evsel *evsel, u64 len, int min_pcnt, int printed,
|
2012-04-16 02:24:39 +08:00
|
|
|
int max_lines, struct disasm_line *queue)
|
2011-02-04 19:45:46 +08:00
|
|
|
{
|
|
|
|
static const char *prev_line;
|
|
|
|
static const char *prev_color;
|
|
|
|
|
2012-04-16 02:24:39 +08:00
|
|
|
if (dl->offset != -1) {
|
2011-02-04 19:45:46 +08:00
|
|
|
const char *path = NULL;
|
2015-06-20 03:10:43 +08:00
|
|
|
u64 nr_samples;
|
perf annotate: Add basic support to event group view
Add --group option to enable event grouping. When enabled, all the
group members information will be shown with the leader so skip
non-leader events.
It only supports --stdio output currently. Later patches will extend
additional features.
$ perf annotate --group --stdio
...
Percent | Source code & Disassembly of libpthread-2.15.so
--------------------------------------------------------------------------------
:
:
:
: Disassembly of section .text:
:
: 000000387dc0aa50 <__pthread_mutex_unlock_usercnt>:
8.08 2.40 5.29 : 387dc0aa50: mov %rdi,%rdx
0.00 0.00 0.00 : 387dc0aa53: mov 0x10(%rdi),%edi
0.00 0.00 0.00 : 387dc0aa56: mov %edi,%eax
0.00 0.80 0.00 : 387dc0aa58: and $0x7f,%eax
3.03 2.40 3.53 : 387dc0aa5b: test $0x7c,%dil
0.00 0.00 0.00 : 387dc0aa5f: jne 387dc0aaa9 <__pthread_mutex_unlock_use
0.00 0.00 0.00 : 387dc0aa61: test %eax,%eax
0.00 0.00 0.00 : 387dc0aa63: jne 387dc0aa85 <__pthread_mutex_unlock_use
0.00 0.00 0.00 : 387dc0aa65: and $0x80,%edi
0.00 0.00 0.00 : 387dc0aa6b: test %esi,%esi
3.03 5.60 7.06 : 387dc0aa6d: movl $0x0,0x8(%rdx)
0.00 0.00 0.59 : 387dc0aa74: je 387dc0aa7a <__pthread_mutex_unlock_use
0.00 0.00 0.00 : 387dc0aa76: subl $0x1,0xc(%rdx)
2.02 5.60 1.18 : 387dc0aa7a: mov %edi,%esi
0.00 0.00 0.00 : 387dc0aa7c: lock decl (%rdx)
83.84 83.20 82.35 : 387dc0aa7f: jne 387dc0aada <_L_unlock_586>
0.00 0.00 0.00 : 387dc0aa81: nop
0.00 0.00 0.00 : 387dc0aa82: xor %eax,%eax
0.00 0.00 0.00 : 387dc0aa84: retq
...
Signed-off-by: Namhyung Kim <namhyung@kernel.org>
Cc: Andi Kleen <andi@firstfloor.org>
Cc: Ingo Molnar <mingo@kernel.org>
Cc: Jiri Olsa <jolsa@redhat.com>
Cc: Paul Mackerras <paulus@samba.org>
Cc: Pekka Enberg <penberg@kernel.org>
Cc: Peter Zijlstra <a.p.zijlstra@chello.nl>
Link: http://lkml.kernel.org/r/1362462812-30885-6-git-send-email-namhyung@kernel.org
Signed-off-by: Arnaldo Carvalho de Melo <acme@redhat.com>
2013-03-05 13:53:25 +08:00
|
|
|
double percent, max_percent = 0.0;
|
|
|
|
double *ppercents = &percent;
|
2015-06-20 03:10:43 +08:00
|
|
|
u64 *psamples = &nr_samples;
|
perf annotate: Add basic support to event group view
Add --group option to enable event grouping. When enabled, all the
group members information will be shown with the leader so skip
non-leader events.
It only supports --stdio output currently. Later patches will extend
additional features.
$ perf annotate --group --stdio
...
Percent | Source code & Disassembly of libpthread-2.15.so
--------------------------------------------------------------------------------
:
:
:
: Disassembly of section .text:
:
: 000000387dc0aa50 <__pthread_mutex_unlock_usercnt>:
8.08 2.40 5.29 : 387dc0aa50: mov %rdi,%rdx
0.00 0.00 0.00 : 387dc0aa53: mov 0x10(%rdi),%edi
0.00 0.00 0.00 : 387dc0aa56: mov %edi,%eax
0.00 0.80 0.00 : 387dc0aa58: and $0x7f,%eax
3.03 2.40 3.53 : 387dc0aa5b: test $0x7c,%dil
0.00 0.00 0.00 : 387dc0aa5f: jne 387dc0aaa9 <__pthread_mutex_unlock_use
0.00 0.00 0.00 : 387dc0aa61: test %eax,%eax
0.00 0.00 0.00 : 387dc0aa63: jne 387dc0aa85 <__pthread_mutex_unlock_use
0.00 0.00 0.00 : 387dc0aa65: and $0x80,%edi
0.00 0.00 0.00 : 387dc0aa6b: test %esi,%esi
3.03 5.60 7.06 : 387dc0aa6d: movl $0x0,0x8(%rdx)
0.00 0.00 0.59 : 387dc0aa74: je 387dc0aa7a <__pthread_mutex_unlock_use
0.00 0.00 0.00 : 387dc0aa76: subl $0x1,0xc(%rdx)
2.02 5.60 1.18 : 387dc0aa7a: mov %edi,%esi
0.00 0.00 0.00 : 387dc0aa7c: lock decl (%rdx)
83.84 83.20 82.35 : 387dc0aa7f: jne 387dc0aada <_L_unlock_586>
0.00 0.00 0.00 : 387dc0aa81: nop
0.00 0.00 0.00 : 387dc0aa82: xor %eax,%eax
0.00 0.00 0.00 : 387dc0aa84: retq
...
Signed-off-by: Namhyung Kim <namhyung@kernel.org>
Cc: Andi Kleen <andi@firstfloor.org>
Cc: Ingo Molnar <mingo@kernel.org>
Cc: Jiri Olsa <jolsa@redhat.com>
Cc: Paul Mackerras <paulus@samba.org>
Cc: Pekka Enberg <penberg@kernel.org>
Cc: Peter Zijlstra <a.p.zijlstra@chello.nl>
Link: http://lkml.kernel.org/r/1362462812-30885-6-git-send-email-namhyung@kernel.org
Signed-off-by: Arnaldo Carvalho de Melo <acme@redhat.com>
2013-03-05 13:53:25 +08:00
|
|
|
int i, nr_percent = 1;
|
2011-02-04 19:45:46 +08:00
|
|
|
const char *color;
|
|
|
|
struct annotation *notes = symbol__annotation(sym);
|
2012-04-16 02:24:39 +08:00
|
|
|
s64 offset = dl->offset;
|
2012-04-02 23:59:01 +08:00
|
|
|
const u64 addr = start + offset;
|
2012-04-16 02:24:39 +08:00
|
|
|
struct disasm_line *next;
|
perf annotate: Add branch stack / basic block
I wanted to know the hottest path through a function and figured the
branch-stack (LBR) information should be able to help out with that.
The below uses the branch-stack to create basic blocks and generate
statistics from them.
from to branch_i
* ----> *
|
| block
v
* ----> *
from to branch_i+1
The blocks are broken down into non-overlapping ranges, while tracking
if the start of each range is an entry point and/or the end of a range
is a branch.
Each block iterates all ranges it covers (while splitting where required
to exactly match the block) and increments the 'coverage' count.
For the range including the branch we increment the taken counter, as
well as the pred counter if flags.predicted.
Using these number we can find if an instruction:
- had coverage; given by:
br->coverage / br->sym->max_coverage
This metric ensures each symbol has a 100% spot, which reflects the
observation that each symbol must have a most covered/hottest
block.
- is a branch target: br->is_target && br->start == add
- for targets, how much of a branch's coverages comes from it:
target->entry / branch->coverage
- is a branch: br->is_branch && br->end == addr
- for branches, how often it was taken:
br->taken / br->coverage
after all, all execution that didn't take the branch would have
incremented the coverage and continued onward to a later branch.
- for branches, how often it was predicted:
br->pred / br->taken
The coverage percentage is used to color the address and asm sections;
for low (<1%) coverage we use NORMAL (uncolored), indicating that these
instructions are not 'important'. For high coverage (>75%) we color the
address RED.
For each branch, we add an asm comment after the instruction with
information on how often it was taken and predicted.
Output looks like (sans color, which does loose a lot of the
information :/)
$ perf record --branch-filter u,any -e cycles:p ./branches 27
$ perf annotate branches
Percent | Source code & Disassembly of branches for cycles:pu (217 samples)
---------------------------------------------------------------------------------
: branches():
0.00 : 40057a: push %rbp
0.00 : 40057b: mov %rsp,%rbp
0.00 : 40057e: sub $0x20,%rsp
0.00 : 400582: mov %rdi,-0x18(%rbp)
0.00 : 400586: mov %rsi,-0x20(%rbp)
0.00 : 40058a: mov -0x18(%rbp),%rax
0.00 : 40058e: mov %rax,-0x10(%rbp)
0.00 : 400592: movq $0x0,-0x8(%rbp)
0.00 : 40059a: jmpq 400656 <branches+0xdc>
1.84 : 40059f: mov -0x10(%rbp),%rax # +100.00%
3.23 : 4005a3: and $0x1,%eax
1.84 : 4005a6: test %rax,%rax
0.00 : 4005a9: je 4005bf <branches+0x45> # -54.50% (p:42.00%)
0.46 : 4005ab: mov 0x200bbe(%rip),%rax # 601170 <acc>
12.90 : 4005b2: add $0x1,%rax
2.30 : 4005b6: mov %rax,0x200bb3(%rip) # 601170 <acc>
0.46 : 4005bd: jmp 4005d1 <branches+0x57> # -100.00% (p:100.00%)
0.92 : 4005bf: mov 0x200baa(%rip),%rax # 601170 <acc> # +49.54%
13.82 : 4005c6: sub $0x1,%rax
0.46 : 4005ca: mov %rax,0x200b9f(%rip) # 601170 <acc>
2.30 : 4005d1: mov -0x10(%rbp),%rax # +50.46%
0.46 : 4005d5: mov %rax,%rdi
0.46 : 4005d8: callq 400526 <lfsr> # -100.00% (p:100.00%)
0.00 : 4005dd: mov %rax,-0x10(%rbp) # +100.00%
0.92 : 4005e1: mov -0x18(%rbp),%rax
0.00 : 4005e5: and $0x1,%eax
0.00 : 4005e8: test %rax,%rax
0.00 : 4005eb: je 4005ff <branches+0x85> # -100.00% (p:100.00%)
0.00 : 4005ed: mov 0x200b7c(%rip),%rax # 601170 <acc>
0.00 : 4005f4: shr $0x2,%rax
0.00 : 4005f8: mov %rax,0x200b71(%rip) # 601170 <acc>
0.00 : 4005ff: mov -0x10(%rbp),%rax # +100.00%
7.37 : 400603: and $0x1,%eax
3.69 : 400606: test %rax,%rax
0.00 : 400609: jne 400612 <branches+0x98> # -59.25% (p:42.99%)
1.84 : 40060b: mov $0x1,%eax
14.29 : 400610: jmp 400617 <branches+0x9d> # -100.00% (p:100.00%)
1.38 : 400612: mov $0x0,%eax # +57.65%
10.14 : 400617: test %al,%al # +42.35%
0.00 : 400619: je 40062f <branches+0xb5> # -57.65% (p:100.00%)
0.46 : 40061b: mov 0x200b4e(%rip),%rax # 601170 <acc>
2.76 : 400622: sub $0x1,%rax
0.00 : 400626: mov %rax,0x200b43(%rip) # 601170 <acc>
0.46 : 40062d: jmp 400641 <branches+0xc7> # -100.00% (p:100.00%)
0.92 : 40062f: mov 0x200b3a(%rip),%rax # 601170 <acc> # +56.13%
2.30 : 400636: add $0x1,%rax
0.92 : 40063a: mov %rax,0x200b2f(%rip) # 601170 <acc>
0.92 : 400641: mov -0x10(%rbp),%rax # +43.87%
2.30 : 400645: mov %rax,%rdi
0.00 : 400648: callq 400526 <lfsr> # -100.00% (p:100.00%)
0.00 : 40064d: mov %rax,-0x10(%rbp) # +100.00%
1.84 : 400651: addq $0x1,-0x8(%rbp)
0.92 : 400656: mov -0x8(%rbp),%rax
5.07 : 40065a: cmp -0x20(%rbp),%rax
0.00 : 40065e: jb 40059f <branches+0x25> # -100.00% (p:100.00%)
0.00 : 400664: nop
0.00 : 400665: leaveq
0.00 : 400666: retq
(Note: the --branch-filter u,any was used to avoid spurious target and
branch points due to interrupts/faults, they show up as very small -/+
annotations on 'weird' locations)
Committer note:
Please take a look at:
http://vger.kernel.org/~acme/perf/annotate_basic_blocks.png
To see the colors.
Signed-off-by: Peter Zijlstra (Intel) <peterz@infradead.org>
Tested-by: Arnaldo Carvalho de Melo <acme@redhat.com>
Cc: Alexander Shishkin <alexander.shishkin@linux.intel.com>
Cc: Andi Kleen <andi@firstfloor.org>
Cc: Anshuman Khandual <khandual@linux.vnet.ibm.com>
Cc: David Carrillo-Cisneros <davidcc@google.com>
Cc: Jiri Olsa <jolsa@kernel.org>
Cc: Kan Liang <kan.liang@intel.com>
Cc: Linus Torvalds <torvalds@linux-foundation.org>
Cc: Namhyung Kim <namhyung@kernel.org>
Cc: Stephane Eranian <eranian@google.com>
[ Moved sym->max_coverage to 'struct annotate', aka symbol__annotate(sym) ]
Signed-off-by: Arnaldo Carvalho de Melo <acme@redhat.com>
2016-09-06 03:08:12 +08:00
|
|
|
struct block_range *br;
|
2011-02-08 23:27:39 +08:00
|
|
|
|
2012-04-16 02:24:39 +08:00
|
|
|
next = disasm__get_next_ip_line(¬es->src->source, dl);
|
2011-02-04 19:45:46 +08:00
|
|
|
|
2013-03-05 13:53:26 +08:00
|
|
|
if (perf_evsel__is_group_event(evsel)) {
|
perf annotate: Add basic support to event group view
Add --group option to enable event grouping. When enabled, all the
group members information will be shown with the leader so skip
non-leader events.
It only supports --stdio output currently. Later patches will extend
additional features.
$ perf annotate --group --stdio
...
Percent | Source code & Disassembly of libpthread-2.15.so
--------------------------------------------------------------------------------
:
:
:
: Disassembly of section .text:
:
: 000000387dc0aa50 <__pthread_mutex_unlock_usercnt>:
8.08 2.40 5.29 : 387dc0aa50: mov %rdi,%rdx
0.00 0.00 0.00 : 387dc0aa53: mov 0x10(%rdi),%edi
0.00 0.00 0.00 : 387dc0aa56: mov %edi,%eax
0.00 0.80 0.00 : 387dc0aa58: and $0x7f,%eax
3.03 2.40 3.53 : 387dc0aa5b: test $0x7c,%dil
0.00 0.00 0.00 : 387dc0aa5f: jne 387dc0aaa9 <__pthread_mutex_unlock_use
0.00 0.00 0.00 : 387dc0aa61: test %eax,%eax
0.00 0.00 0.00 : 387dc0aa63: jne 387dc0aa85 <__pthread_mutex_unlock_use
0.00 0.00 0.00 : 387dc0aa65: and $0x80,%edi
0.00 0.00 0.00 : 387dc0aa6b: test %esi,%esi
3.03 5.60 7.06 : 387dc0aa6d: movl $0x0,0x8(%rdx)
0.00 0.00 0.59 : 387dc0aa74: je 387dc0aa7a <__pthread_mutex_unlock_use
0.00 0.00 0.00 : 387dc0aa76: subl $0x1,0xc(%rdx)
2.02 5.60 1.18 : 387dc0aa7a: mov %edi,%esi
0.00 0.00 0.00 : 387dc0aa7c: lock decl (%rdx)
83.84 83.20 82.35 : 387dc0aa7f: jne 387dc0aada <_L_unlock_586>
0.00 0.00 0.00 : 387dc0aa81: nop
0.00 0.00 0.00 : 387dc0aa82: xor %eax,%eax
0.00 0.00 0.00 : 387dc0aa84: retq
...
Signed-off-by: Namhyung Kim <namhyung@kernel.org>
Cc: Andi Kleen <andi@firstfloor.org>
Cc: Ingo Molnar <mingo@kernel.org>
Cc: Jiri Olsa <jolsa@redhat.com>
Cc: Paul Mackerras <paulus@samba.org>
Cc: Pekka Enberg <penberg@kernel.org>
Cc: Peter Zijlstra <a.p.zijlstra@chello.nl>
Link: http://lkml.kernel.org/r/1362462812-30885-6-git-send-email-namhyung@kernel.org
Signed-off-by: Arnaldo Carvalho de Melo <acme@redhat.com>
2013-03-05 13:53:25 +08:00
|
|
|
nr_percent = evsel->nr_members;
|
|
|
|
ppercents = calloc(nr_percent, sizeof(double));
|
2015-06-20 03:10:43 +08:00
|
|
|
psamples = calloc(nr_percent, sizeof(u64));
|
|
|
|
if (ppercents == NULL || psamples == NULL) {
|
perf annotate: Add basic support to event group view
Add --group option to enable event grouping. When enabled, all the
group members information will be shown with the leader so skip
non-leader events.
It only supports --stdio output currently. Later patches will extend
additional features.
$ perf annotate --group --stdio
...
Percent | Source code & Disassembly of libpthread-2.15.so
--------------------------------------------------------------------------------
:
:
:
: Disassembly of section .text:
:
: 000000387dc0aa50 <__pthread_mutex_unlock_usercnt>:
8.08 2.40 5.29 : 387dc0aa50: mov %rdi,%rdx
0.00 0.00 0.00 : 387dc0aa53: mov 0x10(%rdi),%edi
0.00 0.00 0.00 : 387dc0aa56: mov %edi,%eax
0.00 0.80 0.00 : 387dc0aa58: and $0x7f,%eax
3.03 2.40 3.53 : 387dc0aa5b: test $0x7c,%dil
0.00 0.00 0.00 : 387dc0aa5f: jne 387dc0aaa9 <__pthread_mutex_unlock_use
0.00 0.00 0.00 : 387dc0aa61: test %eax,%eax
0.00 0.00 0.00 : 387dc0aa63: jne 387dc0aa85 <__pthread_mutex_unlock_use
0.00 0.00 0.00 : 387dc0aa65: and $0x80,%edi
0.00 0.00 0.00 : 387dc0aa6b: test %esi,%esi
3.03 5.60 7.06 : 387dc0aa6d: movl $0x0,0x8(%rdx)
0.00 0.00 0.59 : 387dc0aa74: je 387dc0aa7a <__pthread_mutex_unlock_use
0.00 0.00 0.00 : 387dc0aa76: subl $0x1,0xc(%rdx)
2.02 5.60 1.18 : 387dc0aa7a: mov %edi,%esi
0.00 0.00 0.00 : 387dc0aa7c: lock decl (%rdx)
83.84 83.20 82.35 : 387dc0aa7f: jne 387dc0aada <_L_unlock_586>
0.00 0.00 0.00 : 387dc0aa81: nop
0.00 0.00 0.00 : 387dc0aa82: xor %eax,%eax
0.00 0.00 0.00 : 387dc0aa84: retq
...
Signed-off-by: Namhyung Kim <namhyung@kernel.org>
Cc: Andi Kleen <andi@firstfloor.org>
Cc: Ingo Molnar <mingo@kernel.org>
Cc: Jiri Olsa <jolsa@redhat.com>
Cc: Paul Mackerras <paulus@samba.org>
Cc: Pekka Enberg <penberg@kernel.org>
Cc: Peter Zijlstra <a.p.zijlstra@chello.nl>
Link: http://lkml.kernel.org/r/1362462812-30885-6-git-send-email-namhyung@kernel.org
Signed-off-by: Arnaldo Carvalho de Melo <acme@redhat.com>
2013-03-05 13:53:25 +08:00
|
|
|
return -1;
|
2015-06-20 03:10:43 +08:00
|
|
|
}
|
perf annotate: Add basic support to event group view
Add --group option to enable event grouping. When enabled, all the
group members information will be shown with the leader so skip
non-leader events.
It only supports --stdio output currently. Later patches will extend
additional features.
$ perf annotate --group --stdio
...
Percent | Source code & Disassembly of libpthread-2.15.so
--------------------------------------------------------------------------------
:
:
:
: Disassembly of section .text:
:
: 000000387dc0aa50 <__pthread_mutex_unlock_usercnt>:
8.08 2.40 5.29 : 387dc0aa50: mov %rdi,%rdx
0.00 0.00 0.00 : 387dc0aa53: mov 0x10(%rdi),%edi
0.00 0.00 0.00 : 387dc0aa56: mov %edi,%eax
0.00 0.80 0.00 : 387dc0aa58: and $0x7f,%eax
3.03 2.40 3.53 : 387dc0aa5b: test $0x7c,%dil
0.00 0.00 0.00 : 387dc0aa5f: jne 387dc0aaa9 <__pthread_mutex_unlock_use
0.00 0.00 0.00 : 387dc0aa61: test %eax,%eax
0.00 0.00 0.00 : 387dc0aa63: jne 387dc0aa85 <__pthread_mutex_unlock_use
0.00 0.00 0.00 : 387dc0aa65: and $0x80,%edi
0.00 0.00 0.00 : 387dc0aa6b: test %esi,%esi
3.03 5.60 7.06 : 387dc0aa6d: movl $0x0,0x8(%rdx)
0.00 0.00 0.59 : 387dc0aa74: je 387dc0aa7a <__pthread_mutex_unlock_use
0.00 0.00 0.00 : 387dc0aa76: subl $0x1,0xc(%rdx)
2.02 5.60 1.18 : 387dc0aa7a: mov %edi,%esi
0.00 0.00 0.00 : 387dc0aa7c: lock decl (%rdx)
83.84 83.20 82.35 : 387dc0aa7f: jne 387dc0aada <_L_unlock_586>
0.00 0.00 0.00 : 387dc0aa81: nop
0.00 0.00 0.00 : 387dc0aa82: xor %eax,%eax
0.00 0.00 0.00 : 387dc0aa84: retq
...
Signed-off-by: Namhyung Kim <namhyung@kernel.org>
Cc: Andi Kleen <andi@firstfloor.org>
Cc: Ingo Molnar <mingo@kernel.org>
Cc: Jiri Olsa <jolsa@redhat.com>
Cc: Paul Mackerras <paulus@samba.org>
Cc: Pekka Enberg <penberg@kernel.org>
Cc: Peter Zijlstra <a.p.zijlstra@chello.nl>
Link: http://lkml.kernel.org/r/1362462812-30885-6-git-send-email-namhyung@kernel.org
Signed-off-by: Arnaldo Carvalho de Melo <acme@redhat.com>
2013-03-05 13:53:25 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
for (i = 0; i < nr_percent; i++) {
|
|
|
|
percent = disasm__calc_percent(notes,
|
2013-03-05 13:53:28 +08:00
|
|
|
notes->src->lines ? i : evsel->idx + i,
|
|
|
|
offset,
|
|
|
|
next ? next->offset : (s64) len,
|
2015-06-20 03:10:43 +08:00
|
|
|
&path, &nr_samples);
|
perf annotate: Add basic support to event group view
Add --group option to enable event grouping. When enabled, all the
group members information will be shown with the leader so skip
non-leader events.
It only supports --stdio output currently. Later patches will extend
additional features.
$ perf annotate --group --stdio
...
Percent | Source code & Disassembly of libpthread-2.15.so
--------------------------------------------------------------------------------
:
:
:
: Disassembly of section .text:
:
: 000000387dc0aa50 <__pthread_mutex_unlock_usercnt>:
8.08 2.40 5.29 : 387dc0aa50: mov %rdi,%rdx
0.00 0.00 0.00 : 387dc0aa53: mov 0x10(%rdi),%edi
0.00 0.00 0.00 : 387dc0aa56: mov %edi,%eax
0.00 0.80 0.00 : 387dc0aa58: and $0x7f,%eax
3.03 2.40 3.53 : 387dc0aa5b: test $0x7c,%dil
0.00 0.00 0.00 : 387dc0aa5f: jne 387dc0aaa9 <__pthread_mutex_unlock_use
0.00 0.00 0.00 : 387dc0aa61: test %eax,%eax
0.00 0.00 0.00 : 387dc0aa63: jne 387dc0aa85 <__pthread_mutex_unlock_use
0.00 0.00 0.00 : 387dc0aa65: and $0x80,%edi
0.00 0.00 0.00 : 387dc0aa6b: test %esi,%esi
3.03 5.60 7.06 : 387dc0aa6d: movl $0x0,0x8(%rdx)
0.00 0.00 0.59 : 387dc0aa74: je 387dc0aa7a <__pthread_mutex_unlock_use
0.00 0.00 0.00 : 387dc0aa76: subl $0x1,0xc(%rdx)
2.02 5.60 1.18 : 387dc0aa7a: mov %edi,%esi
0.00 0.00 0.00 : 387dc0aa7c: lock decl (%rdx)
83.84 83.20 82.35 : 387dc0aa7f: jne 387dc0aada <_L_unlock_586>
0.00 0.00 0.00 : 387dc0aa81: nop
0.00 0.00 0.00 : 387dc0aa82: xor %eax,%eax
0.00 0.00 0.00 : 387dc0aa84: retq
...
Signed-off-by: Namhyung Kim <namhyung@kernel.org>
Cc: Andi Kleen <andi@firstfloor.org>
Cc: Ingo Molnar <mingo@kernel.org>
Cc: Jiri Olsa <jolsa@redhat.com>
Cc: Paul Mackerras <paulus@samba.org>
Cc: Pekka Enberg <penberg@kernel.org>
Cc: Peter Zijlstra <a.p.zijlstra@chello.nl>
Link: http://lkml.kernel.org/r/1362462812-30885-6-git-send-email-namhyung@kernel.org
Signed-off-by: Arnaldo Carvalho de Melo <acme@redhat.com>
2013-03-05 13:53:25 +08:00
|
|
|
|
|
|
|
ppercents[i] = percent;
|
2015-06-20 03:10:43 +08:00
|
|
|
psamples[i] = nr_samples;
|
perf annotate: Add basic support to event group view
Add --group option to enable event grouping. When enabled, all the
group members information will be shown with the leader so skip
non-leader events.
It only supports --stdio output currently. Later patches will extend
additional features.
$ perf annotate --group --stdio
...
Percent | Source code & Disassembly of libpthread-2.15.so
--------------------------------------------------------------------------------
:
:
:
: Disassembly of section .text:
:
: 000000387dc0aa50 <__pthread_mutex_unlock_usercnt>:
8.08 2.40 5.29 : 387dc0aa50: mov %rdi,%rdx
0.00 0.00 0.00 : 387dc0aa53: mov 0x10(%rdi),%edi
0.00 0.00 0.00 : 387dc0aa56: mov %edi,%eax
0.00 0.80 0.00 : 387dc0aa58: and $0x7f,%eax
3.03 2.40 3.53 : 387dc0aa5b: test $0x7c,%dil
0.00 0.00 0.00 : 387dc0aa5f: jne 387dc0aaa9 <__pthread_mutex_unlock_use
0.00 0.00 0.00 : 387dc0aa61: test %eax,%eax
0.00 0.00 0.00 : 387dc0aa63: jne 387dc0aa85 <__pthread_mutex_unlock_use
0.00 0.00 0.00 : 387dc0aa65: and $0x80,%edi
0.00 0.00 0.00 : 387dc0aa6b: test %esi,%esi
3.03 5.60 7.06 : 387dc0aa6d: movl $0x0,0x8(%rdx)
0.00 0.00 0.59 : 387dc0aa74: je 387dc0aa7a <__pthread_mutex_unlock_use
0.00 0.00 0.00 : 387dc0aa76: subl $0x1,0xc(%rdx)
2.02 5.60 1.18 : 387dc0aa7a: mov %edi,%esi
0.00 0.00 0.00 : 387dc0aa7c: lock decl (%rdx)
83.84 83.20 82.35 : 387dc0aa7f: jne 387dc0aada <_L_unlock_586>
0.00 0.00 0.00 : 387dc0aa81: nop
0.00 0.00 0.00 : 387dc0aa82: xor %eax,%eax
0.00 0.00 0.00 : 387dc0aa84: retq
...
Signed-off-by: Namhyung Kim <namhyung@kernel.org>
Cc: Andi Kleen <andi@firstfloor.org>
Cc: Ingo Molnar <mingo@kernel.org>
Cc: Jiri Olsa <jolsa@redhat.com>
Cc: Paul Mackerras <paulus@samba.org>
Cc: Pekka Enberg <penberg@kernel.org>
Cc: Peter Zijlstra <a.p.zijlstra@chello.nl>
Link: http://lkml.kernel.org/r/1362462812-30885-6-git-send-email-namhyung@kernel.org
Signed-off-by: Arnaldo Carvalho de Melo <acme@redhat.com>
2013-03-05 13:53:25 +08:00
|
|
|
if (percent > max_percent)
|
|
|
|
max_percent = percent;
|
|
|
|
}
|
|
|
|
|
|
|
|
if (max_percent < min_pcnt)
|
2011-02-07 00:54:44 +08:00
|
|
|
return -1;
|
|
|
|
|
2011-02-09 01:01:39 +08:00
|
|
|
if (max_lines && printed >= max_lines)
|
2011-02-07 00:54:44 +08:00
|
|
|
return 1;
|
2011-02-06 01:37:31 +08:00
|
|
|
|
2011-02-09 01:29:25 +08:00
|
|
|
if (queue != NULL) {
|
|
|
|
list_for_each_entry_from(queue, ¬es->src->source, node) {
|
2012-04-16 02:24:39 +08:00
|
|
|
if (queue == dl)
|
2011-02-09 01:29:25 +08:00
|
|
|
break;
|
2013-03-05 13:53:21 +08:00
|
|
|
disasm_line__print(queue, sym, start, evsel, len,
|
2011-02-09 01:29:25 +08:00
|
|
|
0, 0, 1, NULL);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
perf annotate: Add basic support to event group view
Add --group option to enable event grouping. When enabled, all the
group members information will be shown with the leader so skip
non-leader events.
It only supports --stdio output currently. Later patches will extend
additional features.
$ perf annotate --group --stdio
...
Percent | Source code & Disassembly of libpthread-2.15.so
--------------------------------------------------------------------------------
:
:
:
: Disassembly of section .text:
:
: 000000387dc0aa50 <__pthread_mutex_unlock_usercnt>:
8.08 2.40 5.29 : 387dc0aa50: mov %rdi,%rdx
0.00 0.00 0.00 : 387dc0aa53: mov 0x10(%rdi),%edi
0.00 0.00 0.00 : 387dc0aa56: mov %edi,%eax
0.00 0.80 0.00 : 387dc0aa58: and $0x7f,%eax
3.03 2.40 3.53 : 387dc0aa5b: test $0x7c,%dil
0.00 0.00 0.00 : 387dc0aa5f: jne 387dc0aaa9 <__pthread_mutex_unlock_use
0.00 0.00 0.00 : 387dc0aa61: test %eax,%eax
0.00 0.00 0.00 : 387dc0aa63: jne 387dc0aa85 <__pthread_mutex_unlock_use
0.00 0.00 0.00 : 387dc0aa65: and $0x80,%edi
0.00 0.00 0.00 : 387dc0aa6b: test %esi,%esi
3.03 5.60 7.06 : 387dc0aa6d: movl $0x0,0x8(%rdx)
0.00 0.00 0.59 : 387dc0aa74: je 387dc0aa7a <__pthread_mutex_unlock_use
0.00 0.00 0.00 : 387dc0aa76: subl $0x1,0xc(%rdx)
2.02 5.60 1.18 : 387dc0aa7a: mov %edi,%esi
0.00 0.00 0.00 : 387dc0aa7c: lock decl (%rdx)
83.84 83.20 82.35 : 387dc0aa7f: jne 387dc0aada <_L_unlock_586>
0.00 0.00 0.00 : 387dc0aa81: nop
0.00 0.00 0.00 : 387dc0aa82: xor %eax,%eax
0.00 0.00 0.00 : 387dc0aa84: retq
...
Signed-off-by: Namhyung Kim <namhyung@kernel.org>
Cc: Andi Kleen <andi@firstfloor.org>
Cc: Ingo Molnar <mingo@kernel.org>
Cc: Jiri Olsa <jolsa@redhat.com>
Cc: Paul Mackerras <paulus@samba.org>
Cc: Pekka Enberg <penberg@kernel.org>
Cc: Peter Zijlstra <a.p.zijlstra@chello.nl>
Link: http://lkml.kernel.org/r/1362462812-30885-6-git-send-email-namhyung@kernel.org
Signed-off-by: Arnaldo Carvalho de Melo <acme@redhat.com>
2013-03-05 13:53:25 +08:00
|
|
|
color = get_percent_color(max_percent);
|
2011-02-04 19:45:46 +08:00
|
|
|
|
|
|
|
/*
|
|
|
|
* Also color the filename and line if needed, with
|
|
|
|
* the same color than the percentage. Don't print it
|
|
|
|
* twice for close colored addr with the same filename:line
|
|
|
|
*/
|
|
|
|
if (path) {
|
|
|
|
if (!prev_line || strcmp(prev_line, path)
|
|
|
|
|| color != prev_color) {
|
|
|
|
color_fprintf(stdout, color, " %s", path);
|
|
|
|
prev_line = path;
|
|
|
|
prev_color = color;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
perf annotate: Add basic support to event group view
Add --group option to enable event grouping. When enabled, all the
group members information will be shown with the leader so skip
non-leader events.
It only supports --stdio output currently. Later patches will extend
additional features.
$ perf annotate --group --stdio
...
Percent | Source code & Disassembly of libpthread-2.15.so
--------------------------------------------------------------------------------
:
:
:
: Disassembly of section .text:
:
: 000000387dc0aa50 <__pthread_mutex_unlock_usercnt>:
8.08 2.40 5.29 : 387dc0aa50: mov %rdi,%rdx
0.00 0.00 0.00 : 387dc0aa53: mov 0x10(%rdi),%edi
0.00 0.00 0.00 : 387dc0aa56: mov %edi,%eax
0.00 0.80 0.00 : 387dc0aa58: and $0x7f,%eax
3.03 2.40 3.53 : 387dc0aa5b: test $0x7c,%dil
0.00 0.00 0.00 : 387dc0aa5f: jne 387dc0aaa9 <__pthread_mutex_unlock_use
0.00 0.00 0.00 : 387dc0aa61: test %eax,%eax
0.00 0.00 0.00 : 387dc0aa63: jne 387dc0aa85 <__pthread_mutex_unlock_use
0.00 0.00 0.00 : 387dc0aa65: and $0x80,%edi
0.00 0.00 0.00 : 387dc0aa6b: test %esi,%esi
3.03 5.60 7.06 : 387dc0aa6d: movl $0x0,0x8(%rdx)
0.00 0.00 0.59 : 387dc0aa74: je 387dc0aa7a <__pthread_mutex_unlock_use
0.00 0.00 0.00 : 387dc0aa76: subl $0x1,0xc(%rdx)
2.02 5.60 1.18 : 387dc0aa7a: mov %edi,%esi
0.00 0.00 0.00 : 387dc0aa7c: lock decl (%rdx)
83.84 83.20 82.35 : 387dc0aa7f: jne 387dc0aada <_L_unlock_586>
0.00 0.00 0.00 : 387dc0aa81: nop
0.00 0.00 0.00 : 387dc0aa82: xor %eax,%eax
0.00 0.00 0.00 : 387dc0aa84: retq
...
Signed-off-by: Namhyung Kim <namhyung@kernel.org>
Cc: Andi Kleen <andi@firstfloor.org>
Cc: Ingo Molnar <mingo@kernel.org>
Cc: Jiri Olsa <jolsa@redhat.com>
Cc: Paul Mackerras <paulus@samba.org>
Cc: Pekka Enberg <penberg@kernel.org>
Cc: Peter Zijlstra <a.p.zijlstra@chello.nl>
Link: http://lkml.kernel.org/r/1362462812-30885-6-git-send-email-namhyung@kernel.org
Signed-off-by: Arnaldo Carvalho de Melo <acme@redhat.com>
2013-03-05 13:53:25 +08:00
|
|
|
for (i = 0; i < nr_percent; i++) {
|
|
|
|
percent = ppercents[i];
|
2015-06-20 03:10:43 +08:00
|
|
|
nr_samples = psamples[i];
|
perf annotate: Add basic support to event group view
Add --group option to enable event grouping. When enabled, all the
group members information will be shown with the leader so skip
non-leader events.
It only supports --stdio output currently. Later patches will extend
additional features.
$ perf annotate --group --stdio
...
Percent | Source code & Disassembly of libpthread-2.15.so
--------------------------------------------------------------------------------
:
:
:
: Disassembly of section .text:
:
: 000000387dc0aa50 <__pthread_mutex_unlock_usercnt>:
8.08 2.40 5.29 : 387dc0aa50: mov %rdi,%rdx
0.00 0.00 0.00 : 387dc0aa53: mov 0x10(%rdi),%edi
0.00 0.00 0.00 : 387dc0aa56: mov %edi,%eax
0.00 0.80 0.00 : 387dc0aa58: and $0x7f,%eax
3.03 2.40 3.53 : 387dc0aa5b: test $0x7c,%dil
0.00 0.00 0.00 : 387dc0aa5f: jne 387dc0aaa9 <__pthread_mutex_unlock_use
0.00 0.00 0.00 : 387dc0aa61: test %eax,%eax
0.00 0.00 0.00 : 387dc0aa63: jne 387dc0aa85 <__pthread_mutex_unlock_use
0.00 0.00 0.00 : 387dc0aa65: and $0x80,%edi
0.00 0.00 0.00 : 387dc0aa6b: test %esi,%esi
3.03 5.60 7.06 : 387dc0aa6d: movl $0x0,0x8(%rdx)
0.00 0.00 0.59 : 387dc0aa74: je 387dc0aa7a <__pthread_mutex_unlock_use
0.00 0.00 0.00 : 387dc0aa76: subl $0x1,0xc(%rdx)
2.02 5.60 1.18 : 387dc0aa7a: mov %edi,%esi
0.00 0.00 0.00 : 387dc0aa7c: lock decl (%rdx)
83.84 83.20 82.35 : 387dc0aa7f: jne 387dc0aada <_L_unlock_586>
0.00 0.00 0.00 : 387dc0aa81: nop
0.00 0.00 0.00 : 387dc0aa82: xor %eax,%eax
0.00 0.00 0.00 : 387dc0aa84: retq
...
Signed-off-by: Namhyung Kim <namhyung@kernel.org>
Cc: Andi Kleen <andi@firstfloor.org>
Cc: Ingo Molnar <mingo@kernel.org>
Cc: Jiri Olsa <jolsa@redhat.com>
Cc: Paul Mackerras <paulus@samba.org>
Cc: Pekka Enberg <penberg@kernel.org>
Cc: Peter Zijlstra <a.p.zijlstra@chello.nl>
Link: http://lkml.kernel.org/r/1362462812-30885-6-git-send-email-namhyung@kernel.org
Signed-off-by: Arnaldo Carvalho de Melo <acme@redhat.com>
2013-03-05 13:53:25 +08:00
|
|
|
color = get_percent_color(percent);
|
2015-06-20 03:10:43 +08:00
|
|
|
|
|
|
|
if (symbol_conf.show_total_period)
|
|
|
|
color_fprintf(stdout, color, " %7" PRIu64,
|
|
|
|
nr_samples);
|
|
|
|
else
|
|
|
|
color_fprintf(stdout, color, " %7.2f", percent);
|
perf annotate: Add basic support to event group view
Add --group option to enable event grouping. When enabled, all the
group members information will be shown with the leader so skip
non-leader events.
It only supports --stdio output currently. Later patches will extend
additional features.
$ perf annotate --group --stdio
...
Percent | Source code & Disassembly of libpthread-2.15.so
--------------------------------------------------------------------------------
:
:
:
: Disassembly of section .text:
:
: 000000387dc0aa50 <__pthread_mutex_unlock_usercnt>:
8.08 2.40 5.29 : 387dc0aa50: mov %rdi,%rdx
0.00 0.00 0.00 : 387dc0aa53: mov 0x10(%rdi),%edi
0.00 0.00 0.00 : 387dc0aa56: mov %edi,%eax
0.00 0.80 0.00 : 387dc0aa58: and $0x7f,%eax
3.03 2.40 3.53 : 387dc0aa5b: test $0x7c,%dil
0.00 0.00 0.00 : 387dc0aa5f: jne 387dc0aaa9 <__pthread_mutex_unlock_use
0.00 0.00 0.00 : 387dc0aa61: test %eax,%eax
0.00 0.00 0.00 : 387dc0aa63: jne 387dc0aa85 <__pthread_mutex_unlock_use
0.00 0.00 0.00 : 387dc0aa65: and $0x80,%edi
0.00 0.00 0.00 : 387dc0aa6b: test %esi,%esi
3.03 5.60 7.06 : 387dc0aa6d: movl $0x0,0x8(%rdx)
0.00 0.00 0.59 : 387dc0aa74: je 387dc0aa7a <__pthread_mutex_unlock_use
0.00 0.00 0.00 : 387dc0aa76: subl $0x1,0xc(%rdx)
2.02 5.60 1.18 : 387dc0aa7a: mov %edi,%esi
0.00 0.00 0.00 : 387dc0aa7c: lock decl (%rdx)
83.84 83.20 82.35 : 387dc0aa7f: jne 387dc0aada <_L_unlock_586>
0.00 0.00 0.00 : 387dc0aa81: nop
0.00 0.00 0.00 : 387dc0aa82: xor %eax,%eax
0.00 0.00 0.00 : 387dc0aa84: retq
...
Signed-off-by: Namhyung Kim <namhyung@kernel.org>
Cc: Andi Kleen <andi@firstfloor.org>
Cc: Ingo Molnar <mingo@kernel.org>
Cc: Jiri Olsa <jolsa@redhat.com>
Cc: Paul Mackerras <paulus@samba.org>
Cc: Pekka Enberg <penberg@kernel.org>
Cc: Peter Zijlstra <a.p.zijlstra@chello.nl>
Link: http://lkml.kernel.org/r/1362462812-30885-6-git-send-email-namhyung@kernel.org
Signed-off-by: Arnaldo Carvalho de Melo <acme@redhat.com>
2013-03-05 13:53:25 +08:00
|
|
|
}
|
|
|
|
|
2011-02-04 19:45:46 +08:00
|
|
|
printf(" : ");
|
perf annotate: Add branch stack / basic block
I wanted to know the hottest path through a function and figured the
branch-stack (LBR) information should be able to help out with that.
The below uses the branch-stack to create basic blocks and generate
statistics from them.
from to branch_i
* ----> *
|
| block
v
* ----> *
from to branch_i+1
The blocks are broken down into non-overlapping ranges, while tracking
if the start of each range is an entry point and/or the end of a range
is a branch.
Each block iterates all ranges it covers (while splitting where required
to exactly match the block) and increments the 'coverage' count.
For the range including the branch we increment the taken counter, as
well as the pred counter if flags.predicted.
Using these number we can find if an instruction:
- had coverage; given by:
br->coverage / br->sym->max_coverage
This metric ensures each symbol has a 100% spot, which reflects the
observation that each symbol must have a most covered/hottest
block.
- is a branch target: br->is_target && br->start == add
- for targets, how much of a branch's coverages comes from it:
target->entry / branch->coverage
- is a branch: br->is_branch && br->end == addr
- for branches, how often it was taken:
br->taken / br->coverage
after all, all execution that didn't take the branch would have
incremented the coverage and continued onward to a later branch.
- for branches, how often it was predicted:
br->pred / br->taken
The coverage percentage is used to color the address and asm sections;
for low (<1%) coverage we use NORMAL (uncolored), indicating that these
instructions are not 'important'. For high coverage (>75%) we color the
address RED.
For each branch, we add an asm comment after the instruction with
information on how often it was taken and predicted.
Output looks like (sans color, which does loose a lot of the
information :/)
$ perf record --branch-filter u,any -e cycles:p ./branches 27
$ perf annotate branches
Percent | Source code & Disassembly of branches for cycles:pu (217 samples)
---------------------------------------------------------------------------------
: branches():
0.00 : 40057a: push %rbp
0.00 : 40057b: mov %rsp,%rbp
0.00 : 40057e: sub $0x20,%rsp
0.00 : 400582: mov %rdi,-0x18(%rbp)
0.00 : 400586: mov %rsi,-0x20(%rbp)
0.00 : 40058a: mov -0x18(%rbp),%rax
0.00 : 40058e: mov %rax,-0x10(%rbp)
0.00 : 400592: movq $0x0,-0x8(%rbp)
0.00 : 40059a: jmpq 400656 <branches+0xdc>
1.84 : 40059f: mov -0x10(%rbp),%rax # +100.00%
3.23 : 4005a3: and $0x1,%eax
1.84 : 4005a6: test %rax,%rax
0.00 : 4005a9: je 4005bf <branches+0x45> # -54.50% (p:42.00%)
0.46 : 4005ab: mov 0x200bbe(%rip),%rax # 601170 <acc>
12.90 : 4005b2: add $0x1,%rax
2.30 : 4005b6: mov %rax,0x200bb3(%rip) # 601170 <acc>
0.46 : 4005bd: jmp 4005d1 <branches+0x57> # -100.00% (p:100.00%)
0.92 : 4005bf: mov 0x200baa(%rip),%rax # 601170 <acc> # +49.54%
13.82 : 4005c6: sub $0x1,%rax
0.46 : 4005ca: mov %rax,0x200b9f(%rip) # 601170 <acc>
2.30 : 4005d1: mov -0x10(%rbp),%rax # +50.46%
0.46 : 4005d5: mov %rax,%rdi
0.46 : 4005d8: callq 400526 <lfsr> # -100.00% (p:100.00%)
0.00 : 4005dd: mov %rax,-0x10(%rbp) # +100.00%
0.92 : 4005e1: mov -0x18(%rbp),%rax
0.00 : 4005e5: and $0x1,%eax
0.00 : 4005e8: test %rax,%rax
0.00 : 4005eb: je 4005ff <branches+0x85> # -100.00% (p:100.00%)
0.00 : 4005ed: mov 0x200b7c(%rip),%rax # 601170 <acc>
0.00 : 4005f4: shr $0x2,%rax
0.00 : 4005f8: mov %rax,0x200b71(%rip) # 601170 <acc>
0.00 : 4005ff: mov -0x10(%rbp),%rax # +100.00%
7.37 : 400603: and $0x1,%eax
3.69 : 400606: test %rax,%rax
0.00 : 400609: jne 400612 <branches+0x98> # -59.25% (p:42.99%)
1.84 : 40060b: mov $0x1,%eax
14.29 : 400610: jmp 400617 <branches+0x9d> # -100.00% (p:100.00%)
1.38 : 400612: mov $0x0,%eax # +57.65%
10.14 : 400617: test %al,%al # +42.35%
0.00 : 400619: je 40062f <branches+0xb5> # -57.65% (p:100.00%)
0.46 : 40061b: mov 0x200b4e(%rip),%rax # 601170 <acc>
2.76 : 400622: sub $0x1,%rax
0.00 : 400626: mov %rax,0x200b43(%rip) # 601170 <acc>
0.46 : 40062d: jmp 400641 <branches+0xc7> # -100.00% (p:100.00%)
0.92 : 40062f: mov 0x200b3a(%rip),%rax # 601170 <acc> # +56.13%
2.30 : 400636: add $0x1,%rax
0.92 : 40063a: mov %rax,0x200b2f(%rip) # 601170 <acc>
0.92 : 400641: mov -0x10(%rbp),%rax # +43.87%
2.30 : 400645: mov %rax,%rdi
0.00 : 400648: callq 400526 <lfsr> # -100.00% (p:100.00%)
0.00 : 40064d: mov %rax,-0x10(%rbp) # +100.00%
1.84 : 400651: addq $0x1,-0x8(%rbp)
0.92 : 400656: mov -0x8(%rbp),%rax
5.07 : 40065a: cmp -0x20(%rbp),%rax
0.00 : 40065e: jb 40059f <branches+0x25> # -100.00% (p:100.00%)
0.00 : 400664: nop
0.00 : 400665: leaveq
0.00 : 400666: retq
(Note: the --branch-filter u,any was used to avoid spurious target and
branch points due to interrupts/faults, they show up as very small -/+
annotations on 'weird' locations)
Committer note:
Please take a look at:
http://vger.kernel.org/~acme/perf/annotate_basic_blocks.png
To see the colors.
Signed-off-by: Peter Zijlstra (Intel) <peterz@infradead.org>
Tested-by: Arnaldo Carvalho de Melo <acme@redhat.com>
Cc: Alexander Shishkin <alexander.shishkin@linux.intel.com>
Cc: Andi Kleen <andi@firstfloor.org>
Cc: Anshuman Khandual <khandual@linux.vnet.ibm.com>
Cc: David Carrillo-Cisneros <davidcc@google.com>
Cc: Jiri Olsa <jolsa@kernel.org>
Cc: Kan Liang <kan.liang@intel.com>
Cc: Linus Torvalds <torvalds@linux-foundation.org>
Cc: Namhyung Kim <namhyung@kernel.org>
Cc: Stephane Eranian <eranian@google.com>
[ Moved sym->max_coverage to 'struct annotate', aka symbol__annotate(sym) ]
Signed-off-by: Arnaldo Carvalho de Melo <acme@redhat.com>
2016-09-06 03:08:12 +08:00
|
|
|
|
|
|
|
br = block_range__find(addr);
|
|
|
|
color_fprintf(stdout, annotate__address_color(br), " %" PRIx64 ":", addr);
|
|
|
|
color_fprintf(stdout, annotate__asm_color(br), "%s", dl->line);
|
|
|
|
annotate__branch_printf(br, addr);
|
|
|
|
printf("\n");
|
perf annotate: Add basic support to event group view
Add --group option to enable event grouping. When enabled, all the
group members information will be shown with the leader so skip
non-leader events.
It only supports --stdio output currently. Later patches will extend
additional features.
$ perf annotate --group --stdio
...
Percent | Source code & Disassembly of libpthread-2.15.so
--------------------------------------------------------------------------------
:
:
:
: Disassembly of section .text:
:
: 000000387dc0aa50 <__pthread_mutex_unlock_usercnt>:
8.08 2.40 5.29 : 387dc0aa50: mov %rdi,%rdx
0.00 0.00 0.00 : 387dc0aa53: mov 0x10(%rdi),%edi
0.00 0.00 0.00 : 387dc0aa56: mov %edi,%eax
0.00 0.80 0.00 : 387dc0aa58: and $0x7f,%eax
3.03 2.40 3.53 : 387dc0aa5b: test $0x7c,%dil
0.00 0.00 0.00 : 387dc0aa5f: jne 387dc0aaa9 <__pthread_mutex_unlock_use
0.00 0.00 0.00 : 387dc0aa61: test %eax,%eax
0.00 0.00 0.00 : 387dc0aa63: jne 387dc0aa85 <__pthread_mutex_unlock_use
0.00 0.00 0.00 : 387dc0aa65: and $0x80,%edi
0.00 0.00 0.00 : 387dc0aa6b: test %esi,%esi
3.03 5.60 7.06 : 387dc0aa6d: movl $0x0,0x8(%rdx)
0.00 0.00 0.59 : 387dc0aa74: je 387dc0aa7a <__pthread_mutex_unlock_use
0.00 0.00 0.00 : 387dc0aa76: subl $0x1,0xc(%rdx)
2.02 5.60 1.18 : 387dc0aa7a: mov %edi,%esi
0.00 0.00 0.00 : 387dc0aa7c: lock decl (%rdx)
83.84 83.20 82.35 : 387dc0aa7f: jne 387dc0aada <_L_unlock_586>
0.00 0.00 0.00 : 387dc0aa81: nop
0.00 0.00 0.00 : 387dc0aa82: xor %eax,%eax
0.00 0.00 0.00 : 387dc0aa84: retq
...
Signed-off-by: Namhyung Kim <namhyung@kernel.org>
Cc: Andi Kleen <andi@firstfloor.org>
Cc: Ingo Molnar <mingo@kernel.org>
Cc: Jiri Olsa <jolsa@redhat.com>
Cc: Paul Mackerras <paulus@samba.org>
Cc: Pekka Enberg <penberg@kernel.org>
Cc: Peter Zijlstra <a.p.zijlstra@chello.nl>
Link: http://lkml.kernel.org/r/1362462812-30885-6-git-send-email-namhyung@kernel.org
Signed-off-by: Arnaldo Carvalho de Melo <acme@redhat.com>
2013-03-05 13:53:25 +08:00
|
|
|
|
|
|
|
if (ppercents != &percent)
|
|
|
|
free(ppercents);
|
|
|
|
|
2015-06-20 03:10:43 +08:00
|
|
|
if (psamples != &nr_samples)
|
|
|
|
free(psamples);
|
|
|
|
|
2011-02-09 01:01:39 +08:00
|
|
|
} else if (max_lines && printed >= max_lines)
|
2011-02-07 00:54:44 +08:00
|
|
|
return 1;
|
|
|
|
else {
|
perf annotate: Add basic support to event group view
Add --group option to enable event grouping. When enabled, all the
group members information will be shown with the leader so skip
non-leader events.
It only supports --stdio output currently. Later patches will extend
additional features.
$ perf annotate --group --stdio
...
Percent | Source code & Disassembly of libpthread-2.15.so
--------------------------------------------------------------------------------
:
:
:
: Disassembly of section .text:
:
: 000000387dc0aa50 <__pthread_mutex_unlock_usercnt>:
8.08 2.40 5.29 : 387dc0aa50: mov %rdi,%rdx
0.00 0.00 0.00 : 387dc0aa53: mov 0x10(%rdi),%edi
0.00 0.00 0.00 : 387dc0aa56: mov %edi,%eax
0.00 0.80 0.00 : 387dc0aa58: and $0x7f,%eax
3.03 2.40 3.53 : 387dc0aa5b: test $0x7c,%dil
0.00 0.00 0.00 : 387dc0aa5f: jne 387dc0aaa9 <__pthread_mutex_unlock_use
0.00 0.00 0.00 : 387dc0aa61: test %eax,%eax
0.00 0.00 0.00 : 387dc0aa63: jne 387dc0aa85 <__pthread_mutex_unlock_use
0.00 0.00 0.00 : 387dc0aa65: and $0x80,%edi
0.00 0.00 0.00 : 387dc0aa6b: test %esi,%esi
3.03 5.60 7.06 : 387dc0aa6d: movl $0x0,0x8(%rdx)
0.00 0.00 0.59 : 387dc0aa74: je 387dc0aa7a <__pthread_mutex_unlock_use
0.00 0.00 0.00 : 387dc0aa76: subl $0x1,0xc(%rdx)
2.02 5.60 1.18 : 387dc0aa7a: mov %edi,%esi
0.00 0.00 0.00 : 387dc0aa7c: lock decl (%rdx)
83.84 83.20 82.35 : 387dc0aa7f: jne 387dc0aada <_L_unlock_586>
0.00 0.00 0.00 : 387dc0aa81: nop
0.00 0.00 0.00 : 387dc0aa82: xor %eax,%eax
0.00 0.00 0.00 : 387dc0aa84: retq
...
Signed-off-by: Namhyung Kim <namhyung@kernel.org>
Cc: Andi Kleen <andi@firstfloor.org>
Cc: Ingo Molnar <mingo@kernel.org>
Cc: Jiri Olsa <jolsa@redhat.com>
Cc: Paul Mackerras <paulus@samba.org>
Cc: Pekka Enberg <penberg@kernel.org>
Cc: Peter Zijlstra <a.p.zijlstra@chello.nl>
Link: http://lkml.kernel.org/r/1362462812-30885-6-git-send-email-namhyung@kernel.org
Signed-off-by: Arnaldo Carvalho de Melo <acme@redhat.com>
2013-03-05 13:53:25 +08:00
|
|
|
int width = 8;
|
|
|
|
|
2011-02-09 01:29:25 +08:00
|
|
|
if (queue)
|
|
|
|
return -1;
|
|
|
|
|
2013-03-05 13:53:26 +08:00
|
|
|
if (perf_evsel__is_group_event(evsel))
|
perf annotate: Add basic support to event group view
Add --group option to enable event grouping. When enabled, all the
group members information will be shown with the leader so skip
non-leader events.
It only supports --stdio output currently. Later patches will extend
additional features.
$ perf annotate --group --stdio
...
Percent | Source code & Disassembly of libpthread-2.15.so
--------------------------------------------------------------------------------
:
:
:
: Disassembly of section .text:
:
: 000000387dc0aa50 <__pthread_mutex_unlock_usercnt>:
8.08 2.40 5.29 : 387dc0aa50: mov %rdi,%rdx
0.00 0.00 0.00 : 387dc0aa53: mov 0x10(%rdi),%edi
0.00 0.00 0.00 : 387dc0aa56: mov %edi,%eax
0.00 0.80 0.00 : 387dc0aa58: and $0x7f,%eax
3.03 2.40 3.53 : 387dc0aa5b: test $0x7c,%dil
0.00 0.00 0.00 : 387dc0aa5f: jne 387dc0aaa9 <__pthread_mutex_unlock_use
0.00 0.00 0.00 : 387dc0aa61: test %eax,%eax
0.00 0.00 0.00 : 387dc0aa63: jne 387dc0aa85 <__pthread_mutex_unlock_use
0.00 0.00 0.00 : 387dc0aa65: and $0x80,%edi
0.00 0.00 0.00 : 387dc0aa6b: test %esi,%esi
3.03 5.60 7.06 : 387dc0aa6d: movl $0x0,0x8(%rdx)
0.00 0.00 0.59 : 387dc0aa74: je 387dc0aa7a <__pthread_mutex_unlock_use
0.00 0.00 0.00 : 387dc0aa76: subl $0x1,0xc(%rdx)
2.02 5.60 1.18 : 387dc0aa7a: mov %edi,%esi
0.00 0.00 0.00 : 387dc0aa7c: lock decl (%rdx)
83.84 83.20 82.35 : 387dc0aa7f: jne 387dc0aada <_L_unlock_586>
0.00 0.00 0.00 : 387dc0aa81: nop
0.00 0.00 0.00 : 387dc0aa82: xor %eax,%eax
0.00 0.00 0.00 : 387dc0aa84: retq
...
Signed-off-by: Namhyung Kim <namhyung@kernel.org>
Cc: Andi Kleen <andi@firstfloor.org>
Cc: Ingo Molnar <mingo@kernel.org>
Cc: Jiri Olsa <jolsa@redhat.com>
Cc: Paul Mackerras <paulus@samba.org>
Cc: Pekka Enberg <penberg@kernel.org>
Cc: Peter Zijlstra <a.p.zijlstra@chello.nl>
Link: http://lkml.kernel.org/r/1362462812-30885-6-git-send-email-namhyung@kernel.org
Signed-off-by: Arnaldo Carvalho de Melo <acme@redhat.com>
2013-03-05 13:53:25 +08:00
|
|
|
width *= evsel->nr_members;
|
|
|
|
|
2012-04-16 02:24:39 +08:00
|
|
|
if (!*dl->line)
|
perf annotate: Add basic support to event group view
Add --group option to enable event grouping. When enabled, all the
group members information will be shown with the leader so skip
non-leader events.
It only supports --stdio output currently. Later patches will extend
additional features.
$ perf annotate --group --stdio
...
Percent | Source code & Disassembly of libpthread-2.15.so
--------------------------------------------------------------------------------
:
:
:
: Disassembly of section .text:
:
: 000000387dc0aa50 <__pthread_mutex_unlock_usercnt>:
8.08 2.40 5.29 : 387dc0aa50: mov %rdi,%rdx
0.00 0.00 0.00 : 387dc0aa53: mov 0x10(%rdi),%edi
0.00 0.00 0.00 : 387dc0aa56: mov %edi,%eax
0.00 0.80 0.00 : 387dc0aa58: and $0x7f,%eax
3.03 2.40 3.53 : 387dc0aa5b: test $0x7c,%dil
0.00 0.00 0.00 : 387dc0aa5f: jne 387dc0aaa9 <__pthread_mutex_unlock_use
0.00 0.00 0.00 : 387dc0aa61: test %eax,%eax
0.00 0.00 0.00 : 387dc0aa63: jne 387dc0aa85 <__pthread_mutex_unlock_use
0.00 0.00 0.00 : 387dc0aa65: and $0x80,%edi
0.00 0.00 0.00 : 387dc0aa6b: test %esi,%esi
3.03 5.60 7.06 : 387dc0aa6d: movl $0x0,0x8(%rdx)
0.00 0.00 0.59 : 387dc0aa74: je 387dc0aa7a <__pthread_mutex_unlock_use
0.00 0.00 0.00 : 387dc0aa76: subl $0x1,0xc(%rdx)
2.02 5.60 1.18 : 387dc0aa7a: mov %edi,%esi
0.00 0.00 0.00 : 387dc0aa7c: lock decl (%rdx)
83.84 83.20 82.35 : 387dc0aa7f: jne 387dc0aada <_L_unlock_586>
0.00 0.00 0.00 : 387dc0aa81: nop
0.00 0.00 0.00 : 387dc0aa82: xor %eax,%eax
0.00 0.00 0.00 : 387dc0aa84: retq
...
Signed-off-by: Namhyung Kim <namhyung@kernel.org>
Cc: Andi Kleen <andi@firstfloor.org>
Cc: Ingo Molnar <mingo@kernel.org>
Cc: Jiri Olsa <jolsa@redhat.com>
Cc: Paul Mackerras <paulus@samba.org>
Cc: Pekka Enberg <penberg@kernel.org>
Cc: Peter Zijlstra <a.p.zijlstra@chello.nl>
Link: http://lkml.kernel.org/r/1362462812-30885-6-git-send-email-namhyung@kernel.org
Signed-off-by: Arnaldo Carvalho de Melo <acme@redhat.com>
2013-03-05 13:53:25 +08:00
|
|
|
printf(" %*s:\n", width, " ");
|
2011-02-04 19:45:46 +08:00
|
|
|
else
|
perf annotate: Add basic support to event group view
Add --group option to enable event grouping. When enabled, all the
group members information will be shown with the leader so skip
non-leader events.
It only supports --stdio output currently. Later patches will extend
additional features.
$ perf annotate --group --stdio
...
Percent | Source code & Disassembly of libpthread-2.15.so
--------------------------------------------------------------------------------
:
:
:
: Disassembly of section .text:
:
: 000000387dc0aa50 <__pthread_mutex_unlock_usercnt>:
8.08 2.40 5.29 : 387dc0aa50: mov %rdi,%rdx
0.00 0.00 0.00 : 387dc0aa53: mov 0x10(%rdi),%edi
0.00 0.00 0.00 : 387dc0aa56: mov %edi,%eax
0.00 0.80 0.00 : 387dc0aa58: and $0x7f,%eax
3.03 2.40 3.53 : 387dc0aa5b: test $0x7c,%dil
0.00 0.00 0.00 : 387dc0aa5f: jne 387dc0aaa9 <__pthread_mutex_unlock_use
0.00 0.00 0.00 : 387dc0aa61: test %eax,%eax
0.00 0.00 0.00 : 387dc0aa63: jne 387dc0aa85 <__pthread_mutex_unlock_use
0.00 0.00 0.00 : 387dc0aa65: and $0x80,%edi
0.00 0.00 0.00 : 387dc0aa6b: test %esi,%esi
3.03 5.60 7.06 : 387dc0aa6d: movl $0x0,0x8(%rdx)
0.00 0.00 0.59 : 387dc0aa74: je 387dc0aa7a <__pthread_mutex_unlock_use
0.00 0.00 0.00 : 387dc0aa76: subl $0x1,0xc(%rdx)
2.02 5.60 1.18 : 387dc0aa7a: mov %edi,%esi
0.00 0.00 0.00 : 387dc0aa7c: lock decl (%rdx)
83.84 83.20 82.35 : 387dc0aa7f: jne 387dc0aada <_L_unlock_586>
0.00 0.00 0.00 : 387dc0aa81: nop
0.00 0.00 0.00 : 387dc0aa82: xor %eax,%eax
0.00 0.00 0.00 : 387dc0aa84: retq
...
Signed-off-by: Namhyung Kim <namhyung@kernel.org>
Cc: Andi Kleen <andi@firstfloor.org>
Cc: Ingo Molnar <mingo@kernel.org>
Cc: Jiri Olsa <jolsa@redhat.com>
Cc: Paul Mackerras <paulus@samba.org>
Cc: Pekka Enberg <penberg@kernel.org>
Cc: Peter Zijlstra <a.p.zijlstra@chello.nl>
Link: http://lkml.kernel.org/r/1362462812-30885-6-git-send-email-namhyung@kernel.org
Signed-off-by: Arnaldo Carvalho de Melo <acme@redhat.com>
2013-03-05 13:53:25 +08:00
|
|
|
printf(" %*s: %s\n", width, " ", dl->line);
|
2011-02-04 19:45:46 +08:00
|
|
|
}
|
2011-02-07 00:54:44 +08:00
|
|
|
|
|
|
|
return 0;
|
2011-02-04 19:45:46 +08:00
|
|
|
}
|
|
|
|
|
2013-03-05 13:53:22 +08:00
|
|
|
/*
|
|
|
|
* symbol__parse_objdump_line() parses objdump output (with -d --no-show-raw)
|
|
|
|
* which looks like following
|
|
|
|
*
|
|
|
|
* 0000000000415500 <_init>:
|
|
|
|
* 415500: sub $0x8,%rsp
|
|
|
|
* 415504: mov 0x2f5ad5(%rip),%rax # 70afe0 <_DYNAMIC+0x2f8>
|
|
|
|
* 41550b: test %rax,%rax
|
|
|
|
* 41550e: je 415515 <_init+0x15>
|
|
|
|
* 415510: callq 416e70 <__gmon_start__@plt>
|
|
|
|
* 415515: add $0x8,%rsp
|
|
|
|
* 415519: retq
|
|
|
|
*
|
|
|
|
* it will be parsed and saved into struct disasm_line as
|
|
|
|
* <offset> <name> <ops.raw>
|
|
|
|
*
|
|
|
|
* The offset will be a relative offset from the start of the symbol and -1
|
|
|
|
* means that it's not a disassembly line so should be treated differently.
|
|
|
|
* The ops.raw part will be parsed further according to type of the instruction.
|
|
|
|
*/
|
2011-02-08 23:27:39 +08:00
|
|
|
static int symbol__parse_objdump_line(struct symbol *sym, struct map *map,
|
2014-11-13 10:05:26 +08:00
|
|
|
FILE *file, size_t privsize,
|
|
|
|
int *line_nr)
|
2011-02-04 19:45:46 +08:00
|
|
|
{
|
2011-02-08 23:27:39 +08:00
|
|
|
struct annotation *notes = symbol__annotation(sym);
|
2012-04-16 02:24:39 +08:00
|
|
|
struct disasm_line *dl;
|
2012-04-02 23:59:01 +08:00
|
|
|
char *line = NULL, *parsed_line, *tmp, *tmp2, *c;
|
2011-02-04 19:45:46 +08:00
|
|
|
size_t line_len;
|
|
|
|
s64 line_ip, offset = -1;
|
2014-11-13 10:05:26 +08:00
|
|
|
regmatch_t match[2];
|
2011-02-04 19:45:46 +08:00
|
|
|
|
|
|
|
if (getline(&line, &line_len, file) < 0)
|
|
|
|
return -1;
|
|
|
|
|
|
|
|
if (!line)
|
|
|
|
return -1;
|
|
|
|
|
|
|
|
while (line_len != 0 && isspace(line[line_len - 1]))
|
|
|
|
line[--line_len] = '\0';
|
|
|
|
|
|
|
|
c = strchr(line, '\n');
|
|
|
|
if (c)
|
|
|
|
*c = 0;
|
|
|
|
|
|
|
|
line_ip = -1;
|
2012-04-12 04:04:59 +08:00
|
|
|
parsed_line = line;
|
2011-02-04 19:45:46 +08:00
|
|
|
|
2014-11-13 10:05:26 +08:00
|
|
|
/* /filename:linenr ? Save line number and ignore. */
|
|
|
|
if (regexec(&file_lineno, line, 2, match, 0) == 0) {
|
|
|
|
*line_nr = atoi(line + match[1].rm_so);
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
2011-02-04 19:45:46 +08:00
|
|
|
/*
|
|
|
|
* Strip leading spaces:
|
|
|
|
*/
|
|
|
|
tmp = line;
|
|
|
|
while (*tmp) {
|
|
|
|
if (*tmp != ' ')
|
|
|
|
break;
|
|
|
|
tmp++;
|
|
|
|
}
|
|
|
|
|
|
|
|
if (*tmp) {
|
|
|
|
/*
|
|
|
|
* Parse hexa addresses followed by ':'
|
|
|
|
*/
|
|
|
|
line_ip = strtoull(tmp, &tmp2, 16);
|
|
|
|
if (*tmp2 != ':' || tmp == tmp2 || tmp2[1] == '\0')
|
|
|
|
line_ip = -1;
|
|
|
|
}
|
|
|
|
|
|
|
|
if (line_ip != -1) {
|
|
|
|
u64 start = map__rip_2objdump(map, sym->start),
|
|
|
|
end = map__rip_2objdump(map, sym->end);
|
|
|
|
|
|
|
|
offset = line_ip - start;
|
2014-10-15 04:19:44 +08:00
|
|
|
if ((u64)line_ip < start || (u64)line_ip >= end)
|
2011-02-04 19:45:46 +08:00
|
|
|
offset = -1;
|
2012-04-02 23:59:01 +08:00
|
|
|
else
|
|
|
|
parsed_line = tmp2 + 1;
|
2012-04-12 04:04:59 +08:00
|
|
|
}
|
2011-02-04 19:45:46 +08:00
|
|
|
|
2016-09-20 04:18:16 +08:00
|
|
|
dl = disasm_line__new(offset, parsed_line, privsize, *line_nr, map);
|
2012-04-02 23:59:01 +08:00
|
|
|
free(line);
|
2014-11-13 10:05:26 +08:00
|
|
|
(*line_nr)++;
|
2012-04-02 23:59:01 +08:00
|
|
|
|
2012-04-16 02:24:39 +08:00
|
|
|
if (dl == NULL)
|
2011-02-04 19:45:46 +08:00
|
|
|
return -1;
|
2012-04-02 23:59:01 +08:00
|
|
|
|
2013-08-07 19:38:54 +08:00
|
|
|
if (dl->ops.target.offset == UINT64_MAX)
|
|
|
|
dl->ops.target.offset = dl->ops.target.addr -
|
|
|
|
map__rip_2objdump(map, sym->start);
|
|
|
|
|
2013-10-14 18:43:40 +08:00
|
|
|
/* kcore has no symbols, so add the call target name */
|
2013-08-07 19:38:57 +08:00
|
|
|
if (dl->ins && ins__is_call(dl->ins) && !dl->ops.target.name) {
|
2013-10-14 18:43:40 +08:00
|
|
|
struct addr_map_symbol target = {
|
|
|
|
.map = map,
|
|
|
|
.addr = dl->ops.target.addr,
|
|
|
|
};
|
|
|
|
|
2016-09-02 06:25:52 +08:00
|
|
|
if (!map_groups__find_ams(&target) &&
|
2013-10-14 18:43:40 +08:00
|
|
|
target.sym->start == target.al_addr)
|
|
|
|
dl->ops.target.name = strdup(target.sym->name);
|
2013-08-07 19:38:57 +08:00
|
|
|
}
|
|
|
|
|
2012-04-16 02:24:39 +08:00
|
|
|
disasm__add(¬es->src->source, dl);
|
2011-02-04 19:45:46 +08:00
|
|
|
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
2014-11-13 10:05:26 +08:00
|
|
|
static __attribute__((constructor)) void symbol__init_regexpr(void)
|
|
|
|
{
|
|
|
|
regcomp(&file_lineno, "^/[^:]+:([0-9]+)", REG_EXTENDED);
|
|
|
|
}
|
|
|
|
|
2013-08-07 19:38:56 +08:00
|
|
|
static void delete_last_nop(struct symbol *sym)
|
|
|
|
{
|
|
|
|
struct annotation *notes = symbol__annotation(sym);
|
|
|
|
struct list_head *list = ¬es->src->source;
|
|
|
|
struct disasm_line *dl;
|
|
|
|
|
|
|
|
while (!list_empty(list)) {
|
|
|
|
dl = list_entry(list->prev, struct disasm_line, node);
|
|
|
|
|
|
|
|
if (dl->ins && dl->ins->ops) {
|
|
|
|
if (dl->ins->ops != &nop_ops)
|
|
|
|
return;
|
|
|
|
} else {
|
|
|
|
if (!strstr(dl->line, " nop ") &&
|
|
|
|
!strstr(dl->line, " nopl ") &&
|
|
|
|
!strstr(dl->line, " nopw "))
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
|
|
|
|
list_del(&dl->node);
|
|
|
|
disasm_line__free(dl);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2016-07-30 03:27:18 +08:00
|
|
|
int symbol__strerror_disassemble(struct symbol *sym __maybe_unused, struct map *map,
|
|
|
|
int errnum, char *buf, size_t buflen)
|
|
|
|
{
|
|
|
|
struct dso *dso = map->dso;
|
|
|
|
|
|
|
|
BUG_ON(buflen == 0);
|
|
|
|
|
|
|
|
if (errnum >= 0) {
|
|
|
|
str_error_r(errnum, buf, buflen);
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
|
|
|
switch (errnum) {
|
|
|
|
case SYMBOL_ANNOTATE_ERRNO__NO_VMLINUX: {
|
|
|
|
char bf[SBUILD_ID_SIZE + 15] = " with build id ";
|
|
|
|
char *build_id_msg = NULL;
|
|
|
|
|
|
|
|
if (dso->has_build_id) {
|
|
|
|
build_id__sprintf(dso->build_id,
|
|
|
|
sizeof(dso->build_id), bf + 15);
|
|
|
|
build_id_msg = bf;
|
|
|
|
}
|
|
|
|
scnprintf(buf, buflen,
|
|
|
|
"No vmlinux file%s\nwas found in the path.\n\n"
|
|
|
|
"Note that annotation using /proc/kcore requires CAP_SYS_RAWIO capability.\n\n"
|
|
|
|
"Please use:\n\n"
|
|
|
|
" perf buildid-cache -vu vmlinux\n\n"
|
|
|
|
"or:\n\n"
|
|
|
|
" --vmlinux vmlinux\n", build_id_msg ?: "");
|
|
|
|
}
|
|
|
|
break;
|
|
|
|
default:
|
|
|
|
scnprintf(buf, buflen, "Internal error: Invalid %d error code\n", errnum);
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
2016-08-10 02:32:53 +08:00
|
|
|
static int dso__disassemble_filename(struct dso *dso, char *filename, size_t filename_size)
|
2011-02-04 19:45:46 +08:00
|
|
|
{
|
2016-08-10 02:32:53 +08:00
|
|
|
char linkname[PATH_MAX];
|
|
|
|
char *build_id_filename;
|
2011-02-04 19:45:46 +08:00
|
|
|
|
2016-08-10 01:56:13 +08:00
|
|
|
if (dso->symtab_type == DSO_BINARY_TYPE__KALLSYMS &&
|
|
|
|
!dso__is_kcore(dso))
|
2016-08-10 02:32:53 +08:00
|
|
|
return SYMBOL_ANNOTATE_ERRNO__NO_VMLINUX;
|
2016-08-10 01:56:13 +08:00
|
|
|
|
2016-08-10 02:32:53 +08:00
|
|
|
build_id_filename = dso__build_id_filename(dso, NULL, 0);
|
|
|
|
if (build_id_filename) {
|
|
|
|
__symbol__join_symfs(filename, filename_size, build_id_filename);
|
|
|
|
free(build_id_filename);
|
2016-08-10 02:16:37 +08:00
|
|
|
} else {
|
2016-07-30 03:27:18 +08:00
|
|
|
if (dso->has_build_id)
|
|
|
|
return ENOMEM;
|
2011-02-04 19:45:46 +08:00
|
|
|
goto fallback;
|
2016-08-10 02:16:37 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
if (dso__is_kcore(dso) ||
|
2016-08-10 02:32:53 +08:00
|
|
|
readlink(filename, linkname, sizeof(linkname)) < 0 ||
|
|
|
|
strstr(linkname, DSO__NAME_KALLSYMS) ||
|
|
|
|
access(filename, R_OK)) {
|
2011-02-04 19:45:46 +08:00
|
|
|
fallback:
|
|
|
|
/*
|
|
|
|
* If we don't have build-ids or the build-id file isn't in the
|
|
|
|
* cache, or is just a kallsyms file, well, lets hope that this
|
|
|
|
* DSO is the same as when 'perf record' ran.
|
|
|
|
*/
|
2016-08-10 02:32:53 +08:00
|
|
|
__symbol__join_symfs(filename, filename_size, dso->long_name);
|
2011-02-04 19:45:46 +08:00
|
|
|
}
|
|
|
|
|
2016-08-10 02:32:53 +08:00
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
|
|
|
int symbol__disassemble(struct symbol *sym, struct map *map, size_t privsize)
|
|
|
|
{
|
|
|
|
struct dso *dso = map->dso;
|
|
|
|
char command[PATH_MAX * 2];
|
|
|
|
FILE *file;
|
|
|
|
char symfs_filename[PATH_MAX];
|
|
|
|
struct kcore_extract kce;
|
|
|
|
bool delete_extract = false;
|
|
|
|
int stdout_fd[2];
|
|
|
|
int lineno = 0;
|
|
|
|
int nline;
|
|
|
|
pid_t pid;
|
|
|
|
int err = dso__disassemble_filename(dso, symfs_filename, sizeof(symfs_filename));
|
|
|
|
|
|
|
|
if (err)
|
|
|
|
return err;
|
|
|
|
|
2011-02-04 19:45:46 +08:00
|
|
|
pr_debug("%s: filename=%s, sym=%s, start=%#" PRIx64 ", end=%#" PRIx64 "\n", __func__,
|
2016-08-10 02:16:37 +08:00
|
|
|
symfs_filename, sym->name, map->unmap_ip(map, sym->start),
|
2011-02-04 19:45:46 +08:00
|
|
|
map->unmap_ip(map, sym->end));
|
|
|
|
|
|
|
|
pr_debug("annotating [%p] %30s : [%p] %30s\n",
|
|
|
|
dso, dso->long_name, sym, sym->name);
|
|
|
|
|
2013-10-09 20:01:12 +08:00
|
|
|
if (dso__is_kcore(dso)) {
|
|
|
|
kce.kcore_filename = symfs_filename;
|
|
|
|
kce.addr = map__rip_2objdump(map, sym->start);
|
|
|
|
kce.offs = sym->start;
|
2014-10-15 04:19:44 +08:00
|
|
|
kce.len = sym->end - sym->start;
|
2013-10-09 20:01:12 +08:00
|
|
|
if (!kcore_extract__create(&kce)) {
|
|
|
|
delete_extract = true;
|
|
|
|
strlcpy(symfs_filename, kce.extract_filename,
|
|
|
|
sizeof(symfs_filename));
|
|
|
|
}
|
2015-03-03 01:56:12 +08:00
|
|
|
} else if (dso__needs_decompress(dso)) {
|
|
|
|
char tmp[PATH_MAX];
|
|
|
|
struct kmod_path m;
|
|
|
|
int fd;
|
|
|
|
bool ret;
|
|
|
|
|
|
|
|
if (kmod_path__parse_ext(&m, symfs_filename))
|
2016-08-10 02:16:37 +08:00
|
|
|
goto out;
|
2015-03-03 01:56:12 +08:00
|
|
|
|
|
|
|
snprintf(tmp, PATH_MAX, "/tmp/perf-kmod-XXXXXX");
|
|
|
|
|
|
|
|
fd = mkstemp(tmp);
|
|
|
|
if (fd < 0) {
|
|
|
|
free(m.ext);
|
2016-08-10 02:16:37 +08:00
|
|
|
goto out;
|
2015-03-03 01:56:12 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
ret = decompress_to_file(m.ext, symfs_filename, fd);
|
|
|
|
|
2015-11-06 11:06:07 +08:00
|
|
|
if (ret)
|
|
|
|
pr_err("Cannot decompress %s %s\n", m.ext, symfs_filename);
|
|
|
|
|
2015-03-03 01:56:12 +08:00
|
|
|
free(m.ext);
|
|
|
|
close(fd);
|
|
|
|
|
|
|
|
if (!ret)
|
2016-08-10 02:16:37 +08:00
|
|
|
goto out;
|
2015-03-03 01:56:12 +08:00
|
|
|
|
|
|
|
strcpy(symfs_filename, tmp);
|
2013-10-09 20:01:12 +08:00
|
|
|
}
|
|
|
|
|
2011-02-04 19:45:46 +08:00
|
|
|
snprintf(command, sizeof(command),
|
2012-09-04 18:32:30 +08:00
|
|
|
"%s %s%s --start-address=0x%016" PRIx64
|
2011-05-17 23:32:07 +08:00
|
|
|
" --stop-address=0x%016" PRIx64
|
2014-11-13 10:05:26 +08:00
|
|
|
" -l -d %s %s -C %s 2>/dev/null|grep -v %s|expand",
|
2012-09-04 18:32:30 +08:00
|
|
|
objdump_path ? objdump_path : "objdump",
|
2011-09-16 05:31:41 +08:00
|
|
|
disassembler_style ? "-M " : "",
|
|
|
|
disassembler_style ? disassembler_style : "",
|
2011-02-04 19:45:46 +08:00
|
|
|
map__rip_2objdump(map, sym->start),
|
2014-10-15 04:19:44 +08:00
|
|
|
map__rip_2objdump(map, sym->end),
|
2011-05-17 23:32:07 +08:00
|
|
|
symbol_conf.annotate_asm_raw ? "" : "--no-show-raw",
|
|
|
|
symbol_conf.annotate_src ? "-S" : "",
|
2016-08-10 02:16:37 +08:00
|
|
|
symfs_filename, symfs_filename);
|
2011-02-04 19:45:46 +08:00
|
|
|
|
|
|
|
pr_debug("Executing: %s\n", command);
|
|
|
|
|
2016-06-16 02:48:08 +08:00
|
|
|
err = -1;
|
|
|
|
if (pipe(stdout_fd) < 0) {
|
|
|
|
pr_err("Failure creating the pipe to run %s\n", command);
|
|
|
|
goto out_remove_tmp;
|
|
|
|
}
|
|
|
|
|
|
|
|
pid = fork();
|
|
|
|
if (pid < 0) {
|
|
|
|
pr_err("Failure forking to run %s\n", command);
|
|
|
|
goto out_close_stdout;
|
|
|
|
}
|
|
|
|
|
|
|
|
if (pid == 0) {
|
|
|
|
close(stdout_fd[0]);
|
|
|
|
dup2(stdout_fd[1], 1);
|
|
|
|
close(stdout_fd[1]);
|
|
|
|
execl("/bin/sh", "sh", "-c", command, NULL);
|
|
|
|
perror(command);
|
|
|
|
exit(-1);
|
|
|
|
}
|
|
|
|
|
|
|
|
close(stdout_fd[1]);
|
|
|
|
|
|
|
|
file = fdopen(stdout_fd[0], "r");
|
2015-11-06 11:06:07 +08:00
|
|
|
if (!file) {
|
2016-06-16 02:48:08 +08:00
|
|
|
pr_err("Failure creating FILE stream for %s\n", command);
|
2015-11-06 11:06:07 +08:00
|
|
|
/*
|
|
|
|
* If we were using debug info should retry with
|
|
|
|
* original binary.
|
|
|
|
*/
|
2015-03-03 01:56:12 +08:00
|
|
|
goto out_remove_tmp;
|
2015-11-06 11:06:07 +08:00
|
|
|
}
|
2011-02-04 19:45:46 +08:00
|
|
|
|
2015-11-06 11:06:07 +08:00
|
|
|
nline = 0;
|
|
|
|
while (!feof(file)) {
|
2014-11-13 10:05:26 +08:00
|
|
|
if (symbol__parse_objdump_line(sym, map, file, privsize,
|
|
|
|
&lineno) < 0)
|
2011-02-04 19:45:46 +08:00
|
|
|
break;
|
2015-11-06 11:06:07 +08:00
|
|
|
nline++;
|
|
|
|
}
|
|
|
|
|
|
|
|
if (nline == 0)
|
|
|
|
pr_err("No output from %s\n", command);
|
2011-02-04 19:45:46 +08:00
|
|
|
|
2013-08-07 19:38:56 +08:00
|
|
|
/*
|
|
|
|
* kallsyms does not have symbol sizes so there may a nop at the end.
|
|
|
|
* Remove it.
|
|
|
|
*/
|
|
|
|
if (dso__is_kcore(dso))
|
|
|
|
delete_last_nop(sym);
|
|
|
|
|
2016-06-16 02:48:08 +08:00
|
|
|
fclose(file);
|
|
|
|
err = 0;
|
2015-03-03 01:56:12 +08:00
|
|
|
out_remove_tmp:
|
2016-06-16 02:48:08 +08:00
|
|
|
close(stdout_fd[0]);
|
|
|
|
|
2015-03-03 01:56:12 +08:00
|
|
|
if (dso__needs_decompress(dso))
|
|
|
|
unlink(symfs_filename);
|
2016-08-10 02:16:37 +08:00
|
|
|
|
2013-10-09 20:01:12 +08:00
|
|
|
if (delete_extract)
|
|
|
|
kcore_extract__delete(&kce);
|
2016-08-10 01:56:13 +08:00
|
|
|
out:
|
2011-02-04 19:45:46 +08:00
|
|
|
return err;
|
2016-06-16 02:48:08 +08:00
|
|
|
|
|
|
|
out_close_stdout:
|
|
|
|
close(stdout_fd[1]);
|
|
|
|
goto out_remove_tmp;
|
2011-02-04 19:45:46 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
static void insert_source_line(struct rb_root *root, struct source_line *src_line)
|
|
|
|
{
|
|
|
|
struct source_line *iter;
|
|
|
|
struct rb_node **p = &root->rb_node;
|
|
|
|
struct rb_node *parent = NULL;
|
2013-03-05 13:53:28 +08:00
|
|
|
int i, ret;
|
2011-02-04 19:45:46 +08:00
|
|
|
|
|
|
|
while (*p != NULL) {
|
|
|
|
parent = *p;
|
|
|
|
iter = rb_entry(parent, struct source_line, node);
|
|
|
|
|
2012-11-09 13:58:49 +08:00
|
|
|
ret = strcmp(iter->path, src_line->path);
|
|
|
|
if (ret == 0) {
|
2013-03-05 13:53:28 +08:00
|
|
|
for (i = 0; i < src_line->nr_pcnt; i++)
|
2015-06-20 03:36:12 +08:00
|
|
|
iter->samples[i].percent_sum += src_line->samples[i].percent;
|
2012-11-09 13:58:49 +08:00
|
|
|
return;
|
|
|
|
}
|
|
|
|
|
|
|
|
if (ret < 0)
|
|
|
|
p = &(*p)->rb_left;
|
|
|
|
else
|
|
|
|
p = &(*p)->rb_right;
|
|
|
|
}
|
|
|
|
|
2013-03-05 13:53:28 +08:00
|
|
|
for (i = 0; i < src_line->nr_pcnt; i++)
|
2015-06-20 03:36:12 +08:00
|
|
|
src_line->samples[i].percent_sum = src_line->samples[i].percent;
|
2012-11-09 13:58:49 +08:00
|
|
|
|
|
|
|
rb_link_node(&src_line->node, parent, p);
|
|
|
|
rb_insert_color(&src_line->node, root);
|
|
|
|
}
|
|
|
|
|
2013-03-05 13:53:28 +08:00
|
|
|
static int cmp_source_line(struct source_line *a, struct source_line *b)
|
|
|
|
{
|
|
|
|
int i;
|
|
|
|
|
|
|
|
for (i = 0; i < a->nr_pcnt; i++) {
|
2015-06-20 03:36:12 +08:00
|
|
|
if (a->samples[i].percent_sum == b->samples[i].percent_sum)
|
2013-03-05 13:53:28 +08:00
|
|
|
continue;
|
2015-06-20 03:36:12 +08:00
|
|
|
return a->samples[i].percent_sum > b->samples[i].percent_sum;
|
2013-03-05 13:53:28 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
2012-11-09 13:58:49 +08:00
|
|
|
static void __resort_source_line(struct rb_root *root, struct source_line *src_line)
|
|
|
|
{
|
|
|
|
struct source_line *iter;
|
|
|
|
struct rb_node **p = &root->rb_node;
|
|
|
|
struct rb_node *parent = NULL;
|
|
|
|
|
|
|
|
while (*p != NULL) {
|
|
|
|
parent = *p;
|
|
|
|
iter = rb_entry(parent, struct source_line, node);
|
|
|
|
|
2013-03-05 13:53:28 +08:00
|
|
|
if (cmp_source_line(src_line, iter))
|
2011-02-04 19:45:46 +08:00
|
|
|
p = &(*p)->rb_left;
|
|
|
|
else
|
|
|
|
p = &(*p)->rb_right;
|
|
|
|
}
|
|
|
|
|
|
|
|
rb_link_node(&src_line->node, parent, p);
|
|
|
|
rb_insert_color(&src_line->node, root);
|
|
|
|
}
|
|
|
|
|
2012-11-09 13:58:49 +08:00
|
|
|
static void resort_source_line(struct rb_root *dest_root, struct rb_root *src_root)
|
|
|
|
{
|
|
|
|
struct source_line *src_line;
|
|
|
|
struct rb_node *node;
|
|
|
|
|
|
|
|
node = rb_first(src_root);
|
|
|
|
while (node) {
|
|
|
|
struct rb_node *next;
|
|
|
|
|
|
|
|
src_line = rb_entry(node, struct source_line, node);
|
|
|
|
next = rb_next(node);
|
|
|
|
rb_erase(node, src_root);
|
|
|
|
|
|
|
|
__resort_source_line(dest_root, src_line);
|
|
|
|
node = next;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2011-02-04 19:45:46 +08:00
|
|
|
static void symbol__free_source_line(struct symbol *sym, int len)
|
|
|
|
{
|
|
|
|
struct annotation *notes = symbol__annotation(sym);
|
2011-02-08 23:27:39 +08:00
|
|
|
struct source_line *src_line = notes->src->lines;
|
2013-03-05 13:53:28 +08:00
|
|
|
size_t sizeof_src_line;
|
2011-02-04 19:45:46 +08:00
|
|
|
int i;
|
|
|
|
|
2013-03-05 13:53:28 +08:00
|
|
|
sizeof_src_line = sizeof(*src_line) +
|
2015-06-20 03:36:12 +08:00
|
|
|
(sizeof(src_line->samples) * (src_line->nr_pcnt - 1));
|
2011-02-04 19:45:46 +08:00
|
|
|
|
2013-03-05 13:53:28 +08:00
|
|
|
for (i = 0; i < len; i++) {
|
2013-09-11 13:09:28 +08:00
|
|
|
free_srcline(src_line->path);
|
2013-03-05 13:53:28 +08:00
|
|
|
src_line = (void *)src_line + sizeof_src_line;
|
|
|
|
}
|
|
|
|
|
2013-12-27 04:41:15 +08:00
|
|
|
zfree(¬es->src->lines);
|
2011-02-04 19:45:46 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
/* Get the filename:line for the colored entries */
|
|
|
|
static int symbol__get_source_line(struct symbol *sym, struct map *map,
|
2013-03-05 13:53:21 +08:00
|
|
|
struct perf_evsel *evsel,
|
2013-09-11 13:09:30 +08:00
|
|
|
struct rb_root *root, int len)
|
2011-02-04 19:45:46 +08:00
|
|
|
{
|
|
|
|
u64 start;
|
2013-03-05 13:53:28 +08:00
|
|
|
int i, k;
|
|
|
|
int evidx = evsel->idx;
|
2011-02-04 19:45:46 +08:00
|
|
|
struct source_line *src_line;
|
|
|
|
struct annotation *notes = symbol__annotation(sym);
|
2013-03-05 13:53:28 +08:00
|
|
|
struct sym_hist *h = annotation__histogram(notes, evidx);
|
2012-11-09 13:58:49 +08:00
|
|
|
struct rb_root tmp_root = RB_ROOT;
|
2013-03-05 13:53:28 +08:00
|
|
|
int nr_pcnt = 1;
|
|
|
|
u64 h_sum = h->sum;
|
|
|
|
size_t sizeof_src_line = sizeof(struct source_line);
|
|
|
|
|
|
|
|
if (perf_evsel__is_group_event(evsel)) {
|
|
|
|
for (i = 1; i < evsel->nr_members; i++) {
|
|
|
|
h = annotation__histogram(notes, evidx + i);
|
|
|
|
h_sum += h->sum;
|
|
|
|
}
|
|
|
|
nr_pcnt = evsel->nr_members;
|
2015-06-20 03:36:12 +08:00
|
|
|
sizeof_src_line += (nr_pcnt - 1) * sizeof(src_line->samples);
|
2013-03-05 13:53:28 +08:00
|
|
|
}
|
2011-02-04 19:45:46 +08:00
|
|
|
|
2013-03-05 13:53:28 +08:00
|
|
|
if (!h_sum)
|
2011-02-04 19:45:46 +08:00
|
|
|
return 0;
|
|
|
|
|
2013-03-05 13:53:28 +08:00
|
|
|
src_line = notes->src->lines = calloc(len, sizeof_src_line);
|
2011-02-08 23:27:39 +08:00
|
|
|
if (!notes->src->lines)
|
2011-02-04 19:45:46 +08:00
|
|
|
return -1;
|
|
|
|
|
2012-03-26 04:28:12 +08:00
|
|
|
start = map__rip_2objdump(map, sym->start);
|
2011-02-04 19:45:46 +08:00
|
|
|
|
|
|
|
for (i = 0; i < len; i++) {
|
|
|
|
u64 offset;
|
2013-03-05 13:53:28 +08:00
|
|
|
double percent_max = 0.0;
|
2011-02-04 19:45:46 +08:00
|
|
|
|
2013-03-05 13:53:28 +08:00
|
|
|
src_line->nr_pcnt = nr_pcnt;
|
|
|
|
|
|
|
|
for (k = 0; k < nr_pcnt; k++) {
|
|
|
|
h = annotation__histogram(notes, evidx + k);
|
2015-06-20 03:36:12 +08:00
|
|
|
src_line->samples[k].percent = 100.0 * h->addr[i] / h->sum;
|
2013-03-05 13:53:28 +08:00
|
|
|
|
2015-06-20 03:36:12 +08:00
|
|
|
if (src_line->samples[k].percent > percent_max)
|
|
|
|
percent_max = src_line->samples[k].percent;
|
2013-03-05 13:53:28 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
if (percent_max <= 0.5)
|
|
|
|
goto next;
|
2011-02-04 19:45:46 +08:00
|
|
|
|
|
|
|
offset = start + i;
|
2014-11-13 10:05:27 +08:00
|
|
|
src_line->path = get_srcline(map->dso, offset, NULL, false);
|
2013-03-05 13:53:28 +08:00
|
|
|
insert_source_line(&tmp_root, src_line);
|
2011-02-04 19:45:46 +08:00
|
|
|
|
2013-03-05 13:53:28 +08:00
|
|
|
next:
|
|
|
|
src_line = (void *)src_line + sizeof_src_line;
|
2011-02-04 19:45:46 +08:00
|
|
|
}
|
|
|
|
|
2012-11-09 13:58:49 +08:00
|
|
|
resort_source_line(root, &tmp_root);
|
2011-02-04 19:45:46 +08:00
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
|
|
|
static void print_summary(struct rb_root *root, const char *filename)
|
|
|
|
{
|
|
|
|
struct source_line *src_line;
|
|
|
|
struct rb_node *node;
|
|
|
|
|
|
|
|
printf("\nSorted summary for file %s\n", filename);
|
|
|
|
printf("----------------------------------------------\n\n");
|
|
|
|
|
|
|
|
if (RB_EMPTY_ROOT(root)) {
|
|
|
|
printf(" Nothing higher than %1.1f%%\n", MIN_GREEN);
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
|
|
|
|
node = rb_first(root);
|
|
|
|
while (node) {
|
2013-03-05 13:53:28 +08:00
|
|
|
double percent, percent_max = 0.0;
|
2011-02-04 19:45:46 +08:00
|
|
|
const char *color;
|
|
|
|
char *path;
|
2013-03-05 13:53:28 +08:00
|
|
|
int i;
|
2011-02-04 19:45:46 +08:00
|
|
|
|
|
|
|
src_line = rb_entry(node, struct source_line, node);
|
2013-03-05 13:53:28 +08:00
|
|
|
for (i = 0; i < src_line->nr_pcnt; i++) {
|
2015-06-20 03:36:12 +08:00
|
|
|
percent = src_line->samples[i].percent_sum;
|
2013-03-05 13:53:28 +08:00
|
|
|
color = get_percent_color(percent);
|
|
|
|
color_fprintf(stdout, color, " %7.2f", percent);
|
|
|
|
|
|
|
|
if (percent > percent_max)
|
|
|
|
percent_max = percent;
|
|
|
|
}
|
|
|
|
|
2011-02-04 19:45:46 +08:00
|
|
|
path = src_line->path;
|
2013-03-05 13:53:28 +08:00
|
|
|
color = get_percent_color(percent_max);
|
2013-09-11 13:09:28 +08:00
|
|
|
color_fprintf(stdout, color, " %s\n", path);
|
2011-02-04 19:45:46 +08:00
|
|
|
|
|
|
|
node = rb_next(node);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2013-03-05 13:53:21 +08:00
|
|
|
static void symbol__annotate_hits(struct symbol *sym, struct perf_evsel *evsel)
|
2011-02-04 19:45:46 +08:00
|
|
|
{
|
|
|
|
struct annotation *notes = symbol__annotation(sym);
|
2013-03-05 13:53:21 +08:00
|
|
|
struct sym_hist *h = annotation__histogram(notes, evsel->idx);
|
2012-04-19 21:57:06 +08:00
|
|
|
u64 len = symbol__size(sym), offset;
|
2011-02-04 19:45:46 +08:00
|
|
|
|
|
|
|
for (offset = 0; offset < len; ++offset)
|
|
|
|
if (h->addr[offset] != 0)
|
|
|
|
printf("%*" PRIx64 ": %" PRIu64 "\n", BITS_PER_LONG / 2,
|
|
|
|
sym->start + offset, h->addr[offset]);
|
|
|
|
printf("%*s: %" PRIu64 "\n", BITS_PER_LONG / 2, "h->sum", h->sum);
|
|
|
|
}
|
|
|
|
|
2013-03-05 13:53:21 +08:00
|
|
|
int symbol__annotate_printf(struct symbol *sym, struct map *map,
|
|
|
|
struct perf_evsel *evsel, bool full_paths,
|
|
|
|
int min_pcnt, int max_lines, int context)
|
2011-02-04 19:45:46 +08:00
|
|
|
{
|
|
|
|
struct dso *dso = map->dso;
|
2012-09-08 23:06:50 +08:00
|
|
|
char *filename;
|
|
|
|
const char *d_filename;
|
2014-03-18 22:50:21 +08:00
|
|
|
const char *evsel_name = perf_evsel__name(evsel);
|
2011-02-08 23:27:39 +08:00
|
|
|
struct annotation *notes = symbol__annotation(sym);
|
2016-06-30 16:29:55 +08:00
|
|
|
struct sym_hist *h = annotation__histogram(notes, evsel->idx);
|
2012-04-16 02:24:39 +08:00
|
|
|
struct disasm_line *pos, *queue = NULL;
|
2012-04-02 23:59:01 +08:00
|
|
|
u64 start = map__rip_2objdump(map, sym->start);
|
2011-02-09 01:29:25 +08:00
|
|
|
int printed = 2, queue_len = 0;
|
2011-02-07 00:54:44 +08:00
|
|
|
int more = 0;
|
2011-02-04 19:45:46 +08:00
|
|
|
u64 len;
|
perf annotate: Add basic support to event group view
Add --group option to enable event grouping. When enabled, all the
group members information will be shown with the leader so skip
non-leader events.
It only supports --stdio output currently. Later patches will extend
additional features.
$ perf annotate --group --stdio
...
Percent | Source code & Disassembly of libpthread-2.15.so
--------------------------------------------------------------------------------
:
:
:
: Disassembly of section .text:
:
: 000000387dc0aa50 <__pthread_mutex_unlock_usercnt>:
8.08 2.40 5.29 : 387dc0aa50: mov %rdi,%rdx
0.00 0.00 0.00 : 387dc0aa53: mov 0x10(%rdi),%edi
0.00 0.00 0.00 : 387dc0aa56: mov %edi,%eax
0.00 0.80 0.00 : 387dc0aa58: and $0x7f,%eax
3.03 2.40 3.53 : 387dc0aa5b: test $0x7c,%dil
0.00 0.00 0.00 : 387dc0aa5f: jne 387dc0aaa9 <__pthread_mutex_unlock_use
0.00 0.00 0.00 : 387dc0aa61: test %eax,%eax
0.00 0.00 0.00 : 387dc0aa63: jne 387dc0aa85 <__pthread_mutex_unlock_use
0.00 0.00 0.00 : 387dc0aa65: and $0x80,%edi
0.00 0.00 0.00 : 387dc0aa6b: test %esi,%esi
3.03 5.60 7.06 : 387dc0aa6d: movl $0x0,0x8(%rdx)
0.00 0.00 0.59 : 387dc0aa74: je 387dc0aa7a <__pthread_mutex_unlock_use
0.00 0.00 0.00 : 387dc0aa76: subl $0x1,0xc(%rdx)
2.02 5.60 1.18 : 387dc0aa7a: mov %edi,%esi
0.00 0.00 0.00 : 387dc0aa7c: lock decl (%rdx)
83.84 83.20 82.35 : 387dc0aa7f: jne 387dc0aada <_L_unlock_586>
0.00 0.00 0.00 : 387dc0aa81: nop
0.00 0.00 0.00 : 387dc0aa82: xor %eax,%eax
0.00 0.00 0.00 : 387dc0aa84: retq
...
Signed-off-by: Namhyung Kim <namhyung@kernel.org>
Cc: Andi Kleen <andi@firstfloor.org>
Cc: Ingo Molnar <mingo@kernel.org>
Cc: Jiri Olsa <jolsa@redhat.com>
Cc: Paul Mackerras <paulus@samba.org>
Cc: Pekka Enberg <penberg@kernel.org>
Cc: Peter Zijlstra <a.p.zijlstra@chello.nl>
Link: http://lkml.kernel.org/r/1362462812-30885-6-git-send-email-namhyung@kernel.org
Signed-off-by: Arnaldo Carvalho de Melo <acme@redhat.com>
2013-03-05 13:53:25 +08:00
|
|
|
int width = 8;
|
2016-06-30 20:17:26 +08:00
|
|
|
int graph_dotted_len;
|
2011-02-04 19:45:46 +08:00
|
|
|
|
2012-09-08 23:06:50 +08:00
|
|
|
filename = strdup(dso->long_name);
|
|
|
|
if (!filename)
|
|
|
|
return -ENOMEM;
|
|
|
|
|
2011-02-04 19:45:46 +08:00
|
|
|
if (full_paths)
|
|
|
|
d_filename = filename;
|
|
|
|
else
|
|
|
|
d_filename = basename(filename);
|
|
|
|
|
2012-04-19 21:57:06 +08:00
|
|
|
len = symbol__size(sym);
|
perf annotate: Add basic support to event group view
Add --group option to enable event grouping. When enabled, all the
group members information will be shown with the leader so skip
non-leader events.
It only supports --stdio output currently. Later patches will extend
additional features.
$ perf annotate --group --stdio
...
Percent | Source code & Disassembly of libpthread-2.15.so
--------------------------------------------------------------------------------
:
:
:
: Disassembly of section .text:
:
: 000000387dc0aa50 <__pthread_mutex_unlock_usercnt>:
8.08 2.40 5.29 : 387dc0aa50: mov %rdi,%rdx
0.00 0.00 0.00 : 387dc0aa53: mov 0x10(%rdi),%edi
0.00 0.00 0.00 : 387dc0aa56: mov %edi,%eax
0.00 0.80 0.00 : 387dc0aa58: and $0x7f,%eax
3.03 2.40 3.53 : 387dc0aa5b: test $0x7c,%dil
0.00 0.00 0.00 : 387dc0aa5f: jne 387dc0aaa9 <__pthread_mutex_unlock_use
0.00 0.00 0.00 : 387dc0aa61: test %eax,%eax
0.00 0.00 0.00 : 387dc0aa63: jne 387dc0aa85 <__pthread_mutex_unlock_use
0.00 0.00 0.00 : 387dc0aa65: and $0x80,%edi
0.00 0.00 0.00 : 387dc0aa6b: test %esi,%esi
3.03 5.60 7.06 : 387dc0aa6d: movl $0x0,0x8(%rdx)
0.00 0.00 0.59 : 387dc0aa74: je 387dc0aa7a <__pthread_mutex_unlock_use
0.00 0.00 0.00 : 387dc0aa76: subl $0x1,0xc(%rdx)
2.02 5.60 1.18 : 387dc0aa7a: mov %edi,%esi
0.00 0.00 0.00 : 387dc0aa7c: lock decl (%rdx)
83.84 83.20 82.35 : 387dc0aa7f: jne 387dc0aada <_L_unlock_586>
0.00 0.00 0.00 : 387dc0aa81: nop
0.00 0.00 0.00 : 387dc0aa82: xor %eax,%eax
0.00 0.00 0.00 : 387dc0aa84: retq
...
Signed-off-by: Namhyung Kim <namhyung@kernel.org>
Cc: Andi Kleen <andi@firstfloor.org>
Cc: Ingo Molnar <mingo@kernel.org>
Cc: Jiri Olsa <jolsa@redhat.com>
Cc: Paul Mackerras <paulus@samba.org>
Cc: Pekka Enberg <penberg@kernel.org>
Cc: Peter Zijlstra <a.p.zijlstra@chello.nl>
Link: http://lkml.kernel.org/r/1362462812-30885-6-git-send-email-namhyung@kernel.org
Signed-off-by: Arnaldo Carvalho de Melo <acme@redhat.com>
2013-03-05 13:53:25 +08:00
|
|
|
|
2013-03-05 13:53:26 +08:00
|
|
|
if (perf_evsel__is_group_event(evsel))
|
perf annotate: Add basic support to event group view
Add --group option to enable event grouping. When enabled, all the
group members information will be shown with the leader so skip
non-leader events.
It only supports --stdio output currently. Later patches will extend
additional features.
$ perf annotate --group --stdio
...
Percent | Source code & Disassembly of libpthread-2.15.so
--------------------------------------------------------------------------------
:
:
:
: Disassembly of section .text:
:
: 000000387dc0aa50 <__pthread_mutex_unlock_usercnt>:
8.08 2.40 5.29 : 387dc0aa50: mov %rdi,%rdx
0.00 0.00 0.00 : 387dc0aa53: mov 0x10(%rdi),%edi
0.00 0.00 0.00 : 387dc0aa56: mov %edi,%eax
0.00 0.80 0.00 : 387dc0aa58: and $0x7f,%eax
3.03 2.40 3.53 : 387dc0aa5b: test $0x7c,%dil
0.00 0.00 0.00 : 387dc0aa5f: jne 387dc0aaa9 <__pthread_mutex_unlock_use
0.00 0.00 0.00 : 387dc0aa61: test %eax,%eax
0.00 0.00 0.00 : 387dc0aa63: jne 387dc0aa85 <__pthread_mutex_unlock_use
0.00 0.00 0.00 : 387dc0aa65: and $0x80,%edi
0.00 0.00 0.00 : 387dc0aa6b: test %esi,%esi
3.03 5.60 7.06 : 387dc0aa6d: movl $0x0,0x8(%rdx)
0.00 0.00 0.59 : 387dc0aa74: je 387dc0aa7a <__pthread_mutex_unlock_use
0.00 0.00 0.00 : 387dc0aa76: subl $0x1,0xc(%rdx)
2.02 5.60 1.18 : 387dc0aa7a: mov %edi,%esi
0.00 0.00 0.00 : 387dc0aa7c: lock decl (%rdx)
83.84 83.20 82.35 : 387dc0aa7f: jne 387dc0aada <_L_unlock_586>
0.00 0.00 0.00 : 387dc0aa81: nop
0.00 0.00 0.00 : 387dc0aa82: xor %eax,%eax
0.00 0.00 0.00 : 387dc0aa84: retq
...
Signed-off-by: Namhyung Kim <namhyung@kernel.org>
Cc: Andi Kleen <andi@firstfloor.org>
Cc: Ingo Molnar <mingo@kernel.org>
Cc: Jiri Olsa <jolsa@redhat.com>
Cc: Paul Mackerras <paulus@samba.org>
Cc: Pekka Enberg <penberg@kernel.org>
Cc: Peter Zijlstra <a.p.zijlstra@chello.nl>
Link: http://lkml.kernel.org/r/1362462812-30885-6-git-send-email-namhyung@kernel.org
Signed-off-by: Arnaldo Carvalho de Melo <acme@redhat.com>
2013-03-05 13:53:25 +08:00
|
|
|
width *= evsel->nr_members;
|
2011-02-04 19:45:46 +08:00
|
|
|
|
2016-06-30 16:29:55 +08:00
|
|
|
graph_dotted_len = printf(" %-*.*s| Source code & Disassembly of %s for %s (%" PRIu64 " samples)\n",
|
|
|
|
width, width, "Percent", d_filename, evsel_name, h->sum);
|
2014-03-18 22:50:21 +08:00
|
|
|
|
2016-06-30 20:17:26 +08:00
|
|
|
printf("%-*.*s----\n",
|
2014-03-18 22:50:21 +08:00
|
|
|
graph_dotted_len, graph_dotted_len, graph_dotted_line);
|
2011-02-04 19:45:46 +08:00
|
|
|
|
|
|
|
if (verbose)
|
2013-03-05 13:53:21 +08:00
|
|
|
symbol__annotate_hits(sym, evsel);
|
2011-02-04 19:45:46 +08:00
|
|
|
|
2011-02-08 23:27:39 +08:00
|
|
|
list_for_each_entry(pos, ¬es->src->source, node) {
|
2011-02-09 01:29:25 +08:00
|
|
|
if (context && queue == NULL) {
|
|
|
|
queue = pos;
|
|
|
|
queue_len = 0;
|
|
|
|
}
|
|
|
|
|
2013-03-05 13:53:21 +08:00
|
|
|
switch (disasm_line__print(pos, sym, start, evsel, len,
|
2012-04-02 23:59:01 +08:00
|
|
|
min_pcnt, printed, max_lines,
|
|
|
|
queue)) {
|
2011-02-07 00:54:44 +08:00
|
|
|
case 0:
|
|
|
|
++printed;
|
2011-02-09 01:29:25 +08:00
|
|
|
if (context) {
|
|
|
|
printed += queue_len;
|
|
|
|
queue = NULL;
|
|
|
|
queue_len = 0;
|
|
|
|
}
|
2011-02-07 00:54:44 +08:00
|
|
|
break;
|
|
|
|
case 1:
|
|
|
|
/* filtered by max_lines */
|
|
|
|
++more;
|
2011-02-06 01:37:31 +08:00
|
|
|
break;
|
2011-02-07 00:54:44 +08:00
|
|
|
case -1:
|
|
|
|
default:
|
2011-02-09 01:29:25 +08:00
|
|
|
/*
|
|
|
|
* Filtered by min_pcnt or non IP lines when
|
|
|
|
* context != 0
|
|
|
|
*/
|
|
|
|
if (!context)
|
|
|
|
break;
|
|
|
|
if (queue_len == context)
|
|
|
|
queue = list_entry(queue->node.next, typeof(*queue), node);
|
|
|
|
else
|
|
|
|
++queue_len;
|
2011-02-07 00:54:44 +08:00
|
|
|
break;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2012-09-08 23:06:50 +08:00
|
|
|
free(filename);
|
|
|
|
|
2011-02-07 00:54:44 +08:00
|
|
|
return more;
|
|
|
|
}
|
2011-02-06 04:51:38 +08:00
|
|
|
|
2011-02-07 00:54:44 +08:00
|
|
|
void symbol__annotate_zero_histogram(struct symbol *sym, int evidx)
|
|
|
|
{
|
|
|
|
struct annotation *notes = symbol__annotation(sym);
|
|
|
|
struct sym_hist *h = annotation__histogram(notes, evidx);
|
|
|
|
|
2011-02-08 23:27:39 +08:00
|
|
|
memset(h, 0, notes->src->sizeof_sym_hist);
|
2011-02-07 00:54:44 +08:00
|
|
|
}
|
|
|
|
|
2011-02-08 23:27:39 +08:00
|
|
|
void symbol__annotate_decay_histogram(struct symbol *sym, int evidx)
|
2011-02-07 00:54:44 +08:00
|
|
|
{
|
|
|
|
struct annotation *notes = symbol__annotation(sym);
|
|
|
|
struct sym_hist *h = annotation__histogram(notes, evidx);
|
2012-04-19 21:57:06 +08:00
|
|
|
int len = symbol__size(sym), offset;
|
2011-02-07 00:54:44 +08:00
|
|
|
|
|
|
|
h->sum = 0;
|
2012-04-06 03:15:59 +08:00
|
|
|
for (offset = 0; offset < len; ++offset) {
|
|
|
|
h->addr[offset] = h->addr[offset] * 7 / 8;
|
|
|
|
h->sum += h->addr[offset];
|
2011-02-06 04:51:38 +08:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2012-04-16 02:24:39 +08:00
|
|
|
void disasm__purge(struct list_head *head)
|
2011-02-06 04:51:38 +08:00
|
|
|
{
|
2012-04-16 02:24:39 +08:00
|
|
|
struct disasm_line *pos, *n;
|
2011-02-06 04:51:38 +08:00
|
|
|
|
|
|
|
list_for_each_entry_safe(pos, n, head, node) {
|
|
|
|
list_del(&pos->node);
|
2012-04-16 02:24:39 +08:00
|
|
|
disasm_line__free(pos);
|
2011-02-06 04:51:38 +08:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2012-04-16 02:52:18 +08:00
|
|
|
static size_t disasm_line__fprintf(struct disasm_line *dl, FILE *fp)
|
|
|
|
{
|
|
|
|
size_t printed;
|
|
|
|
|
|
|
|
if (dl->offset == -1)
|
|
|
|
return fprintf(fp, "%s\n", dl->line);
|
|
|
|
|
|
|
|
printed = fprintf(fp, "%#" PRIx64 " %s", dl->offset, dl->name);
|
|
|
|
|
2012-04-21 01:38:46 +08:00
|
|
|
if (dl->ops.raw[0] != '\0') {
|
2012-04-16 02:52:18 +08:00
|
|
|
printed += fprintf(fp, "%.*s %s\n", 6 - (int)printed, " ",
|
2012-04-21 01:38:46 +08:00
|
|
|
dl->ops.raw);
|
2012-04-16 02:52:18 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
return printed + fprintf(fp, "\n");
|
|
|
|
}
|
|
|
|
|
|
|
|
size_t disasm__fprintf(struct list_head *head, FILE *fp)
|
|
|
|
{
|
|
|
|
struct disasm_line *pos;
|
|
|
|
size_t printed = 0;
|
|
|
|
|
|
|
|
list_for_each_entry(pos, head, node)
|
|
|
|
printed += disasm_line__fprintf(pos, fp);
|
|
|
|
|
|
|
|
return printed;
|
|
|
|
}
|
|
|
|
|
2013-03-05 13:53:21 +08:00
|
|
|
int symbol__tty_annotate(struct symbol *sym, struct map *map,
|
|
|
|
struct perf_evsel *evsel, bool print_lines,
|
|
|
|
bool full_paths, int min_pcnt, int max_lines)
|
2011-02-06 04:51:38 +08:00
|
|
|
{
|
|
|
|
struct dso *dso = map->dso;
|
|
|
|
struct rb_root source_line = RB_ROOT;
|
|
|
|
u64 len;
|
|
|
|
|
2016-07-30 03:44:56 +08:00
|
|
|
if (symbol__disassemble(sym, map, 0) < 0)
|
2011-02-06 04:51:38 +08:00
|
|
|
return -1;
|
|
|
|
|
2012-04-19 21:57:06 +08:00
|
|
|
len = symbol__size(sym);
|
2011-02-06 04:51:38 +08:00
|
|
|
|
|
|
|
if (print_lines) {
|
2015-11-09 23:33:31 +08:00
|
|
|
srcline_full_filename = full_paths;
|
2013-09-11 13:09:30 +08:00
|
|
|
symbol__get_source_line(sym, map, evsel, &source_line, len);
|
|
|
|
print_summary(&source_line, dso->long_name);
|
2011-02-04 19:45:46 +08:00
|
|
|
}
|
|
|
|
|
2013-03-05 13:53:21 +08:00
|
|
|
symbol__annotate_printf(sym, map, evsel, full_paths,
|
2011-02-09 01:29:25 +08:00
|
|
|
min_pcnt, max_lines, 0);
|
2011-02-04 19:45:46 +08:00
|
|
|
if (print_lines)
|
|
|
|
symbol__free_source_line(sym, len);
|
|
|
|
|
2012-04-16 02:24:39 +08:00
|
|
|
disasm__purge(&symbol__annotation(sym)->src->source);
|
2011-02-06 04:51:38 +08:00
|
|
|
|
2011-02-04 19:45:46 +08:00
|
|
|
return 0;
|
|
|
|
}
|
2013-12-19 04:10:15 +08:00
|
|
|
|
2014-02-20 09:32:53 +08:00
|
|
|
bool ui__has_annotation(void)
|
|
|
|
{
|
2016-05-03 19:54:44 +08:00
|
|
|
return use_browser == 1 && perf_hpp_list.sym;
|
2014-02-20 09:32:53 +08:00
|
|
|
}
|