]> git.kernelconcepts.de Git - karo-tx-linux.git/blob - tools/perf/util/annotate.c
Merge tag 'renesas-fixes-for-v4.12' of https://git.kernel.org/pub/scm/linux/kernel...
[karo-tx-linux.git] / tools / perf / util / annotate.c
1 /*
2  * Copyright (C) 2011, Red Hat Inc, Arnaldo Carvalho de Melo <acme@redhat.com>
3  *
4  * Parts came from builtin-annotate.c, see those files for further
5  * copyright notes.
6  *
7  * Released under the GPL v2. (and only v2, not any later version)
8  */
9
10 #include <errno.h>
11 #include <inttypes.h>
12 #include "util.h"
13 #include "ui/ui.h"
14 #include "sort.h"
15 #include "build-id.h"
16 #include "color.h"
17 #include "cache.h"
18 #include "symbol.h"
19 #include "debug.h"
20 #include "annotate.h"
21 #include "evsel.h"
22 #include "block-range.h"
23 #include "string2.h"
24 #include "arch/common.h"
25 #include <regex.h>
26 #include <pthread.h>
27 #include <linux/bitops.h>
28 #include <linux/kernel.h>
29 #include <sys/utsname.h>
30
31 #include "sane_ctype.h"
32
33 const char      *disassembler_style;
34 const char      *objdump_path;
35 static regex_t   file_lineno;
36
37 static struct ins_ops *ins__find(struct arch *arch, const char *name);
38 static void ins__sort(struct arch *arch);
39 static int disasm_line__parse(char *line, const char **namep, char **rawp);
40
41 struct arch {
42         const char      *name;
43         struct ins      *instructions;
44         size_t          nr_instructions;
45         size_t          nr_instructions_allocated;
46         struct ins_ops  *(*associate_instruction_ops)(struct arch *arch, const char *name);
47         bool            sorted_instructions;
48         bool            initialized;
49         void            *priv;
50         int             (*init)(struct arch *arch);
51         struct          {
52                 char comment_char;
53                 char skip_functions_char;
54         } objdump;
55 };
56
57 static struct ins_ops call_ops;
58 static struct ins_ops dec_ops;
59 static struct ins_ops jump_ops;
60 static struct ins_ops mov_ops;
61 static struct ins_ops nop_ops;
62 static struct ins_ops lock_ops;
63 static struct ins_ops ret_ops;
64
65 static int arch__grow_instructions(struct arch *arch)
66 {
67         struct ins *new_instructions;
68         size_t new_nr_allocated;
69
70         if (arch->nr_instructions_allocated == 0 && arch->instructions)
71                 goto grow_from_non_allocated_table;
72
73         new_nr_allocated = arch->nr_instructions_allocated + 128;
74         new_instructions = realloc(arch->instructions, new_nr_allocated * sizeof(struct ins));
75         if (new_instructions == NULL)
76                 return -1;
77
78 out_update_instructions:
79         arch->instructions = new_instructions;
80         arch->nr_instructions_allocated = new_nr_allocated;
81         return 0;
82
83 grow_from_non_allocated_table:
84         new_nr_allocated = arch->nr_instructions + 128;
85         new_instructions = calloc(new_nr_allocated, sizeof(struct ins));
86         if (new_instructions == NULL)
87                 return -1;
88
89         memcpy(new_instructions, arch->instructions, arch->nr_instructions);
90         goto out_update_instructions;
91 }
92
93 static int arch__associate_ins_ops(struct arch* arch, const char *name, struct ins_ops *ops)
94 {
95         struct ins *ins;
96
97         if (arch->nr_instructions == arch->nr_instructions_allocated &&
98             arch__grow_instructions(arch))
99                 return -1;
100
101         ins = &arch->instructions[arch->nr_instructions];
102         ins->name = strdup(name);
103         if (!ins->name)
104                 return -1;
105
106         ins->ops  = ops;
107         arch->nr_instructions++;
108
109         ins__sort(arch);
110         return 0;
111 }
112
113 #include "arch/arm/annotate/instructions.c"
114 #include "arch/arm64/annotate/instructions.c"
115 #include "arch/x86/annotate/instructions.c"
116 #include "arch/powerpc/annotate/instructions.c"
117 #include "arch/s390/annotate/instructions.c"
118
119 static struct arch architectures[] = {
120         {
121                 .name = "arm",
122                 .init = arm__annotate_init,
123         },
124         {
125                 .name = "arm64",
126                 .init = arm64__annotate_init,
127         },
128         {
129                 .name = "x86",
130                 .instructions = x86__instructions,
131                 .nr_instructions = ARRAY_SIZE(x86__instructions),
132                 .objdump =  {
133                         .comment_char = '#',
134                 },
135         },
136         {
137                 .name = "powerpc",
138                 .init = powerpc__annotate_init,
139         },
140         {
141                 .name = "s390",
142                 .init = s390__annotate_init,
143                 .objdump =  {
144                         .comment_char = '#',
145                 },
146         },
147 };
148
149 static void ins__delete(struct ins_operands *ops)
150 {
151         if (ops == NULL)
152                 return;
153         zfree(&ops->source.raw);
154         zfree(&ops->source.name);
155         zfree(&ops->target.raw);
156         zfree(&ops->target.name);
157 }
158
159 static int ins__raw_scnprintf(struct ins *ins, char *bf, size_t size,
160                               struct ins_operands *ops)
161 {
162         return scnprintf(bf, size, "%-6.6s %s", ins->name, ops->raw);
163 }
164
165 int ins__scnprintf(struct ins *ins, char *bf, size_t size,
166                   struct ins_operands *ops)
167 {
168         if (ins->ops->scnprintf)
169                 return ins->ops->scnprintf(ins, bf, size, ops);
170
171         return ins__raw_scnprintf(ins, bf, size, ops);
172 }
173
174 static int call__parse(struct arch *arch, struct ins_operands *ops, struct map *map)
175 {
176         char *endptr, *tok, *name;
177
178         ops->target.addr = strtoull(ops->raw, &endptr, 16);
179
180         name = strchr(endptr, '<');
181         if (name == NULL)
182                 goto indirect_call;
183
184         name++;
185
186         if (arch->objdump.skip_functions_char &&
187             strchr(name, arch->objdump.skip_functions_char))
188                 return -1;
189
190         tok = strchr(name, '>');
191         if (tok == NULL)
192                 return -1;
193
194         *tok = '\0';
195         ops->target.name = strdup(name);
196         *tok = '>';
197
198         return ops->target.name == NULL ? -1 : 0;
199
200 indirect_call:
201         tok = strchr(endptr, '*');
202         if (tok == NULL) {
203                 struct symbol *sym = map__find_symbol(map, map->map_ip(map, ops->target.addr));
204                 if (sym != NULL)
205                         ops->target.name = strdup(sym->name);
206                 else
207                         ops->target.addr = 0;
208                 return 0;
209         }
210
211         ops->target.addr = strtoull(tok + 1, NULL, 16);
212         return 0;
213 }
214
215 static int call__scnprintf(struct ins *ins, char *bf, size_t size,
216                            struct ins_operands *ops)
217 {
218         if (ops->target.name)
219                 return scnprintf(bf, size, "%-6.6s %s", ins->name, ops->target.name);
220
221         if (ops->target.addr == 0)
222                 return ins__raw_scnprintf(ins, bf, size, ops);
223
224         return scnprintf(bf, size, "%-6.6s *%" PRIx64, ins->name, ops->target.addr);
225 }
226
227 static struct ins_ops call_ops = {
228         .parse     = call__parse,
229         .scnprintf = call__scnprintf,
230 };
231
232 bool ins__is_call(const struct ins *ins)
233 {
234         return ins->ops == &call_ops;
235 }
236
237 static int jump__parse(struct arch *arch __maybe_unused, struct ins_operands *ops, struct map *map __maybe_unused)
238 {
239         const char *s = strchr(ops->raw, '+');
240         const char *c = strchr(ops->raw, ',');
241
242         if (c++ != NULL)
243                 ops->target.addr = strtoull(c, NULL, 16);
244         else
245                 ops->target.addr = strtoull(ops->raw, NULL, 16);
246
247         if (s++ != NULL) {
248                 ops->target.offset = strtoull(s, NULL, 16);
249                 ops->target.offset_avail = true;
250         } else {
251                 ops->target.offset_avail = false;
252         }
253
254         return 0;
255 }
256
257 static int jump__scnprintf(struct ins *ins, char *bf, size_t size,
258                            struct ins_operands *ops)
259 {
260         if (!ops->target.addr || ops->target.offset < 0)
261                 return ins__raw_scnprintf(ins, bf, size, ops);
262
263         return scnprintf(bf, size, "%-6.6s %" PRIx64, ins->name, ops->target.offset);
264 }
265
266 static struct ins_ops jump_ops = {
267         .parse     = jump__parse,
268         .scnprintf = jump__scnprintf,
269 };
270
271 bool ins__is_jump(const struct ins *ins)
272 {
273         return ins->ops == &jump_ops;
274 }
275
276 static int comment__symbol(char *raw, char *comment, u64 *addrp, char **namep)
277 {
278         char *endptr, *name, *t;
279
280         if (strstr(raw, "(%rip)") == NULL)
281                 return 0;
282
283         *addrp = strtoull(comment, &endptr, 16);
284         name = strchr(endptr, '<');
285         if (name == NULL)
286                 return -1;
287
288         name++;
289
290         t = strchr(name, '>');
291         if (t == NULL)
292                 return 0;
293
294         *t = '\0';
295         *namep = strdup(name);
296         *t = '>';
297
298         return 0;
299 }
300
301 static int lock__parse(struct arch *arch, struct ins_operands *ops, struct map *map)
302 {
303         ops->locked.ops = zalloc(sizeof(*ops->locked.ops));
304         if (ops->locked.ops == NULL)
305                 return 0;
306
307         if (disasm_line__parse(ops->raw, &ops->locked.ins.name, &ops->locked.ops->raw) < 0)
308                 goto out_free_ops;
309
310         ops->locked.ins.ops = ins__find(arch, ops->locked.ins.name);
311
312         if (ops->locked.ins.ops == NULL)
313                 goto out_free_ops;
314
315         if (ops->locked.ins.ops->parse &&
316             ops->locked.ins.ops->parse(arch, ops->locked.ops, map) < 0)
317                 goto out_free_ops;
318
319         return 0;
320
321 out_free_ops:
322         zfree(&ops->locked.ops);
323         return 0;
324 }
325
326 static int lock__scnprintf(struct ins *ins, char *bf, size_t size,
327                            struct ins_operands *ops)
328 {
329         int printed;
330
331         if (ops->locked.ins.ops == NULL)
332                 return ins__raw_scnprintf(ins, bf, size, ops);
333
334         printed = scnprintf(bf, size, "%-6.6s ", ins->name);
335         return printed + ins__scnprintf(&ops->locked.ins, bf + printed,
336                                         size - printed, ops->locked.ops);
337 }
338
339 static void lock__delete(struct ins_operands *ops)
340 {
341         struct ins *ins = &ops->locked.ins;
342
343         if (ins->ops && ins->ops->free)
344                 ins->ops->free(ops->locked.ops);
345         else
346                 ins__delete(ops->locked.ops);
347
348         zfree(&ops->locked.ops);
349         zfree(&ops->target.raw);
350         zfree(&ops->target.name);
351 }
352
353 static struct ins_ops lock_ops = {
354         .free      = lock__delete,
355         .parse     = lock__parse,
356         .scnprintf = lock__scnprintf,
357 };
358
359 static int mov__parse(struct arch *arch, struct ins_operands *ops, struct map *map __maybe_unused)
360 {
361         char *s = strchr(ops->raw, ','), *target, *comment, prev;
362
363         if (s == NULL)
364                 return -1;
365
366         *s = '\0';
367         ops->source.raw = strdup(ops->raw);
368         *s = ',';
369
370         if (ops->source.raw == NULL)
371                 return -1;
372
373         target = ++s;
374         comment = strchr(s, arch->objdump.comment_char);
375
376         if (comment != NULL)
377                 s = comment - 1;
378         else
379                 s = strchr(s, '\0') - 1;
380
381         while (s > target && isspace(s[0]))
382                 --s;
383         s++;
384         prev = *s;
385         *s = '\0';
386
387         ops->target.raw = strdup(target);
388         *s = prev;
389
390         if (ops->target.raw == NULL)
391                 goto out_free_source;
392
393         if (comment == NULL)
394                 return 0;
395
396         comment = ltrim(comment);
397         comment__symbol(ops->source.raw, comment, &ops->source.addr, &ops->source.name);
398         comment__symbol(ops->target.raw, comment, &ops->target.addr, &ops->target.name);
399
400         return 0;
401
402 out_free_source:
403         zfree(&ops->source.raw);
404         return -1;
405 }
406
407 static int mov__scnprintf(struct ins *ins, char *bf, size_t size,
408                            struct ins_operands *ops)
409 {
410         return scnprintf(bf, size, "%-6.6s %s,%s", ins->name,
411                          ops->source.name ?: ops->source.raw,
412                          ops->target.name ?: ops->target.raw);
413 }
414
415 static struct ins_ops mov_ops = {
416         .parse     = mov__parse,
417         .scnprintf = mov__scnprintf,
418 };
419
420 static int dec__parse(struct arch *arch __maybe_unused, struct ins_operands *ops, struct map *map __maybe_unused)
421 {
422         char *target, *comment, *s, prev;
423
424         target = s = ops->raw;
425
426         while (s[0] != '\0' && !isspace(s[0]))
427                 ++s;
428         prev = *s;
429         *s = '\0';
430
431         ops->target.raw = strdup(target);
432         *s = prev;
433
434         if (ops->target.raw == NULL)
435                 return -1;
436
437         comment = strchr(s, arch->objdump.comment_char);
438         if (comment == NULL)
439                 return 0;
440
441         comment = ltrim(comment);
442         comment__symbol(ops->target.raw, comment, &ops->target.addr, &ops->target.name);
443
444         return 0;
445 }
446
447 static int dec__scnprintf(struct ins *ins, char *bf, size_t size,
448                            struct ins_operands *ops)
449 {
450         return scnprintf(bf, size, "%-6.6s %s", ins->name,
451                          ops->target.name ?: ops->target.raw);
452 }
453
454 static struct ins_ops dec_ops = {
455         .parse     = dec__parse,
456         .scnprintf = dec__scnprintf,
457 };
458
459 static int nop__scnprintf(struct ins *ins __maybe_unused, char *bf, size_t size,
460                           struct ins_operands *ops __maybe_unused)
461 {
462         return scnprintf(bf, size, "%-6.6s", "nop");
463 }
464
465 static struct ins_ops nop_ops = {
466         .scnprintf = nop__scnprintf,
467 };
468
469 static struct ins_ops ret_ops = {
470         .scnprintf = ins__raw_scnprintf,
471 };
472
473 bool ins__is_ret(const struct ins *ins)
474 {
475         return ins->ops == &ret_ops;
476 }
477
478 static int ins__key_cmp(const void *name, const void *insp)
479 {
480         const struct ins *ins = insp;
481
482         return strcmp(name, ins->name);
483 }
484
485 static int ins__cmp(const void *a, const void *b)
486 {
487         const struct ins *ia = a;
488         const struct ins *ib = b;
489
490         return strcmp(ia->name, ib->name);
491 }
492
493 static void ins__sort(struct arch *arch)
494 {
495         const int nmemb = arch->nr_instructions;
496
497         qsort(arch->instructions, nmemb, sizeof(struct ins), ins__cmp);
498 }
499
500 static struct ins_ops *__ins__find(struct arch *arch, const char *name)
501 {
502         struct ins *ins;
503         const int nmemb = arch->nr_instructions;
504
505         if (!arch->sorted_instructions) {
506                 ins__sort(arch);
507                 arch->sorted_instructions = true;
508         }
509
510         ins = bsearch(name, arch->instructions, nmemb, sizeof(struct ins), ins__key_cmp);
511         return ins ? ins->ops : NULL;
512 }
513
514 static struct ins_ops *ins__find(struct arch *arch, const char *name)
515 {
516         struct ins_ops *ops = __ins__find(arch, name);
517
518         if (!ops && arch->associate_instruction_ops)
519                 ops = arch->associate_instruction_ops(arch, name);
520
521         return ops;
522 }
523
524 static int arch__key_cmp(const void *name, const void *archp)
525 {
526         const struct arch *arch = archp;
527
528         return strcmp(name, arch->name);
529 }
530
531 static int arch__cmp(const void *a, const void *b)
532 {
533         const struct arch *aa = a;
534         const struct arch *ab = b;
535
536         return strcmp(aa->name, ab->name);
537 }
538
539 static void arch__sort(void)
540 {
541         const int nmemb = ARRAY_SIZE(architectures);
542
543         qsort(architectures, nmemb, sizeof(struct arch), arch__cmp);
544 }
545
546 static struct arch *arch__find(const char *name)
547 {
548         const int nmemb = ARRAY_SIZE(architectures);
549         static bool sorted;
550
551         if (!sorted) {
552                 arch__sort();
553                 sorted = true;
554         }
555
556         return bsearch(name, architectures, nmemb, sizeof(struct arch), arch__key_cmp);
557 }
558
559 int symbol__alloc_hist(struct symbol *sym)
560 {
561         struct annotation *notes = symbol__annotation(sym);
562         const size_t size = symbol__size(sym);
563         size_t sizeof_sym_hist;
564
565         /* Check for overflow when calculating sizeof_sym_hist */
566         if (size > (SIZE_MAX - sizeof(struct sym_hist)) / sizeof(u64))
567                 return -1;
568
569         sizeof_sym_hist = (sizeof(struct sym_hist) + size * sizeof(u64));
570
571         /* Check for overflow in zalloc argument */
572         if (sizeof_sym_hist > (SIZE_MAX - sizeof(*notes->src))
573                                 / symbol_conf.nr_events)
574                 return -1;
575
576         notes->src = zalloc(sizeof(*notes->src) + symbol_conf.nr_events * sizeof_sym_hist);
577         if (notes->src == NULL)
578                 return -1;
579         notes->src->sizeof_sym_hist = sizeof_sym_hist;
580         notes->src->nr_histograms   = symbol_conf.nr_events;
581         INIT_LIST_HEAD(&notes->src->source);
582         return 0;
583 }
584
585 /* The cycles histogram is lazily allocated. */
586 static int symbol__alloc_hist_cycles(struct symbol *sym)
587 {
588         struct annotation *notes = symbol__annotation(sym);
589         const size_t size = symbol__size(sym);
590
591         notes->src->cycles_hist = calloc(size, sizeof(struct cyc_hist));
592         if (notes->src->cycles_hist == NULL)
593                 return -1;
594         return 0;
595 }
596
597 void symbol__annotate_zero_histograms(struct symbol *sym)
598 {
599         struct annotation *notes = symbol__annotation(sym);
600
601         pthread_mutex_lock(&notes->lock);
602         if (notes->src != NULL) {
603                 memset(notes->src->histograms, 0,
604                        notes->src->nr_histograms * notes->src->sizeof_sym_hist);
605                 if (notes->src->cycles_hist)
606                         memset(notes->src->cycles_hist, 0,
607                                 symbol__size(sym) * sizeof(struct cyc_hist));
608         }
609         pthread_mutex_unlock(&notes->lock);
610 }
611
612 static int __symbol__account_cycles(struct annotation *notes,
613                                     u64 start,
614                                     unsigned offset, unsigned cycles,
615                                     unsigned have_start)
616 {
617         struct cyc_hist *ch;
618
619         ch = notes->src->cycles_hist;
620         /*
621          * For now we can only account one basic block per
622          * final jump. But multiple could be overlapping.
623          * Always account the longest one. So when
624          * a shorter one has been already seen throw it away.
625          *
626          * We separately always account the full cycles.
627          */
628         ch[offset].num_aggr++;
629         ch[offset].cycles_aggr += cycles;
630
631         if (!have_start && ch[offset].have_start)
632                 return 0;
633         if (ch[offset].num) {
634                 if (have_start && (!ch[offset].have_start ||
635                                    ch[offset].start > start)) {
636                         ch[offset].have_start = 0;
637                         ch[offset].cycles = 0;
638                         ch[offset].num = 0;
639                         if (ch[offset].reset < 0xffff)
640                                 ch[offset].reset++;
641                 } else if (have_start &&
642                            ch[offset].start < start)
643                         return 0;
644         }
645         ch[offset].have_start = have_start;
646         ch[offset].start = start;
647         ch[offset].cycles += cycles;
648         ch[offset].num++;
649         return 0;
650 }
651
652 static int __symbol__inc_addr_samples(struct symbol *sym, struct map *map,
653                                       struct annotation *notes, int evidx, u64 addr)
654 {
655         unsigned offset;
656         struct sym_hist *h;
657
658         pr_debug3("%s: addr=%#" PRIx64 "\n", __func__, map->unmap_ip(map, addr));
659
660         if ((addr < sym->start || addr >= sym->end) &&
661             (addr != sym->end || sym->start != sym->end)) {
662                 pr_debug("%s(%d): ERANGE! sym->name=%s, start=%#" PRIx64 ", addr=%#" PRIx64 ", end=%#" PRIx64 "\n",
663                        __func__, __LINE__, sym->name, sym->start, addr, sym->end);
664                 return -ERANGE;
665         }
666
667         offset = addr - sym->start;
668         h = annotation__histogram(notes, evidx);
669         h->sum++;
670         h->addr[offset]++;
671
672         pr_debug3("%#" PRIx64 " %s: period++ [addr: %#" PRIx64 ", %#" PRIx64
673                   ", evidx=%d] => %" PRIu64 "\n", sym->start, sym->name,
674                   addr, addr - sym->start, evidx, h->addr[offset]);
675         return 0;
676 }
677
678 static struct annotation *symbol__get_annotation(struct symbol *sym, bool cycles)
679 {
680         struct annotation *notes = symbol__annotation(sym);
681
682         if (notes->src == NULL) {
683                 if (symbol__alloc_hist(sym) < 0)
684                         return NULL;
685         }
686         if (!notes->src->cycles_hist && cycles) {
687                 if (symbol__alloc_hist_cycles(sym) < 0)
688                         return NULL;
689         }
690         return notes;
691 }
692
693 static int symbol__inc_addr_samples(struct symbol *sym, struct map *map,
694                                     int evidx, u64 addr)
695 {
696         struct annotation *notes;
697
698         if (sym == NULL)
699                 return 0;
700         notes = symbol__get_annotation(sym, false);
701         if (notes == NULL)
702                 return -ENOMEM;
703         return __symbol__inc_addr_samples(sym, map, notes, evidx, addr);
704 }
705
706 static int symbol__account_cycles(u64 addr, u64 start,
707                                   struct symbol *sym, unsigned cycles)
708 {
709         struct annotation *notes;
710         unsigned offset;
711
712         if (sym == NULL)
713                 return 0;
714         notes = symbol__get_annotation(sym, true);
715         if (notes == NULL)
716                 return -ENOMEM;
717         if (addr < sym->start || addr >= sym->end)
718                 return -ERANGE;
719
720         if (start) {
721                 if (start < sym->start || start >= sym->end)
722                         return -ERANGE;
723                 if (start >= addr)
724                         start = 0;
725         }
726         offset = addr - sym->start;
727         return __symbol__account_cycles(notes,
728                                         start ? start - sym->start : 0,
729                                         offset, cycles,
730                                         !!start);
731 }
732
733 int addr_map_symbol__account_cycles(struct addr_map_symbol *ams,
734                                     struct addr_map_symbol *start,
735                                     unsigned cycles)
736 {
737         u64 saddr = 0;
738         int err;
739
740         if (!cycles)
741                 return 0;
742
743         /*
744          * Only set start when IPC can be computed. We can only
745          * compute it when the basic block is completely in a single
746          * function.
747          * Special case the case when the jump is elsewhere, but
748          * it starts on the function start.
749          */
750         if (start &&
751                 (start->sym == ams->sym ||
752                  (ams->sym &&
753                    start->addr == ams->sym->start + ams->map->start)))
754                 saddr = start->al_addr;
755         if (saddr == 0)
756                 pr_debug2("BB with bad start: addr %"PRIx64" start %"PRIx64" sym %"PRIx64" saddr %"PRIx64"\n",
757                         ams->addr,
758                         start ? start->addr : 0,
759                         ams->sym ? ams->sym->start + ams->map->start : 0,
760                         saddr);
761         err = symbol__account_cycles(ams->al_addr, saddr, ams->sym, cycles);
762         if (err)
763                 pr_debug2("account_cycles failed %d\n", err);
764         return err;
765 }
766
767 int addr_map_symbol__inc_samples(struct addr_map_symbol *ams, int evidx)
768 {
769         return symbol__inc_addr_samples(ams->sym, ams->map, evidx, ams->al_addr);
770 }
771
772 int hist_entry__inc_addr_samples(struct hist_entry *he, int evidx, u64 ip)
773 {
774         return symbol__inc_addr_samples(he->ms.sym, he->ms.map, evidx, ip);
775 }
776
777 static void disasm_line__init_ins(struct disasm_line *dl, struct arch *arch, struct map *map)
778 {
779         dl->ins.ops = ins__find(arch, dl->ins.name);
780
781         if (!dl->ins.ops)
782                 return;
783
784         if (dl->ins.ops->parse && dl->ins.ops->parse(arch, &dl->ops, map) < 0)
785                 dl->ins.ops = NULL;
786 }
787
788 static int disasm_line__parse(char *line, const char **namep, char **rawp)
789 {
790         char tmp, *name = ltrim(line);
791
792         if (name[0] == '\0')
793                 return -1;
794
795         *rawp = name + 1;
796
797         while ((*rawp)[0] != '\0' && !isspace((*rawp)[0]))
798                 ++*rawp;
799
800         tmp = (*rawp)[0];
801         (*rawp)[0] = '\0';
802         *namep = strdup(name);
803
804         if (*namep == NULL)
805                 goto out_free_name;
806
807         (*rawp)[0] = tmp;
808         *rawp = ltrim(*rawp);
809
810         return 0;
811
812 out_free_name:
813         free((void *)namep);
814         *namep = NULL;
815         return -1;
816 }
817
818 static struct disasm_line *disasm_line__new(s64 offset, char *line,
819                                             size_t privsize, int line_nr,
820                                             struct arch *arch,
821                                             struct map *map)
822 {
823         struct disasm_line *dl = zalloc(sizeof(*dl) + privsize);
824
825         if (dl != NULL) {
826                 dl->offset = offset;
827                 dl->line = strdup(line);
828                 dl->line_nr = line_nr;
829                 if (dl->line == NULL)
830                         goto out_delete;
831
832                 if (offset != -1) {
833                         if (disasm_line__parse(dl->line, &dl->ins.name, &dl->ops.raw) < 0)
834                                 goto out_free_line;
835
836                         disasm_line__init_ins(dl, arch, map);
837                 }
838         }
839
840         return dl;
841
842 out_free_line:
843         zfree(&dl->line);
844 out_delete:
845         free(dl);
846         return NULL;
847 }
848
849 void disasm_line__free(struct disasm_line *dl)
850 {
851         zfree(&dl->line);
852         if (dl->ins.ops && dl->ins.ops->free)
853                 dl->ins.ops->free(&dl->ops);
854         else
855                 ins__delete(&dl->ops);
856         free((void *)dl->ins.name);
857         dl->ins.name = NULL;
858         free(dl);
859 }
860
861 int disasm_line__scnprintf(struct disasm_line *dl, char *bf, size_t size, bool raw)
862 {
863         if (raw || !dl->ins.ops)
864                 return scnprintf(bf, size, "%-6.6s %s", dl->ins.name, dl->ops.raw);
865
866         return ins__scnprintf(&dl->ins, bf, size, &dl->ops);
867 }
868
869 static void disasm__add(struct list_head *head, struct disasm_line *line)
870 {
871         list_add_tail(&line->node, head);
872 }
873
874 struct disasm_line *disasm__get_next_ip_line(struct list_head *head, struct disasm_line *pos)
875 {
876         list_for_each_entry_continue(pos, head, node)
877                 if (pos->offset >= 0)
878                         return pos;
879
880         return NULL;
881 }
882
883 double disasm__calc_percent(struct annotation *notes, int evidx, s64 offset,
884                             s64 end, const char **path, u64 *nr_samples)
885 {
886         struct source_line *src_line = notes->src->lines;
887         double percent = 0.0;
888         *nr_samples = 0;
889
890         if (src_line) {
891                 size_t sizeof_src_line = sizeof(*src_line) +
892                                 sizeof(src_line->samples) * (src_line->nr_pcnt - 1);
893
894                 while (offset < end) {
895                         src_line = (void *)notes->src->lines +
896                                         (sizeof_src_line * offset);
897
898                         if (*path == NULL)
899                                 *path = src_line->path;
900
901                         percent += src_line->samples[evidx].percent;
902                         *nr_samples += src_line->samples[evidx].nr;
903                         offset++;
904                 }
905         } else {
906                 struct sym_hist *h = annotation__histogram(notes, evidx);
907                 unsigned int hits = 0;
908
909                 while (offset < end)
910                         hits += h->addr[offset++];
911
912                 if (h->sum) {
913                         *nr_samples = hits;
914                         percent = 100.0 * hits / h->sum;
915                 }
916         }
917
918         return percent;
919 }
920
921 static const char *annotate__address_color(struct block_range *br)
922 {
923         double cov = block_range__coverage(br);
924
925         if (cov >= 0) {
926                 /* mark red for >75% coverage */
927                 if (cov > 0.75)
928                         return PERF_COLOR_RED;
929
930                 /* mark dull for <1% coverage */
931                 if (cov < 0.01)
932                         return PERF_COLOR_NORMAL;
933         }
934
935         return PERF_COLOR_MAGENTA;
936 }
937
938 static const char *annotate__asm_color(struct block_range *br)
939 {
940         double cov = block_range__coverage(br);
941
942         if (cov >= 0) {
943                 /* mark dull for <1% coverage */
944                 if (cov < 0.01)
945                         return PERF_COLOR_NORMAL;
946         }
947
948         return PERF_COLOR_BLUE;
949 }
950
951 static void annotate__branch_printf(struct block_range *br, u64 addr)
952 {
953         bool emit_comment = true;
954
955         if (!br)
956                 return;
957
958 #if 1
959         if (br->is_target && br->start == addr) {
960                 struct block_range *branch = br;
961                 double p;
962
963                 /*
964                  * Find matching branch to our target.
965                  */
966                 while (!branch->is_branch)
967                         branch = block_range__next(branch);
968
969                 p = 100 *(double)br->entry / branch->coverage;
970
971                 if (p > 0.1) {
972                         if (emit_comment) {
973                                 emit_comment = false;
974                                 printf("\t#");
975                         }
976
977                         /*
978                          * The percentage of coverage joined at this target in relation
979                          * to the next branch.
980                          */
981                         printf(" +%.2f%%", p);
982                 }
983         }
984 #endif
985         if (br->is_branch && br->end == addr) {
986                 double p = 100*(double)br->taken / br->coverage;
987
988                 if (p > 0.1) {
989                         if (emit_comment) {
990                                 emit_comment = false;
991                                 printf("\t#");
992                         }
993
994                         /*
995                          * The percentage of coverage leaving at this branch, and
996                          * its prediction ratio.
997                          */
998                         printf(" -%.2f%% (p:%.2f%%)", p, 100*(double)br->pred  / br->taken);
999                 }
1000         }
1001 }
1002
1003
1004 static int disasm_line__print(struct disasm_line *dl, struct symbol *sym, u64 start,
1005                       struct perf_evsel *evsel, u64 len, int min_pcnt, int printed,
1006                       int max_lines, struct disasm_line *queue)
1007 {
1008         static const char *prev_line;
1009         static const char *prev_color;
1010
1011         if (dl->offset != -1) {
1012                 const char *path = NULL;
1013                 u64 nr_samples;
1014                 double percent, max_percent = 0.0;
1015                 double *ppercents = &percent;
1016                 u64 *psamples = &nr_samples;
1017                 int i, nr_percent = 1;
1018                 const char *color;
1019                 struct annotation *notes = symbol__annotation(sym);
1020                 s64 offset = dl->offset;
1021                 const u64 addr = start + offset;
1022                 struct disasm_line *next;
1023                 struct block_range *br;
1024
1025                 next = disasm__get_next_ip_line(&notes->src->source, dl);
1026
1027                 if (perf_evsel__is_group_event(evsel)) {
1028                         nr_percent = evsel->nr_members;
1029                         ppercents = calloc(nr_percent, sizeof(double));
1030                         psamples = calloc(nr_percent, sizeof(u64));
1031                         if (ppercents == NULL || psamples == NULL) {
1032                                 return -1;
1033                         }
1034                 }
1035
1036                 for (i = 0; i < nr_percent; i++) {
1037                         percent = disasm__calc_percent(notes,
1038                                         notes->src->lines ? i : evsel->idx + i,
1039                                         offset,
1040                                         next ? next->offset : (s64) len,
1041                                         &path, &nr_samples);
1042
1043                         ppercents[i] = percent;
1044                         psamples[i] = nr_samples;
1045                         if (percent > max_percent)
1046                                 max_percent = percent;
1047                 }
1048
1049                 if (max_percent < min_pcnt)
1050                         return -1;
1051
1052                 if (max_lines && printed >= max_lines)
1053                         return 1;
1054
1055                 if (queue != NULL) {
1056                         list_for_each_entry_from(queue, &notes->src->source, node) {
1057                                 if (queue == dl)
1058                                         break;
1059                                 disasm_line__print(queue, sym, start, evsel, len,
1060                                                     0, 0, 1, NULL);
1061                         }
1062                 }
1063
1064                 color = get_percent_color(max_percent);
1065
1066                 /*
1067                  * Also color the filename and line if needed, with
1068                  * the same color than the percentage. Don't print it
1069                  * twice for close colored addr with the same filename:line
1070                  */
1071                 if (path) {
1072                         if (!prev_line || strcmp(prev_line, path)
1073                                        || color != prev_color) {
1074                                 color_fprintf(stdout, color, " %s", path);
1075                                 prev_line = path;
1076                                 prev_color = color;
1077                         }
1078                 }
1079
1080                 for (i = 0; i < nr_percent; i++) {
1081                         percent = ppercents[i];
1082                         nr_samples = psamples[i];
1083                         color = get_percent_color(percent);
1084
1085                         if (symbol_conf.show_total_period)
1086                                 color_fprintf(stdout, color, " %7" PRIu64,
1087                                               nr_samples);
1088                         else
1089                                 color_fprintf(stdout, color, " %7.2f", percent);
1090                 }
1091
1092                 printf(" :      ");
1093
1094                 br = block_range__find(addr);
1095                 color_fprintf(stdout, annotate__address_color(br), "  %" PRIx64 ":", addr);
1096                 color_fprintf(stdout, annotate__asm_color(br), "%s", dl->line);
1097                 annotate__branch_printf(br, addr);
1098                 printf("\n");
1099
1100                 if (ppercents != &percent)
1101                         free(ppercents);
1102
1103                 if (psamples != &nr_samples)
1104                         free(psamples);
1105
1106         } else if (max_lines && printed >= max_lines)
1107                 return 1;
1108         else {
1109                 int width = 8;
1110
1111                 if (queue)
1112                         return -1;
1113
1114                 if (perf_evsel__is_group_event(evsel))
1115                         width *= evsel->nr_members;
1116
1117                 if (!*dl->line)
1118                         printf(" %*s:\n", width, " ");
1119                 else
1120                         printf(" %*s:   %s\n", width, " ", dl->line);
1121         }
1122
1123         return 0;
1124 }
1125
1126 /*
1127  * symbol__parse_objdump_line() parses objdump output (with -d --no-show-raw)
1128  * which looks like following
1129  *
1130  *  0000000000415500 <_init>:
1131  *    415500:       sub    $0x8,%rsp
1132  *    415504:       mov    0x2f5ad5(%rip),%rax        # 70afe0 <_DYNAMIC+0x2f8>
1133  *    41550b:       test   %rax,%rax
1134  *    41550e:       je     415515 <_init+0x15>
1135  *    415510:       callq  416e70 <__gmon_start__@plt>
1136  *    415515:       add    $0x8,%rsp
1137  *    415519:       retq
1138  *
1139  * it will be parsed and saved into struct disasm_line as
1140  *  <offset>       <name>  <ops.raw>
1141  *
1142  * The offset will be a relative offset from the start of the symbol and -1
1143  * means that it's not a disassembly line so should be treated differently.
1144  * The ops.raw part will be parsed further according to type of the instruction.
1145  */
1146 static int symbol__parse_objdump_line(struct symbol *sym, struct map *map,
1147                                       struct arch *arch,
1148                                       FILE *file, size_t privsize,
1149                                       int *line_nr)
1150 {
1151         struct annotation *notes = symbol__annotation(sym);
1152         struct disasm_line *dl;
1153         char *line = NULL, *parsed_line, *tmp, *tmp2;
1154         size_t line_len;
1155         s64 line_ip, offset = -1;
1156         regmatch_t match[2];
1157
1158         if (getline(&line, &line_len, file) < 0)
1159                 return -1;
1160
1161         if (!line)
1162                 return -1;
1163
1164         line_ip = -1;
1165         parsed_line = rtrim(line);
1166
1167         /* /filename:linenr ? Save line number and ignore. */
1168         if (regexec(&file_lineno, parsed_line, 2, match, 0) == 0) {
1169                 *line_nr = atoi(parsed_line + match[1].rm_so);
1170                 return 0;
1171         }
1172
1173         tmp = ltrim(parsed_line);
1174         if (*tmp) {
1175                 /*
1176                  * Parse hexa addresses followed by ':'
1177                  */
1178                 line_ip = strtoull(tmp, &tmp2, 16);
1179                 if (*tmp2 != ':' || tmp == tmp2 || tmp2[1] == '\0')
1180                         line_ip = -1;
1181         }
1182
1183         if (line_ip != -1) {
1184                 u64 start = map__rip_2objdump(map, sym->start),
1185                     end = map__rip_2objdump(map, sym->end);
1186
1187                 offset = line_ip - start;
1188                 if ((u64)line_ip < start || (u64)line_ip >= end)
1189                         offset = -1;
1190                 else
1191                         parsed_line = tmp2 + 1;
1192         }
1193
1194         dl = disasm_line__new(offset, parsed_line, privsize, *line_nr, arch, map);
1195         free(line);
1196         (*line_nr)++;
1197
1198         if (dl == NULL)
1199                 return -1;
1200
1201         if (!disasm_line__has_offset(dl)) {
1202                 dl->ops.target.offset = dl->ops.target.addr -
1203                                         map__rip_2objdump(map, sym->start);
1204                 dl->ops.target.offset_avail = true;
1205         }
1206
1207         /* kcore has no symbols, so add the call target name */
1208         if (dl->ins.ops && ins__is_call(&dl->ins) && !dl->ops.target.name) {
1209                 struct addr_map_symbol target = {
1210                         .map = map,
1211                         .addr = dl->ops.target.addr,
1212                 };
1213
1214                 if (!map_groups__find_ams(&target) &&
1215                     target.sym->start == target.al_addr)
1216                         dl->ops.target.name = strdup(target.sym->name);
1217         }
1218
1219         disasm__add(&notes->src->source, dl);
1220
1221         return 0;
1222 }
1223
1224 static __attribute__((constructor)) void symbol__init_regexpr(void)
1225 {
1226         regcomp(&file_lineno, "^/[^:]+:([0-9]+)", REG_EXTENDED);
1227 }
1228
1229 static void delete_last_nop(struct symbol *sym)
1230 {
1231         struct annotation *notes = symbol__annotation(sym);
1232         struct list_head *list = &notes->src->source;
1233         struct disasm_line *dl;
1234
1235         while (!list_empty(list)) {
1236                 dl = list_entry(list->prev, struct disasm_line, node);
1237
1238                 if (dl->ins.ops) {
1239                         if (dl->ins.ops != &nop_ops)
1240                                 return;
1241                 } else {
1242                         if (!strstr(dl->line, " nop ") &&
1243                             !strstr(dl->line, " nopl ") &&
1244                             !strstr(dl->line, " nopw "))
1245                                 return;
1246                 }
1247
1248                 list_del(&dl->node);
1249                 disasm_line__free(dl);
1250         }
1251 }
1252
1253 int symbol__strerror_disassemble(struct symbol *sym __maybe_unused, struct map *map,
1254                               int errnum, char *buf, size_t buflen)
1255 {
1256         struct dso *dso = map->dso;
1257
1258         BUG_ON(buflen == 0);
1259
1260         if (errnum >= 0) {
1261                 str_error_r(errnum, buf, buflen);
1262                 return 0;
1263         }
1264
1265         switch (errnum) {
1266         case SYMBOL_ANNOTATE_ERRNO__NO_VMLINUX: {
1267                 char bf[SBUILD_ID_SIZE + 15] = " with build id ";
1268                 char *build_id_msg = NULL;
1269
1270                 if (dso->has_build_id) {
1271                         build_id__sprintf(dso->build_id,
1272                                           sizeof(dso->build_id), bf + 15);
1273                         build_id_msg = bf;
1274                 }
1275                 scnprintf(buf, buflen,
1276                           "No vmlinux file%s\nwas found in the path.\n\n"
1277                           "Note that annotation using /proc/kcore requires CAP_SYS_RAWIO capability.\n\n"
1278                           "Please use:\n\n"
1279                           "  perf buildid-cache -vu vmlinux\n\n"
1280                           "or:\n\n"
1281                           "  --vmlinux vmlinux\n", build_id_msg ?: "");
1282         }
1283                 break;
1284         default:
1285                 scnprintf(buf, buflen, "Internal error: Invalid %d error code\n", errnum);
1286                 break;
1287         }
1288
1289         return 0;
1290 }
1291
1292 static int dso__disassemble_filename(struct dso *dso, char *filename, size_t filename_size)
1293 {
1294         char linkname[PATH_MAX];
1295         char *build_id_filename;
1296         char *build_id_path = NULL;
1297
1298         if (dso->symtab_type == DSO_BINARY_TYPE__KALLSYMS &&
1299             !dso__is_kcore(dso))
1300                 return SYMBOL_ANNOTATE_ERRNO__NO_VMLINUX;
1301
1302         build_id_filename = dso__build_id_filename(dso, NULL, 0);
1303         if (build_id_filename) {
1304                 __symbol__join_symfs(filename, filename_size, build_id_filename);
1305                 free(build_id_filename);
1306         } else {
1307                 if (dso->has_build_id)
1308                         return ENOMEM;
1309                 goto fallback;
1310         }
1311
1312         build_id_path = strdup(filename);
1313         if (!build_id_path)
1314                 return -1;
1315
1316         dirname(build_id_path);
1317
1318         if (dso__is_kcore(dso) ||
1319             readlink(build_id_path, linkname, sizeof(linkname)) < 0 ||
1320             strstr(linkname, DSO__NAME_KALLSYMS) ||
1321             access(filename, R_OK)) {
1322 fallback:
1323                 /*
1324                  * If we don't have build-ids or the build-id file isn't in the
1325                  * cache, or is just a kallsyms file, well, lets hope that this
1326                  * DSO is the same as when 'perf record' ran.
1327                  */
1328                 __symbol__join_symfs(filename, filename_size, dso->long_name);
1329         }
1330
1331         free(build_id_path);
1332         return 0;
1333 }
1334
1335 static const char *annotate__norm_arch(const char *arch_name)
1336 {
1337         struct utsname uts;
1338
1339         if (!arch_name) { /* Assume we are annotating locally. */
1340                 if (uname(&uts) < 0)
1341                         return NULL;
1342                 arch_name = uts.machine;
1343         }
1344         return normalize_arch((char *)arch_name);
1345 }
1346
1347 int symbol__disassemble(struct symbol *sym, struct map *map, const char *arch_name, size_t privsize)
1348 {
1349         struct dso *dso = map->dso;
1350         char command[PATH_MAX * 2];
1351         struct arch *arch = NULL;
1352         FILE *file;
1353         char symfs_filename[PATH_MAX];
1354         struct kcore_extract kce;
1355         bool delete_extract = false;
1356         int stdout_fd[2];
1357         int lineno = 0;
1358         int nline;
1359         pid_t pid;
1360         int err = dso__disassemble_filename(dso, symfs_filename, sizeof(symfs_filename));
1361
1362         if (err)
1363                 return err;
1364
1365         arch_name = annotate__norm_arch(arch_name);
1366         if (!arch_name)
1367                 return -1;
1368
1369         arch = arch__find(arch_name);
1370         if (arch == NULL)
1371                 return -ENOTSUP;
1372
1373         if (arch->init) {
1374                 err = arch->init(arch);
1375                 if (err) {
1376                         pr_err("%s: failed to initialize %s arch priv area\n", __func__, arch->name);
1377                         return err;
1378                 }
1379         }
1380
1381         pr_debug("%s: filename=%s, sym=%s, start=%#" PRIx64 ", end=%#" PRIx64 "\n", __func__,
1382                  symfs_filename, sym->name, map->unmap_ip(map, sym->start),
1383                  map->unmap_ip(map, sym->end));
1384
1385         pr_debug("annotating [%p] %30s : [%p] %30s\n",
1386                  dso, dso->long_name, sym, sym->name);
1387
1388         if (dso__is_kcore(dso)) {
1389                 kce.kcore_filename = symfs_filename;
1390                 kce.addr = map__rip_2objdump(map, sym->start);
1391                 kce.offs = sym->start;
1392                 kce.len = sym->end - sym->start;
1393                 if (!kcore_extract__create(&kce)) {
1394                         delete_extract = true;
1395                         strlcpy(symfs_filename, kce.extract_filename,
1396                                 sizeof(symfs_filename));
1397                 }
1398         } else if (dso__needs_decompress(dso)) {
1399                 char tmp[PATH_MAX];
1400                 struct kmod_path m;
1401                 int fd;
1402                 bool ret;
1403
1404                 if (kmod_path__parse_ext(&m, symfs_filename))
1405                         goto out;
1406
1407                 snprintf(tmp, PATH_MAX, "/tmp/perf-kmod-XXXXXX");
1408
1409                 fd = mkstemp(tmp);
1410                 if (fd < 0) {
1411                         free(m.ext);
1412                         goto out;
1413                 }
1414
1415                 ret = decompress_to_file(m.ext, symfs_filename, fd);
1416
1417                 if (ret)
1418                         pr_err("Cannot decompress %s %s\n", m.ext, symfs_filename);
1419
1420                 free(m.ext);
1421                 close(fd);
1422
1423                 if (!ret)
1424                         goto out;
1425
1426                 strcpy(symfs_filename, tmp);
1427         }
1428
1429         snprintf(command, sizeof(command),
1430                  "%s %s%s --start-address=0x%016" PRIx64
1431                  " --stop-address=0x%016" PRIx64
1432                  " -l -d %s %s -C %s 2>/dev/null|grep -v %s:|expand",
1433                  objdump_path ? objdump_path : "objdump",
1434                  disassembler_style ? "-M " : "",
1435                  disassembler_style ? disassembler_style : "",
1436                  map__rip_2objdump(map, sym->start),
1437                  map__rip_2objdump(map, sym->end),
1438                  symbol_conf.annotate_asm_raw ? "" : "--no-show-raw",
1439                  symbol_conf.annotate_src ? "-S" : "",
1440                  symfs_filename, symfs_filename);
1441
1442         pr_debug("Executing: %s\n", command);
1443
1444         err = -1;
1445         if (pipe(stdout_fd) < 0) {
1446                 pr_err("Failure creating the pipe to run %s\n", command);
1447                 goto out_remove_tmp;
1448         }
1449
1450         pid = fork();
1451         if (pid < 0) {
1452                 pr_err("Failure forking to run %s\n", command);
1453                 goto out_close_stdout;
1454         }
1455
1456         if (pid == 0) {
1457                 close(stdout_fd[0]);
1458                 dup2(stdout_fd[1], 1);
1459                 close(stdout_fd[1]);
1460                 execl("/bin/sh", "sh", "-c", command, NULL);
1461                 perror(command);
1462                 exit(-1);
1463         }
1464
1465         close(stdout_fd[1]);
1466
1467         file = fdopen(stdout_fd[0], "r");
1468         if (!file) {
1469                 pr_err("Failure creating FILE stream for %s\n", command);
1470                 /*
1471                  * If we were using debug info should retry with
1472                  * original binary.
1473                  */
1474                 goto out_remove_tmp;
1475         }
1476
1477         nline = 0;
1478         while (!feof(file)) {
1479                 /*
1480                  * The source code line number (lineno) needs to be kept in
1481                  * accross calls to symbol__parse_objdump_line(), so that it
1482                  * can associate it with the instructions till the next one.
1483                  * See disasm_line__new() and struct disasm_line::line_nr.
1484                  */
1485                 if (symbol__parse_objdump_line(sym, map, arch, file, privsize,
1486                             &lineno) < 0)
1487                         break;
1488                 nline++;
1489         }
1490
1491         if (nline == 0)
1492                 pr_err("No output from %s\n", command);
1493
1494         /*
1495          * kallsyms does not have symbol sizes so there may a nop at the end.
1496          * Remove it.
1497          */
1498         if (dso__is_kcore(dso))
1499                 delete_last_nop(sym);
1500
1501         fclose(file);
1502         err = 0;
1503 out_remove_tmp:
1504         close(stdout_fd[0]);
1505
1506         if (dso__needs_decompress(dso))
1507                 unlink(symfs_filename);
1508
1509         if (delete_extract)
1510                 kcore_extract__delete(&kce);
1511 out:
1512         return err;
1513
1514 out_close_stdout:
1515         close(stdout_fd[1]);
1516         goto out_remove_tmp;
1517 }
1518
1519 static void insert_source_line(struct rb_root *root, struct source_line *src_line)
1520 {
1521         struct source_line *iter;
1522         struct rb_node **p = &root->rb_node;
1523         struct rb_node *parent = NULL;
1524         int i, ret;
1525
1526         while (*p != NULL) {
1527                 parent = *p;
1528                 iter = rb_entry(parent, struct source_line, node);
1529
1530                 ret = strcmp(iter->path, src_line->path);
1531                 if (ret == 0) {
1532                         for (i = 0; i < src_line->nr_pcnt; i++)
1533                                 iter->samples[i].percent_sum += src_line->samples[i].percent;
1534                         return;
1535                 }
1536
1537                 if (ret < 0)
1538                         p = &(*p)->rb_left;
1539                 else
1540                         p = &(*p)->rb_right;
1541         }
1542
1543         for (i = 0; i < src_line->nr_pcnt; i++)
1544                 src_line->samples[i].percent_sum = src_line->samples[i].percent;
1545
1546         rb_link_node(&src_line->node, parent, p);
1547         rb_insert_color(&src_line->node, root);
1548 }
1549
1550 static int cmp_source_line(struct source_line *a, struct source_line *b)
1551 {
1552         int i;
1553
1554         for (i = 0; i < a->nr_pcnt; i++) {
1555                 if (a->samples[i].percent_sum == b->samples[i].percent_sum)
1556                         continue;
1557                 return a->samples[i].percent_sum > b->samples[i].percent_sum;
1558         }
1559
1560         return 0;
1561 }
1562
1563 static void __resort_source_line(struct rb_root *root, struct source_line *src_line)
1564 {
1565         struct source_line *iter;
1566         struct rb_node **p = &root->rb_node;
1567         struct rb_node *parent = NULL;
1568
1569         while (*p != NULL) {
1570                 parent = *p;
1571                 iter = rb_entry(parent, struct source_line, node);
1572
1573                 if (cmp_source_line(src_line, iter))
1574                         p = &(*p)->rb_left;
1575                 else
1576                         p = &(*p)->rb_right;
1577         }
1578
1579         rb_link_node(&src_line->node, parent, p);
1580         rb_insert_color(&src_line->node, root);
1581 }
1582
1583 static void resort_source_line(struct rb_root *dest_root, struct rb_root *src_root)
1584 {
1585         struct source_line *src_line;
1586         struct rb_node *node;
1587
1588         node = rb_first(src_root);
1589         while (node) {
1590                 struct rb_node *next;
1591
1592                 src_line = rb_entry(node, struct source_line, node);
1593                 next = rb_next(node);
1594                 rb_erase(node, src_root);
1595
1596                 __resort_source_line(dest_root, src_line);
1597                 node = next;
1598         }
1599 }
1600
1601 static void symbol__free_source_line(struct symbol *sym, int len)
1602 {
1603         struct annotation *notes = symbol__annotation(sym);
1604         struct source_line *src_line = notes->src->lines;
1605         size_t sizeof_src_line;
1606         int i;
1607
1608         sizeof_src_line = sizeof(*src_line) +
1609                           (sizeof(src_line->samples) * (src_line->nr_pcnt - 1));
1610
1611         for (i = 0; i < len; i++) {
1612                 free_srcline(src_line->path);
1613                 src_line = (void *)src_line + sizeof_src_line;
1614         }
1615
1616         zfree(&notes->src->lines);
1617 }
1618
1619 /* Get the filename:line for the colored entries */
1620 static int symbol__get_source_line(struct symbol *sym, struct map *map,
1621                                    struct perf_evsel *evsel,
1622                                    struct rb_root *root, int len)
1623 {
1624         u64 start;
1625         int i, k;
1626         int evidx = evsel->idx;
1627         struct source_line *src_line;
1628         struct annotation *notes = symbol__annotation(sym);
1629         struct sym_hist *h = annotation__histogram(notes, evidx);
1630         struct rb_root tmp_root = RB_ROOT;
1631         int nr_pcnt = 1;
1632         u64 h_sum = h->sum;
1633         size_t sizeof_src_line = sizeof(struct source_line);
1634
1635         if (perf_evsel__is_group_event(evsel)) {
1636                 for (i = 1; i < evsel->nr_members; i++) {
1637                         h = annotation__histogram(notes, evidx + i);
1638                         h_sum += h->sum;
1639                 }
1640                 nr_pcnt = evsel->nr_members;
1641                 sizeof_src_line += (nr_pcnt - 1) * sizeof(src_line->samples);
1642         }
1643
1644         if (!h_sum)
1645                 return 0;
1646
1647         src_line = notes->src->lines = calloc(len, sizeof_src_line);
1648         if (!notes->src->lines)
1649                 return -1;
1650
1651         start = map__rip_2objdump(map, sym->start);
1652
1653         for (i = 0; i < len; i++) {
1654                 u64 offset, nr_samples;
1655                 double percent_max = 0.0;
1656
1657                 src_line->nr_pcnt = nr_pcnt;
1658
1659                 for (k = 0; k < nr_pcnt; k++) {
1660                         double percent = 0.0;
1661
1662                         h = annotation__histogram(notes, evidx + k);
1663                         nr_samples = h->addr[i];
1664                         if (h->sum)
1665                                 percent = 100.0 * nr_samples / h->sum;
1666
1667                         if (percent > percent_max)
1668                                 percent_max = percent;
1669                         src_line->samples[k].percent = percent;
1670                         src_line->samples[k].nr = nr_samples;
1671                 }
1672
1673                 if (percent_max <= 0.5)
1674                         goto next;
1675
1676                 offset = start + i;
1677                 src_line->path = get_srcline(map->dso, offset, NULL,
1678                                              false, true);
1679                 insert_source_line(&tmp_root, src_line);
1680
1681         next:
1682                 src_line = (void *)src_line + sizeof_src_line;
1683         }
1684
1685         resort_source_line(root, &tmp_root);
1686         return 0;
1687 }
1688
1689 static void print_summary(struct rb_root *root, const char *filename)
1690 {
1691         struct source_line *src_line;
1692         struct rb_node *node;
1693
1694         printf("\nSorted summary for file %s\n", filename);
1695         printf("----------------------------------------------\n\n");
1696
1697         if (RB_EMPTY_ROOT(root)) {
1698                 printf(" Nothing higher than %1.1f%%\n", MIN_GREEN);
1699                 return;
1700         }
1701
1702         node = rb_first(root);
1703         while (node) {
1704                 double percent, percent_max = 0.0;
1705                 const char *color;
1706                 char *path;
1707                 int i;
1708
1709                 src_line = rb_entry(node, struct source_line, node);
1710                 for (i = 0; i < src_line->nr_pcnt; i++) {
1711                         percent = src_line->samples[i].percent_sum;
1712                         color = get_percent_color(percent);
1713                         color_fprintf(stdout, color, " %7.2f", percent);
1714
1715                         if (percent > percent_max)
1716                                 percent_max = percent;
1717                 }
1718
1719                 path = src_line->path;
1720                 color = get_percent_color(percent_max);
1721                 color_fprintf(stdout, color, " %s\n", path);
1722
1723                 node = rb_next(node);
1724         }
1725 }
1726
1727 static void symbol__annotate_hits(struct symbol *sym, struct perf_evsel *evsel)
1728 {
1729         struct annotation *notes = symbol__annotation(sym);
1730         struct sym_hist *h = annotation__histogram(notes, evsel->idx);
1731         u64 len = symbol__size(sym), offset;
1732
1733         for (offset = 0; offset < len; ++offset)
1734                 if (h->addr[offset] != 0)
1735                         printf("%*" PRIx64 ": %" PRIu64 "\n", BITS_PER_LONG / 2,
1736                                sym->start + offset, h->addr[offset]);
1737         printf("%*s: %" PRIu64 "\n", BITS_PER_LONG / 2, "h->sum", h->sum);
1738 }
1739
1740 int symbol__annotate_printf(struct symbol *sym, struct map *map,
1741                             struct perf_evsel *evsel, bool full_paths,
1742                             int min_pcnt, int max_lines, int context)
1743 {
1744         struct dso *dso = map->dso;
1745         char *filename;
1746         const char *d_filename;
1747         const char *evsel_name = perf_evsel__name(evsel);
1748         struct annotation *notes = symbol__annotation(sym);
1749         struct sym_hist *h = annotation__histogram(notes, evsel->idx);
1750         struct disasm_line *pos, *queue = NULL;
1751         u64 start = map__rip_2objdump(map, sym->start);
1752         int printed = 2, queue_len = 0;
1753         int more = 0;
1754         u64 len;
1755         int width = 8;
1756         int graph_dotted_len;
1757
1758         filename = strdup(dso->long_name);
1759         if (!filename)
1760                 return -ENOMEM;
1761
1762         if (full_paths)
1763                 d_filename = filename;
1764         else
1765                 d_filename = basename(filename);
1766
1767         len = symbol__size(sym);
1768
1769         if (perf_evsel__is_group_event(evsel))
1770                 width *= evsel->nr_members;
1771
1772         graph_dotted_len = printf(" %-*.*s|     Source code & Disassembly of %s for %s (%" PRIu64 " samples)\n",
1773                width, width, "Percent", d_filename, evsel_name, h->sum);
1774
1775         printf("%-*.*s----\n",
1776                graph_dotted_len, graph_dotted_len, graph_dotted_line);
1777
1778         if (verbose > 0)
1779                 symbol__annotate_hits(sym, evsel);
1780
1781         list_for_each_entry(pos, &notes->src->source, node) {
1782                 if (context && queue == NULL) {
1783                         queue = pos;
1784                         queue_len = 0;
1785                 }
1786
1787                 switch (disasm_line__print(pos, sym, start, evsel, len,
1788                                             min_pcnt, printed, max_lines,
1789                                             queue)) {
1790                 case 0:
1791                         ++printed;
1792                         if (context) {
1793                                 printed += queue_len;
1794                                 queue = NULL;
1795                                 queue_len = 0;
1796                         }
1797                         break;
1798                 case 1:
1799                         /* filtered by max_lines */
1800                         ++more;
1801                         break;
1802                 case -1:
1803                 default:
1804                         /*
1805                          * Filtered by min_pcnt or non IP lines when
1806                          * context != 0
1807                          */
1808                         if (!context)
1809                                 break;
1810                         if (queue_len == context)
1811                                 queue = list_entry(queue->node.next, typeof(*queue), node);
1812                         else
1813                                 ++queue_len;
1814                         break;
1815                 }
1816         }
1817
1818         free(filename);
1819
1820         return more;
1821 }
1822
1823 void symbol__annotate_zero_histogram(struct symbol *sym, int evidx)
1824 {
1825         struct annotation *notes = symbol__annotation(sym);
1826         struct sym_hist *h = annotation__histogram(notes, evidx);
1827
1828         memset(h, 0, notes->src->sizeof_sym_hist);
1829 }
1830
1831 void symbol__annotate_decay_histogram(struct symbol *sym, int evidx)
1832 {
1833         struct annotation *notes = symbol__annotation(sym);
1834         struct sym_hist *h = annotation__histogram(notes, evidx);
1835         int len = symbol__size(sym), offset;
1836
1837         h->sum = 0;
1838         for (offset = 0; offset < len; ++offset) {
1839                 h->addr[offset] = h->addr[offset] * 7 / 8;
1840                 h->sum += h->addr[offset];
1841         }
1842 }
1843
1844 void disasm__purge(struct list_head *head)
1845 {
1846         struct disasm_line *pos, *n;
1847
1848         list_for_each_entry_safe(pos, n, head, node) {
1849                 list_del(&pos->node);
1850                 disasm_line__free(pos);
1851         }
1852 }
1853
1854 static size_t disasm_line__fprintf(struct disasm_line *dl, FILE *fp)
1855 {
1856         size_t printed;
1857
1858         if (dl->offset == -1)
1859                 return fprintf(fp, "%s\n", dl->line);
1860
1861         printed = fprintf(fp, "%#" PRIx64 " %s", dl->offset, dl->ins.name);
1862
1863         if (dl->ops.raw[0] != '\0') {
1864                 printed += fprintf(fp, "%.*s %s\n", 6 - (int)printed, " ",
1865                                    dl->ops.raw);
1866         }
1867
1868         return printed + fprintf(fp, "\n");
1869 }
1870
1871 size_t disasm__fprintf(struct list_head *head, FILE *fp)
1872 {
1873         struct disasm_line *pos;
1874         size_t printed = 0;
1875
1876         list_for_each_entry(pos, head, node)
1877                 printed += disasm_line__fprintf(pos, fp);
1878
1879         return printed;
1880 }
1881
1882 int symbol__tty_annotate(struct symbol *sym, struct map *map,
1883                          struct perf_evsel *evsel, bool print_lines,
1884                          bool full_paths, int min_pcnt, int max_lines)
1885 {
1886         struct dso *dso = map->dso;
1887         struct rb_root source_line = RB_ROOT;
1888         u64 len;
1889
1890         if (symbol__disassemble(sym, map, perf_evsel__env_arch(evsel), 0) < 0)
1891                 return -1;
1892
1893         len = symbol__size(sym);
1894
1895         if (print_lines) {
1896                 srcline_full_filename = full_paths;
1897                 symbol__get_source_line(sym, map, evsel, &source_line, len);
1898                 print_summary(&source_line, dso->long_name);
1899         }
1900
1901         symbol__annotate_printf(sym, map, evsel, full_paths,
1902                                 min_pcnt, max_lines, 0);
1903         if (print_lines)
1904                 symbol__free_source_line(sym, len);
1905
1906         disasm__purge(&symbol__annotation(sym)->src->source);
1907
1908         return 0;
1909 }
1910
1911 bool ui__has_annotation(void)
1912 {
1913         return use_browser == 1 && perf_hpp_list.sym;
1914 }