Linux Audio

Check our new training course

Loading...
v5.4
   1// SPDX-License-Identifier: GPL-2.0
   2/*
   3 * Copyright (C) 2009-2011, Frederic Weisbecker <fweisbec@gmail.com>
   4 *
   5 * Handle the callchains from the stream in an ad-hoc radix tree and then
   6 * sort them in an rbtree.
   7 *
   8 * Using a radix for code path provides a fast retrieval and factorizes
   9 * memory use. Also that lets us use the paths in a hierarchical graph view.
  10 *
  11 */
  12
  13#include <inttypes.h>
  14#include <stdlib.h>
  15#include <stdio.h>
  16#include <stdbool.h>
  17#include <errno.h>
  18#include <math.h>
  19#include <linux/string.h>
  20#include <linux/zalloc.h>
  21
  22#include "asm/bug.h"
  23
  24#include "debug.h"
  25#include "dso.h"
  26#include "event.h"
  27#include "hist.h"
  28#include "sort.h"
  29#include "machine.h"
  30#include "map.h"
  31#include "callchain.h"
  32#include "branch.h"
  33#include "symbol.h"
 
  34#include "../perf.h"
  35
  36#define CALLCHAIN_PARAM_DEFAULT			\
  37	.mode		= CHAIN_GRAPH_ABS,	\
  38	.min_percent	= 0.5,			\
  39	.order		= ORDER_CALLEE,		\
  40	.key		= CCKEY_FUNCTION,	\
  41	.value		= CCVAL_PERCENT,	\
  42
  43struct callchain_param callchain_param = {
  44	CALLCHAIN_PARAM_DEFAULT
  45};
  46
  47/*
  48 * Are there any events usind DWARF callchains?
  49 *
  50 * I.e.
  51 *
  52 * -e cycles/call-graph=dwarf/
  53 */
  54bool dwarf_callchain_users;
  55
  56struct callchain_param callchain_param_default = {
  57	CALLCHAIN_PARAM_DEFAULT
  58};
  59
  60__thread struct callchain_cursor callchain_cursor;
 
  61
  62int parse_callchain_record_opt(const char *arg, struct callchain_param *param)
  63{
  64	return parse_callchain_record(arg, param);
  65}
  66
  67static int parse_callchain_mode(const char *value)
  68{
  69	if (!strncmp(value, "graph", strlen(value))) {
  70		callchain_param.mode = CHAIN_GRAPH_ABS;
  71		return 0;
  72	}
  73	if (!strncmp(value, "flat", strlen(value))) {
  74		callchain_param.mode = CHAIN_FLAT;
  75		return 0;
  76	}
  77	if (!strncmp(value, "fractal", strlen(value))) {
  78		callchain_param.mode = CHAIN_GRAPH_REL;
  79		return 0;
  80	}
  81	if (!strncmp(value, "folded", strlen(value))) {
  82		callchain_param.mode = CHAIN_FOLDED;
  83		return 0;
  84	}
  85	return -1;
  86}
  87
  88static int parse_callchain_order(const char *value)
  89{
  90	if (!strncmp(value, "caller", strlen(value))) {
  91		callchain_param.order = ORDER_CALLER;
  92		callchain_param.order_set = true;
  93		return 0;
  94	}
  95	if (!strncmp(value, "callee", strlen(value))) {
  96		callchain_param.order = ORDER_CALLEE;
  97		callchain_param.order_set = true;
  98		return 0;
  99	}
 100	return -1;
 101}
 102
 103static int parse_callchain_sort_key(const char *value)
 104{
 105	if (!strncmp(value, "function", strlen(value))) {
 106		callchain_param.key = CCKEY_FUNCTION;
 107		return 0;
 108	}
 109	if (!strncmp(value, "address", strlen(value))) {
 110		callchain_param.key = CCKEY_ADDRESS;
 111		return 0;
 112	}
 113	if (!strncmp(value, "srcline", strlen(value))) {
 114		callchain_param.key = CCKEY_SRCLINE;
 115		return 0;
 116	}
 117	if (!strncmp(value, "branch", strlen(value))) {
 118		callchain_param.branch_callstack = 1;
 119		return 0;
 120	}
 121	return -1;
 122}
 123
 124static int parse_callchain_value(const char *value)
 125{
 126	if (!strncmp(value, "percent", strlen(value))) {
 127		callchain_param.value = CCVAL_PERCENT;
 128		return 0;
 129	}
 130	if (!strncmp(value, "period", strlen(value))) {
 131		callchain_param.value = CCVAL_PERIOD;
 132		return 0;
 133	}
 134	if (!strncmp(value, "count", strlen(value))) {
 135		callchain_param.value = CCVAL_COUNT;
 136		return 0;
 137	}
 138	return -1;
 139}
 140
 141static int get_stack_size(const char *str, unsigned long *_size)
 142{
 143	char *endptr;
 144	unsigned long size;
 145	unsigned long max_size = round_down(USHRT_MAX, sizeof(u64));
 146
 147	size = strtoul(str, &endptr, 0);
 148
 149	do {
 150		if (*endptr)
 151			break;
 152
 153		size = round_up(size, sizeof(u64));
 154		if (!size || size > max_size)
 155			break;
 156
 157		*_size = size;
 158		return 0;
 159
 160	} while (0);
 161
 162	pr_err("callchain: Incorrect stack dump size (max %ld): %s\n",
 163	       max_size, str);
 164	return -1;
 165}
 166
 167static int
 168__parse_callchain_report_opt(const char *arg, bool allow_record_opt)
 169{
 170	char *tok;
 171	char *endptr, *saveptr = NULL;
 172	bool minpcnt_set = false;
 173	bool record_opt_set = false;
 174	bool try_stack_size = false;
 175
 176	callchain_param.enabled = true;
 177	symbol_conf.use_callchain = true;
 178
 179	if (!arg)
 180		return 0;
 181
 182	while ((tok = strtok_r((char *)arg, ",", &saveptr)) != NULL) {
 183		if (!strncmp(tok, "none", strlen(tok))) {
 184			callchain_param.mode = CHAIN_NONE;
 185			callchain_param.enabled = false;
 186			symbol_conf.use_callchain = false;
 187			return 0;
 188		}
 189
 190		if (!parse_callchain_mode(tok) ||
 191		    !parse_callchain_order(tok) ||
 192		    !parse_callchain_sort_key(tok) ||
 193		    !parse_callchain_value(tok)) {
 194			/* parsing ok - move on to the next */
 195			try_stack_size = false;
 196			goto next;
 197		} else if (allow_record_opt && !record_opt_set) {
 198			if (parse_callchain_record(tok, &callchain_param))
 199				goto try_numbers;
 200
 201			/* assume that number followed by 'dwarf' is stack size */
 202			if (callchain_param.record_mode == CALLCHAIN_DWARF)
 203				try_stack_size = true;
 204
 205			record_opt_set = true;
 206			goto next;
 207		}
 208
 209try_numbers:
 210		if (try_stack_size) {
 211			unsigned long size = 0;
 212
 213			if (get_stack_size(tok, &size) < 0)
 214				return -1;
 215			callchain_param.dump_size = size;
 216			try_stack_size = false;
 217		} else if (!minpcnt_set) {
 218			/* try to get the min percent */
 219			callchain_param.min_percent = strtod(tok, &endptr);
 220			if (tok == endptr)
 221				return -1;
 222			minpcnt_set = true;
 223		} else {
 224			/* try print limit at last */
 225			callchain_param.print_limit = strtoul(tok, &endptr, 0);
 226			if (tok == endptr)
 227				return -1;
 228		}
 229next:
 230		arg = NULL;
 231	}
 232
 233	if (callchain_register_param(&callchain_param) < 0) {
 234		pr_err("Can't register callchain params\n");
 235		return -1;
 236	}
 237	return 0;
 238}
 239
 240int parse_callchain_report_opt(const char *arg)
 241{
 242	return __parse_callchain_report_opt(arg, false);
 243}
 244
 245int parse_callchain_top_opt(const char *arg)
 246{
 247	return __parse_callchain_report_opt(arg, true);
 248}
 249
 250int parse_callchain_record(const char *arg, struct callchain_param *param)
 251{
 252	char *tok, *name, *saveptr = NULL;
 253	char *buf;
 254	int ret = -1;
 255
 256	/* We need buffer that we know we can write to. */
 257	buf = malloc(strlen(arg) + 1);
 258	if (!buf)
 259		return -ENOMEM;
 260
 261	strcpy(buf, arg);
 262
 263	tok = strtok_r((char *)buf, ",", &saveptr);
 264	name = tok ? : (char *)buf;
 265
 266	do {
 267		/* Framepointer style */
 268		if (!strncmp(name, "fp", sizeof("fp"))) {
 269			if (!strtok_r(NULL, ",", &saveptr)) {
 270				param->record_mode = CALLCHAIN_FP;
 271				ret = 0;
 272			} else
 273				pr_err("callchain: No more arguments "
 274				       "needed for --call-graph fp\n");
 
 
 
 
 
 275			break;
 276
 277		/* Dwarf style */
 278		} else if (!strncmp(name, "dwarf", sizeof("dwarf"))) {
 279			const unsigned long default_stack_dump_size = 8192;
 280
 281			ret = 0;
 282			param->record_mode = CALLCHAIN_DWARF;
 283			param->dump_size = default_stack_dump_size;
 284			dwarf_callchain_users = true;
 285
 286			tok = strtok_r(NULL, ",", &saveptr);
 287			if (tok) {
 288				unsigned long size = 0;
 289
 290				ret = get_stack_size(tok, &size);
 291				param->dump_size = size;
 292			}
 293		} else if (!strncmp(name, "lbr", sizeof("lbr"))) {
 294			if (!strtok_r(NULL, ",", &saveptr)) {
 295				param->record_mode = CALLCHAIN_LBR;
 296				ret = 0;
 297			} else
 298				pr_err("callchain: No more arguments "
 299					"needed for --call-graph lbr\n");
 300			break;
 301		} else {
 302			pr_err("callchain: Unknown --call-graph option "
 303			       "value: %s\n", arg);
 304			break;
 305		}
 306
 307	} while (0);
 308
 309	free(buf);
 310	return ret;
 311}
 312
 313int perf_callchain_config(const char *var, const char *value)
 314{
 315	char *endptr;
 316
 317	if (!strstarts(var, "call-graph."))
 318		return 0;
 319	var += sizeof("call-graph.") - 1;
 320
 321	if (!strcmp(var, "record-mode"))
 322		return parse_callchain_record_opt(value, &callchain_param);
 323	if (!strcmp(var, "dump-size")) {
 324		unsigned long size = 0;
 325		int ret;
 326
 327		ret = get_stack_size(value, &size);
 328		callchain_param.dump_size = size;
 329
 330		return ret;
 331	}
 332	if (!strcmp(var, "print-type")){
 333		int ret;
 334		ret = parse_callchain_mode(value);
 335		if (ret == -1)
 336			pr_err("Invalid callchain mode: %s\n", value);
 337		return ret;
 338	}
 339	if (!strcmp(var, "order")){
 340		int ret;
 341		ret = parse_callchain_order(value);
 342		if (ret == -1)
 343			pr_err("Invalid callchain order: %s\n", value);
 344		return ret;
 345	}
 346	if (!strcmp(var, "sort-key")){
 347		int ret;
 348		ret = parse_callchain_sort_key(value);
 349		if (ret == -1)
 350			pr_err("Invalid callchain sort key: %s\n", value);
 351		return ret;
 352	}
 353	if (!strcmp(var, "threshold")) {
 354		callchain_param.min_percent = strtod(value, &endptr);
 355		if (value == endptr) {
 356			pr_err("Invalid callchain threshold: %s\n", value);
 357			return -1;
 358		}
 359	}
 360	if (!strcmp(var, "print-limit")) {
 361		callchain_param.print_limit = strtod(value, &endptr);
 362		if (value == endptr) {
 363			pr_err("Invalid callchain print limit: %s\n", value);
 364			return -1;
 365		}
 366	}
 367
 368	return 0;
 369}
 370
 371static void
 372rb_insert_callchain(struct rb_root *root, struct callchain_node *chain,
 373		    enum chain_mode mode)
 374{
 375	struct rb_node **p = &root->rb_node;
 376	struct rb_node *parent = NULL;
 377	struct callchain_node *rnode;
 378	u64 chain_cumul = callchain_cumul_hits(chain);
 379
 380	while (*p) {
 381		u64 rnode_cumul;
 382
 383		parent = *p;
 384		rnode = rb_entry(parent, struct callchain_node, rb_node);
 385		rnode_cumul = callchain_cumul_hits(rnode);
 386
 387		switch (mode) {
 388		case CHAIN_FLAT:
 389		case CHAIN_FOLDED:
 390			if (rnode->hit < chain->hit)
 391				p = &(*p)->rb_left;
 392			else
 393				p = &(*p)->rb_right;
 394			break;
 395		case CHAIN_GRAPH_ABS: /* Falldown */
 396		case CHAIN_GRAPH_REL:
 397			if (rnode_cumul < chain_cumul)
 398				p = &(*p)->rb_left;
 399			else
 400				p = &(*p)->rb_right;
 401			break;
 402		case CHAIN_NONE:
 403		default:
 404			break;
 405		}
 406	}
 407
 408	rb_link_node(&chain->rb_node, parent, p);
 409	rb_insert_color(&chain->rb_node, root);
 410}
 411
 412static void
 413__sort_chain_flat(struct rb_root *rb_root, struct callchain_node *node,
 414		  u64 min_hit)
 415{
 416	struct rb_node *n;
 417	struct callchain_node *child;
 418
 419	n = rb_first(&node->rb_root_in);
 420	while (n) {
 421		child = rb_entry(n, struct callchain_node, rb_node_in);
 422		n = rb_next(n);
 423
 424		__sort_chain_flat(rb_root, child, min_hit);
 425	}
 426
 427	if (node->hit && node->hit >= min_hit)
 428		rb_insert_callchain(rb_root, node, CHAIN_FLAT);
 429}
 430
 431/*
 432 * Once we get every callchains from the stream, we can now
 433 * sort them by hit
 434 */
 435static void
 436sort_chain_flat(struct rb_root *rb_root, struct callchain_root *root,
 437		u64 min_hit, struct callchain_param *param __maybe_unused)
 438{
 439	*rb_root = RB_ROOT;
 440	__sort_chain_flat(rb_root, &root->node, min_hit);
 441}
 442
 443static void __sort_chain_graph_abs(struct callchain_node *node,
 444				   u64 min_hit)
 445{
 446	struct rb_node *n;
 447	struct callchain_node *child;
 448
 449	node->rb_root = RB_ROOT;
 450	n = rb_first(&node->rb_root_in);
 451
 452	while (n) {
 453		child = rb_entry(n, struct callchain_node, rb_node_in);
 454		n = rb_next(n);
 455
 456		__sort_chain_graph_abs(child, min_hit);
 457		if (callchain_cumul_hits(child) >= min_hit)
 458			rb_insert_callchain(&node->rb_root, child,
 459					    CHAIN_GRAPH_ABS);
 460	}
 461}
 462
 463static void
 464sort_chain_graph_abs(struct rb_root *rb_root, struct callchain_root *chain_root,
 465		     u64 min_hit, struct callchain_param *param __maybe_unused)
 466{
 467	__sort_chain_graph_abs(&chain_root->node, min_hit);
 468	rb_root->rb_node = chain_root->node.rb_root.rb_node;
 469}
 470
 471static void __sort_chain_graph_rel(struct callchain_node *node,
 472				   double min_percent)
 473{
 474	struct rb_node *n;
 475	struct callchain_node *child;
 476	u64 min_hit;
 477
 478	node->rb_root = RB_ROOT;
 479	min_hit = ceil(node->children_hit * min_percent);
 480
 481	n = rb_first(&node->rb_root_in);
 482	while (n) {
 483		child = rb_entry(n, struct callchain_node, rb_node_in);
 484		n = rb_next(n);
 485
 486		__sort_chain_graph_rel(child, min_percent);
 487		if (callchain_cumul_hits(child) >= min_hit)
 488			rb_insert_callchain(&node->rb_root, child,
 489					    CHAIN_GRAPH_REL);
 490	}
 491}
 492
 493static void
 494sort_chain_graph_rel(struct rb_root *rb_root, struct callchain_root *chain_root,
 495		     u64 min_hit __maybe_unused, struct callchain_param *param)
 496{
 497	__sort_chain_graph_rel(&chain_root->node, param->min_percent / 100.0);
 498	rb_root->rb_node = chain_root->node.rb_root.rb_node;
 499}
 500
 501int callchain_register_param(struct callchain_param *param)
 502{
 503	switch (param->mode) {
 504	case CHAIN_GRAPH_ABS:
 505		param->sort = sort_chain_graph_abs;
 506		break;
 507	case CHAIN_GRAPH_REL:
 508		param->sort = sort_chain_graph_rel;
 509		break;
 510	case CHAIN_FLAT:
 511	case CHAIN_FOLDED:
 512		param->sort = sort_chain_flat;
 513		break;
 514	case CHAIN_NONE:
 515	default:
 516		return -1;
 517	}
 518	return 0;
 519}
 520
 521/*
 522 * Create a child for a parent. If inherit_children, then the new child
 523 * will become the new parent of it's parent children
 524 */
 525static struct callchain_node *
 526create_child(struct callchain_node *parent, bool inherit_children)
 527{
 528	struct callchain_node *new;
 529
 530	new = zalloc(sizeof(*new));
 531	if (!new) {
 532		perror("not enough memory to create child for code path tree");
 533		return NULL;
 534	}
 535	new->parent = parent;
 536	INIT_LIST_HEAD(&new->val);
 537	INIT_LIST_HEAD(&new->parent_val);
 538
 539	if (inherit_children) {
 540		struct rb_node *n;
 541		struct callchain_node *child;
 542
 543		new->rb_root_in = parent->rb_root_in;
 544		parent->rb_root_in = RB_ROOT;
 545
 546		n = rb_first(&new->rb_root_in);
 547		while (n) {
 548			child = rb_entry(n, struct callchain_node, rb_node_in);
 549			child->parent = new;
 550			n = rb_next(n);
 551		}
 552
 553		/* make it the first child */
 554		rb_link_node(&new->rb_node_in, NULL, &parent->rb_root_in.rb_node);
 555		rb_insert_color(&new->rb_node_in, &parent->rb_root_in);
 556	}
 557
 558	return new;
 559}
 560
 561
 562/*
 563 * Fill the node with callchain values
 564 */
 565static int
 566fill_node(struct callchain_node *node, struct callchain_cursor *cursor)
 567{
 568	struct callchain_cursor_node *cursor_node;
 569
 570	node->val_nr = cursor->nr - cursor->pos;
 571	if (!node->val_nr)
 572		pr_warning("Warning: empty node in callchain tree\n");
 573
 574	cursor_node = callchain_cursor_current(cursor);
 575
 576	while (cursor_node) {
 577		struct callchain_list *call;
 578
 579		call = zalloc(sizeof(*call));
 580		if (!call) {
 581			perror("not enough memory for the code path tree");
 582			return -1;
 583		}
 584		call->ip = cursor_node->ip;
 585		call->ms.sym = cursor_node->sym;
 586		call->ms.map = map__get(cursor_node->map);
 
 587		call->srcline = cursor_node->srcline;
 588
 589		if (cursor_node->branch) {
 590			call->branch_count = 1;
 591
 592			if (cursor_node->branch_from) {
 593				/*
 594				 * branch_from is set with value somewhere else
 595				 * to imply it's "to" of a branch.
 596				 */
 597				call->brtype_stat.branch_to = true;
 
 
 
 
 
 
 
 
 598
 599				if (cursor_node->branch_flags.predicted)
 600					call->predicted_count = 1;
 601
 602				if (cursor_node->branch_flags.abort)
 603					call->abort_count = 1;
 604
 605				branch_type_count(&call->brtype_stat,
 606						  &cursor_node->branch_flags,
 607						  cursor_node->branch_from,
 608						  cursor_node->ip);
 609			} else {
 610				/*
 611				 * It's "from" of a branch
 612				 */
 613				call->brtype_stat.branch_to = false;
 
 614				call->cycles_count =
 615					cursor_node->branch_flags.cycles;
 616				call->iter_count = cursor_node->nr_loop_iter;
 617				call->iter_cycles = cursor_node->iter_cycles;
 618			}
 619		}
 620
 621		list_add_tail(&call->list, &node->val);
 622
 623		callchain_cursor_advance(cursor);
 624		cursor_node = callchain_cursor_current(cursor);
 625	}
 626	return 0;
 627}
 628
 629static struct callchain_node *
 630add_child(struct callchain_node *parent,
 631	  struct callchain_cursor *cursor,
 632	  u64 period)
 633{
 634	struct callchain_node *new;
 635
 636	new = create_child(parent, false);
 637	if (new == NULL)
 638		return NULL;
 639
 640	if (fill_node(new, cursor) < 0) {
 641		struct callchain_list *call, *tmp;
 642
 643		list_for_each_entry_safe(call, tmp, &new->val, list) {
 644			list_del_init(&call->list);
 645			map__zput(call->ms.map);
 
 646			free(call);
 647		}
 648		free(new);
 649		return NULL;
 650	}
 651
 652	new->children_hit = 0;
 653	new->hit = period;
 654	new->children_count = 0;
 655	new->count = 1;
 656	return new;
 657}
 658
 659enum match_result {
 660	MATCH_ERROR  = -1,
 661	MATCH_EQ,
 662	MATCH_LT,
 663	MATCH_GT,
 664};
 665
 666static enum match_result match_chain_strings(const char *left,
 667					     const char *right)
 668{
 669	enum match_result ret = MATCH_EQ;
 670	int cmp;
 671
 672	if (left && right)
 673		cmp = strcmp(left, right);
 674	else if (!left && right)
 675		cmp = 1;
 676	else if (left && !right)
 677		cmp = -1;
 678	else
 679		return MATCH_ERROR;
 680
 681	if (cmp != 0)
 682		ret = cmp < 0 ? MATCH_LT : MATCH_GT;
 683
 684	return ret;
 685}
 686
 687/*
 688 * We need to always use relative addresses because we're aggregating
 689 * callchains from multiple threads, i.e. different address spaces, so
 690 * comparing absolute addresses make no sense as a symbol in a DSO may end up
 691 * in a different address when used in a different binary or even the same
 692 * binary but with some sort of address randomization technique, thus we need
 693 * to compare just relative addresses. -acme
 694 */
 695static enum match_result match_chain_dso_addresses(struct map *left_map, u64 left_ip,
 696						   struct map *right_map, u64 right_ip)
 697{
 698	struct dso *left_dso = left_map ? left_map->dso : NULL;
 699	struct dso *right_dso = right_map ? right_map->dso : NULL;
 700
 701	if (left_dso != right_dso)
 702		return left_dso < right_dso ? MATCH_LT : MATCH_GT;
 703
 704	if (left_ip != right_ip)
 705 		return left_ip < right_ip ? MATCH_LT : MATCH_GT;
 706
 707	return MATCH_EQ;
 708}
 709
 710static enum match_result match_chain(struct callchain_cursor_node *node,
 711				     struct callchain_list *cnode)
 712{
 713	enum match_result match = MATCH_ERROR;
 714
 715	switch (callchain_param.key) {
 716	case CCKEY_SRCLINE:
 717		match = match_chain_strings(cnode->srcline, node->srcline);
 718		if (match != MATCH_ERROR)
 719			break;
 720		/* otherwise fall-back to symbol-based comparison below */
 721		__fallthrough;
 722	case CCKEY_FUNCTION:
 723		if (node->sym && cnode->ms.sym) {
 724			/*
 725			 * Compare inlined frames based on their symbol name
 726			 * because different inlined frames will have the same
 727			 * symbol start. Otherwise do a faster comparison based
 728			 * on the symbol start address.
 729			 */
 730			if (cnode->ms.sym->inlined || node->sym->inlined) {
 731				match = match_chain_strings(cnode->ms.sym->name,
 732							    node->sym->name);
 733				if (match != MATCH_ERROR)
 734					break;
 735			} else {
 736				match = match_chain_dso_addresses(cnode->ms.map, cnode->ms.sym->start,
 737								  node->map, node->sym->start);
 738				break;
 739			}
 740		}
 741		/* otherwise fall-back to IP-based comparison below */
 742		__fallthrough;
 743	case CCKEY_ADDRESS:
 744	default:
 745		match = match_chain_dso_addresses(cnode->ms.map, cnode->ip, node->map, node->ip);
 746		break;
 747	}
 748
 749	if (match == MATCH_EQ && node->branch) {
 750		cnode->branch_count++;
 751
 752		if (node->branch_from) {
 753			/*
 754			 * It's "to" of a branch
 755			 */
 756			cnode->brtype_stat.branch_to = true;
 
 
 
 
 
 
 
 757
 758			if (node->branch_flags.predicted)
 759				cnode->predicted_count++;
 760
 761			if (node->branch_flags.abort)
 762				cnode->abort_count++;
 763
 764			branch_type_count(&cnode->brtype_stat,
 765					  &node->branch_flags,
 766					  node->branch_from,
 767					  node->ip);
 768		} else {
 769			/*
 770			 * It's "from" of a branch
 771			 */
 772			cnode->brtype_stat.branch_to = false;
 
 773			cnode->cycles_count += node->branch_flags.cycles;
 774			cnode->iter_count += node->nr_loop_iter;
 775			cnode->iter_cycles += node->iter_cycles;
 776			cnode->from_count++;
 777		}
 778	}
 779
 780	return match;
 781}
 782
 783/*
 784 * Split the parent in two parts (a new child is created) and
 785 * give a part of its callchain to the created child.
 786 * Then create another child to host the given callchain of new branch
 787 */
 788static int
 789split_add_child(struct callchain_node *parent,
 790		struct callchain_cursor *cursor,
 791		struct callchain_list *to_split,
 792		u64 idx_parents, u64 idx_local, u64 period)
 793{
 794	struct callchain_node *new;
 795	struct list_head *old_tail;
 796	unsigned int idx_total = idx_parents + idx_local;
 797
 798	/* split */
 799	new = create_child(parent, true);
 800	if (new == NULL)
 801		return -1;
 802
 803	/* split the callchain and move a part to the new child */
 804	old_tail = parent->val.prev;
 805	list_del_range(&to_split->list, old_tail);
 806	new->val.next = &to_split->list;
 807	new->val.prev = old_tail;
 808	to_split->list.prev = &new->val;
 809	old_tail->next = &new->val;
 810
 811	/* split the hits */
 812	new->hit = parent->hit;
 813	new->children_hit = parent->children_hit;
 814	parent->children_hit = callchain_cumul_hits(new);
 815	new->val_nr = parent->val_nr - idx_local;
 816	parent->val_nr = idx_local;
 817	new->count = parent->count;
 818	new->children_count = parent->children_count;
 819	parent->children_count = callchain_cumul_counts(new);
 820
 821	/* create a new child for the new branch if any */
 822	if (idx_total < cursor->nr) {
 823		struct callchain_node *first;
 824		struct callchain_list *cnode;
 825		struct callchain_cursor_node *node;
 826		struct rb_node *p, **pp;
 827
 828		parent->hit = 0;
 829		parent->children_hit += period;
 830		parent->count = 0;
 831		parent->children_count += 1;
 832
 833		node = callchain_cursor_current(cursor);
 834		new = add_child(parent, cursor, period);
 835		if (new == NULL)
 836			return -1;
 837
 838		/*
 839		 * This is second child since we moved parent's children
 840		 * to new (first) child above.
 841		 */
 842		p = parent->rb_root_in.rb_node;
 843		first = rb_entry(p, struct callchain_node, rb_node_in);
 844		cnode = list_first_entry(&first->val, struct callchain_list,
 845					 list);
 846
 847		if (match_chain(node, cnode) == MATCH_LT)
 848			pp = &p->rb_left;
 849		else
 850			pp = &p->rb_right;
 851
 852		rb_link_node(&new->rb_node_in, p, pp);
 853		rb_insert_color(&new->rb_node_in, &parent->rb_root_in);
 854	} else {
 855		parent->hit = period;
 856		parent->count = 1;
 857	}
 858	return 0;
 859}
 860
 861static enum match_result
 862append_chain(struct callchain_node *root,
 863	     struct callchain_cursor *cursor,
 864	     u64 period);
 865
 866static int
 867append_chain_children(struct callchain_node *root,
 868		      struct callchain_cursor *cursor,
 869		      u64 period)
 870{
 871	struct callchain_node *rnode;
 872	struct callchain_cursor_node *node;
 873	struct rb_node **p = &root->rb_root_in.rb_node;
 874	struct rb_node *parent = NULL;
 875
 876	node = callchain_cursor_current(cursor);
 877	if (!node)
 878		return -1;
 879
 880	/* lookup in childrens */
 881	while (*p) {
 882		enum match_result ret;
 883
 884		parent = *p;
 885		rnode = rb_entry(parent, struct callchain_node, rb_node_in);
 886
 887		/* If at least first entry matches, rely to children */
 888		ret = append_chain(rnode, cursor, period);
 889		if (ret == MATCH_EQ)
 890			goto inc_children_hit;
 891		if (ret == MATCH_ERROR)
 892			return -1;
 893
 894		if (ret == MATCH_LT)
 895			p = &parent->rb_left;
 896		else
 897			p = &parent->rb_right;
 898	}
 899	/* nothing in children, add to the current node */
 900	rnode = add_child(root, cursor, period);
 901	if (rnode == NULL)
 902		return -1;
 903
 904	rb_link_node(&rnode->rb_node_in, parent, p);
 905	rb_insert_color(&rnode->rb_node_in, &root->rb_root_in);
 906
 907inc_children_hit:
 908	root->children_hit += period;
 909	root->children_count++;
 910	return 0;
 911}
 912
 913static enum match_result
 914append_chain(struct callchain_node *root,
 915	     struct callchain_cursor *cursor,
 916	     u64 period)
 917{
 918	struct callchain_list *cnode;
 919	u64 start = cursor->pos;
 920	bool found = false;
 921	u64 matches;
 922	enum match_result cmp = MATCH_ERROR;
 923
 924	/*
 925	 * Lookup in the current node
 926	 * If we have a symbol, then compare the start to match
 927	 * anywhere inside a function, unless function
 928	 * mode is disabled.
 929	 */
 930	list_for_each_entry(cnode, &root->val, list) {
 931		struct callchain_cursor_node *node;
 932
 933		node = callchain_cursor_current(cursor);
 934		if (!node)
 935			break;
 936
 937		cmp = match_chain(node, cnode);
 938		if (cmp != MATCH_EQ)
 939			break;
 940
 941		found = true;
 942
 943		callchain_cursor_advance(cursor);
 944	}
 945
 946	/* matches not, relay no the parent */
 947	if (!found) {
 948		WARN_ONCE(cmp == MATCH_ERROR, "Chain comparison error\n");
 949		return cmp;
 950	}
 951
 952	matches = cursor->pos - start;
 953
 954	/* we match only a part of the node. Split it and add the new chain */
 955	if (matches < root->val_nr) {
 956		if (split_add_child(root, cursor, cnode, start, matches,
 957				    period) < 0)
 958			return MATCH_ERROR;
 959
 960		return MATCH_EQ;
 961	}
 962
 963	/* we match 100% of the path, increment the hit */
 964	if (matches == root->val_nr && cursor->pos == cursor->nr) {
 965		root->hit += period;
 966		root->count++;
 967		return MATCH_EQ;
 968	}
 969
 970	/* We match the node and still have a part remaining */
 971	if (append_chain_children(root, cursor, period) < 0)
 972		return MATCH_ERROR;
 973
 974	return MATCH_EQ;
 975}
 976
 977int callchain_append(struct callchain_root *root,
 978		     struct callchain_cursor *cursor,
 979		     u64 period)
 980{
 
 
 
 981	if (!cursor->nr)
 982		return 0;
 983
 984	callchain_cursor_commit(cursor);
 985
 986	if (append_chain_children(&root->node, cursor, period) < 0)
 987		return -1;
 988
 989	if (cursor->nr > root->max_depth)
 990		root->max_depth = cursor->nr;
 991
 992	return 0;
 993}
 994
 995static int
 996merge_chain_branch(struct callchain_cursor *cursor,
 997		   struct callchain_node *dst, struct callchain_node *src)
 998{
 999	struct callchain_cursor_node **old_last = cursor->last;
1000	struct callchain_node *child;
1001	struct callchain_list *list, *next_list;
1002	struct rb_node *n;
1003	int old_pos = cursor->nr;
1004	int err = 0;
1005
1006	list_for_each_entry_safe(list, next_list, &src->val, list) {
1007		callchain_cursor_append(cursor, list->ip,
1008					list->ms.map, list->ms.sym,
1009					false, NULL, 0, 0, 0, list->srcline);
 
 
1010		list_del_init(&list->list);
1011		map__zput(list->ms.map);
 
 
1012		free(list);
1013	}
1014
1015	if (src->hit) {
1016		callchain_cursor_commit(cursor);
1017		if (append_chain_children(dst, cursor, src->hit) < 0)
1018			return -1;
1019	}
1020
1021	n = rb_first(&src->rb_root_in);
1022	while (n) {
1023		child = container_of(n, struct callchain_node, rb_node_in);
1024		n = rb_next(n);
1025		rb_erase(&child->rb_node_in, &src->rb_root_in);
1026
1027		err = merge_chain_branch(cursor, dst, child);
1028		if (err)
1029			break;
1030
1031		free(child);
1032	}
1033
1034	cursor->nr = old_pos;
1035	cursor->last = old_last;
1036
1037	return err;
1038}
1039
1040int callchain_merge(struct callchain_cursor *cursor,
1041		    struct callchain_root *dst, struct callchain_root *src)
1042{
1043	return merge_chain_branch(cursor, &dst->node, &src->node);
1044}
1045
1046int callchain_cursor_append(struct callchain_cursor *cursor,
1047			    u64 ip, struct map *map, struct symbol *sym,
1048			    bool branch, struct branch_flags *flags,
1049			    int nr_loop_iter, u64 iter_cycles, u64 branch_from,
1050			    const char *srcline)
1051{
1052	struct callchain_cursor_node *node = *cursor->last;
1053
1054	if (!node) {
1055		node = calloc(1, sizeof(*node));
1056		if (!node)
1057			return -ENOMEM;
1058
1059		*cursor->last = node;
1060	}
1061
1062	node->ip = ip;
1063	map__zput(node->map);
1064	node->map = map__get(map);
1065	node->sym = sym;
 
1066	node->branch = branch;
1067	node->nr_loop_iter = nr_loop_iter;
1068	node->iter_cycles = iter_cycles;
1069	node->srcline = srcline;
1070
1071	if (flags)
1072		memcpy(&node->branch_flags, flags,
1073			sizeof(struct branch_flags));
1074
1075	node->branch_from = branch_from;
1076	cursor->nr++;
1077
1078	cursor->last = &node->next;
1079
1080	return 0;
1081}
1082
1083int sample__resolve_callchain(struct perf_sample *sample,
1084			      struct callchain_cursor *cursor, struct symbol **parent,
1085			      struct evsel *evsel, struct addr_location *al,
1086			      int max_stack)
1087{
1088	if (sample->callchain == NULL && !symbol_conf.show_branchflag_count)
1089		return 0;
1090
1091	if (symbol_conf.use_callchain || symbol_conf.cumulate_callchain ||
1092	    perf_hpp_list.parent || symbol_conf.show_branchflag_count) {
1093		return thread__resolve_callchain(al->thread, cursor, evsel, sample,
1094						 parent, al, max_stack);
1095	}
1096	return 0;
1097}
1098
1099int hist_entry__append_callchain(struct hist_entry *he, struct perf_sample *sample)
1100{
1101	if ((!symbol_conf.use_callchain || sample->callchain == NULL) &&
1102		!symbol_conf.show_branchflag_count)
1103		return 0;
1104	return callchain_append(he->callchain, &callchain_cursor, sample->period);
1105}
1106
1107int fill_callchain_info(struct addr_location *al, struct callchain_cursor_node *node,
1108			bool hide_unresolved)
1109{
1110	al->map = node->map;
1111	al->sym = node->sym;
 
 
 
 
 
1112	al->srcline = node->srcline;
1113	al->addr = node->ip;
1114
1115	if (al->sym == NULL) {
1116		if (hide_unresolved)
1117			return 0;
1118		if (al->map == NULL)
1119			goto out;
1120	}
1121
1122	if (al->map->groups == &al->machine->kmaps) {
1123		if (machine__is_host(al->machine)) {
1124			al->cpumode = PERF_RECORD_MISC_KERNEL;
1125			al->level = 'k';
1126		} else {
1127			al->cpumode = PERF_RECORD_MISC_GUEST_KERNEL;
1128			al->level = 'g';
1129		}
1130	} else {
1131		if (machine__is_host(al->machine)) {
1132			al->cpumode = PERF_RECORD_MISC_USER;
1133			al->level = '.';
1134		} else if (perf_guest) {
1135			al->cpumode = PERF_RECORD_MISC_GUEST_USER;
1136			al->level = 'u';
1137		} else {
1138			al->cpumode = PERF_RECORD_MISC_HYPERVISOR;
1139			al->level = 'H';
1140		}
1141	}
1142
1143out:
1144	return 1;
1145}
1146
1147char *callchain_list__sym_name(struct callchain_list *cl,
1148			       char *bf, size_t bfsize, bool show_dso)
1149{
1150	bool show_addr = callchain_param.key == CCKEY_ADDRESS;
1151	bool show_srcline = show_addr || callchain_param.key == CCKEY_SRCLINE;
1152	int printed;
1153
1154	if (cl->ms.sym) {
1155		const char *inlined = cl->ms.sym->inlined ? " (inlined)" : "";
1156
1157		if (show_srcline && cl->srcline)
1158			printed = scnprintf(bf, bfsize, "%s %s%s",
1159					    cl->ms.sym->name, cl->srcline,
1160					    inlined);
1161		else
1162			printed = scnprintf(bf, bfsize, "%s%s",
1163					    cl->ms.sym->name, inlined);
1164	} else
1165		printed = scnprintf(bf, bfsize, "%#" PRIx64, cl->ip);
1166
1167	if (show_dso)
1168		scnprintf(bf + printed, bfsize - printed, " %s",
1169			  cl->ms.map ?
1170			  cl->ms.map->dso->short_name :
1171			  "unknown");
1172
1173	return bf;
1174}
1175
1176char *callchain_node__scnprintf_value(struct callchain_node *node,
1177				      char *bf, size_t bfsize, u64 total)
1178{
1179	double percent = 0.0;
1180	u64 period = callchain_cumul_hits(node);
1181	unsigned count = callchain_cumul_counts(node);
1182
1183	if (callchain_param.mode == CHAIN_FOLDED) {
1184		period = node->hit;
1185		count = node->count;
1186	}
1187
1188	switch (callchain_param.value) {
1189	case CCVAL_PERIOD:
1190		scnprintf(bf, bfsize, "%"PRIu64, period);
1191		break;
1192	case CCVAL_COUNT:
1193		scnprintf(bf, bfsize, "%u", count);
1194		break;
1195	case CCVAL_PERCENT:
1196	default:
1197		if (total)
1198			percent = period * 100.0 / total;
1199		scnprintf(bf, bfsize, "%.2f%%", percent);
1200		break;
1201	}
1202	return bf;
1203}
1204
1205int callchain_node__fprintf_value(struct callchain_node *node,
1206				 FILE *fp, u64 total)
1207{
1208	double percent = 0.0;
1209	u64 period = callchain_cumul_hits(node);
1210	unsigned count = callchain_cumul_counts(node);
1211
1212	if (callchain_param.mode == CHAIN_FOLDED) {
1213		period = node->hit;
1214		count = node->count;
1215	}
1216
1217	switch (callchain_param.value) {
1218	case CCVAL_PERIOD:
1219		return fprintf(fp, "%"PRIu64, period);
1220	case CCVAL_COUNT:
1221		return fprintf(fp, "%u", count);
1222	case CCVAL_PERCENT:
1223	default:
1224		if (total)
1225			percent = period * 100.0 / total;
1226		return percent_color_fprintf(fp, "%.2f%%", percent);
1227	}
1228	return 0;
1229}
1230
1231static void callchain_counts_value(struct callchain_node *node,
1232				   u64 *branch_count, u64 *predicted_count,
1233				   u64 *abort_count, u64 *cycles_count)
1234{
1235	struct callchain_list *clist;
1236
1237	list_for_each_entry(clist, &node->val, list) {
1238		if (branch_count)
1239			*branch_count += clist->branch_count;
1240
1241		if (predicted_count)
1242			*predicted_count += clist->predicted_count;
1243
1244		if (abort_count)
1245			*abort_count += clist->abort_count;
1246
1247		if (cycles_count)
1248			*cycles_count += clist->cycles_count;
1249	}
1250}
1251
1252static int callchain_node_branch_counts_cumul(struct callchain_node *node,
1253					      u64 *branch_count,
1254					      u64 *predicted_count,
1255					      u64 *abort_count,
1256					      u64 *cycles_count)
1257{
1258	struct callchain_node *child;
1259	struct rb_node *n;
1260
1261	n = rb_first(&node->rb_root_in);
1262	while (n) {
1263		child = rb_entry(n, struct callchain_node, rb_node_in);
1264		n = rb_next(n);
1265
1266		callchain_node_branch_counts_cumul(child, branch_count,
1267						   predicted_count,
1268						   abort_count,
1269						   cycles_count);
1270
1271		callchain_counts_value(child, branch_count,
1272				       predicted_count, abort_count,
1273				       cycles_count);
1274	}
1275
1276	return 0;
1277}
1278
1279int callchain_branch_counts(struct callchain_root *root,
1280			    u64 *branch_count, u64 *predicted_count,
1281			    u64 *abort_count, u64 *cycles_count)
1282{
1283	if (branch_count)
1284		*branch_count = 0;
1285
1286	if (predicted_count)
1287		*predicted_count = 0;
1288
1289	if (abort_count)
1290		*abort_count = 0;
1291
1292	if (cycles_count)
1293		*cycles_count = 0;
1294
1295	return callchain_node_branch_counts_cumul(&root->node,
1296						  branch_count,
1297						  predicted_count,
1298						  abort_count,
1299						  cycles_count);
1300}
1301
1302static int count_pri64_printf(int idx, const char *str, u64 value, char *bf, int bfsize)
1303{
1304	int printed;
1305
1306	printed = scnprintf(bf, bfsize, "%s%s:%" PRId64 "", (idx) ? " " : " (", str, value);
1307
1308	return printed;
1309}
1310
1311static int count_float_printf(int idx, const char *str, float value,
1312			      char *bf, int bfsize, float threshold)
1313{
1314	int printed;
1315
1316	if (threshold != 0.0 && value < threshold)
1317		return 0;
1318
1319	printed = scnprintf(bf, bfsize, "%s%s:%.1f%%", (idx) ? " " : " (", str, value);
1320
1321	return printed;
1322}
1323
1324static int branch_to_str(char *bf, int bfsize,
1325			 u64 branch_count, u64 predicted_count,
1326			 u64 abort_count,
1327			 struct branch_type_stat *brtype_stat)
1328{
1329	int printed, i = 0;
1330
1331	printed = branch_type_str(brtype_stat, bf, bfsize);
1332	if (printed)
1333		i++;
1334
1335	if (predicted_count < branch_count) {
1336		printed += count_float_printf(i++, "predicted",
1337				predicted_count * 100.0 / branch_count,
1338				bf + printed, bfsize - printed, 0.0);
1339	}
1340
1341	if (abort_count) {
1342		printed += count_float_printf(i++, "abort",
1343				abort_count * 100.0 / branch_count,
1344				bf + printed, bfsize - printed, 0.1);
1345	}
1346
1347	if (i)
1348		printed += scnprintf(bf + printed, bfsize - printed, ")");
1349
1350	return printed;
1351}
1352
1353static int branch_from_str(char *bf, int bfsize,
1354			   u64 branch_count,
1355			   u64 cycles_count, u64 iter_count,
1356			   u64 iter_cycles, u64 from_count)
1357{
1358	int printed = 0, i = 0;
1359	u64 cycles, v = 0;
1360
1361	cycles = cycles_count / branch_count;
1362	if (cycles) {
1363		printed += count_pri64_printf(i++, "cycles",
1364				cycles,
1365				bf + printed, bfsize - printed);
1366	}
1367
1368	if (iter_count && from_count) {
1369		v = iter_count / from_count;
1370		if (v) {
1371			printed += count_pri64_printf(i++, "iter",
1372					v, bf + printed, bfsize - printed);
1373
1374			printed += count_pri64_printf(i++, "avg_cycles",
1375					iter_cycles / iter_count,
1376					bf + printed, bfsize - printed);
1377		}
1378	}
1379
1380	if (i)
1381		printed += scnprintf(bf + printed, bfsize - printed, ")");
1382
1383	return printed;
1384}
1385
1386static int counts_str_build(char *bf, int bfsize,
1387			     u64 branch_count, u64 predicted_count,
1388			     u64 abort_count, u64 cycles_count,
1389			     u64 iter_count, u64 iter_cycles,
1390			     u64 from_count,
1391			     struct branch_type_stat *brtype_stat)
1392{
1393	int printed;
1394
1395	if (branch_count == 0)
1396		return scnprintf(bf, bfsize, " (calltrace)");
1397
1398	if (brtype_stat->branch_to) {
1399		printed = branch_to_str(bf, bfsize, branch_count,
1400				predicted_count, abort_count, brtype_stat);
1401	} else {
1402		printed = branch_from_str(bf, bfsize, branch_count,
1403				cycles_count, iter_count, iter_cycles,
1404				from_count);
1405	}
1406
1407	if (!printed)
1408		bf[0] = 0;
1409
1410	return printed;
1411}
1412
1413static int callchain_counts_printf(FILE *fp, char *bf, int bfsize,
1414				   u64 branch_count, u64 predicted_count,
1415				   u64 abort_count, u64 cycles_count,
1416				   u64 iter_count, u64 iter_cycles,
1417				   u64 from_count,
1418				   struct branch_type_stat *brtype_stat)
1419{
1420	char str[256];
1421
1422	counts_str_build(str, sizeof(str), branch_count,
1423			 predicted_count, abort_count, cycles_count,
1424			 iter_count, iter_cycles, from_count, brtype_stat);
1425
1426	if (fp)
1427		return fprintf(fp, "%s", str);
1428
1429	return scnprintf(bf, bfsize, "%s", str);
1430}
1431
1432int callchain_list_counts__printf_value(struct callchain_list *clist,
1433					FILE *fp, char *bf, int bfsize)
1434{
 
 
1435	u64 branch_count, predicted_count;
1436	u64 abort_count, cycles_count;
1437	u64 iter_count, iter_cycles;
1438	u64 from_count;
1439
 
1440	branch_count = clist->branch_count;
1441	predicted_count = clist->predicted_count;
1442	abort_count = clist->abort_count;
1443	cycles_count = clist->cycles_count;
1444	iter_count = clist->iter_count;
1445	iter_cycles = clist->iter_cycles;
1446	from_count = clist->from_count;
1447
1448	return callchain_counts_printf(fp, bf, bfsize, branch_count,
1449				       predicted_count, abort_count,
1450				       cycles_count, iter_count, iter_cycles,
1451				       from_count, &clist->brtype_stat);
1452}
1453
1454static void free_callchain_node(struct callchain_node *node)
1455{
1456	struct callchain_list *list, *tmp;
1457	struct callchain_node *child;
1458	struct rb_node *n;
1459
1460	list_for_each_entry_safe(list, tmp, &node->parent_val, list) {
1461		list_del_init(&list->list);
1462		map__zput(list->ms.map);
 
1463		free(list);
1464	}
1465
1466	list_for_each_entry_safe(list, tmp, &node->val, list) {
1467		list_del_init(&list->list);
1468		map__zput(list->ms.map);
 
1469		free(list);
1470	}
1471
1472	n = rb_first(&node->rb_root_in);
1473	while (n) {
1474		child = container_of(n, struct callchain_node, rb_node_in);
1475		n = rb_next(n);
1476		rb_erase(&child->rb_node_in, &node->rb_root_in);
1477
1478		free_callchain_node(child);
1479		free(child);
1480	}
1481}
1482
1483void free_callchain(struct callchain_root *root)
1484{
1485	if (!symbol_conf.use_callchain)
1486		return;
1487
1488	free_callchain_node(&root->node);
1489}
1490
1491static u64 decay_callchain_node(struct callchain_node *node)
1492{
1493	struct callchain_node *child;
1494	struct rb_node *n;
1495	u64 child_hits = 0;
1496
1497	n = rb_first(&node->rb_root_in);
1498	while (n) {
1499		child = container_of(n, struct callchain_node, rb_node_in);
1500
1501		child_hits += decay_callchain_node(child);
1502		n = rb_next(n);
1503	}
1504
1505	node->hit = (node->hit * 7) / 8;
1506	node->children_hit = child_hits;
1507
1508	return node->hit;
1509}
1510
1511void decay_callchain(struct callchain_root *root)
1512{
1513	if (!symbol_conf.use_callchain)
1514		return;
1515
1516	decay_callchain_node(&root->node);
1517}
1518
1519int callchain_node__make_parent_list(struct callchain_node *node)
1520{
1521	struct callchain_node *parent = node->parent;
1522	struct callchain_list *chain, *new;
1523	LIST_HEAD(head);
1524
1525	while (parent) {
1526		list_for_each_entry_reverse(chain, &parent->val, list) {
1527			new = malloc(sizeof(*new));
1528			if (new == NULL)
1529				goto out;
1530			*new = *chain;
1531			new->has_children = false;
1532			map__get(new->ms.map);
1533			list_add_tail(&new->list, &head);
1534		}
1535		parent = parent->parent;
1536	}
1537
1538	list_for_each_entry_safe_reverse(chain, new, &head, list)
1539		list_move_tail(&chain->list, &node->parent_val);
1540
1541	if (!list_empty(&node->parent_val)) {
1542		chain = list_first_entry(&node->parent_val, struct callchain_list, list);
1543		chain->has_children = rb_prev(&node->rb_node) || rb_next(&node->rb_node);
1544
1545		chain = list_first_entry(&node->val, struct callchain_list, list);
1546		chain->has_children = false;
1547	}
1548	return 0;
1549
1550out:
1551	list_for_each_entry_safe(chain, new, &head, list) {
1552		list_del_init(&chain->list);
1553		map__zput(chain->ms.map);
 
1554		free(chain);
1555	}
1556	return -ENOMEM;
1557}
1558
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1559int callchain_cursor__copy(struct callchain_cursor *dst,
1560			   struct callchain_cursor *src)
1561{
1562	int rc = 0;
1563
1564	callchain_cursor_reset(dst);
1565	callchain_cursor_commit(src);
1566
1567	while (true) {
1568		struct callchain_cursor_node *node;
1569
1570		node = callchain_cursor_current(src);
1571		if (node == NULL)
1572			break;
1573
1574		rc = callchain_cursor_append(dst, node->ip, node->map, node->sym,
1575					     node->branch, &node->branch_flags,
1576					     node->nr_loop_iter,
1577					     node->iter_cycles,
1578					     node->branch_from, node->srcline);
1579		if (rc)
1580			break;
1581
1582		callchain_cursor_advance(src);
1583	}
1584
1585	return rc;
1586}
1587
1588/*
1589 * Initialize a cursor before adding entries inside, but keep
1590 * the previously allocated entries as a cache.
1591 */
1592void callchain_cursor_reset(struct callchain_cursor *cursor)
1593{
1594	struct callchain_cursor_node *node;
1595
1596	cursor->nr = 0;
1597	cursor->last = &cursor->first;
1598
1599	for (node = cursor->first; node != NULL; node = node->next)
1600		map__zput(node->map);
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1601}
v6.8
   1// SPDX-License-Identifier: GPL-2.0
   2/*
   3 * Copyright (C) 2009-2011, Frederic Weisbecker <fweisbec@gmail.com>
   4 *
   5 * Handle the callchains from the stream in an ad-hoc radix tree and then
   6 * sort them in an rbtree.
   7 *
   8 * Using a radix for code path provides a fast retrieval and factorizes
   9 * memory use. Also that lets us use the paths in a hierarchical graph view.
  10 *
  11 */
  12
  13#include <inttypes.h>
  14#include <stdlib.h>
  15#include <stdio.h>
  16#include <stdbool.h>
  17#include <errno.h>
  18#include <math.h>
  19#include <linux/string.h>
  20#include <linux/zalloc.h>
  21
  22#include "asm/bug.h"
  23
  24#include "debug.h"
  25#include "dso.h"
  26#include "event.h"
  27#include "hist.h"
  28#include "sort.h"
  29#include "machine.h"
  30#include "map.h"
  31#include "callchain.h"
  32#include "branch.h"
  33#include "symbol.h"
  34#include "util.h"
  35#include "../perf.h"
  36
  37#define CALLCHAIN_PARAM_DEFAULT			\
  38	.mode		= CHAIN_GRAPH_ABS,	\
  39	.min_percent	= 0.5,			\
  40	.order		= ORDER_CALLEE,		\
  41	.key		= CCKEY_FUNCTION,	\
  42	.value		= CCVAL_PERCENT,	\
  43
  44struct callchain_param callchain_param = {
  45	CALLCHAIN_PARAM_DEFAULT
  46};
  47
  48/*
  49 * Are there any events usind DWARF callchains?
  50 *
  51 * I.e.
  52 *
  53 * -e cycles/call-graph=dwarf/
  54 */
  55bool dwarf_callchain_users;
  56
  57struct callchain_param callchain_param_default = {
  58	CALLCHAIN_PARAM_DEFAULT
  59};
  60
  61/* Used for thread-local struct callchain_cursor. */
  62static pthread_key_t callchain_cursor;
  63
  64int parse_callchain_record_opt(const char *arg, struct callchain_param *param)
  65{
  66	return parse_callchain_record(arg, param);
  67}
  68
  69static int parse_callchain_mode(const char *value)
  70{
  71	if (!strncmp(value, "graph", strlen(value))) {
  72		callchain_param.mode = CHAIN_GRAPH_ABS;
  73		return 0;
  74	}
  75	if (!strncmp(value, "flat", strlen(value))) {
  76		callchain_param.mode = CHAIN_FLAT;
  77		return 0;
  78	}
  79	if (!strncmp(value, "fractal", strlen(value))) {
  80		callchain_param.mode = CHAIN_GRAPH_REL;
  81		return 0;
  82	}
  83	if (!strncmp(value, "folded", strlen(value))) {
  84		callchain_param.mode = CHAIN_FOLDED;
  85		return 0;
  86	}
  87	return -1;
  88}
  89
  90static int parse_callchain_order(const char *value)
  91{
  92	if (!strncmp(value, "caller", strlen(value))) {
  93		callchain_param.order = ORDER_CALLER;
  94		callchain_param.order_set = true;
  95		return 0;
  96	}
  97	if (!strncmp(value, "callee", strlen(value))) {
  98		callchain_param.order = ORDER_CALLEE;
  99		callchain_param.order_set = true;
 100		return 0;
 101	}
 102	return -1;
 103}
 104
 105static int parse_callchain_sort_key(const char *value)
 106{
 107	if (!strncmp(value, "function", strlen(value))) {
 108		callchain_param.key = CCKEY_FUNCTION;
 109		return 0;
 110	}
 111	if (!strncmp(value, "address", strlen(value))) {
 112		callchain_param.key = CCKEY_ADDRESS;
 113		return 0;
 114	}
 115	if (!strncmp(value, "srcline", strlen(value))) {
 116		callchain_param.key = CCKEY_SRCLINE;
 117		return 0;
 118	}
 119	if (!strncmp(value, "branch", strlen(value))) {
 120		callchain_param.branch_callstack = 1;
 121		return 0;
 122	}
 123	return -1;
 124}
 125
 126static int parse_callchain_value(const char *value)
 127{
 128	if (!strncmp(value, "percent", strlen(value))) {
 129		callchain_param.value = CCVAL_PERCENT;
 130		return 0;
 131	}
 132	if (!strncmp(value, "period", strlen(value))) {
 133		callchain_param.value = CCVAL_PERIOD;
 134		return 0;
 135	}
 136	if (!strncmp(value, "count", strlen(value))) {
 137		callchain_param.value = CCVAL_COUNT;
 138		return 0;
 139	}
 140	return -1;
 141}
 142
 143static int get_stack_size(const char *str, unsigned long *_size)
 144{
 145	char *endptr;
 146	unsigned long size;
 147	unsigned long max_size = round_down(USHRT_MAX, sizeof(u64));
 148
 149	size = strtoul(str, &endptr, 0);
 150
 151	do {
 152		if (*endptr)
 153			break;
 154
 155		size = round_up(size, sizeof(u64));
 156		if (!size || size > max_size)
 157			break;
 158
 159		*_size = size;
 160		return 0;
 161
 162	} while (0);
 163
 164	pr_err("callchain: Incorrect stack dump size (max %ld): %s\n",
 165	       max_size, str);
 166	return -1;
 167}
 168
 169static int
 170__parse_callchain_report_opt(const char *arg, bool allow_record_opt)
 171{
 172	char *tok;
 173	char *endptr, *saveptr = NULL;
 174	bool minpcnt_set = false;
 175	bool record_opt_set = false;
 176	bool try_stack_size = false;
 177
 178	callchain_param.enabled = true;
 179	symbol_conf.use_callchain = true;
 180
 181	if (!arg)
 182		return 0;
 183
 184	while ((tok = strtok_r((char *)arg, ",", &saveptr)) != NULL) {
 185		if (!strncmp(tok, "none", strlen(tok))) {
 186			callchain_param.mode = CHAIN_NONE;
 187			callchain_param.enabled = false;
 188			symbol_conf.use_callchain = false;
 189			return 0;
 190		}
 191
 192		if (!parse_callchain_mode(tok) ||
 193		    !parse_callchain_order(tok) ||
 194		    !parse_callchain_sort_key(tok) ||
 195		    !parse_callchain_value(tok)) {
 196			/* parsing ok - move on to the next */
 197			try_stack_size = false;
 198			goto next;
 199		} else if (allow_record_opt && !record_opt_set) {
 200			if (parse_callchain_record(tok, &callchain_param))
 201				goto try_numbers;
 202
 203			/* assume that number followed by 'dwarf' is stack size */
 204			if (callchain_param.record_mode == CALLCHAIN_DWARF)
 205				try_stack_size = true;
 206
 207			record_opt_set = true;
 208			goto next;
 209		}
 210
 211try_numbers:
 212		if (try_stack_size) {
 213			unsigned long size = 0;
 214
 215			if (get_stack_size(tok, &size) < 0)
 216				return -1;
 217			callchain_param.dump_size = size;
 218			try_stack_size = false;
 219		} else if (!minpcnt_set) {
 220			/* try to get the min percent */
 221			callchain_param.min_percent = strtod(tok, &endptr);
 222			if (tok == endptr)
 223				return -1;
 224			minpcnt_set = true;
 225		} else {
 226			/* try print limit at last */
 227			callchain_param.print_limit = strtoul(tok, &endptr, 0);
 228			if (tok == endptr)
 229				return -1;
 230		}
 231next:
 232		arg = NULL;
 233	}
 234
 235	if (callchain_register_param(&callchain_param) < 0) {
 236		pr_err("Can't register callchain params\n");
 237		return -1;
 238	}
 239	return 0;
 240}
 241
 242int parse_callchain_report_opt(const char *arg)
 243{
 244	return __parse_callchain_report_opt(arg, false);
 245}
 246
 247int parse_callchain_top_opt(const char *arg)
 248{
 249	return __parse_callchain_report_opt(arg, true);
 250}
 251
 252int parse_callchain_record(const char *arg, struct callchain_param *param)
 253{
 254	char *tok, *name, *saveptr = NULL;
 255	char *buf;
 256	int ret = -1;
 257
 258	/* We need buffer that we know we can write to. */
 259	buf = malloc(strlen(arg) + 1);
 260	if (!buf)
 261		return -ENOMEM;
 262
 263	strcpy(buf, arg);
 264
 265	tok = strtok_r((char *)buf, ",", &saveptr);
 266	name = tok ? : (char *)buf;
 267
 268	do {
 269		/* Framepointer style */
 270		if (!strncmp(name, "fp", sizeof("fp"))) {
 271			ret = 0;
 272			param->record_mode = CALLCHAIN_FP;
 273
 274			tok = strtok_r(NULL, ",", &saveptr);
 275			if (tok) {
 276				unsigned long size;
 277
 278				size = strtoul(tok, &name, 0);
 279				if (size < (unsigned) sysctl__max_stack())
 280					param->max_stack = size;
 281			}
 282			break;
 283
 284		/* Dwarf style */
 285		} else if (!strncmp(name, "dwarf", sizeof("dwarf"))) {
 286			const unsigned long default_stack_dump_size = 8192;
 287
 288			ret = 0;
 289			param->record_mode = CALLCHAIN_DWARF;
 290			param->dump_size = default_stack_dump_size;
 291			dwarf_callchain_users = true;
 292
 293			tok = strtok_r(NULL, ",", &saveptr);
 294			if (tok) {
 295				unsigned long size = 0;
 296
 297				ret = get_stack_size(tok, &size);
 298				param->dump_size = size;
 299			}
 300		} else if (!strncmp(name, "lbr", sizeof("lbr"))) {
 301			if (!strtok_r(NULL, ",", &saveptr)) {
 302				param->record_mode = CALLCHAIN_LBR;
 303				ret = 0;
 304			} else
 305				pr_err("callchain: No more arguments "
 306					"needed for --call-graph lbr\n");
 307			break;
 308		} else {
 309			pr_err("callchain: Unknown --call-graph option "
 310			       "value: %s\n", arg);
 311			break;
 312		}
 313
 314	} while (0);
 315
 316	free(buf);
 317	return ret;
 318}
 319
 320int perf_callchain_config(const char *var, const char *value)
 321{
 322	char *endptr;
 323
 324	if (!strstarts(var, "call-graph."))
 325		return 0;
 326	var += sizeof("call-graph.") - 1;
 327
 328	if (!strcmp(var, "record-mode"))
 329		return parse_callchain_record_opt(value, &callchain_param);
 330	if (!strcmp(var, "dump-size")) {
 331		unsigned long size = 0;
 332		int ret;
 333
 334		ret = get_stack_size(value, &size);
 335		callchain_param.dump_size = size;
 336
 337		return ret;
 338	}
 339	if (!strcmp(var, "print-type")){
 340		int ret;
 341		ret = parse_callchain_mode(value);
 342		if (ret == -1)
 343			pr_err("Invalid callchain mode: %s\n", value);
 344		return ret;
 345	}
 346	if (!strcmp(var, "order")){
 347		int ret;
 348		ret = parse_callchain_order(value);
 349		if (ret == -1)
 350			pr_err("Invalid callchain order: %s\n", value);
 351		return ret;
 352	}
 353	if (!strcmp(var, "sort-key")){
 354		int ret;
 355		ret = parse_callchain_sort_key(value);
 356		if (ret == -1)
 357			pr_err("Invalid callchain sort key: %s\n", value);
 358		return ret;
 359	}
 360	if (!strcmp(var, "threshold")) {
 361		callchain_param.min_percent = strtod(value, &endptr);
 362		if (value == endptr) {
 363			pr_err("Invalid callchain threshold: %s\n", value);
 364			return -1;
 365		}
 366	}
 367	if (!strcmp(var, "print-limit")) {
 368		callchain_param.print_limit = strtod(value, &endptr);
 369		if (value == endptr) {
 370			pr_err("Invalid callchain print limit: %s\n", value);
 371			return -1;
 372		}
 373	}
 374
 375	return 0;
 376}
 377
 378static void
 379rb_insert_callchain(struct rb_root *root, struct callchain_node *chain,
 380		    enum chain_mode mode)
 381{
 382	struct rb_node **p = &root->rb_node;
 383	struct rb_node *parent = NULL;
 384	struct callchain_node *rnode;
 385	u64 chain_cumul = callchain_cumul_hits(chain);
 386
 387	while (*p) {
 388		u64 rnode_cumul;
 389
 390		parent = *p;
 391		rnode = rb_entry(parent, struct callchain_node, rb_node);
 392		rnode_cumul = callchain_cumul_hits(rnode);
 393
 394		switch (mode) {
 395		case CHAIN_FLAT:
 396		case CHAIN_FOLDED:
 397			if (rnode->hit < chain->hit)
 398				p = &(*p)->rb_left;
 399			else
 400				p = &(*p)->rb_right;
 401			break;
 402		case CHAIN_GRAPH_ABS: /* Falldown */
 403		case CHAIN_GRAPH_REL:
 404			if (rnode_cumul < chain_cumul)
 405				p = &(*p)->rb_left;
 406			else
 407				p = &(*p)->rb_right;
 408			break;
 409		case CHAIN_NONE:
 410		default:
 411			break;
 412		}
 413	}
 414
 415	rb_link_node(&chain->rb_node, parent, p);
 416	rb_insert_color(&chain->rb_node, root);
 417}
 418
 419static void
 420__sort_chain_flat(struct rb_root *rb_root, struct callchain_node *node,
 421		  u64 min_hit)
 422{
 423	struct rb_node *n;
 424	struct callchain_node *child;
 425
 426	n = rb_first(&node->rb_root_in);
 427	while (n) {
 428		child = rb_entry(n, struct callchain_node, rb_node_in);
 429		n = rb_next(n);
 430
 431		__sort_chain_flat(rb_root, child, min_hit);
 432	}
 433
 434	if (node->hit && node->hit >= min_hit)
 435		rb_insert_callchain(rb_root, node, CHAIN_FLAT);
 436}
 437
 438/*
 439 * Once we get every callchains from the stream, we can now
 440 * sort them by hit
 441 */
 442static void
 443sort_chain_flat(struct rb_root *rb_root, struct callchain_root *root,
 444		u64 min_hit, struct callchain_param *param __maybe_unused)
 445{
 446	*rb_root = RB_ROOT;
 447	__sort_chain_flat(rb_root, &root->node, min_hit);
 448}
 449
 450static void __sort_chain_graph_abs(struct callchain_node *node,
 451				   u64 min_hit)
 452{
 453	struct rb_node *n;
 454	struct callchain_node *child;
 455
 456	node->rb_root = RB_ROOT;
 457	n = rb_first(&node->rb_root_in);
 458
 459	while (n) {
 460		child = rb_entry(n, struct callchain_node, rb_node_in);
 461		n = rb_next(n);
 462
 463		__sort_chain_graph_abs(child, min_hit);
 464		if (callchain_cumul_hits(child) >= min_hit)
 465			rb_insert_callchain(&node->rb_root, child,
 466					    CHAIN_GRAPH_ABS);
 467	}
 468}
 469
 470static void
 471sort_chain_graph_abs(struct rb_root *rb_root, struct callchain_root *chain_root,
 472		     u64 min_hit, struct callchain_param *param __maybe_unused)
 473{
 474	__sort_chain_graph_abs(&chain_root->node, min_hit);
 475	rb_root->rb_node = chain_root->node.rb_root.rb_node;
 476}
 477
 478static void __sort_chain_graph_rel(struct callchain_node *node,
 479				   double min_percent)
 480{
 481	struct rb_node *n;
 482	struct callchain_node *child;
 483	u64 min_hit;
 484
 485	node->rb_root = RB_ROOT;
 486	min_hit = ceil(node->children_hit * min_percent);
 487
 488	n = rb_first(&node->rb_root_in);
 489	while (n) {
 490		child = rb_entry(n, struct callchain_node, rb_node_in);
 491		n = rb_next(n);
 492
 493		__sort_chain_graph_rel(child, min_percent);
 494		if (callchain_cumul_hits(child) >= min_hit)
 495			rb_insert_callchain(&node->rb_root, child,
 496					    CHAIN_GRAPH_REL);
 497	}
 498}
 499
 500static void
 501sort_chain_graph_rel(struct rb_root *rb_root, struct callchain_root *chain_root,
 502		     u64 min_hit __maybe_unused, struct callchain_param *param)
 503{
 504	__sort_chain_graph_rel(&chain_root->node, param->min_percent / 100.0);
 505	rb_root->rb_node = chain_root->node.rb_root.rb_node;
 506}
 507
 508int callchain_register_param(struct callchain_param *param)
 509{
 510	switch (param->mode) {
 511	case CHAIN_GRAPH_ABS:
 512		param->sort = sort_chain_graph_abs;
 513		break;
 514	case CHAIN_GRAPH_REL:
 515		param->sort = sort_chain_graph_rel;
 516		break;
 517	case CHAIN_FLAT:
 518	case CHAIN_FOLDED:
 519		param->sort = sort_chain_flat;
 520		break;
 521	case CHAIN_NONE:
 522	default:
 523		return -1;
 524	}
 525	return 0;
 526}
 527
 528/*
 529 * Create a child for a parent. If inherit_children, then the new child
 530 * will become the new parent of it's parent children
 531 */
 532static struct callchain_node *
 533create_child(struct callchain_node *parent, bool inherit_children)
 534{
 535	struct callchain_node *new;
 536
 537	new = zalloc(sizeof(*new));
 538	if (!new) {
 539		perror("not enough memory to create child for code path tree");
 540		return NULL;
 541	}
 542	new->parent = parent;
 543	INIT_LIST_HEAD(&new->val);
 544	INIT_LIST_HEAD(&new->parent_val);
 545
 546	if (inherit_children) {
 547		struct rb_node *n;
 548		struct callchain_node *child;
 549
 550		new->rb_root_in = parent->rb_root_in;
 551		parent->rb_root_in = RB_ROOT;
 552
 553		n = rb_first(&new->rb_root_in);
 554		while (n) {
 555			child = rb_entry(n, struct callchain_node, rb_node_in);
 556			child->parent = new;
 557			n = rb_next(n);
 558		}
 559
 560		/* make it the first child */
 561		rb_link_node(&new->rb_node_in, NULL, &parent->rb_root_in.rb_node);
 562		rb_insert_color(&new->rb_node_in, &parent->rb_root_in);
 563	}
 564
 565	return new;
 566}
 567
 568
 569/*
 570 * Fill the node with callchain values
 571 */
 572static int
 573fill_node(struct callchain_node *node, struct callchain_cursor *cursor)
 574{
 575	struct callchain_cursor_node *cursor_node;
 576
 577	node->val_nr = cursor->nr - cursor->pos;
 578	if (!node->val_nr)
 579		pr_warning("Warning: empty node in callchain tree\n");
 580
 581	cursor_node = callchain_cursor_current(cursor);
 582
 583	while (cursor_node) {
 584		struct callchain_list *call;
 585
 586		call = zalloc(sizeof(*call));
 587		if (!call) {
 588			perror("not enough memory for the code path tree");
 589			return -ENOMEM;
 590		}
 591		call->ip = cursor_node->ip;
 592		call->ms = cursor_node->ms;
 593		call->ms.map = map__get(call->ms.map);
 594		call->ms.maps = maps__get(call->ms.maps);
 595		call->srcline = cursor_node->srcline;
 596
 597		if (cursor_node->branch) {
 598			call->branch_count = 1;
 599
 600			if (cursor_node->branch_from) {
 601				/*
 602				 * branch_from is set with value somewhere else
 603				 * to imply it's "to" of a branch.
 604				 */
 605				if (!call->brtype_stat) {
 606					call->brtype_stat = zalloc(sizeof(*call->brtype_stat));
 607					if (!call->brtype_stat) {
 608						perror("not enough memory for the code path branch statistics");
 609						free(call->brtype_stat);
 610						return -ENOMEM;
 611					}
 612				}
 613				call->brtype_stat->branch_to = true;
 614
 615				if (cursor_node->branch_flags.predicted)
 616					call->predicted_count = 1;
 617
 618				if (cursor_node->branch_flags.abort)
 619					call->abort_count = 1;
 620
 621				branch_type_count(call->brtype_stat,
 622						  &cursor_node->branch_flags,
 623						  cursor_node->branch_from,
 624						  cursor_node->ip);
 625			} else {
 626				/*
 627				 * It's "from" of a branch
 628				 */
 629				if (call->brtype_stat && call->brtype_stat->branch_to)
 630					call->brtype_stat->branch_to = false;
 631				call->cycles_count =
 632					cursor_node->branch_flags.cycles;
 633				call->iter_count = cursor_node->nr_loop_iter;
 634				call->iter_cycles = cursor_node->iter_cycles;
 635			}
 636		}
 637
 638		list_add_tail(&call->list, &node->val);
 639
 640		callchain_cursor_advance(cursor);
 641		cursor_node = callchain_cursor_current(cursor);
 642	}
 643	return 0;
 644}
 645
 646static struct callchain_node *
 647add_child(struct callchain_node *parent,
 648	  struct callchain_cursor *cursor,
 649	  u64 period)
 650{
 651	struct callchain_node *new;
 652
 653	new = create_child(parent, false);
 654	if (new == NULL)
 655		return NULL;
 656
 657	if (fill_node(new, cursor) < 0) {
 658		struct callchain_list *call, *tmp;
 659
 660		list_for_each_entry_safe(call, tmp, &new->val, list) {
 661			list_del_init(&call->list);
 662			map_symbol__exit(&call->ms);
 663			zfree(&call->brtype_stat);
 664			free(call);
 665		}
 666		free(new);
 667		return NULL;
 668	}
 669
 670	new->children_hit = 0;
 671	new->hit = period;
 672	new->children_count = 0;
 673	new->count = 1;
 674	return new;
 675}
 676
 677enum match_result {
 678	MATCH_ERROR  = -1,
 679	MATCH_EQ,
 680	MATCH_LT,
 681	MATCH_GT,
 682};
 683
 684static enum match_result match_chain_strings(const char *left,
 685					     const char *right)
 686{
 687	enum match_result ret = MATCH_EQ;
 688	int cmp;
 689
 690	if (left && right)
 691		cmp = strcmp(left, right);
 692	else if (!left && right)
 693		cmp = 1;
 694	else if (left && !right)
 695		cmp = -1;
 696	else
 697		return MATCH_ERROR;
 698
 699	if (cmp != 0)
 700		ret = cmp < 0 ? MATCH_LT : MATCH_GT;
 701
 702	return ret;
 703}
 704
 705/*
 706 * We need to always use relative addresses because we're aggregating
 707 * callchains from multiple threads, i.e. different address spaces, so
 708 * comparing absolute addresses make no sense as a symbol in a DSO may end up
 709 * in a different address when used in a different binary or even the same
 710 * binary but with some sort of address randomization technique, thus we need
 711 * to compare just relative addresses. -acme
 712 */
 713static enum match_result match_chain_dso_addresses(struct map *left_map, u64 left_ip,
 714						   struct map *right_map, u64 right_ip)
 715{
 716	struct dso *left_dso = left_map ? map__dso(left_map) : NULL;
 717	struct dso *right_dso = right_map ? map__dso(right_map) : NULL;
 718
 719	if (left_dso != right_dso)
 720		return left_dso < right_dso ? MATCH_LT : MATCH_GT;
 721
 722	if (left_ip != right_ip)
 723 		return left_ip < right_ip ? MATCH_LT : MATCH_GT;
 724
 725	return MATCH_EQ;
 726}
 727
 728static enum match_result match_chain(struct callchain_cursor_node *node,
 729				     struct callchain_list *cnode)
 730{
 731	enum match_result match = MATCH_ERROR;
 732
 733	switch (callchain_param.key) {
 734	case CCKEY_SRCLINE:
 735		match = match_chain_strings(cnode->srcline, node->srcline);
 736		if (match != MATCH_ERROR)
 737			break;
 738		/* otherwise fall-back to symbol-based comparison below */
 739		fallthrough;
 740	case CCKEY_FUNCTION:
 741		if (node->ms.sym && cnode->ms.sym) {
 742			/*
 743			 * Compare inlined frames based on their symbol name
 744			 * because different inlined frames will have the same
 745			 * symbol start. Otherwise do a faster comparison based
 746			 * on the symbol start address.
 747			 */
 748			if (cnode->ms.sym->inlined || node->ms.sym->inlined) {
 749				match = match_chain_strings(cnode->ms.sym->name,
 750							    node->ms.sym->name);
 751				if (match != MATCH_ERROR)
 752					break;
 753			} else {
 754				match = match_chain_dso_addresses(cnode->ms.map, cnode->ms.sym->start,
 755								  node->ms.map, node->ms.sym->start);
 756				break;
 757			}
 758		}
 759		/* otherwise fall-back to IP-based comparison below */
 760		fallthrough;
 761	case CCKEY_ADDRESS:
 762	default:
 763		match = match_chain_dso_addresses(cnode->ms.map, cnode->ip, node->ms.map, node->ip);
 764		break;
 765	}
 766
 767	if (match == MATCH_EQ && node->branch) {
 768		cnode->branch_count++;
 769
 770		if (node->branch_from) {
 771			/*
 772			 * It's "to" of a branch
 773			 */
 774			if (!cnode->brtype_stat) {
 775				cnode->brtype_stat = zalloc(sizeof(*cnode->brtype_stat));
 776				if (!cnode->brtype_stat) {
 777					perror("not enough memory for the code path branch statistics");
 778					return MATCH_ERROR;
 779				}
 780			}
 781			cnode->brtype_stat->branch_to = true;
 782
 783			if (node->branch_flags.predicted)
 784				cnode->predicted_count++;
 785
 786			if (node->branch_flags.abort)
 787				cnode->abort_count++;
 788
 789			branch_type_count(cnode->brtype_stat,
 790					  &node->branch_flags,
 791					  node->branch_from,
 792					  node->ip);
 793		} else {
 794			/*
 795			 * It's "from" of a branch
 796			 */
 797			if (cnode->brtype_stat && cnode->brtype_stat->branch_to)
 798				cnode->brtype_stat->branch_to = false;
 799			cnode->cycles_count += node->branch_flags.cycles;
 800			cnode->iter_count += node->nr_loop_iter;
 801			cnode->iter_cycles += node->iter_cycles;
 802			cnode->from_count++;
 803		}
 804	}
 805
 806	return match;
 807}
 808
 809/*
 810 * Split the parent in two parts (a new child is created) and
 811 * give a part of its callchain to the created child.
 812 * Then create another child to host the given callchain of new branch
 813 */
 814static int
 815split_add_child(struct callchain_node *parent,
 816		struct callchain_cursor *cursor,
 817		struct callchain_list *to_split,
 818		u64 idx_parents, u64 idx_local, u64 period)
 819{
 820	struct callchain_node *new;
 821	struct list_head *old_tail;
 822	unsigned int idx_total = idx_parents + idx_local;
 823
 824	/* split */
 825	new = create_child(parent, true);
 826	if (new == NULL)
 827		return -1;
 828
 829	/* split the callchain and move a part to the new child */
 830	old_tail = parent->val.prev;
 831	list_del_range(&to_split->list, old_tail);
 832	new->val.next = &to_split->list;
 833	new->val.prev = old_tail;
 834	to_split->list.prev = &new->val;
 835	old_tail->next = &new->val;
 836
 837	/* split the hits */
 838	new->hit = parent->hit;
 839	new->children_hit = parent->children_hit;
 840	parent->children_hit = callchain_cumul_hits(new);
 841	new->val_nr = parent->val_nr - idx_local;
 842	parent->val_nr = idx_local;
 843	new->count = parent->count;
 844	new->children_count = parent->children_count;
 845	parent->children_count = callchain_cumul_counts(new);
 846
 847	/* create a new child for the new branch if any */
 848	if (idx_total < cursor->nr) {
 849		struct callchain_node *first;
 850		struct callchain_list *cnode;
 851		struct callchain_cursor_node *node;
 852		struct rb_node *p, **pp;
 853
 854		parent->hit = 0;
 855		parent->children_hit += period;
 856		parent->count = 0;
 857		parent->children_count += 1;
 858
 859		node = callchain_cursor_current(cursor);
 860		new = add_child(parent, cursor, period);
 861		if (new == NULL)
 862			return -1;
 863
 864		/*
 865		 * This is second child since we moved parent's children
 866		 * to new (first) child above.
 867		 */
 868		p = parent->rb_root_in.rb_node;
 869		first = rb_entry(p, struct callchain_node, rb_node_in);
 870		cnode = list_first_entry(&first->val, struct callchain_list,
 871					 list);
 872
 873		if (match_chain(node, cnode) == MATCH_LT)
 874			pp = &p->rb_left;
 875		else
 876			pp = &p->rb_right;
 877
 878		rb_link_node(&new->rb_node_in, p, pp);
 879		rb_insert_color(&new->rb_node_in, &parent->rb_root_in);
 880	} else {
 881		parent->hit = period;
 882		parent->count = 1;
 883	}
 884	return 0;
 885}
 886
 887static enum match_result
 888append_chain(struct callchain_node *root,
 889	     struct callchain_cursor *cursor,
 890	     u64 period);
 891
 892static int
 893append_chain_children(struct callchain_node *root,
 894		      struct callchain_cursor *cursor,
 895		      u64 period)
 896{
 897	struct callchain_node *rnode;
 898	struct callchain_cursor_node *node;
 899	struct rb_node **p = &root->rb_root_in.rb_node;
 900	struct rb_node *parent = NULL;
 901
 902	node = callchain_cursor_current(cursor);
 903	if (!node)
 904		return -1;
 905
 906	/* lookup in children */
 907	while (*p) {
 908		enum match_result ret;
 909
 910		parent = *p;
 911		rnode = rb_entry(parent, struct callchain_node, rb_node_in);
 912
 913		/* If at least first entry matches, rely to children */
 914		ret = append_chain(rnode, cursor, period);
 915		if (ret == MATCH_EQ)
 916			goto inc_children_hit;
 917		if (ret == MATCH_ERROR)
 918			return -1;
 919
 920		if (ret == MATCH_LT)
 921			p = &parent->rb_left;
 922		else
 923			p = &parent->rb_right;
 924	}
 925	/* nothing in children, add to the current node */
 926	rnode = add_child(root, cursor, period);
 927	if (rnode == NULL)
 928		return -1;
 929
 930	rb_link_node(&rnode->rb_node_in, parent, p);
 931	rb_insert_color(&rnode->rb_node_in, &root->rb_root_in);
 932
 933inc_children_hit:
 934	root->children_hit += period;
 935	root->children_count++;
 936	return 0;
 937}
 938
 939static enum match_result
 940append_chain(struct callchain_node *root,
 941	     struct callchain_cursor *cursor,
 942	     u64 period)
 943{
 944	struct callchain_list *cnode;
 945	u64 start = cursor->pos;
 946	bool found = false;
 947	u64 matches;
 948	enum match_result cmp = MATCH_ERROR;
 949
 950	/*
 951	 * Lookup in the current node
 952	 * If we have a symbol, then compare the start to match
 953	 * anywhere inside a function, unless function
 954	 * mode is disabled.
 955	 */
 956	list_for_each_entry(cnode, &root->val, list) {
 957		struct callchain_cursor_node *node;
 958
 959		node = callchain_cursor_current(cursor);
 960		if (!node)
 961			break;
 962
 963		cmp = match_chain(node, cnode);
 964		if (cmp != MATCH_EQ)
 965			break;
 966
 967		found = true;
 968
 969		callchain_cursor_advance(cursor);
 970	}
 971
 972	/* matches not, relay no the parent */
 973	if (!found) {
 974		WARN_ONCE(cmp == MATCH_ERROR, "Chain comparison error\n");
 975		return cmp;
 976	}
 977
 978	matches = cursor->pos - start;
 979
 980	/* we match only a part of the node. Split it and add the new chain */
 981	if (matches < root->val_nr) {
 982		if (split_add_child(root, cursor, cnode, start, matches,
 983				    period) < 0)
 984			return MATCH_ERROR;
 985
 986		return MATCH_EQ;
 987	}
 988
 989	/* we match 100% of the path, increment the hit */
 990	if (matches == root->val_nr && cursor->pos == cursor->nr) {
 991		root->hit += period;
 992		root->count++;
 993		return MATCH_EQ;
 994	}
 995
 996	/* We match the node and still have a part remaining */
 997	if (append_chain_children(root, cursor, period) < 0)
 998		return MATCH_ERROR;
 999
1000	return MATCH_EQ;
1001}
1002
1003int callchain_append(struct callchain_root *root,
1004		     struct callchain_cursor *cursor,
1005		     u64 period)
1006{
1007	if (cursor == NULL)
1008		return -1;
1009
1010	if (!cursor->nr)
1011		return 0;
1012
1013	callchain_cursor_commit(cursor);
1014
1015	if (append_chain_children(&root->node, cursor, period) < 0)
1016		return -1;
1017
1018	if (cursor->nr > root->max_depth)
1019		root->max_depth = cursor->nr;
1020
1021	return 0;
1022}
1023
1024static int
1025merge_chain_branch(struct callchain_cursor *cursor,
1026		   struct callchain_node *dst, struct callchain_node *src)
1027{
1028	struct callchain_cursor_node **old_last = cursor->last;
1029	struct callchain_node *child;
1030	struct callchain_list *list, *next_list;
1031	struct rb_node *n;
1032	int old_pos = cursor->nr;
1033	int err = 0;
1034
1035	list_for_each_entry_safe(list, next_list, &src->val, list) {
1036		struct map_symbol ms = {
1037			.maps = maps__get(list->ms.maps),
1038			.map = map__get(list->ms.map),
1039		};
1040		callchain_cursor_append(cursor, list->ip, &ms, false, NULL, 0, 0, 0, list->srcline);
1041		list_del_init(&list->list);
1042		map_symbol__exit(&ms);
1043		map_symbol__exit(&list->ms);
1044		zfree(&list->brtype_stat);
1045		free(list);
1046	}
1047
1048	if (src->hit) {
1049		callchain_cursor_commit(cursor);
1050		if (append_chain_children(dst, cursor, src->hit) < 0)
1051			return -1;
1052	}
1053
1054	n = rb_first(&src->rb_root_in);
1055	while (n) {
1056		child = container_of(n, struct callchain_node, rb_node_in);
1057		n = rb_next(n);
1058		rb_erase(&child->rb_node_in, &src->rb_root_in);
1059
1060		err = merge_chain_branch(cursor, dst, child);
1061		if (err)
1062			break;
1063
1064		free(child);
1065	}
1066
1067	cursor->nr = old_pos;
1068	cursor->last = old_last;
1069
1070	return err;
1071}
1072
1073int callchain_merge(struct callchain_cursor *cursor,
1074		    struct callchain_root *dst, struct callchain_root *src)
1075{
1076	return merge_chain_branch(cursor, &dst->node, &src->node);
1077}
1078
1079int callchain_cursor_append(struct callchain_cursor *cursor,
1080			    u64 ip, struct map_symbol *ms,
1081			    bool branch, struct branch_flags *flags,
1082			    int nr_loop_iter, u64 iter_cycles, u64 branch_from,
1083			    const char *srcline)
1084{
1085	struct callchain_cursor_node *node = *cursor->last;
1086
1087	if (!node) {
1088		node = calloc(1, sizeof(*node));
1089		if (!node)
1090			return -ENOMEM;
1091
1092		*cursor->last = node;
1093	}
1094
1095	node->ip = ip;
1096	map_symbol__exit(&node->ms);
1097	node->ms = *ms;
1098	node->ms.maps = maps__get(ms->maps);
1099	node->ms.map = map__get(ms->map);
1100	node->branch = branch;
1101	node->nr_loop_iter = nr_loop_iter;
1102	node->iter_cycles = iter_cycles;
1103	node->srcline = srcline;
1104
1105	if (flags)
1106		memcpy(&node->branch_flags, flags,
1107			sizeof(struct branch_flags));
1108
1109	node->branch_from = branch_from;
1110	cursor->nr++;
1111
1112	cursor->last = &node->next;
1113
1114	return 0;
1115}
1116
1117int sample__resolve_callchain(struct perf_sample *sample,
1118			      struct callchain_cursor *cursor, struct symbol **parent,
1119			      struct evsel *evsel, struct addr_location *al,
1120			      int max_stack)
1121{
1122	if (sample->callchain == NULL && !symbol_conf.show_branchflag_count)
1123		return 0;
1124
1125	if (symbol_conf.use_callchain || symbol_conf.cumulate_callchain ||
1126	    perf_hpp_list.parent || symbol_conf.show_branchflag_count) {
1127		return thread__resolve_callchain(al->thread, cursor, evsel, sample,
1128						 parent, al, max_stack);
1129	}
1130	return 0;
1131}
1132
1133int hist_entry__append_callchain(struct hist_entry *he, struct perf_sample *sample)
1134{
1135	if ((!symbol_conf.use_callchain || sample->callchain == NULL) &&
1136		!symbol_conf.show_branchflag_count)
1137		return 0;
1138	return callchain_append(he->callchain, get_tls_callchain_cursor(), sample->period);
1139}
1140
1141int fill_callchain_info(struct addr_location *al, struct callchain_cursor_node *node,
1142			bool hide_unresolved)
1143{
1144	struct machine *machine = maps__machine(node->ms.maps);
1145
1146	maps__put(al->maps);
1147	al->maps = maps__get(node->ms.maps);
1148	map__put(al->map);
1149	al->map = map__get(node->ms.map);
1150	al->sym = node->ms.sym;
1151	al->srcline = node->srcline;
1152	al->addr = node->ip;
1153
1154	if (al->sym == NULL) {
1155		if (hide_unresolved)
1156			return 0;
1157		if (al->map == NULL)
1158			goto out;
1159	}
1160	if (RC_CHK_EQUAL(al->maps, machine__kernel_maps(machine))) {
1161		if (machine__is_host(machine)) {
 
1162			al->cpumode = PERF_RECORD_MISC_KERNEL;
1163			al->level = 'k';
1164		} else {
1165			al->cpumode = PERF_RECORD_MISC_GUEST_KERNEL;
1166			al->level = 'g';
1167		}
1168	} else {
1169		if (machine__is_host(machine)) {
1170			al->cpumode = PERF_RECORD_MISC_USER;
1171			al->level = '.';
1172		} else if (perf_guest) {
1173			al->cpumode = PERF_RECORD_MISC_GUEST_USER;
1174			al->level = 'u';
1175		} else {
1176			al->cpumode = PERF_RECORD_MISC_HYPERVISOR;
1177			al->level = 'H';
1178		}
1179	}
1180
1181out:
1182	return 1;
1183}
1184
1185char *callchain_list__sym_name(struct callchain_list *cl,
1186			       char *bf, size_t bfsize, bool show_dso)
1187{
1188	bool show_addr = callchain_param.key == CCKEY_ADDRESS;
1189	bool show_srcline = show_addr || callchain_param.key == CCKEY_SRCLINE;
1190	int printed;
1191
1192	if (cl->ms.sym) {
1193		const char *inlined = cl->ms.sym->inlined ? " (inlined)" : "";
1194
1195		if (show_srcline && cl->srcline)
1196			printed = scnprintf(bf, bfsize, "%s %s%s",
1197					    cl->ms.sym->name, cl->srcline,
1198					    inlined);
1199		else
1200			printed = scnprintf(bf, bfsize, "%s%s",
1201					    cl->ms.sym->name, inlined);
1202	} else
1203		printed = scnprintf(bf, bfsize, "%#" PRIx64, cl->ip);
1204
1205	if (show_dso)
1206		scnprintf(bf + printed, bfsize - printed, " %s",
1207			  cl->ms.map ?
1208			  map__dso(cl->ms.map)->short_name :
1209			  "unknown");
1210
1211	return bf;
1212}
1213
1214char *callchain_node__scnprintf_value(struct callchain_node *node,
1215				      char *bf, size_t bfsize, u64 total)
1216{
1217	double percent = 0.0;
1218	u64 period = callchain_cumul_hits(node);
1219	unsigned count = callchain_cumul_counts(node);
1220
1221	if (callchain_param.mode == CHAIN_FOLDED) {
1222		period = node->hit;
1223		count = node->count;
1224	}
1225
1226	switch (callchain_param.value) {
1227	case CCVAL_PERIOD:
1228		scnprintf(bf, bfsize, "%"PRIu64, period);
1229		break;
1230	case CCVAL_COUNT:
1231		scnprintf(bf, bfsize, "%u", count);
1232		break;
1233	case CCVAL_PERCENT:
1234	default:
1235		if (total)
1236			percent = period * 100.0 / total;
1237		scnprintf(bf, bfsize, "%.2f%%", percent);
1238		break;
1239	}
1240	return bf;
1241}
1242
1243int callchain_node__fprintf_value(struct callchain_node *node,
1244				 FILE *fp, u64 total)
1245{
1246	double percent = 0.0;
1247	u64 period = callchain_cumul_hits(node);
1248	unsigned count = callchain_cumul_counts(node);
1249
1250	if (callchain_param.mode == CHAIN_FOLDED) {
1251		period = node->hit;
1252		count = node->count;
1253	}
1254
1255	switch (callchain_param.value) {
1256	case CCVAL_PERIOD:
1257		return fprintf(fp, "%"PRIu64, period);
1258	case CCVAL_COUNT:
1259		return fprintf(fp, "%u", count);
1260	case CCVAL_PERCENT:
1261	default:
1262		if (total)
1263			percent = period * 100.0 / total;
1264		return percent_color_fprintf(fp, "%.2f%%", percent);
1265	}
1266	return 0;
1267}
1268
1269static void callchain_counts_value(struct callchain_node *node,
1270				   u64 *branch_count, u64 *predicted_count,
1271				   u64 *abort_count, u64 *cycles_count)
1272{
1273	struct callchain_list *clist;
1274
1275	list_for_each_entry(clist, &node->val, list) {
1276		if (branch_count)
1277			*branch_count += clist->branch_count;
1278
1279		if (predicted_count)
1280			*predicted_count += clist->predicted_count;
1281
1282		if (abort_count)
1283			*abort_count += clist->abort_count;
1284
1285		if (cycles_count)
1286			*cycles_count += clist->cycles_count;
1287	}
1288}
1289
1290static int callchain_node_branch_counts_cumul(struct callchain_node *node,
1291					      u64 *branch_count,
1292					      u64 *predicted_count,
1293					      u64 *abort_count,
1294					      u64 *cycles_count)
1295{
1296	struct callchain_node *child;
1297	struct rb_node *n;
1298
1299	n = rb_first(&node->rb_root_in);
1300	while (n) {
1301		child = rb_entry(n, struct callchain_node, rb_node_in);
1302		n = rb_next(n);
1303
1304		callchain_node_branch_counts_cumul(child, branch_count,
1305						   predicted_count,
1306						   abort_count,
1307						   cycles_count);
1308
1309		callchain_counts_value(child, branch_count,
1310				       predicted_count, abort_count,
1311				       cycles_count);
1312	}
1313
1314	return 0;
1315}
1316
1317int callchain_branch_counts(struct callchain_root *root,
1318			    u64 *branch_count, u64 *predicted_count,
1319			    u64 *abort_count, u64 *cycles_count)
1320{
1321	if (branch_count)
1322		*branch_count = 0;
1323
1324	if (predicted_count)
1325		*predicted_count = 0;
1326
1327	if (abort_count)
1328		*abort_count = 0;
1329
1330	if (cycles_count)
1331		*cycles_count = 0;
1332
1333	return callchain_node_branch_counts_cumul(&root->node,
1334						  branch_count,
1335						  predicted_count,
1336						  abort_count,
1337						  cycles_count);
1338}
1339
1340static int count_pri64_printf(int idx, const char *str, u64 value, char *bf, int bfsize)
1341{
1342	return scnprintf(bf, bfsize, "%s%s:%" PRId64 "", (idx) ? " " : " (", str, value);
 
 
 
 
1343}
1344
1345static int count_float_printf(int idx, const char *str, float value,
1346			      char *bf, int bfsize, float threshold)
1347{
 
 
1348	if (threshold != 0.0 && value < threshold)
1349		return 0;
1350
1351	return scnprintf(bf, bfsize, "%s%s:%.1f%%", (idx) ? " " : " (", str, value);
 
 
1352}
1353
1354static int branch_to_str(char *bf, int bfsize,
1355			 u64 branch_count, u64 predicted_count,
1356			 u64 abort_count,
1357			 const struct branch_type_stat *brtype_stat)
1358{
1359	int printed, i = 0;
1360
1361	printed = branch_type_str(brtype_stat, bf, bfsize);
1362	if (printed)
1363		i++;
1364
1365	if (predicted_count < branch_count) {
1366		printed += count_float_printf(i++, "predicted",
1367				predicted_count * 100.0 / branch_count,
1368				bf + printed, bfsize - printed, 0.0);
1369	}
1370
1371	if (abort_count) {
1372		printed += count_float_printf(i++, "abort",
1373				abort_count * 100.0 / branch_count,
1374				bf + printed, bfsize - printed, 0.1);
1375	}
1376
1377	if (i)
1378		printed += scnprintf(bf + printed, bfsize - printed, ")");
1379
1380	return printed;
1381}
1382
1383static int branch_from_str(char *bf, int bfsize,
1384			   u64 branch_count,
1385			   u64 cycles_count, u64 iter_count,
1386			   u64 iter_cycles, u64 from_count)
1387{
1388	int printed = 0, i = 0;
1389	u64 cycles, v = 0;
1390
1391	cycles = cycles_count / branch_count;
1392	if (cycles) {
1393		printed += count_pri64_printf(i++, "cycles",
1394				cycles,
1395				bf + printed, bfsize - printed);
1396	}
1397
1398	if (iter_count && from_count) {
1399		v = iter_count / from_count;
1400		if (v) {
1401			printed += count_pri64_printf(i++, "iter",
1402					v, bf + printed, bfsize - printed);
1403
1404			printed += count_pri64_printf(i++, "avg_cycles",
1405					iter_cycles / iter_count,
1406					bf + printed, bfsize - printed);
1407		}
1408	}
1409
1410	if (i)
1411		printed += scnprintf(bf + printed, bfsize - printed, ")");
1412
1413	return printed;
1414}
1415
1416static int counts_str_build(char *bf, int bfsize,
1417			     u64 branch_count, u64 predicted_count,
1418			     u64 abort_count, u64 cycles_count,
1419			     u64 iter_count, u64 iter_cycles,
1420			     u64 from_count,
1421			     const struct branch_type_stat *brtype_stat)
1422{
1423	int printed;
1424
1425	if (branch_count == 0)
1426		return scnprintf(bf, bfsize, " (calltrace)");
1427
1428	if (brtype_stat->branch_to) {
1429		printed = branch_to_str(bf, bfsize, branch_count,
1430				predicted_count, abort_count, brtype_stat);
1431	} else {
1432		printed = branch_from_str(bf, bfsize, branch_count,
1433				cycles_count, iter_count, iter_cycles,
1434				from_count);
1435	}
1436
1437	if (!printed)
1438		bf[0] = 0;
1439
1440	return printed;
1441}
1442
1443static int callchain_counts_printf(FILE *fp, char *bf, int bfsize,
1444				   u64 branch_count, u64 predicted_count,
1445				   u64 abort_count, u64 cycles_count,
1446				   u64 iter_count, u64 iter_cycles,
1447				   u64 from_count,
1448				   const struct branch_type_stat *brtype_stat)
1449{
1450	char str[256];
1451
1452	counts_str_build(str, sizeof(str), branch_count,
1453			 predicted_count, abort_count, cycles_count,
1454			 iter_count, iter_cycles, from_count, brtype_stat);
1455
1456	if (fp)
1457		return fprintf(fp, "%s", str);
1458
1459	return scnprintf(bf, bfsize, "%s", str);
1460}
1461
1462int callchain_list_counts__printf_value(struct callchain_list *clist,
1463					FILE *fp, char *bf, int bfsize)
1464{
1465	static const struct branch_type_stat empty_brtype_stat = {};
1466	const struct branch_type_stat *brtype_stat;
1467	u64 branch_count, predicted_count;
1468	u64 abort_count, cycles_count;
1469	u64 iter_count, iter_cycles;
1470	u64 from_count;
1471
1472	brtype_stat = clist->brtype_stat ?: &empty_brtype_stat;
1473	branch_count = clist->branch_count;
1474	predicted_count = clist->predicted_count;
1475	abort_count = clist->abort_count;
1476	cycles_count = clist->cycles_count;
1477	iter_count = clist->iter_count;
1478	iter_cycles = clist->iter_cycles;
1479	from_count = clist->from_count;
1480
1481	return callchain_counts_printf(fp, bf, bfsize, branch_count,
1482				       predicted_count, abort_count,
1483				       cycles_count, iter_count, iter_cycles,
1484				       from_count, brtype_stat);
1485}
1486
1487static void free_callchain_node(struct callchain_node *node)
1488{
1489	struct callchain_list *list, *tmp;
1490	struct callchain_node *child;
1491	struct rb_node *n;
1492
1493	list_for_each_entry_safe(list, tmp, &node->parent_val, list) {
1494		list_del_init(&list->list);
1495		map_symbol__exit(&list->ms);
1496		zfree(&list->brtype_stat);
1497		free(list);
1498	}
1499
1500	list_for_each_entry_safe(list, tmp, &node->val, list) {
1501		list_del_init(&list->list);
1502		map_symbol__exit(&list->ms);
1503		zfree(&list->brtype_stat);
1504		free(list);
1505	}
1506
1507	n = rb_first(&node->rb_root_in);
1508	while (n) {
1509		child = container_of(n, struct callchain_node, rb_node_in);
1510		n = rb_next(n);
1511		rb_erase(&child->rb_node_in, &node->rb_root_in);
1512
1513		free_callchain_node(child);
1514		free(child);
1515	}
1516}
1517
1518void free_callchain(struct callchain_root *root)
1519{
1520	if (!symbol_conf.use_callchain)
1521		return;
1522
1523	free_callchain_node(&root->node);
1524}
1525
1526static u64 decay_callchain_node(struct callchain_node *node)
1527{
1528	struct callchain_node *child;
1529	struct rb_node *n;
1530	u64 child_hits = 0;
1531
1532	n = rb_first(&node->rb_root_in);
1533	while (n) {
1534		child = container_of(n, struct callchain_node, rb_node_in);
1535
1536		child_hits += decay_callchain_node(child);
1537		n = rb_next(n);
1538	}
1539
1540	node->hit = (node->hit * 7) / 8;
1541	node->children_hit = child_hits;
1542
1543	return node->hit;
1544}
1545
1546void decay_callchain(struct callchain_root *root)
1547{
1548	if (!symbol_conf.use_callchain)
1549		return;
1550
1551	decay_callchain_node(&root->node);
1552}
1553
1554int callchain_node__make_parent_list(struct callchain_node *node)
1555{
1556	struct callchain_node *parent = node->parent;
1557	struct callchain_list *chain, *new;
1558	LIST_HEAD(head);
1559
1560	while (parent) {
1561		list_for_each_entry_reverse(chain, &parent->val, list) {
1562			new = malloc(sizeof(*new));
1563			if (new == NULL)
1564				goto out;
1565			*new = *chain;
1566			new->has_children = false;
1567			new->ms.map = map__get(new->ms.map);
1568			list_add_tail(&new->list, &head);
1569		}
1570		parent = parent->parent;
1571	}
1572
1573	list_for_each_entry_safe_reverse(chain, new, &head, list)
1574		list_move_tail(&chain->list, &node->parent_val);
1575
1576	if (!list_empty(&node->parent_val)) {
1577		chain = list_first_entry(&node->parent_val, struct callchain_list, list);
1578		chain->has_children = rb_prev(&node->rb_node) || rb_next(&node->rb_node);
1579
1580		chain = list_first_entry(&node->val, struct callchain_list, list);
1581		chain->has_children = false;
1582	}
1583	return 0;
1584
1585out:
1586	list_for_each_entry_safe(chain, new, &head, list) {
1587		list_del_init(&chain->list);
1588		map_symbol__exit(&chain->ms);
1589		zfree(&chain->brtype_stat);
1590		free(chain);
1591	}
1592	return -ENOMEM;
1593}
1594
1595static void callchain_cursor__delete(void *vcursor)
1596{
1597	struct callchain_cursor *cursor = vcursor;
1598	struct callchain_cursor_node *node, *next;
1599
1600	callchain_cursor_reset(cursor);
1601	for (node = cursor->first; node != NULL; node = next) {
1602		next = node->next;
1603		free(node);
1604	}
1605	free(cursor);
1606}
1607
1608static void init_callchain_cursor_key(void)
1609{
1610	if (pthread_key_create(&callchain_cursor, callchain_cursor__delete)) {
1611		pr_err("callchain cursor creation failed");
1612		abort();
1613	}
1614}
1615
1616struct callchain_cursor *get_tls_callchain_cursor(void)
1617{
1618	static pthread_once_t once_control = PTHREAD_ONCE_INIT;
1619	struct callchain_cursor *cursor;
1620
1621	pthread_once(&once_control, init_callchain_cursor_key);
1622	cursor = pthread_getspecific(callchain_cursor);
1623	if (!cursor) {
1624		cursor = zalloc(sizeof(*cursor));
1625		if (!cursor)
1626			pr_debug3("%s: not enough memory\n", __func__);
1627		pthread_setspecific(callchain_cursor, cursor);
1628	}
1629	return cursor;
1630}
1631
1632int callchain_cursor__copy(struct callchain_cursor *dst,
1633			   struct callchain_cursor *src)
1634{
1635	int rc = 0;
1636
1637	callchain_cursor_reset(dst);
1638	callchain_cursor_commit(src);
1639
1640	while (true) {
1641		struct callchain_cursor_node *node;
1642
1643		node = callchain_cursor_current(src);
1644		if (node == NULL)
1645			break;
1646
1647		rc = callchain_cursor_append(dst, node->ip, &node->ms,
1648					     node->branch, &node->branch_flags,
1649					     node->nr_loop_iter,
1650					     node->iter_cycles,
1651					     node->branch_from, node->srcline);
1652		if (rc)
1653			break;
1654
1655		callchain_cursor_advance(src);
1656	}
1657
1658	return rc;
1659}
1660
1661/*
1662 * Initialize a cursor before adding entries inside, but keep
1663 * the previously allocated entries as a cache.
1664 */
1665void callchain_cursor_reset(struct callchain_cursor *cursor)
1666{
1667	struct callchain_cursor_node *node;
1668
1669	cursor->nr = 0;
1670	cursor->last = &cursor->first;
1671
1672	for (node = cursor->first; node != NULL; node = node->next)
1673		map_symbol__exit(&node->ms);
1674}
1675
1676void callchain_param_setup(u64 sample_type, const char *arch)
1677{
1678	if (symbol_conf.use_callchain || symbol_conf.cumulate_callchain) {
1679		if ((sample_type & PERF_SAMPLE_REGS_USER) &&
1680		    (sample_type & PERF_SAMPLE_STACK_USER)) {
1681			callchain_param.record_mode = CALLCHAIN_DWARF;
1682			dwarf_callchain_users = true;
1683		} else if (sample_type & PERF_SAMPLE_BRANCH_STACK)
1684			callchain_param.record_mode = CALLCHAIN_LBR;
1685		else
1686			callchain_param.record_mode = CALLCHAIN_FP;
1687	}
1688
1689	/*
1690	 * It's necessary to use libunwind to reliably determine the caller of
1691	 * a leaf function on aarch64, as otherwise we cannot know whether to
1692	 * start from the LR or FP.
1693	 *
1694	 * Always starting from the LR can result in duplicate or entirely
1695	 * erroneous entries. Always skipping the LR and starting from the FP
1696	 * can result in missing entries.
1697	 */
1698	if (callchain_param.record_mode == CALLCHAIN_FP && !strcmp(arch, "arm64"))
1699		dwarf_callchain_users = true;
1700}
1701
1702static bool chain_match(struct callchain_list *base_chain,
1703			struct callchain_list *pair_chain)
1704{
1705	enum match_result match;
1706
1707	match = match_chain_strings(base_chain->srcline,
1708				    pair_chain->srcline);
1709	if (match != MATCH_ERROR)
1710		return match == MATCH_EQ;
1711
1712	match = match_chain_dso_addresses(base_chain->ms.map,
1713					  base_chain->ip,
1714					  pair_chain->ms.map,
1715					  pair_chain->ip);
1716
1717	return match == MATCH_EQ;
1718}
1719
1720bool callchain_cnode_matched(struct callchain_node *base_cnode,
1721			     struct callchain_node *pair_cnode)
1722{
1723	struct callchain_list *base_chain, *pair_chain;
1724	bool match = false;
1725
1726	pair_chain = list_first_entry(&pair_cnode->val,
1727				      struct callchain_list,
1728				      list);
1729
1730	list_for_each_entry(base_chain, &base_cnode->val, list) {
1731		if (&pair_chain->list == &pair_cnode->val)
1732			return false;
1733
1734		if (!base_chain->srcline || !pair_chain->srcline) {
1735			pair_chain = list_next_entry(pair_chain, list);
1736			continue;
1737		}
1738
1739		match = chain_match(base_chain, pair_chain);
1740		if (!match)
1741			return false;
1742
1743		pair_chain = list_next_entry(pair_chain, list);
1744	}
1745
1746	/*
1747	 * Say chain1 is ABC, chain2 is ABCD, we consider they are
1748	 * not fully matched.
1749	 */
1750	if (pair_chain && (&pair_chain->list != &pair_cnode->val))
1751		return false;
1752
1753	return match;
1754}
1755
1756static u64 count_callchain_hits(struct hist_entry *he)
1757{
1758	struct rb_root *root = &he->sorted_chain;
1759	struct rb_node *rb_node = rb_first(root);
1760	struct callchain_node *node;
1761	u64 chain_hits = 0;
1762
1763	while (rb_node) {
1764		node = rb_entry(rb_node, struct callchain_node, rb_node);
1765		chain_hits += node->hit;
1766		rb_node = rb_next(rb_node);
1767	}
1768
1769	return chain_hits;
1770}
1771
1772u64 callchain_total_hits(struct hists *hists)
1773{
1774	struct rb_node *next = rb_first_cached(&hists->entries);
1775	u64 chain_hits = 0;
1776
1777	while (next) {
1778		struct hist_entry *he = rb_entry(next, struct hist_entry,
1779						 rb_node);
1780
1781		chain_hits += count_callchain_hits(he);
1782		next = rb_next(&he->rb_node);
1783	}
1784
1785	return chain_hits;
1786}
1787
1788s64 callchain_avg_cycles(struct callchain_node *cnode)
1789{
1790	struct callchain_list *chain;
1791	s64 cycles = 0;
1792
1793	list_for_each_entry(chain, &cnode->val, list) {
1794		if (chain->srcline && chain->branch_count)
1795			cycles += chain->cycles_count / chain->branch_count;
1796	}
1797
1798	return cycles;
1799}