Loading...
1# event_analyzing_sample.py: general event handler in python
2# SPDX-License-Identifier: GPL-2.0
3#
4# Current perf report is already very powerful with the annotation integrated,
5# and this script is not trying to be as powerful as perf report, but
6# providing end user/developer a flexible way to analyze the events other
7# than trace points.
8#
9# The 2 database related functions in this script just show how to gather
10# the basic information, and users can modify and write their own functions
11# according to their specific requirement.
12#
13# The first function "show_general_events" just does a basic grouping for all
14# generic events with the help of sqlite, and the 2nd one "show_pebs_ll" is
15# for a x86 HW PMU event: PEBS with load latency data.
16#
17
18from __future__ import print_function
19
20import os
21import sys
22import math
23import struct
24import sqlite3
25
26sys.path.append(os.environ['PERF_EXEC_PATH'] + \
27 '/scripts/python/Perf-Trace-Util/lib/Perf/Trace')
28
29from perf_trace_context import *
30from EventClass import *
31
32#
33# If the perf.data has a big number of samples, then the insert operation
34# will be very time consuming (about 10+ minutes for 10000 samples) if the
35# .db database is on disk. Move the .db file to RAM based FS to speedup
36# the handling, which will cut the time down to several seconds.
37#
38con = sqlite3.connect("/dev/shm/perf.db")
39con.isolation_level = None
40
41def trace_begin():
42 print("In trace_begin:\n")
43
44 #
45 # Will create several tables at the start, pebs_ll is for PEBS data with
46 # load latency info, while gen_events is for general event.
47 #
48 con.execute("""
49 create table if not exists gen_events (
50 name text,
51 symbol text,
52 comm text,
53 dso text
54 );""")
55 con.execute("""
56 create table if not exists pebs_ll (
57 name text,
58 symbol text,
59 comm text,
60 dso text,
61 flags integer,
62 ip integer,
63 status integer,
64 dse integer,
65 dla integer,
66 lat integer
67 );""")
68
69#
70# Create and insert event object to a database so that user could
71# do more analysis with simple database commands.
72#
73def process_event(param_dict):
74 event_attr = param_dict["attr"]
75 sample = param_dict["sample"]
76 raw_buf = param_dict["raw_buf"]
77 comm = param_dict["comm"]
78 name = param_dict["ev_name"]
79
80 # Symbol and dso info are not always resolved
81 if ("dso" in param_dict):
82 dso = param_dict["dso"]
83 else:
84 dso = "Unknown_dso"
85
86 if ("symbol" in param_dict):
87 symbol = param_dict["symbol"]
88 else:
89 symbol = "Unknown_symbol"
90
91 # Create the event object and insert it to the right table in database
92 event = create_event(name, comm, dso, symbol, raw_buf)
93 insert_db(event)
94
95def insert_db(event):
96 if event.ev_type == EVTYPE_GENERIC:
97 con.execute("insert into gen_events values(?, ?, ?, ?)",
98 (event.name, event.symbol, event.comm, event.dso))
99 elif event.ev_type == EVTYPE_PEBS_LL:
100 event.ip &= 0x7fffffffffffffff
101 event.dla &= 0x7fffffffffffffff
102 con.execute("insert into pebs_ll values (?, ?, ?, ?, ?, ?, ?, ?, ?, ?)",
103 (event.name, event.symbol, event.comm, event.dso, event.flags,
104 event.ip, event.status, event.dse, event.dla, event.lat))
105
106def trace_end():
107 print("In trace_end:\n")
108 # We show the basic info for the 2 type of event classes
109 show_general_events()
110 show_pebs_ll()
111 con.close()
112
113#
114# As the event number may be very big, so we can't use linear way
115# to show the histogram in real number, but use a log2 algorithm.
116#
117
118def num2sym(num):
119 # Each number will have at least one '#'
120 snum = '#' * (int)(math.log(num, 2) + 1)
121 return snum
122
123def show_general_events():
124
125 # Check the total record number in the table
126 count = con.execute("select count(*) from gen_events")
127 for t in count:
128 print("There is %d records in gen_events table" % t[0])
129 if t[0] == 0:
130 return
131
132 print("Statistics about the general events grouped by thread/symbol/dso: \n")
133
134 # Group by thread
135 commq = con.execute("select comm, count(comm) from gen_events group by comm order by -count(comm)")
136 print("\n%16s %8s %16s\n%s" % ("comm", "number", "histogram", "="*42))
137 for row in commq:
138 print("%16s %8d %s" % (row[0], row[1], num2sym(row[1])))
139
140 # Group by symbol
141 print("\n%32s %8s %16s\n%s" % ("symbol", "number", "histogram", "="*58))
142 symbolq = con.execute("select symbol, count(symbol) from gen_events group by symbol order by -count(symbol)")
143 for row in symbolq:
144 print("%32s %8d %s" % (row[0], row[1], num2sym(row[1])))
145
146 # Group by dso
147 print("\n%40s %8s %16s\n%s" % ("dso", "number", "histogram", "="*74))
148 dsoq = con.execute("select dso, count(dso) from gen_events group by dso order by -count(dso)")
149 for row in dsoq:
150 print("%40s %8d %s" % (row[0], row[1], num2sym(row[1])))
151
152#
153# This function just shows the basic info, and we could do more with the
154# data in the tables, like checking the function parameters when some
155# big latency events happen.
156#
157def show_pebs_ll():
158
159 count = con.execute("select count(*) from pebs_ll")
160 for t in count:
161 print("There is %d records in pebs_ll table" % t[0])
162 if t[0] == 0:
163 return
164
165 print("Statistics about the PEBS Load Latency events grouped by thread/symbol/dse/latency: \n")
166
167 # Group by thread
168 commq = con.execute("select comm, count(comm) from pebs_ll group by comm order by -count(comm)")
169 print("\n%16s %8s %16s\n%s" % ("comm", "number", "histogram", "="*42))
170 for row in commq:
171 print("%16s %8d %s" % (row[0], row[1], num2sym(row[1])))
172
173 # Group by symbol
174 print("\n%32s %8s %16s\n%s" % ("symbol", "number", "histogram", "="*58))
175 symbolq = con.execute("select symbol, count(symbol) from pebs_ll group by symbol order by -count(symbol)")
176 for row in symbolq:
177 print("%32s %8d %s" % (row[0], row[1], num2sym(row[1])))
178
179 # Group by dse
180 dseq = con.execute("select dse, count(dse) from pebs_ll group by dse order by -count(dse)")
181 print("\n%32s %8s %16s\n%s" % ("dse", "number", "histogram", "="*58))
182 for row in dseq:
183 print("%32s %8d %s" % (row[0], row[1], num2sym(row[1])))
184
185 # Group by latency
186 latq = con.execute("select lat, count(lat) from pebs_ll group by lat order by lat")
187 print("\n%32s %8s %16s\n%s" % ("latency", "number", "histogram", "="*58))
188 for row in latq:
189 print("%32s %8d %s" % (row[0], row[1], num2sym(row[1])))
190
191def trace_unhandled(event_name, context, event_fields_dict):
192 print (' '.join(['%s=%s'%(k,str(v))for k,v in sorted(event_fields_dict.items())]))