Loading...
1/*
2 * Copyright 2010 ARM Ltd.
3 *
4 * Perf-events backend for OProfile.
5 */
6#include <linux/perf_event.h>
7#include <linux/platform_device.h>
8#include <linux/oprofile.h>
9#include <linux/slab.h>
10
11/*
12 * Per performance monitor configuration as set via oprofilefs.
13 */
14struct op_counter_config {
15 unsigned long count;
16 unsigned long enabled;
17 unsigned long event;
18 unsigned long unit_mask;
19 unsigned long kernel;
20 unsigned long user;
21 struct perf_event_attr attr;
22};
23
24static int oprofile_perf_enabled;
25static DEFINE_MUTEX(oprofile_perf_mutex);
26
27static struct op_counter_config *counter_config;
28static struct perf_event **perf_events[nr_cpumask_bits];
29static int num_counters;
30
31/*
32 * Overflow callback for oprofile.
33 */
34static void op_overflow_handler(struct perf_event *event,
35 struct perf_sample_data *data, struct pt_regs *regs)
36{
37 int id;
38 u32 cpu = smp_processor_id();
39
40 for (id = 0; id < num_counters; ++id)
41 if (perf_events[cpu][id] == event)
42 break;
43
44 if (id != num_counters)
45 oprofile_add_sample(regs, id);
46 else
47 pr_warning("oprofile: ignoring spurious overflow "
48 "on cpu %u\n", cpu);
49}
50
51/*
52 * Called by oprofile_perf_setup to create perf attributes to mirror the oprofile
53 * settings in counter_config. Attributes are created as `pinned' events and
54 * so are permanently scheduled on the PMU.
55 */
56static void op_perf_setup(void)
57{
58 int i;
59 u32 size = sizeof(struct perf_event_attr);
60 struct perf_event_attr *attr;
61
62 for (i = 0; i < num_counters; ++i) {
63 attr = &counter_config[i].attr;
64 memset(attr, 0, size);
65 attr->type = PERF_TYPE_RAW;
66 attr->size = size;
67 attr->config = counter_config[i].event;
68 attr->sample_period = counter_config[i].count;
69 attr->pinned = 1;
70 }
71}
72
73static int op_create_counter(int cpu, int event)
74{
75 struct perf_event *pevent;
76
77 if (!counter_config[event].enabled || perf_events[cpu][event])
78 return 0;
79
80 pevent = perf_event_create_kernel_counter(&counter_config[event].attr,
81 cpu, NULL,
82 op_overflow_handler, NULL);
83
84 if (IS_ERR(pevent))
85 return PTR_ERR(pevent);
86
87 if (pevent->state != PERF_EVENT_STATE_ACTIVE) {
88 perf_event_release_kernel(pevent);
89 pr_warning("oprofile: failed to enable event %d "
90 "on CPU %d\n", event, cpu);
91 return -EBUSY;
92 }
93
94 perf_events[cpu][event] = pevent;
95
96 return 0;
97}
98
99static void op_destroy_counter(int cpu, int event)
100{
101 struct perf_event *pevent = perf_events[cpu][event];
102
103 if (pevent) {
104 perf_event_release_kernel(pevent);
105 perf_events[cpu][event] = NULL;
106 }
107}
108
109/*
110 * Called by oprofile_perf_start to create active perf events based on the
111 * perviously configured attributes.
112 */
113static int op_perf_start(void)
114{
115 int cpu, event, ret = 0;
116
117 for_each_online_cpu(cpu) {
118 for (event = 0; event < num_counters; ++event) {
119 ret = op_create_counter(cpu, event);
120 if (ret)
121 return ret;
122 }
123 }
124
125 return ret;
126}
127
128/*
129 * Called by oprofile_perf_stop at the end of a profiling run.
130 */
131static void op_perf_stop(void)
132{
133 int cpu, event;
134
135 for_each_online_cpu(cpu)
136 for (event = 0; event < num_counters; ++event)
137 op_destroy_counter(cpu, event);
138}
139
140static int oprofile_perf_create_files(struct super_block *sb, struct dentry *root)
141{
142 unsigned int i;
143
144 for (i = 0; i < num_counters; i++) {
145 struct dentry *dir;
146 char buf[4];
147
148 snprintf(buf, sizeof buf, "%d", i);
149 dir = oprofilefs_mkdir(sb, root, buf);
150 oprofilefs_create_ulong(sb, dir, "enabled", &counter_config[i].enabled);
151 oprofilefs_create_ulong(sb, dir, "event", &counter_config[i].event);
152 oprofilefs_create_ulong(sb, dir, "count", &counter_config[i].count);
153 oprofilefs_create_ulong(sb, dir, "unit_mask", &counter_config[i].unit_mask);
154 oprofilefs_create_ulong(sb, dir, "kernel", &counter_config[i].kernel);
155 oprofilefs_create_ulong(sb, dir, "user", &counter_config[i].user);
156 }
157
158 return 0;
159}
160
161static int oprofile_perf_setup(void)
162{
163 spin_lock(&oprofilefs_lock);
164 op_perf_setup();
165 spin_unlock(&oprofilefs_lock);
166 return 0;
167}
168
169static int oprofile_perf_start(void)
170{
171 int ret = -EBUSY;
172
173 mutex_lock(&oprofile_perf_mutex);
174 if (!oprofile_perf_enabled) {
175 ret = 0;
176 op_perf_start();
177 oprofile_perf_enabled = 1;
178 }
179 mutex_unlock(&oprofile_perf_mutex);
180 return ret;
181}
182
183static void oprofile_perf_stop(void)
184{
185 mutex_lock(&oprofile_perf_mutex);
186 if (oprofile_perf_enabled)
187 op_perf_stop();
188 oprofile_perf_enabled = 0;
189 mutex_unlock(&oprofile_perf_mutex);
190}
191
192#ifdef CONFIG_PM
193
194static int oprofile_perf_suspend(struct platform_device *dev, pm_message_t state)
195{
196 mutex_lock(&oprofile_perf_mutex);
197 if (oprofile_perf_enabled)
198 op_perf_stop();
199 mutex_unlock(&oprofile_perf_mutex);
200 return 0;
201}
202
203static int oprofile_perf_resume(struct platform_device *dev)
204{
205 mutex_lock(&oprofile_perf_mutex);
206 if (oprofile_perf_enabled && op_perf_start())
207 oprofile_perf_enabled = 0;
208 mutex_unlock(&oprofile_perf_mutex);
209 return 0;
210}
211
212static struct platform_driver oprofile_driver = {
213 .driver = {
214 .name = "oprofile-perf",
215 },
216 .resume = oprofile_perf_resume,
217 .suspend = oprofile_perf_suspend,
218};
219
220static struct platform_device *oprofile_pdev;
221
222static int __init init_driverfs(void)
223{
224 int ret;
225
226 ret = platform_driver_register(&oprofile_driver);
227 if (ret)
228 return ret;
229
230 oprofile_pdev = platform_device_register_simple(
231 oprofile_driver.driver.name, 0, NULL, 0);
232 if (IS_ERR(oprofile_pdev)) {
233 ret = PTR_ERR(oprofile_pdev);
234 platform_driver_unregister(&oprofile_driver);
235 }
236
237 return ret;
238}
239
240static void exit_driverfs(void)
241{
242 platform_device_unregister(oprofile_pdev);
243 platform_driver_unregister(&oprofile_driver);
244}
245
246#else
247
248static inline int init_driverfs(void) { return 0; }
249static inline void exit_driverfs(void) { }
250
251#endif /* CONFIG_PM */
252
253void oprofile_perf_exit(void)
254{
255 int cpu, id;
256 struct perf_event *event;
257
258 for_each_possible_cpu(cpu) {
259 for (id = 0; id < num_counters; ++id) {
260 event = perf_events[cpu][id];
261 if (event)
262 perf_event_release_kernel(event);
263 }
264
265 kfree(perf_events[cpu]);
266 }
267
268 kfree(counter_config);
269 exit_driverfs();
270}
271
272int __init oprofile_perf_init(struct oprofile_operations *ops)
273{
274 int cpu, ret = 0;
275
276 ret = init_driverfs();
277 if (ret)
278 return ret;
279
280 memset(&perf_events, 0, sizeof(perf_events));
281
282 num_counters = perf_num_counters();
283 if (num_counters <= 0) {
284 pr_info("oprofile: no performance counters\n");
285 ret = -ENODEV;
286 goto out;
287 }
288
289 counter_config = kcalloc(num_counters,
290 sizeof(struct op_counter_config), GFP_KERNEL);
291
292 if (!counter_config) {
293 pr_info("oprofile: failed to allocate %d "
294 "counters\n", num_counters);
295 ret = -ENOMEM;
296 num_counters = 0;
297 goto out;
298 }
299
300 for_each_possible_cpu(cpu) {
301 perf_events[cpu] = kcalloc(num_counters,
302 sizeof(struct perf_event *), GFP_KERNEL);
303 if (!perf_events[cpu]) {
304 pr_info("oprofile: failed to allocate %d perf events "
305 "for cpu %d\n", num_counters, cpu);
306 ret = -ENOMEM;
307 goto out;
308 }
309 }
310
311 ops->create_files = oprofile_perf_create_files;
312 ops->setup = oprofile_perf_setup;
313 ops->start = oprofile_perf_start;
314 ops->stop = oprofile_perf_stop;
315 ops->shutdown = oprofile_perf_stop;
316 ops->cpu_type = op_name_from_perf_id();
317
318 if (!ops->cpu_type)
319 ret = -ENODEV;
320 else
321 pr_info("oprofile: using %s\n", ops->cpu_type);
322
323out:
324 if (ret)
325 oprofile_perf_exit();
326
327 return ret;
328}
1/*
2 * Copyright 2010 ARM Ltd.
3 * Copyright 2012 Advanced Micro Devices, Inc., Robert Richter
4 *
5 * Perf-events backend for OProfile.
6 */
7#include <linux/perf_event.h>
8#include <linux/platform_device.h>
9#include <linux/oprofile.h>
10#include <linux/slab.h>
11
12/*
13 * Per performance monitor configuration as set via oprofilefs.
14 */
15struct op_counter_config {
16 unsigned long count;
17 unsigned long enabled;
18 unsigned long event;
19 unsigned long unit_mask;
20 unsigned long kernel;
21 unsigned long user;
22 struct perf_event_attr attr;
23};
24
25static int oprofile_perf_enabled;
26static DEFINE_MUTEX(oprofile_perf_mutex);
27
28static struct op_counter_config *counter_config;
29static DEFINE_PER_CPU(struct perf_event **, perf_events);
30static int num_counters;
31
32/*
33 * Overflow callback for oprofile.
34 */
35static void op_overflow_handler(struct perf_event *event,
36 struct perf_sample_data *data, struct pt_regs *regs)
37{
38 int id;
39 u32 cpu = smp_processor_id();
40
41 for (id = 0; id < num_counters; ++id)
42 if (per_cpu(perf_events, cpu)[id] == event)
43 break;
44
45 if (id != num_counters)
46 oprofile_add_sample(regs, id);
47 else
48 pr_warning("oprofile: ignoring spurious overflow "
49 "on cpu %u\n", cpu);
50}
51
52/*
53 * Called by oprofile_perf_setup to create perf attributes to mirror the oprofile
54 * settings in counter_config. Attributes are created as `pinned' events and
55 * so are permanently scheduled on the PMU.
56 */
57static void op_perf_setup(void)
58{
59 int i;
60 u32 size = sizeof(struct perf_event_attr);
61 struct perf_event_attr *attr;
62
63 for (i = 0; i < num_counters; ++i) {
64 attr = &counter_config[i].attr;
65 memset(attr, 0, size);
66 attr->type = PERF_TYPE_RAW;
67 attr->size = size;
68 attr->config = counter_config[i].event;
69 attr->sample_period = counter_config[i].count;
70 attr->pinned = 1;
71 }
72}
73
74static int op_create_counter(int cpu, int event)
75{
76 struct perf_event *pevent;
77
78 if (!counter_config[event].enabled || per_cpu(perf_events, cpu)[event])
79 return 0;
80
81 pevent = perf_event_create_kernel_counter(&counter_config[event].attr,
82 cpu, NULL,
83 op_overflow_handler, NULL);
84
85 if (IS_ERR(pevent))
86 return PTR_ERR(pevent);
87
88 if (pevent->state != PERF_EVENT_STATE_ACTIVE) {
89 perf_event_release_kernel(pevent);
90 pr_warning("oprofile: failed to enable event %d "
91 "on CPU %d\n", event, cpu);
92 return -EBUSY;
93 }
94
95 per_cpu(perf_events, cpu)[event] = pevent;
96
97 return 0;
98}
99
100static void op_destroy_counter(int cpu, int event)
101{
102 struct perf_event *pevent = per_cpu(perf_events, cpu)[event];
103
104 if (pevent) {
105 perf_event_release_kernel(pevent);
106 per_cpu(perf_events, cpu)[event] = NULL;
107 }
108}
109
110/*
111 * Called by oprofile_perf_start to create active perf events based on the
112 * perviously configured attributes.
113 */
114static int op_perf_start(void)
115{
116 int cpu, event, ret = 0;
117
118 for_each_online_cpu(cpu) {
119 for (event = 0; event < num_counters; ++event) {
120 ret = op_create_counter(cpu, event);
121 if (ret)
122 return ret;
123 }
124 }
125
126 return ret;
127}
128
129/*
130 * Called by oprofile_perf_stop at the end of a profiling run.
131 */
132static void op_perf_stop(void)
133{
134 int cpu, event;
135
136 for_each_online_cpu(cpu)
137 for (event = 0; event < num_counters; ++event)
138 op_destroy_counter(cpu, event);
139}
140
141static int oprofile_perf_create_files(struct dentry *root)
142{
143 unsigned int i;
144
145 for (i = 0; i < num_counters; i++) {
146 struct dentry *dir;
147 char buf[4];
148
149 snprintf(buf, sizeof buf, "%d", i);
150 dir = oprofilefs_mkdir(root, buf);
151 oprofilefs_create_ulong(dir, "enabled", &counter_config[i].enabled);
152 oprofilefs_create_ulong(dir, "event", &counter_config[i].event);
153 oprofilefs_create_ulong(dir, "count", &counter_config[i].count);
154 oprofilefs_create_ulong(dir, "unit_mask", &counter_config[i].unit_mask);
155 oprofilefs_create_ulong(dir, "kernel", &counter_config[i].kernel);
156 oprofilefs_create_ulong(dir, "user", &counter_config[i].user);
157 }
158
159 return 0;
160}
161
162static int oprofile_perf_setup(void)
163{
164 raw_spin_lock(&oprofilefs_lock);
165 op_perf_setup();
166 raw_spin_unlock(&oprofilefs_lock);
167 return 0;
168}
169
170static int oprofile_perf_start(void)
171{
172 int ret = -EBUSY;
173
174 mutex_lock(&oprofile_perf_mutex);
175 if (!oprofile_perf_enabled) {
176 ret = 0;
177 op_perf_start();
178 oprofile_perf_enabled = 1;
179 }
180 mutex_unlock(&oprofile_perf_mutex);
181 return ret;
182}
183
184static void oprofile_perf_stop(void)
185{
186 mutex_lock(&oprofile_perf_mutex);
187 if (oprofile_perf_enabled)
188 op_perf_stop();
189 oprofile_perf_enabled = 0;
190 mutex_unlock(&oprofile_perf_mutex);
191}
192
193#ifdef CONFIG_PM
194
195static int oprofile_perf_suspend(struct platform_device *dev, pm_message_t state)
196{
197 mutex_lock(&oprofile_perf_mutex);
198 if (oprofile_perf_enabled)
199 op_perf_stop();
200 mutex_unlock(&oprofile_perf_mutex);
201 return 0;
202}
203
204static int oprofile_perf_resume(struct platform_device *dev)
205{
206 mutex_lock(&oprofile_perf_mutex);
207 if (oprofile_perf_enabled && op_perf_start())
208 oprofile_perf_enabled = 0;
209 mutex_unlock(&oprofile_perf_mutex);
210 return 0;
211}
212
213static struct platform_driver oprofile_driver = {
214 .driver = {
215 .name = "oprofile-perf",
216 },
217 .resume = oprofile_perf_resume,
218 .suspend = oprofile_perf_suspend,
219};
220
221static struct platform_device *oprofile_pdev;
222
223static int __init init_driverfs(void)
224{
225 int ret;
226
227 ret = platform_driver_register(&oprofile_driver);
228 if (ret)
229 return ret;
230
231 oprofile_pdev = platform_device_register_simple(
232 oprofile_driver.driver.name, 0, NULL, 0);
233 if (IS_ERR(oprofile_pdev)) {
234 ret = PTR_ERR(oprofile_pdev);
235 platform_driver_unregister(&oprofile_driver);
236 }
237
238 return ret;
239}
240
241static void exit_driverfs(void)
242{
243 platform_device_unregister(oprofile_pdev);
244 platform_driver_unregister(&oprofile_driver);
245}
246
247#else
248
249static inline int init_driverfs(void) { return 0; }
250static inline void exit_driverfs(void) { }
251
252#endif /* CONFIG_PM */
253
254void oprofile_perf_exit(void)
255{
256 int cpu, id;
257 struct perf_event *event;
258
259 for_each_possible_cpu(cpu) {
260 for (id = 0; id < num_counters; ++id) {
261 event = per_cpu(perf_events, cpu)[id];
262 if (event)
263 perf_event_release_kernel(event);
264 }
265
266 kfree(per_cpu(perf_events, cpu));
267 }
268
269 kfree(counter_config);
270 exit_driverfs();
271}
272
273int __init oprofile_perf_init(struct oprofile_operations *ops)
274{
275 int cpu, ret = 0;
276
277 ret = init_driverfs();
278 if (ret)
279 return ret;
280
281 num_counters = perf_num_counters();
282 if (num_counters <= 0) {
283 pr_info("oprofile: no performance counters\n");
284 ret = -ENODEV;
285 goto out;
286 }
287
288 counter_config = kcalloc(num_counters,
289 sizeof(struct op_counter_config), GFP_KERNEL);
290
291 if (!counter_config) {
292 pr_info("oprofile: failed to allocate %d "
293 "counters\n", num_counters);
294 ret = -ENOMEM;
295 num_counters = 0;
296 goto out;
297 }
298
299 for_each_possible_cpu(cpu) {
300 per_cpu(perf_events, cpu) = kcalloc(num_counters,
301 sizeof(struct perf_event *), GFP_KERNEL);
302 if (!per_cpu(perf_events, cpu)) {
303 pr_info("oprofile: failed to allocate %d perf events "
304 "for cpu %d\n", num_counters, cpu);
305 ret = -ENOMEM;
306 goto out;
307 }
308 }
309
310 ops->create_files = oprofile_perf_create_files;
311 ops->setup = oprofile_perf_setup;
312 ops->start = oprofile_perf_start;
313 ops->stop = oprofile_perf_stop;
314 ops->shutdown = oprofile_perf_stop;
315 ops->cpu_type = op_name_from_perf_id();
316
317 if (!ops->cpu_type)
318 ret = -ENODEV;
319 else
320 pr_info("oprofile: using %s\n", ops->cpu_type);
321
322out:
323 if (ret)
324 oprofile_perf_exit();
325
326 return ret;
327}