Loading...
1// SPDX-License-Identifier: GPL-2.0
2/*
3 * trace irqs off critical timings
4 *
5 * Copyright (C) 2007-2008 Steven Rostedt <srostedt@redhat.com>
6 * Copyright (C) 2008 Ingo Molnar <mingo@redhat.com>
7 *
8 * From code in the latency_tracer, that is:
9 *
10 * Copyright (C) 2004-2006 Ingo Molnar
11 * Copyright (C) 2004 Nadia Yvette Chambers
12 */
13#include <linux/kallsyms.h>
14#include <linux/uaccess.h>
15#include <linux/module.h>
16#include <linux/ftrace.h>
17#include <linux/kprobes.h>
18
19#include "trace.h"
20
21#include <trace/events/preemptirq.h>
22
23#if defined(CONFIG_IRQSOFF_TRACER) || defined(CONFIG_PREEMPT_TRACER)
24static struct trace_array *irqsoff_trace __read_mostly;
25static int tracer_enabled __read_mostly;
26
27static DEFINE_PER_CPU(int, tracing_cpu);
28
29static DEFINE_RAW_SPINLOCK(max_trace_lock);
30
31enum {
32 TRACER_IRQS_OFF = (1 << 1),
33 TRACER_PREEMPT_OFF = (1 << 2),
34};
35
36static int trace_type __read_mostly;
37
38static int save_flags;
39
40static void stop_irqsoff_tracer(struct trace_array *tr, int graph);
41static int start_irqsoff_tracer(struct trace_array *tr, int graph);
42
43#ifdef CONFIG_PREEMPT_TRACER
44static inline int
45preempt_trace(int pc)
46{
47 return ((trace_type & TRACER_PREEMPT_OFF) && pc);
48}
49#else
50# define preempt_trace(pc) (0)
51#endif
52
53#ifdef CONFIG_IRQSOFF_TRACER
54static inline int
55irq_trace(void)
56{
57 return ((trace_type & TRACER_IRQS_OFF) &&
58 irqs_disabled());
59}
60#else
61# define irq_trace() (0)
62#endif
63
64#ifdef CONFIG_FUNCTION_GRAPH_TRACER
65static int irqsoff_display_graph(struct trace_array *tr, int set);
66# define is_graph(tr) ((tr)->trace_flags & TRACE_ITER_DISPLAY_GRAPH)
67#else
68static inline int irqsoff_display_graph(struct trace_array *tr, int set)
69{
70 return -EINVAL;
71}
72# define is_graph(tr) false
73#endif
74
75/*
76 * Sequence count - we record it when starting a measurement and
77 * skip the latency if the sequence has changed - some other section
78 * did a maximum and could disturb our measurement with serial console
79 * printouts, etc. Truly coinciding maximum latencies should be rare
80 * and what happens together happens separately as well, so this doesn't
81 * decrease the validity of the maximum found:
82 */
83static __cacheline_aligned_in_smp unsigned long max_sequence;
84
85#ifdef CONFIG_FUNCTION_TRACER
86/*
87 * Prologue for the preempt and irqs off function tracers.
88 *
89 * Returns 1 if it is OK to continue, and data->disabled is
90 * incremented.
91 * 0 if the trace is to be ignored, and data->disabled
92 * is kept the same.
93 *
94 * Note, this function is also used outside this ifdef but
95 * inside the #ifdef of the function graph tracer below.
96 * This is OK, since the function graph tracer is
97 * dependent on the function tracer.
98 */
99static int func_prolog_dec(struct trace_array *tr,
100 struct trace_array_cpu **data,
101 unsigned long *flags)
102{
103 long disabled;
104 int cpu;
105
106 /*
107 * Does not matter if we preempt. We test the flags
108 * afterward, to see if irqs are disabled or not.
109 * If we preempt and get a false positive, the flags
110 * test will fail.
111 */
112 cpu = raw_smp_processor_id();
113 if (likely(!per_cpu(tracing_cpu, cpu)))
114 return 0;
115
116 local_save_flags(*flags);
117 /*
118 * Slight chance to get a false positive on tracing_cpu,
119 * although I'm starting to think there isn't a chance.
120 * Leave this for now just to be paranoid.
121 */
122 if (!irqs_disabled_flags(*flags) && !preempt_count())
123 return 0;
124
125 *data = per_cpu_ptr(tr->array_buffer.data, cpu);
126 disabled = atomic_inc_return(&(*data)->disabled);
127
128 if (likely(disabled == 1))
129 return 1;
130
131 atomic_dec(&(*data)->disabled);
132
133 return 0;
134}
135
136/*
137 * irqsoff uses its own tracer function to keep the overhead down:
138 */
139static void
140irqsoff_tracer_call(unsigned long ip, unsigned long parent_ip,
141 struct ftrace_ops *op, struct ftrace_regs *fregs)
142{
143 struct trace_array *tr = irqsoff_trace;
144 struct trace_array_cpu *data;
145 unsigned long flags;
146 unsigned int trace_ctx;
147
148 if (!func_prolog_dec(tr, &data, &flags))
149 return;
150
151 trace_ctx = tracing_gen_ctx_flags(flags);
152
153 trace_function(tr, ip, parent_ip, trace_ctx);
154
155 atomic_dec(&data->disabled);
156}
157#endif /* CONFIG_FUNCTION_TRACER */
158
159#ifdef CONFIG_FUNCTION_GRAPH_TRACER
160static int irqsoff_display_graph(struct trace_array *tr, int set)
161{
162 int cpu;
163
164 if (!(is_graph(tr) ^ set))
165 return 0;
166
167 stop_irqsoff_tracer(irqsoff_trace, !set);
168
169 for_each_possible_cpu(cpu)
170 per_cpu(tracing_cpu, cpu) = 0;
171
172 tr->max_latency = 0;
173 tracing_reset_online_cpus(&irqsoff_trace->array_buffer);
174
175 return start_irqsoff_tracer(irqsoff_trace, set);
176}
177
178static int irqsoff_graph_entry(struct ftrace_graph_ent *trace)
179{
180 struct trace_array *tr = irqsoff_trace;
181 struct trace_array_cpu *data;
182 unsigned long flags;
183 unsigned int trace_ctx;
184 int ret;
185
186 if (ftrace_graph_ignore_func(trace))
187 return 0;
188 /*
189 * Do not trace a function if it's filtered by set_graph_notrace.
190 * Make the index of ret stack negative to indicate that it should
191 * ignore further functions. But it needs its own ret stack entry
192 * to recover the original index in order to continue tracing after
193 * returning from the function.
194 */
195 if (ftrace_graph_notrace_addr(trace->func))
196 return 1;
197
198 if (!func_prolog_dec(tr, &data, &flags))
199 return 0;
200
201 trace_ctx = tracing_gen_ctx_flags(flags);
202 ret = __trace_graph_entry(tr, trace, trace_ctx);
203 atomic_dec(&data->disabled);
204
205 return ret;
206}
207
208static void irqsoff_graph_return(struct ftrace_graph_ret *trace)
209{
210 struct trace_array *tr = irqsoff_trace;
211 struct trace_array_cpu *data;
212 unsigned long flags;
213 unsigned int trace_ctx;
214
215 ftrace_graph_addr_finish(trace);
216
217 if (!func_prolog_dec(tr, &data, &flags))
218 return;
219
220 trace_ctx = tracing_gen_ctx_flags(flags);
221 __trace_graph_return(tr, trace, trace_ctx);
222 atomic_dec(&data->disabled);
223}
224
225static struct fgraph_ops fgraph_ops = {
226 .entryfunc = &irqsoff_graph_entry,
227 .retfunc = &irqsoff_graph_return,
228};
229
230static void irqsoff_trace_open(struct trace_iterator *iter)
231{
232 if (is_graph(iter->tr))
233 graph_trace_open(iter);
234 else
235 iter->private = NULL;
236}
237
238static void irqsoff_trace_close(struct trace_iterator *iter)
239{
240 if (iter->private)
241 graph_trace_close(iter);
242}
243
244#define GRAPH_TRACER_FLAGS (TRACE_GRAPH_PRINT_CPU | \
245 TRACE_GRAPH_PRINT_PROC | \
246 TRACE_GRAPH_PRINT_REL_TIME | \
247 TRACE_GRAPH_PRINT_DURATION)
248
249static enum print_line_t irqsoff_print_line(struct trace_iterator *iter)
250{
251 /*
252 * In graph mode call the graph tracer output function,
253 * otherwise go with the TRACE_FN event handler
254 */
255 if (is_graph(iter->tr))
256 return print_graph_function_flags(iter, GRAPH_TRACER_FLAGS);
257
258 return TRACE_TYPE_UNHANDLED;
259}
260
261static void irqsoff_print_header(struct seq_file *s)
262{
263 struct trace_array *tr = irqsoff_trace;
264
265 if (is_graph(tr))
266 print_graph_headers_flags(s, GRAPH_TRACER_FLAGS);
267 else
268 trace_default_header(s);
269}
270
271static void
272__trace_function(struct trace_array *tr,
273 unsigned long ip, unsigned long parent_ip,
274 unsigned int trace_ctx)
275{
276 if (is_graph(tr))
277 trace_graph_function(tr, ip, parent_ip, trace_ctx);
278 else
279 trace_function(tr, ip, parent_ip, trace_ctx);
280}
281
282#else
283#define __trace_function trace_function
284
285static enum print_line_t irqsoff_print_line(struct trace_iterator *iter)
286{
287 return TRACE_TYPE_UNHANDLED;
288}
289
290static void irqsoff_trace_open(struct trace_iterator *iter) { }
291static void irqsoff_trace_close(struct trace_iterator *iter) { }
292
293#ifdef CONFIG_FUNCTION_TRACER
294static void irqsoff_print_header(struct seq_file *s)
295{
296 trace_default_header(s);
297}
298#else
299static void irqsoff_print_header(struct seq_file *s)
300{
301 trace_latency_header(s);
302}
303#endif /* CONFIG_FUNCTION_TRACER */
304#endif /* CONFIG_FUNCTION_GRAPH_TRACER */
305
306/*
307 * Should this new latency be reported/recorded?
308 */
309static bool report_latency(struct trace_array *tr, u64 delta)
310{
311 if (tracing_thresh) {
312 if (delta < tracing_thresh)
313 return false;
314 } else {
315 if (delta <= tr->max_latency)
316 return false;
317 }
318 return true;
319}
320
321static void
322check_critical_timing(struct trace_array *tr,
323 struct trace_array_cpu *data,
324 unsigned long parent_ip,
325 int cpu)
326{
327 u64 T0, T1, delta;
328 unsigned long flags;
329 unsigned int trace_ctx;
330
331 T0 = data->preempt_timestamp;
332 T1 = ftrace_now(cpu);
333 delta = T1-T0;
334
335 trace_ctx = tracing_gen_ctx();
336
337 if (!report_latency(tr, delta))
338 goto out;
339
340 raw_spin_lock_irqsave(&max_trace_lock, flags);
341
342 /* check if we are still the max latency */
343 if (!report_latency(tr, delta))
344 goto out_unlock;
345
346 __trace_function(tr, CALLER_ADDR0, parent_ip, trace_ctx);
347 /* Skip 5 functions to get to the irq/preempt enable function */
348 __trace_stack(tr, trace_ctx, 5);
349
350 if (data->critical_sequence != max_sequence)
351 goto out_unlock;
352
353 data->critical_end = parent_ip;
354
355 if (likely(!is_tracing_stopped())) {
356 tr->max_latency = delta;
357 update_max_tr_single(tr, current, cpu);
358 }
359
360 max_sequence++;
361
362out_unlock:
363 raw_spin_unlock_irqrestore(&max_trace_lock, flags);
364
365out:
366 data->critical_sequence = max_sequence;
367 data->preempt_timestamp = ftrace_now(cpu);
368 __trace_function(tr, CALLER_ADDR0, parent_ip, trace_ctx);
369}
370
371static nokprobe_inline void
372start_critical_timing(unsigned long ip, unsigned long parent_ip)
373{
374 int cpu;
375 struct trace_array *tr = irqsoff_trace;
376 struct trace_array_cpu *data;
377
378 if (!tracer_enabled || !tracing_is_enabled())
379 return;
380
381 cpu = raw_smp_processor_id();
382
383 if (per_cpu(tracing_cpu, cpu))
384 return;
385
386 data = per_cpu_ptr(tr->array_buffer.data, cpu);
387
388 if (unlikely(!data) || atomic_read(&data->disabled))
389 return;
390
391 atomic_inc(&data->disabled);
392
393 data->critical_sequence = max_sequence;
394 data->preempt_timestamp = ftrace_now(cpu);
395 data->critical_start = parent_ip ? : ip;
396
397 __trace_function(tr, ip, parent_ip, tracing_gen_ctx());
398
399 per_cpu(tracing_cpu, cpu) = 1;
400
401 atomic_dec(&data->disabled);
402}
403
404static nokprobe_inline void
405stop_critical_timing(unsigned long ip, unsigned long parent_ip)
406{
407 int cpu;
408 struct trace_array *tr = irqsoff_trace;
409 struct trace_array_cpu *data;
410 unsigned int trace_ctx;
411
412 cpu = raw_smp_processor_id();
413 /* Always clear the tracing cpu on stopping the trace */
414 if (unlikely(per_cpu(tracing_cpu, cpu)))
415 per_cpu(tracing_cpu, cpu) = 0;
416 else
417 return;
418
419 if (!tracer_enabled || !tracing_is_enabled())
420 return;
421
422 data = per_cpu_ptr(tr->array_buffer.data, cpu);
423
424 if (unlikely(!data) ||
425 !data->critical_start || atomic_read(&data->disabled))
426 return;
427
428 atomic_inc(&data->disabled);
429
430 trace_ctx = tracing_gen_ctx();
431 __trace_function(tr, ip, parent_ip, trace_ctx);
432 check_critical_timing(tr, data, parent_ip ? : ip, cpu);
433 data->critical_start = 0;
434 atomic_dec(&data->disabled);
435}
436
437/* start and stop critical timings used to for stoppage (in idle) */
438void start_critical_timings(void)
439{
440 if (preempt_trace(preempt_count()) || irq_trace())
441 start_critical_timing(CALLER_ADDR0, CALLER_ADDR1);
442}
443EXPORT_SYMBOL_GPL(start_critical_timings);
444NOKPROBE_SYMBOL(start_critical_timings);
445
446void stop_critical_timings(void)
447{
448 if (preempt_trace(preempt_count()) || irq_trace())
449 stop_critical_timing(CALLER_ADDR0, CALLER_ADDR1);
450}
451EXPORT_SYMBOL_GPL(stop_critical_timings);
452NOKPROBE_SYMBOL(stop_critical_timings);
453
454#ifdef CONFIG_FUNCTION_TRACER
455static bool function_enabled;
456
457static int register_irqsoff_function(struct trace_array *tr, int graph, int set)
458{
459 int ret;
460
461 /* 'set' is set if TRACE_ITER_FUNCTION is about to be set */
462 if (function_enabled || (!set && !(tr->trace_flags & TRACE_ITER_FUNCTION)))
463 return 0;
464
465 if (graph)
466 ret = register_ftrace_graph(&fgraph_ops);
467 else
468 ret = register_ftrace_function(tr->ops);
469
470 if (!ret)
471 function_enabled = true;
472
473 return ret;
474}
475
476static void unregister_irqsoff_function(struct trace_array *tr, int graph)
477{
478 if (!function_enabled)
479 return;
480
481 if (graph)
482 unregister_ftrace_graph(&fgraph_ops);
483 else
484 unregister_ftrace_function(tr->ops);
485
486 function_enabled = false;
487}
488
489static int irqsoff_function_set(struct trace_array *tr, u32 mask, int set)
490{
491 if (!(mask & TRACE_ITER_FUNCTION))
492 return 0;
493
494 if (set)
495 register_irqsoff_function(tr, is_graph(tr), 1);
496 else
497 unregister_irqsoff_function(tr, is_graph(tr));
498 return 1;
499}
500#else
501static int register_irqsoff_function(struct trace_array *tr, int graph, int set)
502{
503 return 0;
504}
505static void unregister_irqsoff_function(struct trace_array *tr, int graph) { }
506static inline int irqsoff_function_set(struct trace_array *tr, u32 mask, int set)
507{
508 return 0;
509}
510#endif /* CONFIG_FUNCTION_TRACER */
511
512static int irqsoff_flag_changed(struct trace_array *tr, u32 mask, int set)
513{
514 struct tracer *tracer = tr->current_trace;
515
516 if (irqsoff_function_set(tr, mask, set))
517 return 0;
518
519#ifdef CONFIG_FUNCTION_GRAPH_TRACER
520 if (mask & TRACE_ITER_DISPLAY_GRAPH)
521 return irqsoff_display_graph(tr, set);
522#endif
523
524 return trace_keep_overwrite(tracer, mask, set);
525}
526
527static int start_irqsoff_tracer(struct trace_array *tr, int graph)
528{
529 int ret;
530
531 ret = register_irqsoff_function(tr, graph, 0);
532
533 if (!ret && tracing_is_enabled())
534 tracer_enabled = 1;
535 else
536 tracer_enabled = 0;
537
538 return ret;
539}
540
541static void stop_irqsoff_tracer(struct trace_array *tr, int graph)
542{
543 tracer_enabled = 0;
544
545 unregister_irqsoff_function(tr, graph);
546}
547
548static bool irqsoff_busy;
549
550static int __irqsoff_tracer_init(struct trace_array *tr)
551{
552 if (irqsoff_busy)
553 return -EBUSY;
554
555 save_flags = tr->trace_flags;
556
557 /* non overwrite screws up the latency tracers */
558 set_tracer_flag(tr, TRACE_ITER_OVERWRITE, 1);
559 set_tracer_flag(tr, TRACE_ITER_LATENCY_FMT, 1);
560 /* without pause, we will produce garbage if another latency occurs */
561 set_tracer_flag(tr, TRACE_ITER_PAUSE_ON_TRACE, 1);
562
563 tr->max_latency = 0;
564 irqsoff_trace = tr;
565 /* make sure that the tracer is visible */
566 smp_wmb();
567
568 ftrace_init_array_ops(tr, irqsoff_tracer_call);
569
570 /* Only toplevel instance supports graph tracing */
571 if (start_irqsoff_tracer(tr, (tr->flags & TRACE_ARRAY_FL_GLOBAL &&
572 is_graph(tr))))
573 printk(KERN_ERR "failed to start irqsoff tracer\n");
574
575 irqsoff_busy = true;
576 return 0;
577}
578
579static void __irqsoff_tracer_reset(struct trace_array *tr)
580{
581 int lat_flag = save_flags & TRACE_ITER_LATENCY_FMT;
582 int overwrite_flag = save_flags & TRACE_ITER_OVERWRITE;
583 int pause_flag = save_flags & TRACE_ITER_PAUSE_ON_TRACE;
584
585 stop_irqsoff_tracer(tr, is_graph(tr));
586
587 set_tracer_flag(tr, TRACE_ITER_LATENCY_FMT, lat_flag);
588 set_tracer_flag(tr, TRACE_ITER_OVERWRITE, overwrite_flag);
589 set_tracer_flag(tr, TRACE_ITER_PAUSE_ON_TRACE, pause_flag);
590 ftrace_reset_array_ops(tr);
591
592 irqsoff_busy = false;
593}
594
595static void irqsoff_tracer_start(struct trace_array *tr)
596{
597 tracer_enabled = 1;
598}
599
600static void irqsoff_tracer_stop(struct trace_array *tr)
601{
602 tracer_enabled = 0;
603}
604
605#ifdef CONFIG_IRQSOFF_TRACER
606/*
607 * We are only interested in hardirq on/off events:
608 */
609void tracer_hardirqs_on(unsigned long a0, unsigned long a1)
610{
611 if (!preempt_trace(preempt_count()) && irq_trace())
612 stop_critical_timing(a0, a1);
613}
614NOKPROBE_SYMBOL(tracer_hardirqs_on);
615
616void tracer_hardirqs_off(unsigned long a0, unsigned long a1)
617{
618 if (!preempt_trace(preempt_count()) && irq_trace())
619 start_critical_timing(a0, a1);
620}
621NOKPROBE_SYMBOL(tracer_hardirqs_off);
622
623static int irqsoff_tracer_init(struct trace_array *tr)
624{
625 trace_type = TRACER_IRQS_OFF;
626
627 return __irqsoff_tracer_init(tr);
628}
629
630static void irqsoff_tracer_reset(struct trace_array *tr)
631{
632 __irqsoff_tracer_reset(tr);
633}
634
635static struct tracer irqsoff_tracer __read_mostly =
636{
637 .name = "irqsoff",
638 .init = irqsoff_tracer_init,
639 .reset = irqsoff_tracer_reset,
640 .start = irqsoff_tracer_start,
641 .stop = irqsoff_tracer_stop,
642 .print_max = true,
643 .print_header = irqsoff_print_header,
644 .print_line = irqsoff_print_line,
645 .flag_changed = irqsoff_flag_changed,
646#ifdef CONFIG_FTRACE_SELFTEST
647 .selftest = trace_selftest_startup_irqsoff,
648#endif
649 .open = irqsoff_trace_open,
650 .close = irqsoff_trace_close,
651 .allow_instances = true,
652 .use_max_tr = true,
653};
654#endif /* CONFIG_IRQSOFF_TRACER */
655
656#ifdef CONFIG_PREEMPT_TRACER
657void tracer_preempt_on(unsigned long a0, unsigned long a1)
658{
659 if (preempt_trace(preempt_count()) && !irq_trace())
660 stop_critical_timing(a0, a1);
661}
662
663void tracer_preempt_off(unsigned long a0, unsigned long a1)
664{
665 if (preempt_trace(preempt_count()) && !irq_trace())
666 start_critical_timing(a0, a1);
667}
668
669static int preemptoff_tracer_init(struct trace_array *tr)
670{
671 trace_type = TRACER_PREEMPT_OFF;
672
673 return __irqsoff_tracer_init(tr);
674}
675
676static void preemptoff_tracer_reset(struct trace_array *tr)
677{
678 __irqsoff_tracer_reset(tr);
679}
680
681static struct tracer preemptoff_tracer __read_mostly =
682{
683 .name = "preemptoff",
684 .init = preemptoff_tracer_init,
685 .reset = preemptoff_tracer_reset,
686 .start = irqsoff_tracer_start,
687 .stop = irqsoff_tracer_stop,
688 .print_max = true,
689 .print_header = irqsoff_print_header,
690 .print_line = irqsoff_print_line,
691 .flag_changed = irqsoff_flag_changed,
692#ifdef CONFIG_FTRACE_SELFTEST
693 .selftest = trace_selftest_startup_preemptoff,
694#endif
695 .open = irqsoff_trace_open,
696 .close = irqsoff_trace_close,
697 .allow_instances = true,
698 .use_max_tr = true,
699};
700#endif /* CONFIG_PREEMPT_TRACER */
701
702#if defined(CONFIG_IRQSOFF_TRACER) && defined(CONFIG_PREEMPT_TRACER)
703
704static int preemptirqsoff_tracer_init(struct trace_array *tr)
705{
706 trace_type = TRACER_IRQS_OFF | TRACER_PREEMPT_OFF;
707
708 return __irqsoff_tracer_init(tr);
709}
710
711static void preemptirqsoff_tracer_reset(struct trace_array *tr)
712{
713 __irqsoff_tracer_reset(tr);
714}
715
716static struct tracer preemptirqsoff_tracer __read_mostly =
717{
718 .name = "preemptirqsoff",
719 .init = preemptirqsoff_tracer_init,
720 .reset = preemptirqsoff_tracer_reset,
721 .start = irqsoff_tracer_start,
722 .stop = irqsoff_tracer_stop,
723 .print_max = true,
724 .print_header = irqsoff_print_header,
725 .print_line = irqsoff_print_line,
726 .flag_changed = irqsoff_flag_changed,
727#ifdef CONFIG_FTRACE_SELFTEST
728 .selftest = trace_selftest_startup_preemptirqsoff,
729#endif
730 .open = irqsoff_trace_open,
731 .close = irqsoff_trace_close,
732 .allow_instances = true,
733 .use_max_tr = true,
734};
735#endif
736
737__init static int init_irqsoff_tracer(void)
738{
739#ifdef CONFIG_IRQSOFF_TRACER
740 register_tracer(&irqsoff_tracer);
741#endif
742#ifdef CONFIG_PREEMPT_TRACER
743 register_tracer(&preemptoff_tracer);
744#endif
745#if defined(CONFIG_IRQSOFF_TRACER) && defined(CONFIG_PREEMPT_TRACER)
746 register_tracer(&preemptirqsoff_tracer);
747#endif
748
749 return 0;
750}
751core_initcall(init_irqsoff_tracer);
752#endif /* IRQSOFF_TRACER || PREEMPTOFF_TRACER */
1/*
2 * trace irqs off critical timings
3 *
4 * Copyright (C) 2007-2008 Steven Rostedt <srostedt@redhat.com>
5 * Copyright (C) 2008 Ingo Molnar <mingo@redhat.com>
6 *
7 * From code in the latency_tracer, that is:
8 *
9 * Copyright (C) 2004-2006 Ingo Molnar
10 * Copyright (C) 2004 William Lee Irwin III
11 */
12#include <linux/kallsyms.h>
13#include <linux/debugfs.h>
14#include <linux/uaccess.h>
15#include <linux/module.h>
16#include <linux/ftrace.h>
17#include <linux/fs.h>
18
19#include "trace.h"
20
21static struct trace_array *irqsoff_trace __read_mostly;
22static int tracer_enabled __read_mostly;
23
24static DEFINE_PER_CPU(int, tracing_cpu);
25
26static DEFINE_RAW_SPINLOCK(max_trace_lock);
27
28enum {
29 TRACER_IRQS_OFF = (1 << 1),
30 TRACER_PREEMPT_OFF = (1 << 2),
31};
32
33static int trace_type __read_mostly;
34
35static int save_lat_flag;
36
37static void stop_irqsoff_tracer(struct trace_array *tr, int graph);
38static int start_irqsoff_tracer(struct trace_array *tr, int graph);
39
40#ifdef CONFIG_PREEMPT_TRACER
41static inline int
42preempt_trace(void)
43{
44 return ((trace_type & TRACER_PREEMPT_OFF) && preempt_count());
45}
46#else
47# define preempt_trace() (0)
48#endif
49
50#ifdef CONFIG_IRQSOFF_TRACER
51static inline int
52irq_trace(void)
53{
54 return ((trace_type & TRACER_IRQS_OFF) &&
55 irqs_disabled());
56}
57#else
58# define irq_trace() (0)
59#endif
60
61#define TRACE_DISPLAY_GRAPH 1
62
63static struct tracer_opt trace_opts[] = {
64#ifdef CONFIG_FUNCTION_GRAPH_TRACER
65 /* display latency trace as call graph */
66 { TRACER_OPT(display-graph, TRACE_DISPLAY_GRAPH) },
67#endif
68 { } /* Empty entry */
69};
70
71static struct tracer_flags tracer_flags = {
72 .val = 0,
73 .opts = trace_opts,
74};
75
76#define is_graph() (tracer_flags.val & TRACE_DISPLAY_GRAPH)
77
78/*
79 * Sequence count - we record it when starting a measurement and
80 * skip the latency if the sequence has changed - some other section
81 * did a maximum and could disturb our measurement with serial console
82 * printouts, etc. Truly coinciding maximum latencies should be rare
83 * and what happens together happens separately as well, so this doesn't
84 * decrease the validity of the maximum found:
85 */
86static __cacheline_aligned_in_smp unsigned long max_sequence;
87
88#ifdef CONFIG_FUNCTION_TRACER
89/*
90 * Prologue for the preempt and irqs off function tracers.
91 *
92 * Returns 1 if it is OK to continue, and data->disabled is
93 * incremented.
94 * 0 if the trace is to be ignored, and data->disabled
95 * is kept the same.
96 *
97 * Note, this function is also used outside this ifdef but
98 * inside the #ifdef of the function graph tracer below.
99 * This is OK, since the function graph tracer is
100 * dependent on the function tracer.
101 */
102static int func_prolog_dec(struct trace_array *tr,
103 struct trace_array_cpu **data,
104 unsigned long *flags)
105{
106 long disabled;
107 int cpu;
108
109 /*
110 * Does not matter if we preempt. We test the flags
111 * afterward, to see if irqs are disabled or not.
112 * If we preempt and get a false positive, the flags
113 * test will fail.
114 */
115 cpu = raw_smp_processor_id();
116 if (likely(!per_cpu(tracing_cpu, cpu)))
117 return 0;
118
119 local_save_flags(*flags);
120 /* slight chance to get a false positive on tracing_cpu */
121 if (!irqs_disabled_flags(*flags))
122 return 0;
123
124 *data = tr->data[cpu];
125 disabled = atomic_inc_return(&(*data)->disabled);
126
127 if (likely(disabled == 1))
128 return 1;
129
130 atomic_dec(&(*data)->disabled);
131
132 return 0;
133}
134
135/*
136 * irqsoff uses its own tracer function to keep the overhead down:
137 */
138static void
139irqsoff_tracer_call(unsigned long ip, unsigned long parent_ip)
140{
141 struct trace_array *tr = irqsoff_trace;
142 struct trace_array_cpu *data;
143 unsigned long flags;
144
145 if (!func_prolog_dec(tr, &data, &flags))
146 return;
147
148 trace_function(tr, ip, parent_ip, flags, preempt_count());
149
150 atomic_dec(&data->disabled);
151}
152
153static struct ftrace_ops trace_ops __read_mostly =
154{
155 .func = irqsoff_tracer_call,
156 .flags = FTRACE_OPS_FL_GLOBAL,
157};
158#endif /* CONFIG_FUNCTION_TRACER */
159
160#ifdef CONFIG_FUNCTION_GRAPH_TRACER
161static int irqsoff_set_flag(u32 old_flags, u32 bit, int set)
162{
163 int cpu;
164
165 if (!(bit & TRACE_DISPLAY_GRAPH))
166 return -EINVAL;
167
168 if (!(is_graph() ^ set))
169 return 0;
170
171 stop_irqsoff_tracer(irqsoff_trace, !set);
172
173 for_each_possible_cpu(cpu)
174 per_cpu(tracing_cpu, cpu) = 0;
175
176 tracing_max_latency = 0;
177 tracing_reset_online_cpus(irqsoff_trace);
178
179 return start_irqsoff_tracer(irqsoff_trace, set);
180}
181
182static int irqsoff_graph_entry(struct ftrace_graph_ent *trace)
183{
184 struct trace_array *tr = irqsoff_trace;
185 struct trace_array_cpu *data;
186 unsigned long flags;
187 int ret;
188 int pc;
189
190 if (!func_prolog_dec(tr, &data, &flags))
191 return 0;
192
193 pc = preempt_count();
194 ret = __trace_graph_entry(tr, trace, flags, pc);
195 atomic_dec(&data->disabled);
196
197 return ret;
198}
199
200static void irqsoff_graph_return(struct ftrace_graph_ret *trace)
201{
202 struct trace_array *tr = irqsoff_trace;
203 struct trace_array_cpu *data;
204 unsigned long flags;
205 int pc;
206
207 if (!func_prolog_dec(tr, &data, &flags))
208 return;
209
210 pc = preempt_count();
211 __trace_graph_return(tr, trace, flags, pc);
212 atomic_dec(&data->disabled);
213}
214
215static void irqsoff_trace_open(struct trace_iterator *iter)
216{
217 if (is_graph())
218 graph_trace_open(iter);
219
220}
221
222static void irqsoff_trace_close(struct trace_iterator *iter)
223{
224 if (iter->private)
225 graph_trace_close(iter);
226}
227
228#define GRAPH_TRACER_FLAGS (TRACE_GRAPH_PRINT_CPU | \
229 TRACE_GRAPH_PRINT_PROC | \
230 TRACE_GRAPH_PRINT_ABS_TIME | \
231 TRACE_GRAPH_PRINT_DURATION)
232
233static enum print_line_t irqsoff_print_line(struct trace_iterator *iter)
234{
235 /*
236 * In graph mode call the graph tracer output function,
237 * otherwise go with the TRACE_FN event handler
238 */
239 if (is_graph())
240 return print_graph_function_flags(iter, GRAPH_TRACER_FLAGS);
241
242 return TRACE_TYPE_UNHANDLED;
243}
244
245static void irqsoff_print_header(struct seq_file *s)
246{
247 if (is_graph())
248 print_graph_headers_flags(s, GRAPH_TRACER_FLAGS);
249 else
250 trace_default_header(s);
251}
252
253static void
254__trace_function(struct trace_array *tr,
255 unsigned long ip, unsigned long parent_ip,
256 unsigned long flags, int pc)
257{
258 if (is_graph())
259 trace_graph_function(tr, ip, parent_ip, flags, pc);
260 else
261 trace_function(tr, ip, parent_ip, flags, pc);
262}
263
264#else
265#define __trace_function trace_function
266
267static int irqsoff_set_flag(u32 old_flags, u32 bit, int set)
268{
269 return -EINVAL;
270}
271
272static int irqsoff_graph_entry(struct ftrace_graph_ent *trace)
273{
274 return -1;
275}
276
277static enum print_line_t irqsoff_print_line(struct trace_iterator *iter)
278{
279 return TRACE_TYPE_UNHANDLED;
280}
281
282static void irqsoff_graph_return(struct ftrace_graph_ret *trace) { }
283static void irqsoff_trace_open(struct trace_iterator *iter) { }
284static void irqsoff_trace_close(struct trace_iterator *iter) { }
285
286#ifdef CONFIG_FUNCTION_TRACER
287static void irqsoff_print_header(struct seq_file *s)
288{
289 trace_default_header(s);
290}
291#else
292static void irqsoff_print_header(struct seq_file *s)
293{
294 trace_latency_header(s);
295}
296#endif /* CONFIG_FUNCTION_TRACER */
297#endif /* CONFIG_FUNCTION_GRAPH_TRACER */
298
299/*
300 * Should this new latency be reported/recorded?
301 */
302static int report_latency(cycle_t delta)
303{
304 if (tracing_thresh) {
305 if (delta < tracing_thresh)
306 return 0;
307 } else {
308 if (delta <= tracing_max_latency)
309 return 0;
310 }
311 return 1;
312}
313
314static void
315check_critical_timing(struct trace_array *tr,
316 struct trace_array_cpu *data,
317 unsigned long parent_ip,
318 int cpu)
319{
320 cycle_t T0, T1, delta;
321 unsigned long flags;
322 int pc;
323
324 T0 = data->preempt_timestamp;
325 T1 = ftrace_now(cpu);
326 delta = T1-T0;
327
328 local_save_flags(flags);
329
330 pc = preempt_count();
331
332 if (!report_latency(delta))
333 goto out;
334
335 raw_spin_lock_irqsave(&max_trace_lock, flags);
336
337 /* check if we are still the max latency */
338 if (!report_latency(delta))
339 goto out_unlock;
340
341 __trace_function(tr, CALLER_ADDR0, parent_ip, flags, pc);
342 /* Skip 5 functions to get to the irq/preempt enable function */
343 __trace_stack(tr, flags, 5, pc);
344
345 if (data->critical_sequence != max_sequence)
346 goto out_unlock;
347
348 data->critical_end = parent_ip;
349
350 if (likely(!is_tracing_stopped())) {
351 tracing_max_latency = delta;
352 update_max_tr_single(tr, current, cpu);
353 }
354
355 max_sequence++;
356
357out_unlock:
358 raw_spin_unlock_irqrestore(&max_trace_lock, flags);
359
360out:
361 data->critical_sequence = max_sequence;
362 data->preempt_timestamp = ftrace_now(cpu);
363 __trace_function(tr, CALLER_ADDR0, parent_ip, flags, pc);
364}
365
366static inline void
367start_critical_timing(unsigned long ip, unsigned long parent_ip)
368{
369 int cpu;
370 struct trace_array *tr = irqsoff_trace;
371 struct trace_array_cpu *data;
372 unsigned long flags;
373
374 if (likely(!tracer_enabled))
375 return;
376
377 cpu = raw_smp_processor_id();
378
379 if (per_cpu(tracing_cpu, cpu))
380 return;
381
382 data = tr->data[cpu];
383
384 if (unlikely(!data) || atomic_read(&data->disabled))
385 return;
386
387 atomic_inc(&data->disabled);
388
389 data->critical_sequence = max_sequence;
390 data->preempt_timestamp = ftrace_now(cpu);
391 data->critical_start = parent_ip ? : ip;
392
393 local_save_flags(flags);
394
395 __trace_function(tr, ip, parent_ip, flags, preempt_count());
396
397 per_cpu(tracing_cpu, cpu) = 1;
398
399 atomic_dec(&data->disabled);
400}
401
402static inline void
403stop_critical_timing(unsigned long ip, unsigned long parent_ip)
404{
405 int cpu;
406 struct trace_array *tr = irqsoff_trace;
407 struct trace_array_cpu *data;
408 unsigned long flags;
409
410 cpu = raw_smp_processor_id();
411 /* Always clear the tracing cpu on stopping the trace */
412 if (unlikely(per_cpu(tracing_cpu, cpu)))
413 per_cpu(tracing_cpu, cpu) = 0;
414 else
415 return;
416
417 if (!tracer_enabled)
418 return;
419
420 data = tr->data[cpu];
421
422 if (unlikely(!data) ||
423 !data->critical_start || atomic_read(&data->disabled))
424 return;
425
426 atomic_inc(&data->disabled);
427
428 local_save_flags(flags);
429 __trace_function(tr, ip, parent_ip, flags, preempt_count());
430 check_critical_timing(tr, data, parent_ip ? : ip, cpu);
431 data->critical_start = 0;
432 atomic_dec(&data->disabled);
433}
434
435/* start and stop critical timings used to for stoppage (in idle) */
436void start_critical_timings(void)
437{
438 if (preempt_trace() || irq_trace())
439 start_critical_timing(CALLER_ADDR0, CALLER_ADDR1);
440}
441EXPORT_SYMBOL_GPL(start_critical_timings);
442
443void stop_critical_timings(void)
444{
445 if (preempt_trace() || irq_trace())
446 stop_critical_timing(CALLER_ADDR0, CALLER_ADDR1);
447}
448EXPORT_SYMBOL_GPL(stop_critical_timings);
449
450#ifdef CONFIG_IRQSOFF_TRACER
451#ifdef CONFIG_PROVE_LOCKING
452void time_hardirqs_on(unsigned long a0, unsigned long a1)
453{
454 if (!preempt_trace() && irq_trace())
455 stop_critical_timing(a0, a1);
456}
457
458void time_hardirqs_off(unsigned long a0, unsigned long a1)
459{
460 if (!preempt_trace() && irq_trace())
461 start_critical_timing(a0, a1);
462}
463
464#else /* !CONFIG_PROVE_LOCKING */
465
466/*
467 * Stubs:
468 */
469
470void trace_softirqs_on(unsigned long ip)
471{
472}
473
474void trace_softirqs_off(unsigned long ip)
475{
476}
477
478inline void print_irqtrace_events(struct task_struct *curr)
479{
480}
481
482/*
483 * We are only interested in hardirq on/off events:
484 */
485void trace_hardirqs_on(void)
486{
487 if (!preempt_trace() && irq_trace())
488 stop_critical_timing(CALLER_ADDR0, CALLER_ADDR1);
489}
490EXPORT_SYMBOL(trace_hardirqs_on);
491
492void trace_hardirqs_off(void)
493{
494 if (!preempt_trace() && irq_trace())
495 start_critical_timing(CALLER_ADDR0, CALLER_ADDR1);
496}
497EXPORT_SYMBOL(trace_hardirqs_off);
498
499void trace_hardirqs_on_caller(unsigned long caller_addr)
500{
501 if (!preempt_trace() && irq_trace())
502 stop_critical_timing(CALLER_ADDR0, caller_addr);
503}
504EXPORT_SYMBOL(trace_hardirqs_on_caller);
505
506void trace_hardirqs_off_caller(unsigned long caller_addr)
507{
508 if (!preempt_trace() && irq_trace())
509 start_critical_timing(CALLER_ADDR0, caller_addr);
510}
511EXPORT_SYMBOL(trace_hardirqs_off_caller);
512
513#endif /* CONFIG_PROVE_LOCKING */
514#endif /* CONFIG_IRQSOFF_TRACER */
515
516#ifdef CONFIG_PREEMPT_TRACER
517void trace_preempt_on(unsigned long a0, unsigned long a1)
518{
519 if (preempt_trace() && !irq_trace())
520 stop_critical_timing(a0, a1);
521}
522
523void trace_preempt_off(unsigned long a0, unsigned long a1)
524{
525 if (preempt_trace() && !irq_trace())
526 start_critical_timing(a0, a1);
527}
528#endif /* CONFIG_PREEMPT_TRACER */
529
530static int start_irqsoff_tracer(struct trace_array *tr, int graph)
531{
532 int ret = 0;
533
534 if (!graph)
535 ret = register_ftrace_function(&trace_ops);
536 else
537 ret = register_ftrace_graph(&irqsoff_graph_return,
538 &irqsoff_graph_entry);
539
540 if (!ret && tracing_is_enabled())
541 tracer_enabled = 1;
542 else
543 tracer_enabled = 0;
544
545 return ret;
546}
547
548static void stop_irqsoff_tracer(struct trace_array *tr, int graph)
549{
550 tracer_enabled = 0;
551
552 if (!graph)
553 unregister_ftrace_function(&trace_ops);
554 else
555 unregister_ftrace_graph();
556}
557
558static void __irqsoff_tracer_init(struct trace_array *tr)
559{
560 save_lat_flag = trace_flags & TRACE_ITER_LATENCY_FMT;
561 trace_flags |= TRACE_ITER_LATENCY_FMT;
562
563 tracing_max_latency = 0;
564 irqsoff_trace = tr;
565 /* make sure that the tracer is visible */
566 smp_wmb();
567 tracing_reset_online_cpus(tr);
568
569 if (start_irqsoff_tracer(tr, is_graph()))
570 printk(KERN_ERR "failed to start irqsoff tracer\n");
571}
572
573static void irqsoff_tracer_reset(struct trace_array *tr)
574{
575 stop_irqsoff_tracer(tr, is_graph());
576
577 if (!save_lat_flag)
578 trace_flags &= ~TRACE_ITER_LATENCY_FMT;
579}
580
581static void irqsoff_tracer_start(struct trace_array *tr)
582{
583 tracer_enabled = 1;
584}
585
586static void irqsoff_tracer_stop(struct trace_array *tr)
587{
588 tracer_enabled = 0;
589}
590
591#ifdef CONFIG_IRQSOFF_TRACER
592static int irqsoff_tracer_init(struct trace_array *tr)
593{
594 trace_type = TRACER_IRQS_OFF;
595
596 __irqsoff_tracer_init(tr);
597 return 0;
598}
599static struct tracer irqsoff_tracer __read_mostly =
600{
601 .name = "irqsoff",
602 .init = irqsoff_tracer_init,
603 .reset = irqsoff_tracer_reset,
604 .start = irqsoff_tracer_start,
605 .stop = irqsoff_tracer_stop,
606 .print_max = 1,
607 .print_header = irqsoff_print_header,
608 .print_line = irqsoff_print_line,
609 .flags = &tracer_flags,
610 .set_flag = irqsoff_set_flag,
611#ifdef CONFIG_FTRACE_SELFTEST
612 .selftest = trace_selftest_startup_irqsoff,
613#endif
614 .open = irqsoff_trace_open,
615 .close = irqsoff_trace_close,
616 .use_max_tr = 1,
617};
618# define register_irqsoff(trace) register_tracer(&trace)
619#else
620# define register_irqsoff(trace) do { } while (0)
621#endif
622
623#ifdef CONFIG_PREEMPT_TRACER
624static int preemptoff_tracer_init(struct trace_array *tr)
625{
626 trace_type = TRACER_PREEMPT_OFF;
627
628 __irqsoff_tracer_init(tr);
629 return 0;
630}
631
632static struct tracer preemptoff_tracer __read_mostly =
633{
634 .name = "preemptoff",
635 .init = preemptoff_tracer_init,
636 .reset = irqsoff_tracer_reset,
637 .start = irqsoff_tracer_start,
638 .stop = irqsoff_tracer_stop,
639 .print_max = 1,
640 .print_header = irqsoff_print_header,
641 .print_line = irqsoff_print_line,
642 .flags = &tracer_flags,
643 .set_flag = irqsoff_set_flag,
644#ifdef CONFIG_FTRACE_SELFTEST
645 .selftest = trace_selftest_startup_preemptoff,
646#endif
647 .open = irqsoff_trace_open,
648 .close = irqsoff_trace_close,
649 .use_max_tr = 1,
650};
651# define register_preemptoff(trace) register_tracer(&trace)
652#else
653# define register_preemptoff(trace) do { } while (0)
654#endif
655
656#if defined(CONFIG_IRQSOFF_TRACER) && \
657 defined(CONFIG_PREEMPT_TRACER)
658
659static int preemptirqsoff_tracer_init(struct trace_array *tr)
660{
661 trace_type = TRACER_IRQS_OFF | TRACER_PREEMPT_OFF;
662
663 __irqsoff_tracer_init(tr);
664 return 0;
665}
666
667static struct tracer preemptirqsoff_tracer __read_mostly =
668{
669 .name = "preemptirqsoff",
670 .init = preemptirqsoff_tracer_init,
671 .reset = irqsoff_tracer_reset,
672 .start = irqsoff_tracer_start,
673 .stop = irqsoff_tracer_stop,
674 .print_max = 1,
675 .print_header = irqsoff_print_header,
676 .print_line = irqsoff_print_line,
677 .flags = &tracer_flags,
678 .set_flag = irqsoff_set_flag,
679#ifdef CONFIG_FTRACE_SELFTEST
680 .selftest = trace_selftest_startup_preemptirqsoff,
681#endif
682 .open = irqsoff_trace_open,
683 .close = irqsoff_trace_close,
684 .use_max_tr = 1,
685};
686
687# define register_preemptirqsoff(trace) register_tracer(&trace)
688#else
689# define register_preemptirqsoff(trace) do { } while (0)
690#endif
691
692__init static int init_irqsoff_tracer(void)
693{
694 register_irqsoff(irqsoff_tracer);
695 register_preemptoff(preemptoff_tracer);
696 register_preemptirqsoff(preemptirqsoff_tracer);
697
698 return 0;
699}
700device_initcall(init_irqsoff_tracer);