blob: c04917cad1bfdc50fe4f00b08eaa58c9e7e7692e [file] [log] [blame]
Borislav Petkov9251f902011-10-16 17:15:04 +02001/*
2 * Performance events callchain code, extracted from core.c:
3 *
4 * Copyright (C) 2008 Thomas Gleixner <tglx@linutronix.de>
5 * Copyright (C) 2008-2011 Red Hat, Inc., Ingo Molnar
Peter Zijlstra90eec102015-11-16 11:08:45 +01006 * Copyright (C) 2008-2011 Red Hat, Inc., Peter Zijlstra
Borislav Petkov9251f902011-10-16 17:15:04 +02007 * Copyright © 2009 Paul Mackerras, IBM Corp. <paulus@au1.ibm.com>
8 *
9 * For licensing details see kernel-base/COPYING
10 */
11
12#include <linux/perf_event.h>
13#include <linux/slab.h>
Ingo Molnar68db0cf2017-02-08 18:51:37 +010014#include <linux/sched/task_stack.h>
15
Borislav Petkov9251f902011-10-16 17:15:04 +020016#include "internal.h"
17
18struct callchain_cpus_entries {
19 struct rcu_head rcu_head;
20 struct perf_callchain_entry *cpu_entries[0];
21};
22
Arnaldo Carvalho de Meloc5dfd782016-04-21 12:28:50 -030023int sysctl_perf_event_max_stack __read_mostly = PERF_MAX_STACK_DEPTH;
Arnaldo Carvalho de Meloc85b0332016-05-12 13:06:21 -030024int sysctl_perf_event_max_contexts_per_stack __read_mostly = PERF_MAX_CONTEXTS_PER_STACK;
Arnaldo Carvalho de Meloc5dfd782016-04-21 12:28:50 -030025
26static inline size_t perf_callchain_entry__sizeof(void)
27{
28 return (sizeof(struct perf_callchain_entry) +
Arnaldo Carvalho de Meloc85b0332016-05-12 13:06:21 -030029 sizeof(__u64) * (sysctl_perf_event_max_stack +
30 sysctl_perf_event_max_contexts_per_stack));
Arnaldo Carvalho de Meloc5dfd782016-04-21 12:28:50 -030031}
32
Borislav Petkov9251f902011-10-16 17:15:04 +020033static DEFINE_PER_CPU(int, callchain_recursion[PERF_NR_CONTEXTS]);
34static atomic_t nr_callchain_events;
35static DEFINE_MUTEX(callchain_mutex);
36static struct callchain_cpus_entries *callchain_cpus_entries;
37
38
Arnaldo Carvalho de Melocfbcf462016-04-28 12:30:53 -030039__weak void perf_callchain_kernel(struct perf_callchain_entry_ctx *entry,
Borislav Petkov9251f902011-10-16 17:15:04 +020040 struct pt_regs *regs)
41{
42}
43
Arnaldo Carvalho de Melocfbcf462016-04-28 12:30:53 -030044__weak void perf_callchain_user(struct perf_callchain_entry_ctx *entry,
Borislav Petkov9251f902011-10-16 17:15:04 +020045 struct pt_regs *regs)
46{
47}
48
49static void release_callchain_buffers_rcu(struct rcu_head *head)
50{
51 struct callchain_cpus_entries *entries;
52 int cpu;
53
54 entries = container_of(head, struct callchain_cpus_entries, rcu_head);
55
56 for_each_possible_cpu(cpu)
57 kfree(entries->cpu_entries[cpu]);
58
59 kfree(entries);
60}
61
62static void release_callchain_buffers(void)
63{
64 struct callchain_cpus_entries *entries;
65
66 entries = callchain_cpus_entries;
Andreea-Cristina Bernate0455e12014-08-22 17:15:36 +030067 RCU_INIT_POINTER(callchain_cpus_entries, NULL);
Borislav Petkov9251f902011-10-16 17:15:04 +020068 call_rcu(&entries->rcu_head, release_callchain_buffers_rcu);
69}
70
71static int alloc_callchain_buffers(void)
72{
73 int cpu;
74 int size;
75 struct callchain_cpus_entries *entries;
76
77 /*
78 * We can't use the percpu allocation API for data that can be
79 * accessed from NMI. Use a temporary manual per cpu allocation
80 * until that gets sorted out.
81 */
82 size = offsetof(struct callchain_cpus_entries, cpu_entries[nr_cpu_ids]);
83
84 entries = kzalloc(size, GFP_KERNEL);
85 if (!entries)
86 return -ENOMEM;
87
Arnaldo Carvalho de Meloc5dfd782016-04-21 12:28:50 -030088 size = perf_callchain_entry__sizeof() * PERF_NR_CONTEXTS;
Borislav Petkov9251f902011-10-16 17:15:04 +020089
90 for_each_possible_cpu(cpu) {
91 entries->cpu_entries[cpu] = kmalloc_node(size, GFP_KERNEL,
92 cpu_to_node(cpu));
93 if (!entries->cpu_entries[cpu])
94 goto fail;
95 }
96
97 rcu_assign_pointer(callchain_cpus_entries, entries);
98
99 return 0;
100
101fail:
102 for_each_possible_cpu(cpu)
103 kfree(entries->cpu_entries[cpu]);
104 kfree(entries);
105
106 return -ENOMEM;
107}
108
Arnaldo Carvalho de Melo97c79a32016-04-28 13:16:33 -0300109int get_callchain_buffers(int event_max_stack)
Borislav Petkov9251f902011-10-16 17:15:04 +0200110{
111 int err = 0;
112 int count;
113
114 mutex_lock(&callchain_mutex);
115
116 count = atomic_inc_return(&nr_callchain_events);
117 if (WARN_ON_ONCE(count < 1)) {
118 err = -EINVAL;
119 goto exit;
120 }
121
122 if (count > 1) {
123 /* If the allocation failed, give up */
124 if (!callchain_cpus_entries)
125 err = -ENOMEM;
Arnaldo Carvalho de Melo97c79a32016-04-28 13:16:33 -0300126 /*
127 * If requesting per event more than the global cap,
128 * return a different error to help userspace figure
129 * this out.
130 *
131 * And also do it here so that we have &callchain_mutex held.
132 */
133 if (event_max_stack > sysctl_perf_event_max_stack)
134 err = -EOVERFLOW;
Borislav Petkov9251f902011-10-16 17:15:04 +0200135 goto exit;
136 }
137
138 err = alloc_callchain_buffers();
Borislav Petkov9251f902011-10-16 17:15:04 +0200139exit:
Frederic Weisbecker90983b12013-07-23 02:31:00 +0200140 if (err)
141 atomic_dec(&nr_callchain_events);
Borislav Petkov9251f902011-10-16 17:15:04 +0200142
Frederic Weisbeckerfc3b86d2013-08-02 18:29:54 +0200143 mutex_unlock(&callchain_mutex);
144
Borislav Petkov9251f902011-10-16 17:15:04 +0200145 return err;
146}
147
148void put_callchain_buffers(void)
149{
150 if (atomic_dec_and_mutex_lock(&nr_callchain_events, &callchain_mutex)) {
151 release_callchain_buffers();
152 mutex_unlock(&callchain_mutex);
153 }
154}
155
156static struct perf_callchain_entry *get_callchain_entry(int *rctx)
157{
158 int cpu;
159 struct callchain_cpus_entries *entries;
160
Christoph Lameter4a32fea2014-08-17 12:30:27 -0500161 *rctx = get_recursion_context(this_cpu_ptr(callchain_recursion));
Borislav Petkov9251f902011-10-16 17:15:04 +0200162 if (*rctx == -1)
163 return NULL;
164
165 entries = rcu_dereference(callchain_cpus_entries);
166 if (!entries)
167 return NULL;
168
169 cpu = smp_processor_id();
170
Arnaldo Carvalho de Meloc5dfd782016-04-21 12:28:50 -0300171 return (((void *)entries->cpu_entries[cpu]) +
172 (*rctx * perf_callchain_entry__sizeof()));
Borislav Petkov9251f902011-10-16 17:15:04 +0200173}
174
175static void
176put_callchain_entry(int rctx)
177{
Christoph Lameter4a32fea2014-08-17 12:30:27 -0500178 put_recursion_context(this_cpu_ptr(callchain_recursion), rctx);
Borislav Petkov9251f902011-10-16 17:15:04 +0200179}
180
Andrew Vagine6dab5f2012-07-11 18:14:58 +0400181struct perf_callchain_entry *
182perf_callchain(struct perf_event *event, struct pt_regs *regs)
Borislav Petkov9251f902011-10-16 17:15:04 +0200183{
Alexei Starovoitov568b3292016-02-17 19:58:57 -0800184 bool kernel = !event->attr.exclude_callchain_kernel;
185 bool user = !event->attr.exclude_callchain_user;
186 /* Disallow cross-task user callchains. */
187 bool crosstask = event->ctx->task && event->ctx->task != current;
Arnaldo Carvalho de Melo97c79a32016-04-28 13:16:33 -0300188 const u32 max_stack = event->attr.sample_max_stack;
Frederic Weisbeckerd0775262012-08-07 15:20:41 +0200189
190 if (!kernel && !user)
191 return NULL;
Borislav Petkov9251f902011-10-16 17:15:04 +0200192
Arnaldo Carvalho de Melo97c79a32016-04-28 13:16:33 -0300193 return get_perf_callchain(regs, 0, kernel, user, max_stack, crosstask, true);
Alexei Starovoitov568b3292016-02-17 19:58:57 -0800194}
195
196struct perf_callchain_entry *
197get_perf_callchain(struct pt_regs *regs, u32 init_nr, bool kernel, bool user,
Arnaldo Carvalho de Melocfbcf462016-04-28 12:30:53 -0300198 u32 max_stack, bool crosstask, bool add_mark)
Alexei Starovoitov568b3292016-02-17 19:58:57 -0800199{
200 struct perf_callchain_entry *entry;
Arnaldo Carvalho de Melocfbcf462016-04-28 12:30:53 -0300201 struct perf_callchain_entry_ctx ctx;
Alexei Starovoitov568b3292016-02-17 19:58:57 -0800202 int rctx;
203
Borislav Petkov9251f902011-10-16 17:15:04 +0200204 entry = get_callchain_entry(&rctx);
205 if (rctx == -1)
206 return NULL;
207
208 if (!entry)
209 goto exit_put;
210
Arnaldo Carvalho de Melocfbcf462016-04-28 12:30:53 -0300211 ctx.entry = entry;
212 ctx.max_stack = max_stack;
Arnaldo Carvalho de Melo3b1fff02016-05-10 18:08:32 -0300213 ctx.nr = entry->nr = init_nr;
Arnaldo Carvalho de Meloc85b0332016-05-12 13:06:21 -0300214 ctx.contexts = 0;
215 ctx.contexts_maxed = false;
Borislav Petkov9251f902011-10-16 17:15:04 +0200216
Frederic Weisbeckerd0775262012-08-07 15:20:41 +0200217 if (kernel && !user_mode(regs)) {
Alexei Starovoitov568b3292016-02-17 19:58:57 -0800218 if (add_mark)
Arnaldo Carvalho de Melo3e4de4e2016-05-12 13:01:50 -0300219 perf_callchain_store_context(&ctx, PERF_CONTEXT_KERNEL);
Arnaldo Carvalho de Melocfbcf462016-04-28 12:30:53 -0300220 perf_callchain_kernel(&ctx, regs);
Borislav Petkov9251f902011-10-16 17:15:04 +0200221 }
222
Frederic Weisbeckerd0775262012-08-07 15:20:41 +0200223 if (user) {
224 if (!user_mode(regs)) {
225 if (current->mm)
226 regs = task_pt_regs(current);
227 else
228 regs = NULL;
229 }
Andrew Vagine6dab5f2012-07-11 18:14:58 +0400230
Frederic Weisbeckerd0775262012-08-07 15:20:41 +0200231 if (regs) {
Alexei Starovoitov568b3292016-02-17 19:58:57 -0800232 if (crosstask)
Frederic Weisbeckerd0775262012-08-07 15:20:41 +0200233 goto exit_put;
234
Alexei Starovoitov568b3292016-02-17 19:58:57 -0800235 if (add_mark)
Arnaldo Carvalho de Melo3e4de4e2016-05-12 13:01:50 -0300236 perf_callchain_store_context(&ctx, PERF_CONTEXT_USER);
Arnaldo Carvalho de Melocfbcf462016-04-28 12:30:53 -0300237 perf_callchain_user(&ctx, regs);
Frederic Weisbeckerd0775262012-08-07 15:20:41 +0200238 }
Borislav Petkov9251f902011-10-16 17:15:04 +0200239 }
240
241exit_put:
242 put_callchain_entry(rctx);
243
244 return entry;
245}
Arnaldo Carvalho de Meloc5dfd782016-04-21 12:28:50 -0300246
Arnaldo Carvalho de Meloc85b0332016-05-12 13:06:21 -0300247/*
248 * Used for sysctl_perf_event_max_stack and
249 * sysctl_perf_event_max_contexts_per_stack.
250 */
Arnaldo Carvalho de Meloc5dfd782016-04-21 12:28:50 -0300251int perf_event_max_stack_handler(struct ctl_table *table, int write,
252 void __user *buffer, size_t *lenp, loff_t *ppos)
253{
Arnaldo Carvalho de Meloa8311002016-05-10 16:34:53 -0300254 int *value = table->data;
255 int new_value = *value, ret;
Arnaldo Carvalho de Meloc5dfd782016-04-21 12:28:50 -0300256 struct ctl_table new_table = *table;
257
258 new_table.data = &new_value;
259 ret = proc_dointvec_minmax(&new_table, write, buffer, lenp, ppos);
260 if (ret || !write)
261 return ret;
262
263 mutex_lock(&callchain_mutex);
264 if (atomic_read(&nr_callchain_events))
265 ret = -EBUSY;
266 else
Arnaldo Carvalho de Meloa8311002016-05-10 16:34:53 -0300267 *value = new_value;
Arnaldo Carvalho de Meloc5dfd782016-04-21 12:28:50 -0300268
269 mutex_unlock(&callchain_mutex);
270
271 return ret;
272}