Borislav Petkov | 9251f90 | 2011-10-16 17:15:04 +0200 | [diff] [blame] | 1 | /* |
| 2 | * Performance events callchain code, extracted from core.c: |
| 3 | * |
| 4 | * Copyright (C) 2008 Thomas Gleixner <tglx@linutronix.de> |
| 5 | * Copyright (C) 2008-2011 Red Hat, Inc., Ingo Molnar |
Peter Zijlstra | 90eec10 | 2015-11-16 11:08:45 +0100 | [diff] [blame] | 6 | * Copyright (C) 2008-2011 Red Hat, Inc., Peter Zijlstra |
Borislav Petkov | 9251f90 | 2011-10-16 17:15:04 +0200 | [diff] [blame] | 7 | * Copyright © 2009 Paul Mackerras, IBM Corp. <paulus@au1.ibm.com> |
| 8 | * |
| 9 | * For licensing details see kernel-base/COPYING |
| 10 | */ |
| 11 | |
| 12 | #include <linux/perf_event.h> |
| 13 | #include <linux/slab.h> |
| 14 | #include "internal.h" |
| 15 | |
| 16 | struct callchain_cpus_entries { |
| 17 | struct rcu_head rcu_head; |
| 18 | struct perf_callchain_entry *cpu_entries[0]; |
| 19 | }; |
| 20 | |
Arnaldo Carvalho de Melo | c5dfd78 | 2016-04-21 12:28:50 -0300 | [diff] [blame] | 21 | int sysctl_perf_event_max_stack __read_mostly = PERF_MAX_STACK_DEPTH; |
Arnaldo Carvalho de Melo | c85b033 | 2016-05-12 13:06:21 -0300 | [diff] [blame] | 22 | int sysctl_perf_event_max_contexts_per_stack __read_mostly = PERF_MAX_CONTEXTS_PER_STACK; |
Arnaldo Carvalho de Melo | c5dfd78 | 2016-04-21 12:28:50 -0300 | [diff] [blame] | 23 | |
| 24 | static inline size_t perf_callchain_entry__sizeof(void) |
| 25 | { |
| 26 | return (sizeof(struct perf_callchain_entry) + |
Arnaldo Carvalho de Melo | c85b033 | 2016-05-12 13:06:21 -0300 | [diff] [blame] | 27 | sizeof(__u64) * (sysctl_perf_event_max_stack + |
| 28 | sysctl_perf_event_max_contexts_per_stack)); |
Arnaldo Carvalho de Melo | c5dfd78 | 2016-04-21 12:28:50 -0300 | [diff] [blame] | 29 | } |
| 30 | |
Borislav Petkov | 9251f90 | 2011-10-16 17:15:04 +0200 | [diff] [blame] | 31 | static DEFINE_PER_CPU(int, callchain_recursion[PERF_NR_CONTEXTS]); |
| 32 | static atomic_t nr_callchain_events; |
| 33 | static DEFINE_MUTEX(callchain_mutex); |
| 34 | static struct callchain_cpus_entries *callchain_cpus_entries; |
| 35 | |
| 36 | |
Arnaldo Carvalho de Melo | cfbcf46 | 2016-04-28 12:30:53 -0300 | [diff] [blame] | 37 | __weak void perf_callchain_kernel(struct perf_callchain_entry_ctx *entry, |
Borislav Petkov | 9251f90 | 2011-10-16 17:15:04 +0200 | [diff] [blame] | 38 | struct pt_regs *regs) |
| 39 | { |
| 40 | } |
| 41 | |
Arnaldo Carvalho de Melo | cfbcf46 | 2016-04-28 12:30:53 -0300 | [diff] [blame] | 42 | __weak void perf_callchain_user(struct perf_callchain_entry_ctx *entry, |
Borislav Petkov | 9251f90 | 2011-10-16 17:15:04 +0200 | [diff] [blame] | 43 | struct pt_regs *regs) |
| 44 | { |
| 45 | } |
| 46 | |
| 47 | static void release_callchain_buffers_rcu(struct rcu_head *head) |
| 48 | { |
| 49 | struct callchain_cpus_entries *entries; |
| 50 | int cpu; |
| 51 | |
| 52 | entries = container_of(head, struct callchain_cpus_entries, rcu_head); |
| 53 | |
| 54 | for_each_possible_cpu(cpu) |
| 55 | kfree(entries->cpu_entries[cpu]); |
| 56 | |
| 57 | kfree(entries); |
| 58 | } |
| 59 | |
| 60 | static void release_callchain_buffers(void) |
| 61 | { |
| 62 | struct callchain_cpus_entries *entries; |
| 63 | |
| 64 | entries = callchain_cpus_entries; |
Andreea-Cristina Bernat | e0455e1 | 2014-08-22 17:15:36 +0300 | [diff] [blame] | 65 | RCU_INIT_POINTER(callchain_cpus_entries, NULL); |
Borislav Petkov | 9251f90 | 2011-10-16 17:15:04 +0200 | [diff] [blame] | 66 | call_rcu(&entries->rcu_head, release_callchain_buffers_rcu); |
| 67 | } |
| 68 | |
| 69 | static int alloc_callchain_buffers(void) |
| 70 | { |
| 71 | int cpu; |
| 72 | int size; |
| 73 | struct callchain_cpus_entries *entries; |
| 74 | |
| 75 | /* |
| 76 | * We can't use the percpu allocation API for data that can be |
| 77 | * accessed from NMI. Use a temporary manual per cpu allocation |
| 78 | * until that gets sorted out. |
| 79 | */ |
| 80 | size = offsetof(struct callchain_cpus_entries, cpu_entries[nr_cpu_ids]); |
| 81 | |
| 82 | entries = kzalloc(size, GFP_KERNEL); |
| 83 | if (!entries) |
| 84 | return -ENOMEM; |
| 85 | |
Arnaldo Carvalho de Melo | c5dfd78 | 2016-04-21 12:28:50 -0300 | [diff] [blame] | 86 | size = perf_callchain_entry__sizeof() * PERF_NR_CONTEXTS; |
Borislav Petkov | 9251f90 | 2011-10-16 17:15:04 +0200 | [diff] [blame] | 87 | |
| 88 | for_each_possible_cpu(cpu) { |
| 89 | entries->cpu_entries[cpu] = kmalloc_node(size, GFP_KERNEL, |
| 90 | cpu_to_node(cpu)); |
| 91 | if (!entries->cpu_entries[cpu]) |
| 92 | goto fail; |
| 93 | } |
| 94 | |
| 95 | rcu_assign_pointer(callchain_cpus_entries, entries); |
| 96 | |
| 97 | return 0; |
| 98 | |
| 99 | fail: |
| 100 | for_each_possible_cpu(cpu) |
| 101 | kfree(entries->cpu_entries[cpu]); |
| 102 | kfree(entries); |
| 103 | |
| 104 | return -ENOMEM; |
| 105 | } |
| 106 | |
Arnaldo Carvalho de Melo | 97c79a3 | 2016-04-28 13:16:33 -0300 | [diff] [blame^] | 107 | int get_callchain_buffers(int event_max_stack) |
Borislav Petkov | 9251f90 | 2011-10-16 17:15:04 +0200 | [diff] [blame] | 108 | { |
| 109 | int err = 0; |
| 110 | int count; |
| 111 | |
| 112 | mutex_lock(&callchain_mutex); |
| 113 | |
| 114 | count = atomic_inc_return(&nr_callchain_events); |
| 115 | if (WARN_ON_ONCE(count < 1)) { |
| 116 | err = -EINVAL; |
| 117 | goto exit; |
| 118 | } |
| 119 | |
| 120 | if (count > 1) { |
| 121 | /* If the allocation failed, give up */ |
| 122 | if (!callchain_cpus_entries) |
| 123 | err = -ENOMEM; |
Arnaldo Carvalho de Melo | 97c79a3 | 2016-04-28 13:16:33 -0300 | [diff] [blame^] | 124 | /* |
| 125 | * If requesting per event more than the global cap, |
| 126 | * return a different error to help userspace figure |
| 127 | * this out. |
| 128 | * |
| 129 | * And also do it here so that we have &callchain_mutex held. |
| 130 | */ |
| 131 | if (event_max_stack > sysctl_perf_event_max_stack) |
| 132 | err = -EOVERFLOW; |
Borislav Petkov | 9251f90 | 2011-10-16 17:15:04 +0200 | [diff] [blame] | 133 | goto exit; |
| 134 | } |
| 135 | |
| 136 | err = alloc_callchain_buffers(); |
Borislav Petkov | 9251f90 | 2011-10-16 17:15:04 +0200 | [diff] [blame] | 137 | exit: |
Frederic Weisbecker | 90983b1 | 2013-07-23 02:31:00 +0200 | [diff] [blame] | 138 | if (err) |
| 139 | atomic_dec(&nr_callchain_events); |
Borislav Petkov | 9251f90 | 2011-10-16 17:15:04 +0200 | [diff] [blame] | 140 | |
Frederic Weisbecker | fc3b86d | 2013-08-02 18:29:54 +0200 | [diff] [blame] | 141 | mutex_unlock(&callchain_mutex); |
| 142 | |
Borislav Petkov | 9251f90 | 2011-10-16 17:15:04 +0200 | [diff] [blame] | 143 | return err; |
| 144 | } |
| 145 | |
| 146 | void put_callchain_buffers(void) |
| 147 | { |
| 148 | if (atomic_dec_and_mutex_lock(&nr_callchain_events, &callchain_mutex)) { |
| 149 | release_callchain_buffers(); |
| 150 | mutex_unlock(&callchain_mutex); |
| 151 | } |
| 152 | } |
| 153 | |
| 154 | static struct perf_callchain_entry *get_callchain_entry(int *rctx) |
| 155 | { |
| 156 | int cpu; |
| 157 | struct callchain_cpus_entries *entries; |
| 158 | |
Christoph Lameter | 4a32fea | 2014-08-17 12:30:27 -0500 | [diff] [blame] | 159 | *rctx = get_recursion_context(this_cpu_ptr(callchain_recursion)); |
Borislav Petkov | 9251f90 | 2011-10-16 17:15:04 +0200 | [diff] [blame] | 160 | if (*rctx == -1) |
| 161 | return NULL; |
| 162 | |
| 163 | entries = rcu_dereference(callchain_cpus_entries); |
| 164 | if (!entries) |
| 165 | return NULL; |
| 166 | |
| 167 | cpu = smp_processor_id(); |
| 168 | |
Arnaldo Carvalho de Melo | c5dfd78 | 2016-04-21 12:28:50 -0300 | [diff] [blame] | 169 | return (((void *)entries->cpu_entries[cpu]) + |
| 170 | (*rctx * perf_callchain_entry__sizeof())); |
Borislav Petkov | 9251f90 | 2011-10-16 17:15:04 +0200 | [diff] [blame] | 171 | } |
| 172 | |
| 173 | static void |
| 174 | put_callchain_entry(int rctx) |
| 175 | { |
Christoph Lameter | 4a32fea | 2014-08-17 12:30:27 -0500 | [diff] [blame] | 176 | put_recursion_context(this_cpu_ptr(callchain_recursion), rctx); |
Borislav Petkov | 9251f90 | 2011-10-16 17:15:04 +0200 | [diff] [blame] | 177 | } |
| 178 | |
Andrew Vagin | e6dab5f | 2012-07-11 18:14:58 +0400 | [diff] [blame] | 179 | struct perf_callchain_entry * |
| 180 | perf_callchain(struct perf_event *event, struct pt_regs *regs) |
Borislav Petkov | 9251f90 | 2011-10-16 17:15:04 +0200 | [diff] [blame] | 181 | { |
Alexei Starovoitov | 568b329 | 2016-02-17 19:58:57 -0800 | [diff] [blame] | 182 | bool kernel = !event->attr.exclude_callchain_kernel; |
| 183 | bool user = !event->attr.exclude_callchain_user; |
| 184 | /* Disallow cross-task user callchains. */ |
| 185 | bool crosstask = event->ctx->task && event->ctx->task != current; |
Arnaldo Carvalho de Melo | 97c79a3 | 2016-04-28 13:16:33 -0300 | [diff] [blame^] | 186 | const u32 max_stack = event->attr.sample_max_stack; |
Frederic Weisbecker | d077526 | 2012-08-07 15:20:41 +0200 | [diff] [blame] | 187 | |
| 188 | if (!kernel && !user) |
| 189 | return NULL; |
Borislav Petkov | 9251f90 | 2011-10-16 17:15:04 +0200 | [diff] [blame] | 190 | |
Arnaldo Carvalho de Melo | 97c79a3 | 2016-04-28 13:16:33 -0300 | [diff] [blame^] | 191 | return get_perf_callchain(regs, 0, kernel, user, max_stack, crosstask, true); |
Alexei Starovoitov | 568b329 | 2016-02-17 19:58:57 -0800 | [diff] [blame] | 192 | } |
| 193 | |
| 194 | struct perf_callchain_entry * |
| 195 | get_perf_callchain(struct pt_regs *regs, u32 init_nr, bool kernel, bool user, |
Arnaldo Carvalho de Melo | cfbcf46 | 2016-04-28 12:30:53 -0300 | [diff] [blame] | 196 | u32 max_stack, bool crosstask, bool add_mark) |
Alexei Starovoitov | 568b329 | 2016-02-17 19:58:57 -0800 | [diff] [blame] | 197 | { |
| 198 | struct perf_callchain_entry *entry; |
Arnaldo Carvalho de Melo | cfbcf46 | 2016-04-28 12:30:53 -0300 | [diff] [blame] | 199 | struct perf_callchain_entry_ctx ctx; |
Alexei Starovoitov | 568b329 | 2016-02-17 19:58:57 -0800 | [diff] [blame] | 200 | int rctx; |
| 201 | |
Borislav Petkov | 9251f90 | 2011-10-16 17:15:04 +0200 | [diff] [blame] | 202 | entry = get_callchain_entry(&rctx); |
| 203 | if (rctx == -1) |
| 204 | return NULL; |
| 205 | |
| 206 | if (!entry) |
| 207 | goto exit_put; |
| 208 | |
Arnaldo Carvalho de Melo | cfbcf46 | 2016-04-28 12:30:53 -0300 | [diff] [blame] | 209 | ctx.entry = entry; |
| 210 | ctx.max_stack = max_stack; |
Arnaldo Carvalho de Melo | 3b1fff0 | 2016-05-10 18:08:32 -0300 | [diff] [blame] | 211 | ctx.nr = entry->nr = init_nr; |
Arnaldo Carvalho de Melo | c85b033 | 2016-05-12 13:06:21 -0300 | [diff] [blame] | 212 | ctx.contexts = 0; |
| 213 | ctx.contexts_maxed = false; |
Borislav Petkov | 9251f90 | 2011-10-16 17:15:04 +0200 | [diff] [blame] | 214 | |
Frederic Weisbecker | d077526 | 2012-08-07 15:20:41 +0200 | [diff] [blame] | 215 | if (kernel && !user_mode(regs)) { |
Alexei Starovoitov | 568b329 | 2016-02-17 19:58:57 -0800 | [diff] [blame] | 216 | if (add_mark) |
Arnaldo Carvalho de Melo | 3e4de4e | 2016-05-12 13:01:50 -0300 | [diff] [blame] | 217 | perf_callchain_store_context(&ctx, PERF_CONTEXT_KERNEL); |
Arnaldo Carvalho de Melo | cfbcf46 | 2016-04-28 12:30:53 -0300 | [diff] [blame] | 218 | perf_callchain_kernel(&ctx, regs); |
Borislav Petkov | 9251f90 | 2011-10-16 17:15:04 +0200 | [diff] [blame] | 219 | } |
| 220 | |
Frederic Weisbecker | d077526 | 2012-08-07 15:20:41 +0200 | [diff] [blame] | 221 | if (user) { |
| 222 | if (!user_mode(regs)) { |
| 223 | if (current->mm) |
| 224 | regs = task_pt_regs(current); |
| 225 | else |
| 226 | regs = NULL; |
| 227 | } |
Andrew Vagin | e6dab5f | 2012-07-11 18:14:58 +0400 | [diff] [blame] | 228 | |
Frederic Weisbecker | d077526 | 2012-08-07 15:20:41 +0200 | [diff] [blame] | 229 | if (regs) { |
Alexei Starovoitov | 568b329 | 2016-02-17 19:58:57 -0800 | [diff] [blame] | 230 | if (crosstask) |
Frederic Weisbecker | d077526 | 2012-08-07 15:20:41 +0200 | [diff] [blame] | 231 | goto exit_put; |
| 232 | |
Alexei Starovoitov | 568b329 | 2016-02-17 19:58:57 -0800 | [diff] [blame] | 233 | if (add_mark) |
Arnaldo Carvalho de Melo | 3e4de4e | 2016-05-12 13:01:50 -0300 | [diff] [blame] | 234 | perf_callchain_store_context(&ctx, PERF_CONTEXT_USER); |
Arnaldo Carvalho de Melo | cfbcf46 | 2016-04-28 12:30:53 -0300 | [diff] [blame] | 235 | perf_callchain_user(&ctx, regs); |
Frederic Weisbecker | d077526 | 2012-08-07 15:20:41 +0200 | [diff] [blame] | 236 | } |
Borislav Petkov | 9251f90 | 2011-10-16 17:15:04 +0200 | [diff] [blame] | 237 | } |
| 238 | |
| 239 | exit_put: |
| 240 | put_callchain_entry(rctx); |
| 241 | |
| 242 | return entry; |
| 243 | } |
Arnaldo Carvalho de Melo | c5dfd78 | 2016-04-21 12:28:50 -0300 | [diff] [blame] | 244 | |
Arnaldo Carvalho de Melo | c85b033 | 2016-05-12 13:06:21 -0300 | [diff] [blame] | 245 | /* |
| 246 | * Used for sysctl_perf_event_max_stack and |
| 247 | * sysctl_perf_event_max_contexts_per_stack. |
| 248 | */ |
Arnaldo Carvalho de Melo | c5dfd78 | 2016-04-21 12:28:50 -0300 | [diff] [blame] | 249 | int perf_event_max_stack_handler(struct ctl_table *table, int write, |
| 250 | void __user *buffer, size_t *lenp, loff_t *ppos) |
| 251 | { |
Arnaldo Carvalho de Melo | a831100 | 2016-05-10 16:34:53 -0300 | [diff] [blame] | 252 | int *value = table->data; |
| 253 | int new_value = *value, ret; |
Arnaldo Carvalho de Melo | c5dfd78 | 2016-04-21 12:28:50 -0300 | [diff] [blame] | 254 | struct ctl_table new_table = *table; |
| 255 | |
| 256 | new_table.data = &new_value; |
| 257 | ret = proc_dointvec_minmax(&new_table, write, buffer, lenp, ppos); |
| 258 | if (ret || !write) |
| 259 | return ret; |
| 260 | |
| 261 | mutex_lock(&callchain_mutex); |
| 262 | if (atomic_read(&nr_callchain_events)) |
| 263 | ret = -EBUSY; |
| 264 | else |
Arnaldo Carvalho de Melo | a831100 | 2016-05-10 16:34:53 -0300 | [diff] [blame] | 265 | *value = new_value; |
Arnaldo Carvalho de Melo | c5dfd78 | 2016-04-21 12:28:50 -0300 | [diff] [blame] | 266 | |
| 267 | mutex_unlock(&callchain_mutex); |
| 268 | |
| 269 | return ret; |
| 270 | } |