Borislav Petkov | 9251f90 | 2011-10-16 17:15:04 +0200 | [diff] [blame] | 1 | /* |
| 2 | * Performance events callchain code, extracted from core.c: |
| 3 | * |
| 4 | * Copyright (C) 2008 Thomas Gleixner <tglx@linutronix.de> |
| 5 | * Copyright (C) 2008-2011 Red Hat, Inc., Ingo Molnar |
Peter Zijlstra | 90eec10 | 2015-11-16 11:08:45 +0100 | [diff] [blame] | 6 | * Copyright (C) 2008-2011 Red Hat, Inc., Peter Zijlstra |
Borislav Petkov | 9251f90 | 2011-10-16 17:15:04 +0200 | [diff] [blame] | 7 | * Copyright © 2009 Paul Mackerras, IBM Corp. <paulus@au1.ibm.com> |
| 8 | * |
| 9 | * For licensing details see kernel-base/COPYING |
| 10 | */ |
| 11 | |
| 12 | #include <linux/perf_event.h> |
| 13 | #include <linux/slab.h> |
Ingo Molnar | 68db0cf | 2017-02-08 18:51:37 +0100 | [diff] [blame] | 14 | #include <linux/sched/task_stack.h> |
| 15 | |
Borislav Petkov | 9251f90 | 2011-10-16 17:15:04 +0200 | [diff] [blame] | 16 | #include "internal.h" |
| 17 | |
| 18 | struct callchain_cpus_entries { |
| 19 | struct rcu_head rcu_head; |
| 20 | struct perf_callchain_entry *cpu_entries[0]; |
| 21 | }; |
| 22 | |
Arnaldo Carvalho de Melo | c5dfd78 | 2016-04-21 12:28:50 -0300 | [diff] [blame] | 23 | int sysctl_perf_event_max_stack __read_mostly = PERF_MAX_STACK_DEPTH; |
Arnaldo Carvalho de Melo | c85b033 | 2016-05-12 13:06:21 -0300 | [diff] [blame] | 24 | int sysctl_perf_event_max_contexts_per_stack __read_mostly = PERF_MAX_CONTEXTS_PER_STACK; |
Arnaldo Carvalho de Melo | c5dfd78 | 2016-04-21 12:28:50 -0300 | [diff] [blame] | 25 | |
| 26 | static inline size_t perf_callchain_entry__sizeof(void) |
| 27 | { |
| 28 | return (sizeof(struct perf_callchain_entry) + |
Arnaldo Carvalho de Melo | c85b033 | 2016-05-12 13:06:21 -0300 | [diff] [blame] | 29 | sizeof(__u64) * (sysctl_perf_event_max_stack + |
| 30 | sysctl_perf_event_max_contexts_per_stack)); |
Arnaldo Carvalho de Melo | c5dfd78 | 2016-04-21 12:28:50 -0300 | [diff] [blame] | 31 | } |
| 32 | |
Borislav Petkov | 9251f90 | 2011-10-16 17:15:04 +0200 | [diff] [blame] | 33 | static DEFINE_PER_CPU(int, callchain_recursion[PERF_NR_CONTEXTS]); |
| 34 | static atomic_t nr_callchain_events; |
| 35 | static DEFINE_MUTEX(callchain_mutex); |
| 36 | static struct callchain_cpus_entries *callchain_cpus_entries; |
| 37 | |
| 38 | |
Arnaldo Carvalho de Melo | cfbcf46 | 2016-04-28 12:30:53 -0300 | [diff] [blame] | 39 | __weak void perf_callchain_kernel(struct perf_callchain_entry_ctx *entry, |
Borislav Petkov | 9251f90 | 2011-10-16 17:15:04 +0200 | [diff] [blame] | 40 | struct pt_regs *regs) |
| 41 | { |
| 42 | } |
| 43 | |
Arnaldo Carvalho de Melo | cfbcf46 | 2016-04-28 12:30:53 -0300 | [diff] [blame] | 44 | __weak void perf_callchain_user(struct perf_callchain_entry_ctx *entry, |
Borislav Petkov | 9251f90 | 2011-10-16 17:15:04 +0200 | [diff] [blame] | 45 | struct pt_regs *regs) |
| 46 | { |
| 47 | } |
| 48 | |
| 49 | static void release_callchain_buffers_rcu(struct rcu_head *head) |
| 50 | { |
| 51 | struct callchain_cpus_entries *entries; |
| 52 | int cpu; |
| 53 | |
| 54 | entries = container_of(head, struct callchain_cpus_entries, rcu_head); |
| 55 | |
| 56 | for_each_possible_cpu(cpu) |
| 57 | kfree(entries->cpu_entries[cpu]); |
| 58 | |
| 59 | kfree(entries); |
| 60 | } |
| 61 | |
| 62 | static void release_callchain_buffers(void) |
| 63 | { |
| 64 | struct callchain_cpus_entries *entries; |
| 65 | |
| 66 | entries = callchain_cpus_entries; |
Andreea-Cristina Bernat | e0455e1 | 2014-08-22 17:15:36 +0300 | [diff] [blame] | 67 | RCU_INIT_POINTER(callchain_cpus_entries, NULL); |
Borislav Petkov | 9251f90 | 2011-10-16 17:15:04 +0200 | [diff] [blame] | 68 | call_rcu(&entries->rcu_head, release_callchain_buffers_rcu); |
| 69 | } |
| 70 | |
| 71 | static int alloc_callchain_buffers(void) |
| 72 | { |
| 73 | int cpu; |
| 74 | int size; |
| 75 | struct callchain_cpus_entries *entries; |
| 76 | |
| 77 | /* |
| 78 | * We can't use the percpu allocation API for data that can be |
| 79 | * accessed from NMI. Use a temporary manual per cpu allocation |
| 80 | * until that gets sorted out. |
| 81 | */ |
| 82 | size = offsetof(struct callchain_cpus_entries, cpu_entries[nr_cpu_ids]); |
| 83 | |
| 84 | entries = kzalloc(size, GFP_KERNEL); |
| 85 | if (!entries) |
| 86 | return -ENOMEM; |
| 87 | |
Arnaldo Carvalho de Melo | c5dfd78 | 2016-04-21 12:28:50 -0300 | [diff] [blame] | 88 | size = perf_callchain_entry__sizeof() * PERF_NR_CONTEXTS; |
Borislav Petkov | 9251f90 | 2011-10-16 17:15:04 +0200 | [diff] [blame] | 89 | |
| 90 | for_each_possible_cpu(cpu) { |
| 91 | entries->cpu_entries[cpu] = kmalloc_node(size, GFP_KERNEL, |
| 92 | cpu_to_node(cpu)); |
| 93 | if (!entries->cpu_entries[cpu]) |
| 94 | goto fail; |
| 95 | } |
| 96 | |
| 97 | rcu_assign_pointer(callchain_cpus_entries, entries); |
| 98 | |
| 99 | return 0; |
| 100 | |
| 101 | fail: |
| 102 | for_each_possible_cpu(cpu) |
| 103 | kfree(entries->cpu_entries[cpu]); |
| 104 | kfree(entries); |
| 105 | |
| 106 | return -ENOMEM; |
| 107 | } |
| 108 | |
Arnaldo Carvalho de Melo | 97c79a3 | 2016-04-28 13:16:33 -0300 | [diff] [blame] | 109 | int get_callchain_buffers(int event_max_stack) |
Borislav Petkov | 9251f90 | 2011-10-16 17:15:04 +0200 | [diff] [blame] | 110 | { |
| 111 | int err = 0; |
| 112 | int count; |
| 113 | |
| 114 | mutex_lock(&callchain_mutex); |
| 115 | |
| 116 | count = atomic_inc_return(&nr_callchain_events); |
| 117 | if (WARN_ON_ONCE(count < 1)) { |
| 118 | err = -EINVAL; |
| 119 | goto exit; |
| 120 | } |
| 121 | |
Jiri Olsa | 5af44ca | 2018-04-15 11:23:51 +0200 | [diff] [blame^] | 122 | /* |
| 123 | * If requesting per event more than the global cap, |
| 124 | * return a different error to help userspace figure |
| 125 | * this out. |
| 126 | * |
| 127 | * And also do it here so that we have &callchain_mutex held. |
| 128 | */ |
| 129 | if (event_max_stack > sysctl_perf_event_max_stack) { |
| 130 | err = -EOVERFLOW; |
| 131 | goto exit; |
| 132 | } |
| 133 | |
Borislav Petkov | 9251f90 | 2011-10-16 17:15:04 +0200 | [diff] [blame] | 134 | if (count > 1) { |
| 135 | /* If the allocation failed, give up */ |
| 136 | if (!callchain_cpus_entries) |
| 137 | err = -ENOMEM; |
| 138 | goto exit; |
| 139 | } |
| 140 | |
| 141 | err = alloc_callchain_buffers(); |
Borislav Petkov | 9251f90 | 2011-10-16 17:15:04 +0200 | [diff] [blame] | 142 | exit: |
Frederic Weisbecker | 90983b1 | 2013-07-23 02:31:00 +0200 | [diff] [blame] | 143 | if (err) |
| 144 | atomic_dec(&nr_callchain_events); |
Borislav Petkov | 9251f90 | 2011-10-16 17:15:04 +0200 | [diff] [blame] | 145 | |
Frederic Weisbecker | fc3b86d | 2013-08-02 18:29:54 +0200 | [diff] [blame] | 146 | mutex_unlock(&callchain_mutex); |
| 147 | |
Borislav Petkov | 9251f90 | 2011-10-16 17:15:04 +0200 | [diff] [blame] | 148 | return err; |
| 149 | } |
| 150 | |
| 151 | void put_callchain_buffers(void) |
| 152 | { |
| 153 | if (atomic_dec_and_mutex_lock(&nr_callchain_events, &callchain_mutex)) { |
| 154 | release_callchain_buffers(); |
| 155 | mutex_unlock(&callchain_mutex); |
| 156 | } |
| 157 | } |
| 158 | |
| 159 | static struct perf_callchain_entry *get_callchain_entry(int *rctx) |
| 160 | { |
| 161 | int cpu; |
| 162 | struct callchain_cpus_entries *entries; |
| 163 | |
Christoph Lameter | 4a32fea | 2014-08-17 12:30:27 -0500 | [diff] [blame] | 164 | *rctx = get_recursion_context(this_cpu_ptr(callchain_recursion)); |
Borislav Petkov | 9251f90 | 2011-10-16 17:15:04 +0200 | [diff] [blame] | 165 | if (*rctx == -1) |
| 166 | return NULL; |
| 167 | |
| 168 | entries = rcu_dereference(callchain_cpus_entries); |
| 169 | if (!entries) |
| 170 | return NULL; |
| 171 | |
| 172 | cpu = smp_processor_id(); |
| 173 | |
Arnaldo Carvalho de Melo | c5dfd78 | 2016-04-21 12:28:50 -0300 | [diff] [blame] | 174 | return (((void *)entries->cpu_entries[cpu]) + |
| 175 | (*rctx * perf_callchain_entry__sizeof())); |
Borislav Petkov | 9251f90 | 2011-10-16 17:15:04 +0200 | [diff] [blame] | 176 | } |
| 177 | |
| 178 | static void |
| 179 | put_callchain_entry(int rctx) |
| 180 | { |
Christoph Lameter | 4a32fea | 2014-08-17 12:30:27 -0500 | [diff] [blame] | 181 | put_recursion_context(this_cpu_ptr(callchain_recursion), rctx); |
Borislav Petkov | 9251f90 | 2011-10-16 17:15:04 +0200 | [diff] [blame] | 182 | } |
| 183 | |
Andrew Vagin | e6dab5f | 2012-07-11 18:14:58 +0400 | [diff] [blame] | 184 | struct perf_callchain_entry * |
Alexei Starovoitov | 568b329 | 2016-02-17 19:58:57 -0800 | [diff] [blame] | 185 | get_perf_callchain(struct pt_regs *regs, u32 init_nr, bool kernel, bool user, |
Arnaldo Carvalho de Melo | cfbcf46 | 2016-04-28 12:30:53 -0300 | [diff] [blame] | 186 | u32 max_stack, bool crosstask, bool add_mark) |
Alexei Starovoitov | 568b329 | 2016-02-17 19:58:57 -0800 | [diff] [blame] | 187 | { |
| 188 | struct perf_callchain_entry *entry; |
Arnaldo Carvalho de Melo | cfbcf46 | 2016-04-28 12:30:53 -0300 | [diff] [blame] | 189 | struct perf_callchain_entry_ctx ctx; |
Alexei Starovoitov | 568b329 | 2016-02-17 19:58:57 -0800 | [diff] [blame] | 190 | int rctx; |
| 191 | |
Borislav Petkov | 9251f90 | 2011-10-16 17:15:04 +0200 | [diff] [blame] | 192 | entry = get_callchain_entry(&rctx); |
| 193 | if (rctx == -1) |
| 194 | return NULL; |
| 195 | |
| 196 | if (!entry) |
| 197 | goto exit_put; |
| 198 | |
Arnaldo Carvalho de Melo | cfbcf46 | 2016-04-28 12:30:53 -0300 | [diff] [blame] | 199 | ctx.entry = entry; |
| 200 | ctx.max_stack = max_stack; |
Arnaldo Carvalho de Melo | 3b1fff0 | 2016-05-10 18:08:32 -0300 | [diff] [blame] | 201 | ctx.nr = entry->nr = init_nr; |
Arnaldo Carvalho de Melo | c85b033 | 2016-05-12 13:06:21 -0300 | [diff] [blame] | 202 | ctx.contexts = 0; |
| 203 | ctx.contexts_maxed = false; |
Borislav Petkov | 9251f90 | 2011-10-16 17:15:04 +0200 | [diff] [blame] | 204 | |
Frederic Weisbecker | d077526 | 2012-08-07 15:20:41 +0200 | [diff] [blame] | 205 | if (kernel && !user_mode(regs)) { |
Alexei Starovoitov | 568b329 | 2016-02-17 19:58:57 -0800 | [diff] [blame] | 206 | if (add_mark) |
Arnaldo Carvalho de Melo | 3e4de4e | 2016-05-12 13:01:50 -0300 | [diff] [blame] | 207 | perf_callchain_store_context(&ctx, PERF_CONTEXT_KERNEL); |
Arnaldo Carvalho de Melo | cfbcf46 | 2016-04-28 12:30:53 -0300 | [diff] [blame] | 208 | perf_callchain_kernel(&ctx, regs); |
Borislav Petkov | 9251f90 | 2011-10-16 17:15:04 +0200 | [diff] [blame] | 209 | } |
| 210 | |
Frederic Weisbecker | d077526 | 2012-08-07 15:20:41 +0200 | [diff] [blame] | 211 | if (user) { |
| 212 | if (!user_mode(regs)) { |
| 213 | if (current->mm) |
| 214 | regs = task_pt_regs(current); |
| 215 | else |
| 216 | regs = NULL; |
| 217 | } |
Andrew Vagin | e6dab5f | 2012-07-11 18:14:58 +0400 | [diff] [blame] | 218 | |
Frederic Weisbecker | d077526 | 2012-08-07 15:20:41 +0200 | [diff] [blame] | 219 | if (regs) { |
Will Deacon | 88b0193 | 2017-05-09 18:00:04 +0100 | [diff] [blame] | 220 | mm_segment_t fs; |
| 221 | |
Alexei Starovoitov | 568b329 | 2016-02-17 19:58:57 -0800 | [diff] [blame] | 222 | if (crosstask) |
Frederic Weisbecker | d077526 | 2012-08-07 15:20:41 +0200 | [diff] [blame] | 223 | goto exit_put; |
| 224 | |
Alexei Starovoitov | 568b329 | 2016-02-17 19:58:57 -0800 | [diff] [blame] | 225 | if (add_mark) |
Arnaldo Carvalho de Melo | 3e4de4e | 2016-05-12 13:01:50 -0300 | [diff] [blame] | 226 | perf_callchain_store_context(&ctx, PERF_CONTEXT_USER); |
Will Deacon | 88b0193 | 2017-05-09 18:00:04 +0100 | [diff] [blame] | 227 | |
| 228 | fs = get_fs(); |
| 229 | set_fs(USER_DS); |
Arnaldo Carvalho de Melo | cfbcf46 | 2016-04-28 12:30:53 -0300 | [diff] [blame] | 230 | perf_callchain_user(&ctx, regs); |
Will Deacon | 88b0193 | 2017-05-09 18:00:04 +0100 | [diff] [blame] | 231 | set_fs(fs); |
Frederic Weisbecker | d077526 | 2012-08-07 15:20:41 +0200 | [diff] [blame] | 232 | } |
Borislav Petkov | 9251f90 | 2011-10-16 17:15:04 +0200 | [diff] [blame] | 233 | } |
| 234 | |
| 235 | exit_put: |
| 236 | put_callchain_entry(rctx); |
| 237 | |
| 238 | return entry; |
| 239 | } |
Arnaldo Carvalho de Melo | c5dfd78 | 2016-04-21 12:28:50 -0300 | [diff] [blame] | 240 | |
Arnaldo Carvalho de Melo | c85b033 | 2016-05-12 13:06:21 -0300 | [diff] [blame] | 241 | /* |
| 242 | * Used for sysctl_perf_event_max_stack and |
| 243 | * sysctl_perf_event_max_contexts_per_stack. |
| 244 | */ |
Arnaldo Carvalho de Melo | c5dfd78 | 2016-04-21 12:28:50 -0300 | [diff] [blame] | 245 | int perf_event_max_stack_handler(struct ctl_table *table, int write, |
| 246 | void __user *buffer, size_t *lenp, loff_t *ppos) |
| 247 | { |
Arnaldo Carvalho de Melo | a831100 | 2016-05-10 16:34:53 -0300 | [diff] [blame] | 248 | int *value = table->data; |
| 249 | int new_value = *value, ret; |
Arnaldo Carvalho de Melo | c5dfd78 | 2016-04-21 12:28:50 -0300 | [diff] [blame] | 250 | struct ctl_table new_table = *table; |
| 251 | |
| 252 | new_table.data = &new_value; |
| 253 | ret = proc_dointvec_minmax(&new_table, write, buffer, lenp, ppos); |
| 254 | if (ret || !write) |
| 255 | return ret; |
| 256 | |
| 257 | mutex_lock(&callchain_mutex); |
| 258 | if (atomic_read(&nr_callchain_events)) |
| 259 | ret = -EBUSY; |
| 260 | else |
Arnaldo Carvalho de Melo | a831100 | 2016-05-10 16:34:53 -0300 | [diff] [blame] | 261 | *value = new_value; |
Arnaldo Carvalho de Melo | c5dfd78 | 2016-04-21 12:28:50 -0300 | [diff] [blame] | 262 | |
| 263 | mutex_unlock(&callchain_mutex); |
| 264 | |
| 265 | return ret; |
| 266 | } |