Thomas Gleixner | 8e86e01 | 2019-01-16 12:10:59 +0100 | [diff] [blame] | 1 | // SPDX-License-Identifier: GPL-2.0 |
Borislav Petkov | 9251f90 | 2011-10-16 17:15:04 +0200 | [diff] [blame] | 2 | /* |
| 3 | * Performance events callchain code, extracted from core.c: |
| 4 | * |
| 5 | * Copyright (C) 2008 Thomas Gleixner <tglx@linutronix.de> |
| 6 | * Copyright (C) 2008-2011 Red Hat, Inc., Ingo Molnar |
Peter Zijlstra | 90eec10 | 2015-11-16 11:08:45 +0100 | [diff] [blame] | 7 | * Copyright (C) 2008-2011 Red Hat, Inc., Peter Zijlstra |
Arnd Bergmann | 3723c63 | 2018-08-23 17:01:26 -0700 | [diff] [blame] | 8 | * Copyright © 2009 Paul Mackerras, IBM Corp. <paulus@au1.ibm.com> |
Borislav Petkov | 9251f90 | 2011-10-16 17:15:04 +0200 | [diff] [blame] | 9 | */ |
| 10 | |
| 11 | #include <linux/perf_event.h> |
| 12 | #include <linux/slab.h> |
Ingo Molnar | 68db0cf | 2017-02-08 18:51:37 +0100 | [diff] [blame] | 13 | #include <linux/sched/task_stack.h> |
| 14 | |
Borislav Petkov | 9251f90 | 2011-10-16 17:15:04 +0200 | [diff] [blame] | 15 | #include "internal.h" |
| 16 | |
| 17 | struct callchain_cpus_entries { |
| 18 | struct rcu_head rcu_head; |
| 19 | struct perf_callchain_entry *cpu_entries[0]; |
| 20 | }; |
| 21 | |
Arnaldo Carvalho de Melo | c5dfd78 | 2016-04-21 12:28:50 -0300 | [diff] [blame] | 22 | int sysctl_perf_event_max_stack __read_mostly = PERF_MAX_STACK_DEPTH; |
Arnaldo Carvalho de Melo | c85b033 | 2016-05-12 13:06:21 -0300 | [diff] [blame] | 23 | int sysctl_perf_event_max_contexts_per_stack __read_mostly = PERF_MAX_CONTEXTS_PER_STACK; |
Arnaldo Carvalho de Melo | c5dfd78 | 2016-04-21 12:28:50 -0300 | [diff] [blame] | 24 | |
| 25 | static inline size_t perf_callchain_entry__sizeof(void) |
| 26 | { |
| 27 | return (sizeof(struct perf_callchain_entry) + |
Arnaldo Carvalho de Melo | c85b033 | 2016-05-12 13:06:21 -0300 | [diff] [blame] | 28 | sizeof(__u64) * (sysctl_perf_event_max_stack + |
| 29 | sysctl_perf_event_max_contexts_per_stack)); |
Arnaldo Carvalho de Melo | c5dfd78 | 2016-04-21 12:28:50 -0300 | [diff] [blame] | 30 | } |
| 31 | |
Borislav Petkov | 9251f90 | 2011-10-16 17:15:04 +0200 | [diff] [blame] | 32 | static DEFINE_PER_CPU(int, callchain_recursion[PERF_NR_CONTEXTS]); |
| 33 | static atomic_t nr_callchain_events; |
| 34 | static DEFINE_MUTEX(callchain_mutex); |
| 35 | static struct callchain_cpus_entries *callchain_cpus_entries; |
| 36 | |
| 37 | |
Arnaldo Carvalho de Melo | cfbcf46 | 2016-04-28 12:30:53 -0300 | [diff] [blame] | 38 | __weak void perf_callchain_kernel(struct perf_callchain_entry_ctx *entry, |
Borislav Petkov | 9251f90 | 2011-10-16 17:15:04 +0200 | [diff] [blame] | 39 | struct pt_regs *regs) |
| 40 | { |
| 41 | } |
| 42 | |
Arnaldo Carvalho de Melo | cfbcf46 | 2016-04-28 12:30:53 -0300 | [diff] [blame] | 43 | __weak void perf_callchain_user(struct perf_callchain_entry_ctx *entry, |
Borislav Petkov | 9251f90 | 2011-10-16 17:15:04 +0200 | [diff] [blame] | 44 | struct pt_regs *regs) |
| 45 | { |
| 46 | } |
| 47 | |
| 48 | static void release_callchain_buffers_rcu(struct rcu_head *head) |
| 49 | { |
| 50 | struct callchain_cpus_entries *entries; |
| 51 | int cpu; |
| 52 | |
| 53 | entries = container_of(head, struct callchain_cpus_entries, rcu_head); |
| 54 | |
| 55 | for_each_possible_cpu(cpu) |
| 56 | kfree(entries->cpu_entries[cpu]); |
| 57 | |
| 58 | kfree(entries); |
| 59 | } |
| 60 | |
| 61 | static void release_callchain_buffers(void) |
| 62 | { |
| 63 | struct callchain_cpus_entries *entries; |
| 64 | |
| 65 | entries = callchain_cpus_entries; |
Andreea-Cristina Bernat | e0455e1 | 2014-08-22 17:15:36 +0300 | [diff] [blame] | 66 | RCU_INIT_POINTER(callchain_cpus_entries, NULL); |
Borislav Petkov | 9251f90 | 2011-10-16 17:15:04 +0200 | [diff] [blame] | 67 | call_rcu(&entries->rcu_head, release_callchain_buffers_rcu); |
| 68 | } |
| 69 | |
| 70 | static int alloc_callchain_buffers(void) |
| 71 | { |
| 72 | int cpu; |
| 73 | int size; |
| 74 | struct callchain_cpus_entries *entries; |
| 75 | |
| 76 | /* |
| 77 | * We can't use the percpu allocation API for data that can be |
| 78 | * accessed from NMI. Use a temporary manual per cpu allocation |
| 79 | * until that gets sorted out. |
| 80 | */ |
| 81 | size = offsetof(struct callchain_cpus_entries, cpu_entries[nr_cpu_ids]); |
| 82 | |
| 83 | entries = kzalloc(size, GFP_KERNEL); |
| 84 | if (!entries) |
| 85 | return -ENOMEM; |
| 86 | |
Arnaldo Carvalho de Melo | c5dfd78 | 2016-04-21 12:28:50 -0300 | [diff] [blame] | 87 | size = perf_callchain_entry__sizeof() * PERF_NR_CONTEXTS; |
Borislav Petkov | 9251f90 | 2011-10-16 17:15:04 +0200 | [diff] [blame] | 88 | |
| 89 | for_each_possible_cpu(cpu) { |
| 90 | entries->cpu_entries[cpu] = kmalloc_node(size, GFP_KERNEL, |
| 91 | cpu_to_node(cpu)); |
| 92 | if (!entries->cpu_entries[cpu]) |
| 93 | goto fail; |
| 94 | } |
| 95 | |
| 96 | rcu_assign_pointer(callchain_cpus_entries, entries); |
| 97 | |
| 98 | return 0; |
| 99 | |
| 100 | fail: |
| 101 | for_each_possible_cpu(cpu) |
| 102 | kfree(entries->cpu_entries[cpu]); |
| 103 | kfree(entries); |
| 104 | |
| 105 | return -ENOMEM; |
| 106 | } |
| 107 | |
Arnaldo Carvalho de Melo | 97c79a3 | 2016-04-28 13:16:33 -0300 | [diff] [blame] | 108 | int get_callchain_buffers(int event_max_stack) |
Borislav Petkov | 9251f90 | 2011-10-16 17:15:04 +0200 | [diff] [blame] | 109 | { |
| 110 | int err = 0; |
| 111 | int count; |
| 112 | |
| 113 | mutex_lock(&callchain_mutex); |
| 114 | |
| 115 | count = atomic_inc_return(&nr_callchain_events); |
| 116 | if (WARN_ON_ONCE(count < 1)) { |
| 117 | err = -EINVAL; |
| 118 | goto exit; |
| 119 | } |
| 120 | |
Jiri Olsa | 5af44ca | 2018-04-15 11:23:51 +0200 | [diff] [blame] | 121 | /* |
| 122 | * If requesting per event more than the global cap, |
| 123 | * return a different error to help userspace figure |
| 124 | * this out. |
| 125 | * |
| 126 | * And also do it here so that we have &callchain_mutex held. |
| 127 | */ |
| 128 | if (event_max_stack > sysctl_perf_event_max_stack) { |
| 129 | err = -EOVERFLOW; |
| 130 | goto exit; |
| 131 | } |
| 132 | |
Jiri Olsa | bfb3d7b | 2018-04-15 11:23:52 +0200 | [diff] [blame] | 133 | if (count == 1) |
| 134 | err = alloc_callchain_buffers(); |
Borislav Petkov | 9251f90 | 2011-10-16 17:15:04 +0200 | [diff] [blame] | 135 | exit: |
Frederic Weisbecker | 90983b1 | 2013-07-23 02:31:00 +0200 | [diff] [blame] | 136 | if (err) |
| 137 | atomic_dec(&nr_callchain_events); |
Borislav Petkov | 9251f90 | 2011-10-16 17:15:04 +0200 | [diff] [blame] | 138 | |
Frederic Weisbecker | fc3b86d | 2013-08-02 18:29:54 +0200 | [diff] [blame] | 139 | mutex_unlock(&callchain_mutex); |
| 140 | |
Borislav Petkov | 9251f90 | 2011-10-16 17:15:04 +0200 | [diff] [blame] | 141 | return err; |
| 142 | } |
| 143 | |
| 144 | void put_callchain_buffers(void) |
| 145 | { |
| 146 | if (atomic_dec_and_mutex_lock(&nr_callchain_events, &callchain_mutex)) { |
| 147 | release_callchain_buffers(); |
| 148 | mutex_unlock(&callchain_mutex); |
| 149 | } |
| 150 | } |
| 151 | |
| 152 | static struct perf_callchain_entry *get_callchain_entry(int *rctx) |
| 153 | { |
| 154 | int cpu; |
| 155 | struct callchain_cpus_entries *entries; |
| 156 | |
Christoph Lameter | 4a32fea | 2014-08-17 12:30:27 -0500 | [diff] [blame] | 157 | *rctx = get_recursion_context(this_cpu_ptr(callchain_recursion)); |
Borislav Petkov | 9251f90 | 2011-10-16 17:15:04 +0200 | [diff] [blame] | 158 | if (*rctx == -1) |
| 159 | return NULL; |
| 160 | |
| 161 | entries = rcu_dereference(callchain_cpus_entries); |
| 162 | if (!entries) |
| 163 | return NULL; |
| 164 | |
| 165 | cpu = smp_processor_id(); |
| 166 | |
Arnaldo Carvalho de Melo | c5dfd78 | 2016-04-21 12:28:50 -0300 | [diff] [blame] | 167 | return (((void *)entries->cpu_entries[cpu]) + |
| 168 | (*rctx * perf_callchain_entry__sizeof())); |
Borislav Petkov | 9251f90 | 2011-10-16 17:15:04 +0200 | [diff] [blame] | 169 | } |
| 170 | |
| 171 | static void |
| 172 | put_callchain_entry(int rctx) |
| 173 | { |
Christoph Lameter | 4a32fea | 2014-08-17 12:30:27 -0500 | [diff] [blame] | 174 | put_recursion_context(this_cpu_ptr(callchain_recursion), rctx); |
Borislav Petkov | 9251f90 | 2011-10-16 17:15:04 +0200 | [diff] [blame] | 175 | } |
| 176 | |
Andrew Vagin | e6dab5f | 2012-07-11 18:14:58 +0400 | [diff] [blame] | 177 | struct perf_callchain_entry * |
Alexei Starovoitov | 568b329 | 2016-02-17 19:58:57 -0800 | [diff] [blame] | 178 | get_perf_callchain(struct pt_regs *regs, u32 init_nr, bool kernel, bool user, |
Arnaldo Carvalho de Melo | cfbcf46 | 2016-04-28 12:30:53 -0300 | [diff] [blame] | 179 | u32 max_stack, bool crosstask, bool add_mark) |
Alexei Starovoitov | 568b329 | 2016-02-17 19:58:57 -0800 | [diff] [blame] | 180 | { |
| 181 | struct perf_callchain_entry *entry; |
Arnaldo Carvalho de Melo | cfbcf46 | 2016-04-28 12:30:53 -0300 | [diff] [blame] | 182 | struct perf_callchain_entry_ctx ctx; |
Alexei Starovoitov | 568b329 | 2016-02-17 19:58:57 -0800 | [diff] [blame] | 183 | int rctx; |
| 184 | |
Borislav Petkov | 9251f90 | 2011-10-16 17:15:04 +0200 | [diff] [blame] | 185 | entry = get_callchain_entry(&rctx); |
| 186 | if (rctx == -1) |
| 187 | return NULL; |
| 188 | |
| 189 | if (!entry) |
| 190 | goto exit_put; |
| 191 | |
Arnaldo Carvalho de Melo | cfbcf46 | 2016-04-28 12:30:53 -0300 | [diff] [blame] | 192 | ctx.entry = entry; |
| 193 | ctx.max_stack = max_stack; |
Arnaldo Carvalho de Melo | 3b1fff0 | 2016-05-10 18:08:32 -0300 | [diff] [blame] | 194 | ctx.nr = entry->nr = init_nr; |
Arnaldo Carvalho de Melo | c85b033 | 2016-05-12 13:06:21 -0300 | [diff] [blame] | 195 | ctx.contexts = 0; |
| 196 | ctx.contexts_maxed = false; |
Borislav Petkov | 9251f90 | 2011-10-16 17:15:04 +0200 | [diff] [blame] | 197 | |
Frederic Weisbecker | d077526 | 2012-08-07 15:20:41 +0200 | [diff] [blame] | 198 | if (kernel && !user_mode(regs)) { |
Alexei Starovoitov | 568b329 | 2016-02-17 19:58:57 -0800 | [diff] [blame] | 199 | if (add_mark) |
Arnaldo Carvalho de Melo | 3e4de4e | 2016-05-12 13:01:50 -0300 | [diff] [blame] | 200 | perf_callchain_store_context(&ctx, PERF_CONTEXT_KERNEL); |
Arnaldo Carvalho de Melo | cfbcf46 | 2016-04-28 12:30:53 -0300 | [diff] [blame] | 201 | perf_callchain_kernel(&ctx, regs); |
Borislav Petkov | 9251f90 | 2011-10-16 17:15:04 +0200 | [diff] [blame] | 202 | } |
| 203 | |
Frederic Weisbecker | d077526 | 2012-08-07 15:20:41 +0200 | [diff] [blame] | 204 | if (user) { |
| 205 | if (!user_mode(regs)) { |
| 206 | if (current->mm) |
| 207 | regs = task_pt_regs(current); |
| 208 | else |
| 209 | regs = NULL; |
| 210 | } |
Andrew Vagin | e6dab5f | 2012-07-11 18:14:58 +0400 | [diff] [blame] | 211 | |
Frederic Weisbecker | d077526 | 2012-08-07 15:20:41 +0200 | [diff] [blame] | 212 | if (regs) { |
Will Deacon | 88b0193 | 2017-05-09 18:00:04 +0100 | [diff] [blame] | 213 | mm_segment_t fs; |
| 214 | |
Alexei Starovoitov | 568b329 | 2016-02-17 19:58:57 -0800 | [diff] [blame] | 215 | if (crosstask) |
Frederic Weisbecker | d077526 | 2012-08-07 15:20:41 +0200 | [diff] [blame] | 216 | goto exit_put; |
| 217 | |
Alexei Starovoitov | 568b329 | 2016-02-17 19:58:57 -0800 | [diff] [blame] | 218 | if (add_mark) |
Arnaldo Carvalho de Melo | 3e4de4e | 2016-05-12 13:01:50 -0300 | [diff] [blame] | 219 | perf_callchain_store_context(&ctx, PERF_CONTEXT_USER); |
Will Deacon | 88b0193 | 2017-05-09 18:00:04 +0100 | [diff] [blame] | 220 | |
| 221 | fs = get_fs(); |
| 222 | set_fs(USER_DS); |
Arnaldo Carvalho de Melo | cfbcf46 | 2016-04-28 12:30:53 -0300 | [diff] [blame] | 223 | perf_callchain_user(&ctx, regs); |
Will Deacon | 88b0193 | 2017-05-09 18:00:04 +0100 | [diff] [blame] | 224 | set_fs(fs); |
Frederic Weisbecker | d077526 | 2012-08-07 15:20:41 +0200 | [diff] [blame] | 225 | } |
Borislav Petkov | 9251f90 | 2011-10-16 17:15:04 +0200 | [diff] [blame] | 226 | } |
| 227 | |
| 228 | exit_put: |
| 229 | put_callchain_entry(rctx); |
| 230 | |
| 231 | return entry; |
| 232 | } |
Arnaldo Carvalho de Melo | c5dfd78 | 2016-04-21 12:28:50 -0300 | [diff] [blame] | 233 | |
Arnaldo Carvalho de Melo | c85b033 | 2016-05-12 13:06:21 -0300 | [diff] [blame] | 234 | /* |
| 235 | * Used for sysctl_perf_event_max_stack and |
| 236 | * sysctl_perf_event_max_contexts_per_stack. |
| 237 | */ |
Arnaldo Carvalho de Melo | c5dfd78 | 2016-04-21 12:28:50 -0300 | [diff] [blame] | 238 | int perf_event_max_stack_handler(struct ctl_table *table, int write, |
| 239 | void __user *buffer, size_t *lenp, loff_t *ppos) |
| 240 | { |
Arnaldo Carvalho de Melo | a831100 | 2016-05-10 16:34:53 -0300 | [diff] [blame] | 241 | int *value = table->data; |
| 242 | int new_value = *value, ret; |
Arnaldo Carvalho de Melo | c5dfd78 | 2016-04-21 12:28:50 -0300 | [diff] [blame] | 243 | struct ctl_table new_table = *table; |
| 244 | |
| 245 | new_table.data = &new_value; |
| 246 | ret = proc_dointvec_minmax(&new_table, write, buffer, lenp, ppos); |
| 247 | if (ret || !write) |
| 248 | return ret; |
| 249 | |
| 250 | mutex_lock(&callchain_mutex); |
| 251 | if (atomic_read(&nr_callchain_events)) |
| 252 | ret = -EBUSY; |
| 253 | else |
Arnaldo Carvalho de Melo | a831100 | 2016-05-10 16:34:53 -0300 | [diff] [blame] | 254 | *value = new_value; |
Arnaldo Carvalho de Melo | c5dfd78 | 2016-04-21 12:28:50 -0300 | [diff] [blame] | 255 | |
| 256 | mutex_unlock(&callchain_mutex); |
| 257 | |
| 258 | return ret; |
| 259 | } |