blob: fc15077991c47992b8b50367e80792f8a77589be [file] [log] [blame]
Marco Elverdfd402a2019-11-14 19:02:54 +01001// SPDX-License-Identifier: GPL-2.0
Marco Elverbd0ccc42021-01-15 18:09:53 +01002/*
3 * KCSAN reporting.
4 *
5 * Copyright (C) 2019, Google LLC.
6 */
Marco Elverdfd402a2019-11-14 19:02:54 +01007
Marco Elver2402d0e2020-02-22 00:10:27 +01008#include <linux/debug_locks.h>
9#include <linux/delay.h>
Marco Elver05f9a402020-01-10 19:48:34 +010010#include <linux/jiffies.h>
Marco Elver6c65eb72021-08-09 13:25:14 +020011#include <linux/kallsyms.h>
Marco Elverdfd402a2019-11-14 19:02:54 +010012#include <linux/kernel.h>
Marco Elverf1bc9622020-01-15 17:25:12 +010013#include <linux/lockdep.h>
Marco Elverdfd402a2019-11-14 19:02:54 +010014#include <linux/preempt.h>
15#include <linux/printk.h>
16#include <linux/sched.h>
17#include <linux/spinlock.h>
18#include <linux/stacktrace.h>
19
20#include "kcsan.h"
21#include "encoding.h"
22
23/*
24 * Max. number of stack entries to show in the report.
25 */
26#define NUM_STACK_ENTRIES 64
27
Marco Elver135c0872020-03-18 18:38:44 +010028/* Common access info. */
29struct access_info {
30 const volatile void *ptr;
31 size_t size;
32 int access_type;
33 int task_pid;
34 int cpu_id;
Marco Elver55a55fe2021-08-09 13:25:12 +020035 unsigned long ip;
Marco Elver135c0872020-03-18 18:38:44 +010036};
37
Marco Elverdfd402a2019-11-14 19:02:54 +010038/*
39 * Other thread info: communicated from other racing thread to thread that set
Marco Elver61194182020-03-18 18:38:45 +010040 * up the watchpoint, which then prints the complete report atomically.
Marco Elverdfd402a2019-11-14 19:02:54 +010041 */
Marco Elver135c0872020-03-18 18:38:44 +010042struct other_info {
43 struct access_info ai;
Ingo Molnar5cbaefe2019-11-20 10:41:43 +010044 unsigned long stack_entries[NUM_STACK_ENTRIES];
45 int num_stack_entries;
Marco Elver2402d0e2020-02-22 00:10:27 +010046
47 /*
48 * Optionally pass @current. Typically we do not need to pass @current
49 * via @other_info since just @task_pid is sufficient. Passing @current
50 * has additional overhead.
51 *
52 * To safely pass @current, we must either use get_task_struct/
53 * put_task_struct, or stall the thread that populated @other_info.
54 *
55 * We cannot rely on get_task_struct/put_task_struct in case
56 * release_report() races with a task being released, and would have to
57 * free it in release_report(). This may result in deadlock if we want
58 * to use KCSAN on the allocators.
59 *
60 * Since we also want to reliably print held locks for
61 * CONFIG_KCSAN_VERBOSE, the current implementation stalls the thread
62 * that populated @other_info until it has been consumed.
63 */
64 struct task_struct *task;
Marco Elver135c0872020-03-18 18:38:44 +010065};
66
Marco Elver61194182020-03-18 18:38:45 +010067/*
68 * To never block any producers of struct other_info, we need as many elements
69 * as we have watchpoints (upper bound on concurrent races to report).
70 */
71static struct other_info other_infos[CONFIG_KCSAN_NUM_WATCHPOINTS + NUM_SLOTS-1];
Marco Elverdfd402a2019-11-14 19:02:54 +010072
73/*
Marco Elverd591ec32020-02-06 16:46:24 +010074 * Information about reported races; used to rate limit reporting.
Marco Elver05f9a402020-01-10 19:48:34 +010075 */
76struct report_time {
77 /*
Marco Elverd591ec32020-02-06 16:46:24 +010078 * The last time the race was reported.
Marco Elver05f9a402020-01-10 19:48:34 +010079 */
80 unsigned long time;
81
82 /*
83 * The frames of the 2 threads; if only 1 thread is known, one frame
84 * will be 0.
85 */
86 unsigned long frame1;
87 unsigned long frame2;
88};
89
90/*
91 * Since we also want to be able to debug allocators with KCSAN, to avoid
92 * deadlock, report_times cannot be dynamically resized with krealloc in
93 * rate_limit_report.
94 *
95 * Therefore, we use a fixed-size array, which at most will occupy a page. This
96 * still adequately rate limits reports, assuming that a) number of unique data
Marco Elverd591ec32020-02-06 16:46:24 +010097 * races is not excessive, and b) occurrence of unique races within the
Marco Elver05f9a402020-01-10 19:48:34 +010098 * same time window is limited.
99 */
100#define REPORT_TIMES_MAX (PAGE_SIZE / sizeof(struct report_time))
101#define REPORT_TIMES_SIZE \
102 (CONFIG_KCSAN_REPORT_ONCE_IN_MS > REPORT_TIMES_MAX ? \
103 REPORT_TIMES_MAX : \
104 CONFIG_KCSAN_REPORT_ONCE_IN_MS)
105static struct report_time report_times[REPORT_TIMES_SIZE];
106
107/*
Marco Elver61194182020-03-18 18:38:45 +0100108 * Spinlock serializing report generation, and access to @other_infos. Although
109 * it could make sense to have a finer-grained locking story for @other_infos,
110 * report generation needs to be serialized either way, so not much is gained.
Marco Elverdfd402a2019-11-14 19:02:54 +0100111 */
Marco Elver61194182020-03-18 18:38:45 +0100112static DEFINE_RAW_SPINLOCK(report_lock);
Marco Elverdfd402a2019-11-14 19:02:54 +0100113
114/*
Marco Elverd591ec32020-02-06 16:46:24 +0100115 * Checks if the race identified by thread frames frame1 and frame2 has
Marco Elver05f9a402020-01-10 19:48:34 +0100116 * been reported since (now - KCSAN_REPORT_ONCE_IN_MS).
117 */
118static bool rate_limit_report(unsigned long frame1, unsigned long frame2)
119{
120 struct report_time *use_entry = &report_times[0];
121 unsigned long invalid_before;
122 int i;
123
124 BUILD_BUG_ON(CONFIG_KCSAN_REPORT_ONCE_IN_MS != 0 && REPORT_TIMES_SIZE == 0);
125
126 if (CONFIG_KCSAN_REPORT_ONCE_IN_MS == 0)
127 return false;
128
129 invalid_before = jiffies - msecs_to_jiffies(CONFIG_KCSAN_REPORT_ONCE_IN_MS);
130
Marco Elverd591ec32020-02-06 16:46:24 +0100131 /* Check if a matching race report exists. */
Marco Elver05f9a402020-01-10 19:48:34 +0100132 for (i = 0; i < REPORT_TIMES_SIZE; ++i) {
133 struct report_time *rt = &report_times[i];
134
135 /*
136 * Must always select an entry for use to store info as we
137 * cannot resize report_times; at the end of the scan, use_entry
138 * will be the oldest entry, which ideally also happened before
139 * KCSAN_REPORT_ONCE_IN_MS ago.
140 */
141 if (time_before(rt->time, use_entry->time))
142 use_entry = rt;
143
144 /*
145 * Initially, no need to check any further as this entry as well
146 * as following entries have never been used.
147 */
148 if (rt->time == 0)
149 break;
150
151 /* Check if entry expired. */
152 if (time_before(rt->time, invalid_before))
153 continue; /* before KCSAN_REPORT_ONCE_IN_MS ago */
154
Marco Elverd591ec32020-02-06 16:46:24 +0100155 /* Reported recently, check if race matches. */
Marco Elver05f9a402020-01-10 19:48:34 +0100156 if ((rt->frame1 == frame1 && rt->frame2 == frame2) ||
157 (rt->frame1 == frame2 && rt->frame2 == frame1))
158 return true;
159 }
160
161 use_entry->time = jiffies;
162 use_entry->frame1 = frame1;
163 use_entry->frame2 = frame2;
164 return false;
165}
166
167/*
Marco Elverdfd402a2019-11-14 19:02:54 +0100168 * Special rules to skip reporting.
169 */
Ingo Molnar5cbaefe2019-11-20 10:41:43 +0100170static bool
Marco Elverb738f612020-02-11 17:04:21 +0100171skip_report(enum kcsan_value_change value_change, unsigned long top_frame)
Marco Elverdfd402a2019-11-14 19:02:54 +0100172{
Marco Elver81af89e2020-02-11 17:04:22 +0100173 /* Should never get here if value_change==FALSE. */
174 WARN_ON_ONCE(value_change == KCSAN_VALUE_CHANGE_FALSE);
175
Marco Elverad4f8ee2020-01-29 16:01:02 +0100176 /*
Marco Elverb738f612020-02-11 17:04:21 +0100177 * The first call to skip_report always has value_change==TRUE, since we
Marco Elverad4f8ee2020-01-29 16:01:02 +0100178 * cannot know the value written of an instrumented access. For the 2nd
179 * call there are 6 cases with CONFIG_KCSAN_REPORT_VALUE_CHANGE_ONLY:
180 *
Marco Elverb738f612020-02-11 17:04:21 +0100181 * 1. read watchpoint, conflicting write (value_change==TRUE): report;
182 * 2. read watchpoint, conflicting write (value_change==MAYBE): skip;
183 * 3. write watchpoint, conflicting write (value_change==TRUE): report;
184 * 4. write watchpoint, conflicting write (value_change==MAYBE): skip;
185 * 5. write watchpoint, conflicting read (value_change==MAYBE): skip;
186 * 6. write watchpoint, conflicting read (value_change==TRUE): report;
Marco Elverad4f8ee2020-01-29 16:01:02 +0100187 *
188 * Cases 1-4 are intuitive and expected; case 5 ensures we do not report
Marco Elverd591ec32020-02-06 16:46:24 +0100189 * data races where the write may have rewritten the same value; case 6
190 * is possible either if the size is larger than what we check value
191 * changes for or the access type is KCSAN_ACCESS_ASSERT.
Marco Elverad4f8ee2020-01-29 16:01:02 +0100192 */
Marco Elverb738f612020-02-11 17:04:21 +0100193 if (IS_ENABLED(CONFIG_KCSAN_REPORT_VALUE_CHANGE_ONLY) &&
194 value_change == KCSAN_VALUE_CHANGE_MAYBE) {
Marco Elverdfd402a2019-11-14 19:02:54 +0100195 /*
196 * The access is a write, but the data value did not change.
197 *
198 * We opt-out of this filter for certain functions at request of
199 * maintainers.
200 */
201 char buf[64];
Marco Elverf770ed12020-04-10 18:44:17 +0200202 int len = scnprintf(buf, sizeof(buf), "%ps", (void *)top_frame);
Marco Elverdfd402a2019-11-14 19:02:54 +0100203
Marco Elverf770ed12020-04-10 18:44:17 +0200204 if (!strnstr(buf, "rcu_", len) &&
205 !strnstr(buf, "_rcu", len) &&
206 !strnstr(buf, "_srcu", len))
Marco Elverdfd402a2019-11-14 19:02:54 +0100207 return true;
208 }
209
210 return kcsan_skip_report_debugfs(top_frame);
211}
212
Marco Elver47144ec2020-01-10 19:48:33 +0100213static const char *get_access_type(int type)
Marco Elverdfd402a2019-11-14 19:02:54 +0100214{
Marco Elver757a4ce2020-03-25 17:41:56 +0100215 if (type & KCSAN_ACCESS_ASSERT) {
216 if (type & KCSAN_ACCESS_SCOPED) {
217 if (type & KCSAN_ACCESS_WRITE)
218 return "assert no accesses (scoped)";
219 else
220 return "assert no writes (scoped)";
221 } else {
222 if (type & KCSAN_ACCESS_WRITE)
223 return "assert no accesses";
224 else
225 return "assert no writes";
226 }
227 }
228
Marco Elver47144ec2020-01-10 19:48:33 +0100229 switch (type) {
230 case 0:
231 return "read";
232 case KCSAN_ACCESS_ATOMIC:
233 return "read (marked)";
234 case KCSAN_ACCESS_WRITE:
235 return "write";
236 case KCSAN_ACCESS_WRITE | KCSAN_ACCESS_ATOMIC:
237 return "write (marked)";
Marco Elver14e2ac82020-07-24 09:00:01 +0200238 case KCSAN_ACCESS_COMPOUND | KCSAN_ACCESS_WRITE:
239 return "read-write";
240 case KCSAN_ACCESS_COMPOUND | KCSAN_ACCESS_WRITE | KCSAN_ACCESS_ATOMIC:
241 return "read-write (marked)";
Marco Elver757a4ce2020-03-25 17:41:56 +0100242 case KCSAN_ACCESS_SCOPED:
243 return "read (scoped)";
244 case KCSAN_ACCESS_SCOPED | KCSAN_ACCESS_ATOMIC:
245 return "read (marked, scoped)";
246 case KCSAN_ACCESS_SCOPED | KCSAN_ACCESS_WRITE:
247 return "write (scoped)";
248 case KCSAN_ACCESS_SCOPED | KCSAN_ACCESS_WRITE | KCSAN_ACCESS_ATOMIC:
249 return "write (marked, scoped)";
Marco Elverd627c532021-08-09 13:25:15 +0200250 case KCSAN_ACCESS_SCOPED | KCSAN_ACCESS_COMPOUND | KCSAN_ACCESS_WRITE:
251 return "read-write (scoped)";
252 case KCSAN_ACCESS_SCOPED | KCSAN_ACCESS_COMPOUND | KCSAN_ACCESS_WRITE | KCSAN_ACCESS_ATOMIC:
253 return "read-write (marked, scoped)";
Marco Elver47144ec2020-01-10 19:48:33 +0100254 default:
255 BUG();
256 }
Marco Elverdfd402a2019-11-14 19:02:54 +0100257}
258
Marco Elverd591ec32020-02-06 16:46:24 +0100259static const char *get_bug_type(int type)
260{
261 return (type & KCSAN_ACCESS_ASSERT) != 0 ? "assert: race" : "data-race";
262}
263
Marco Elverdfd402a2019-11-14 19:02:54 +0100264/* Return thread description: in task or interrupt. */
265static const char *get_thread_desc(int task_id)
266{
267 if (task_id != -1) {
268 static char buf[32]; /* safe: protected by report_lock */
269
270 snprintf(buf, sizeof(buf), "task %i", task_id);
271 return buf;
272 }
273 return "interrupt";
274}
275
276/* Helper to skip KCSAN-related functions in stack-trace. */
Marco Elver135c0872020-03-18 18:38:44 +0100277static int get_stack_skipnr(const unsigned long stack_entries[], int num_entries)
Marco Elverdfd402a2019-11-14 19:02:54 +0100278{
279 char buf[64];
Marco Elvercdb9b072020-04-10 18:44:18 +0200280 char *cur;
281 int len, skip;
Marco Elverdfd402a2019-11-14 19:02:54 +0100282
Marco Elvercdb9b072020-04-10 18:44:18 +0200283 for (skip = 0; skip < num_entries; ++skip) {
Marco Elverf770ed12020-04-10 18:44:17 +0200284 len = scnprintf(buf, sizeof(buf), "%ps", (void *)stack_entries[skip]);
Marco Elvercdb9b072020-04-10 18:44:18 +0200285
286 /* Never show tsan_* or {read,write}_once_size. */
287 if (strnstr(buf, "tsan_", len) ||
288 strnstr(buf, "_once_size", len))
289 continue;
290
291 cur = strnstr(buf, "kcsan_", len);
292 if (cur) {
Marco Elvera4e74fa2020-07-31 10:17:20 +0200293 cur += strlen("kcsan_");
294 if (!str_has_prefix(cur, "test"))
Marco Elvercdb9b072020-04-10 18:44:18 +0200295 continue; /* KCSAN runtime function. */
296 /* KCSAN related test. */
297 }
298
299 /*
300 * No match for runtime functions -- @skip entries to skip to
301 * get to first frame of interest.
302 */
303 break;
Marco Elverdfd402a2019-11-14 19:02:54 +0100304 }
Marco Elvercdb9b072020-04-10 18:44:18 +0200305
Marco Elverdfd402a2019-11-14 19:02:54 +0100306 return skip;
307}
308
Marco Elver6c65eb72021-08-09 13:25:14 +0200309/*
310 * Skips to the first entry that matches the function of @ip, and then replaces
311 * that entry with @ip, returning the entries to skip.
312 */
313static int
314replace_stack_entry(unsigned long stack_entries[], int num_entries, unsigned long ip)
315{
316 unsigned long symbolsize, offset;
317 unsigned long target_func;
318 int skip;
319
320 if (kallsyms_lookup_size_offset(ip, &symbolsize, &offset))
321 target_func = ip - offset;
322 else
323 goto fallback;
324
325 for (skip = 0; skip < num_entries; ++skip) {
326 unsigned long func = stack_entries[skip];
327
328 if (!kallsyms_lookup_size_offset(func, &symbolsize, &offset))
329 goto fallback;
330 func -= offset;
331
332 if (func == target_func) {
333 stack_entries[skip] = ip;
334 return skip;
335 }
336 }
337
338fallback:
339 /* Should not happen; the resulting stack trace is likely misleading. */
340 WARN_ONCE(1, "Cannot find frame for %pS in stack trace", (void *)ip);
341 return get_stack_skipnr(stack_entries, num_entries);
342}
343
344static int
345sanitize_stack_entries(unsigned long stack_entries[], int num_entries, unsigned long ip)
346{
347 return ip ? replace_stack_entry(stack_entries, num_entries, ip) :
348 get_stack_skipnr(stack_entries, num_entries);
349}
350
Marco Elverdfd402a2019-11-14 19:02:54 +0100351/* Compares symbolized strings of addr1 and addr2. */
352static int sym_strcmp(void *addr1, void *addr2)
353{
354 char buf1[64];
355 char buf2[64];
356
357 snprintf(buf1, sizeof(buf1), "%pS", addr1);
358 snprintf(buf2, sizeof(buf2), "%pS", addr2);
Ingo Molnar5cbaefe2019-11-20 10:41:43 +0100359
Marco Elverdfd402a2019-11-14 19:02:54 +0100360 return strncmp(buf1, buf2, sizeof(buf1));
361}
362
Marco Elver2402d0e2020-02-22 00:10:27 +0100363static void print_verbose_info(struct task_struct *task)
364{
365 if (!task)
366 return;
367
Marco Elver92c209a2020-07-29 13:09:16 +0200368 /* Restore IRQ state trace for printing. */
369 kcsan_restore_irqtrace(task);
370
Marco Elver2402d0e2020-02-22 00:10:27 +0100371 pr_err("\n");
372 debug_show_held_locks(task);
373 print_irqtrace_events(task);
374}
375
Mark Rutland97aa6132021-04-14 13:28:20 +0200376static void print_report(enum kcsan_value_change value_change,
Marco Elver135c0872020-03-18 18:38:44 +0100377 const struct access_info *ai,
Marco Elver6c65eb72021-08-09 13:25:14 +0200378 struct other_info *other_info,
Mark Rutland7bbe6dc2021-04-14 13:28:24 +0200379 u64 old, u64 new, u64 mask)
Marco Elverdfd402a2019-11-14 19:02:54 +0100380{
381 unsigned long stack_entries[NUM_STACK_ENTRIES] = { 0 };
Ingo Molnar5cbaefe2019-11-20 10:41:43 +0100382 int num_stack_entries = stack_trace_save(stack_entries, NUM_STACK_ENTRIES, 1);
Marco Elver6c65eb72021-08-09 13:25:14 +0200383 int skipnr = sanitize_stack_entries(stack_entries, num_stack_entries, ai->ip);
Marco Elver05f9a402020-01-10 19:48:34 +0100384 unsigned long this_frame = stack_entries[skipnr];
385 unsigned long other_frame = 0;
386 int other_skipnr = 0; /* silence uninit warnings */
Marco Elverdfd402a2019-11-14 19:02:54 +0100387
388 /*
389 * Must check report filter rules before starting to print.
390 */
Marco Elverb738f612020-02-11 17:04:21 +0100391 if (skip_report(KCSAN_VALUE_CHANGE_TRUE, stack_entries[skipnr]))
Mark Rutland97aa6132021-04-14 13:28:20 +0200392 return;
Marco Elverdfd402a2019-11-14 19:02:54 +0100393
Mark Rutland609f8092021-04-14 13:28:23 +0200394 if (other_info) {
Marco Elver6c65eb72021-08-09 13:25:14 +0200395 other_skipnr = sanitize_stack_entries(other_info->stack_entries,
396 other_info->num_stack_entries,
397 other_info->ai.ip);
Marco Elver135c0872020-03-18 18:38:44 +0100398 other_frame = other_info->stack_entries[other_skipnr];
Marco Elverdfd402a2019-11-14 19:02:54 +0100399
Ingo Molnar5cbaefe2019-11-20 10:41:43 +0100400 /* @value_change is only known for the other thread */
Marco Elverad4f8ee2020-01-29 16:01:02 +0100401 if (skip_report(value_change, other_frame))
Mark Rutland97aa6132021-04-14 13:28:20 +0200402 return;
Marco Elverdfd402a2019-11-14 19:02:54 +0100403 }
404
Marco Elver05f9a402020-01-10 19:48:34 +0100405 if (rate_limit_report(this_frame, other_frame))
Mark Rutland97aa6132021-04-14 13:28:20 +0200406 return;
Marco Elver05f9a402020-01-10 19:48:34 +0100407
Marco Elverdfd402a2019-11-14 19:02:54 +0100408 /* Print report header. */
409 pr_err("==================================================================\n");
Mark Rutland609f8092021-04-14 13:28:23 +0200410 if (other_info) {
Marco Elverdfd402a2019-11-14 19:02:54 +0100411 int cmp;
412
413 /*
414 * Order functions lexographically for consistent bug titles.
415 * Do not print offset of functions to keep title short.
416 */
Marco Elver05f9a402020-01-10 19:48:34 +0100417 cmp = sym_strcmp((void *)other_frame, (void *)this_frame);
Marco Elverd591ec32020-02-06 16:46:24 +0100418 pr_err("BUG: KCSAN: %s in %ps / %ps\n",
Marco Elver135c0872020-03-18 18:38:44 +0100419 get_bug_type(ai->access_type | other_info->ai.access_type),
Marco Elver05f9a402020-01-10 19:48:34 +0100420 (void *)(cmp < 0 ? other_frame : this_frame),
421 (void *)(cmp < 0 ? this_frame : other_frame));
Mark Rutland609f8092021-04-14 13:28:23 +0200422 } else {
Marco Elver135c0872020-03-18 18:38:44 +0100423 pr_err("BUG: KCSAN: %s in %pS\n", get_bug_type(ai->access_type),
Marco Elverd591ec32020-02-06 16:46:24 +0100424 (void *)this_frame);
Marco Elverdfd402a2019-11-14 19:02:54 +0100425 }
426
427 pr_err("\n");
428
429 /* Print information about the racing accesses. */
Mark Rutland609f8092021-04-14 13:28:23 +0200430 if (other_info) {
Marco Elverdfd402a2019-11-14 19:02:54 +0100431 pr_err("%s to 0x%px of %zu bytes by %s on cpu %i:\n",
Marco Elver135c0872020-03-18 18:38:44 +0100432 get_access_type(other_info->ai.access_type), other_info->ai.ptr,
433 other_info->ai.size, get_thread_desc(other_info->ai.task_pid),
434 other_info->ai.cpu_id);
Marco Elverdfd402a2019-11-14 19:02:54 +0100435
436 /* Print the other thread's stack trace. */
Marco Elver135c0872020-03-18 18:38:44 +0100437 stack_trace_print(other_info->stack_entries + other_skipnr,
438 other_info->num_stack_entries - other_skipnr,
Marco Elverdfd402a2019-11-14 19:02:54 +0100439 0);
440
Marco Elver2402d0e2020-02-22 00:10:27 +0100441 if (IS_ENABLED(CONFIG_KCSAN_VERBOSE))
Marco Elver135c0872020-03-18 18:38:44 +0100442 print_verbose_info(other_info->task);
Marco Elver2402d0e2020-02-22 00:10:27 +0100443
Marco Elverdfd402a2019-11-14 19:02:54 +0100444 pr_err("\n");
445 pr_err("%s to 0x%px of %zu bytes by %s on cpu %i:\n",
Marco Elver135c0872020-03-18 18:38:44 +0100446 get_access_type(ai->access_type), ai->ptr, ai->size,
447 get_thread_desc(ai->task_pid), ai->cpu_id);
Mark Rutland609f8092021-04-14 13:28:23 +0200448 } else {
Marco Elverdfd402a2019-11-14 19:02:54 +0100449 pr_err("race at unknown origin, with %s to 0x%px of %zu bytes by %s on cpu %i:\n",
Marco Elver135c0872020-03-18 18:38:44 +0100450 get_access_type(ai->access_type), ai->ptr, ai->size,
451 get_thread_desc(ai->task_pid), ai->cpu_id);
Marco Elverdfd402a2019-11-14 19:02:54 +0100452 }
453 /* Print stack trace of this thread. */
454 stack_trace_print(stack_entries + skipnr, num_stack_entries - skipnr,
455 0);
456
Marco Elver2402d0e2020-02-22 00:10:27 +0100457 if (IS_ENABLED(CONFIG_KCSAN_VERBOSE))
458 print_verbose_info(current);
459
Mark Rutland7bbe6dc2021-04-14 13:28:24 +0200460 /* Print observed value change. */
461 if (ai->size <= 8) {
462 int hex_len = ai->size * 2;
463 u64 diff = old ^ new;
464
465 if (mask)
466 diff &= mask;
467 if (diff) {
468 pr_err("\n");
469 pr_err("value changed: 0x%0*llx -> 0x%0*llx\n",
470 hex_len, old, hex_len, new);
471 if (mask) {
472 pr_err(" bits changed: 0x%0*llx with mask 0x%0*llx\n",
473 hex_len, diff, hex_len, mask);
474 }
475 }
476 }
477
Marco Elverdfd402a2019-11-14 19:02:54 +0100478 /* Print report footer. */
479 pr_err("\n");
480 pr_err("Reported by Kernel Concurrency Sanitizer on:\n");
481 dump_stack_print_info(KERN_DEFAULT);
482 pr_err("==================================================================\n");
483
Mark Rutland97aa6132021-04-14 13:28:20 +0200484 if (panic_on_warn)
485 panic("panic_on_warn set ...\n");
Marco Elverdfd402a2019-11-14 19:02:54 +0100486}
487
Marco Elver135c0872020-03-18 18:38:44 +0100488static void release_report(unsigned long *flags, struct other_info *other_info)
Marco Elverdfd402a2019-11-14 19:02:54 +0100489{
Mark Rutland19dfdc02021-04-14 13:28:22 +0200490 /*
491 * Use size to denote valid/invalid, since KCSAN entirely ignores
492 * 0-sized accesses.
493 */
494 other_info->ai.size = 0;
Marco Elver61194182020-03-18 18:38:45 +0100495 raw_spin_unlock_irqrestore(&report_lock, *flags);
Marco Elverdfd402a2019-11-14 19:02:54 +0100496}
497
498/*
Marco Elver135c0872020-03-18 18:38:44 +0100499 * Sets @other_info->task and awaits consumption of @other_info.
Marco Elver2402d0e2020-02-22 00:10:27 +0100500 *
501 * Precondition: report_lock is held.
502 * Postcondition: report_lock is held.
503 */
Marco Elver135c0872020-03-18 18:38:44 +0100504static void set_other_info_task_blocking(unsigned long *flags,
505 const struct access_info *ai,
506 struct other_info *other_info)
Marco Elver2402d0e2020-02-22 00:10:27 +0100507{
508 /*
509 * We may be instrumenting a code-path where current->state is already
510 * something other than TASK_RUNNING.
511 */
Peter Zijlstrab03fbd42021-06-11 10:28:12 +0200512 const bool is_running = task_is_running(current);
Marco Elver2402d0e2020-02-22 00:10:27 +0100513 /*
514 * To avoid deadlock in case we are in an interrupt here and this is a
515 * race with a task on the same CPU (KCSAN_INTERRUPT_WATCHER), provide a
516 * timeout to ensure this works in all contexts.
517 *
518 * Await approximately the worst case delay of the reporting thread (if
519 * we are not interrupted).
520 */
521 int timeout = max(kcsan_udelay_task, kcsan_udelay_interrupt);
522
Marco Elver135c0872020-03-18 18:38:44 +0100523 other_info->task = current;
Marco Elver2402d0e2020-02-22 00:10:27 +0100524 do {
525 if (is_running) {
526 /*
527 * Let lockdep know the real task is sleeping, to print
528 * the held locks (recall we turned lockdep off, so
529 * locking/unlocking @report_lock won't be recorded).
530 */
531 set_current_state(TASK_UNINTERRUPTIBLE);
532 }
Marco Elver61194182020-03-18 18:38:45 +0100533 raw_spin_unlock_irqrestore(&report_lock, *flags);
Marco Elver2402d0e2020-02-22 00:10:27 +0100534 /*
535 * We cannot call schedule() since we also cannot reliably
536 * determine if sleeping here is permitted -- see in_atomic().
537 */
538
539 udelay(1);
Marco Elver61194182020-03-18 18:38:45 +0100540 raw_spin_lock_irqsave(&report_lock, *flags);
Marco Elver2402d0e2020-02-22 00:10:27 +0100541 if (timeout-- < 0) {
542 /*
Marco Elver135c0872020-03-18 18:38:44 +0100543 * Abort. Reset @other_info->task to NULL, since it
Marco Elver2402d0e2020-02-22 00:10:27 +0100544 * appears the other thread is still going to consume
545 * it. It will result in no verbose info printed for
546 * this task.
547 */
Marco Elver135c0872020-03-18 18:38:44 +0100548 other_info->task = NULL;
Marco Elver2402d0e2020-02-22 00:10:27 +0100549 break;
550 }
551 /*
Marco Elver61194182020-03-18 18:38:45 +0100552 * If invalid, or @ptr nor @current matches, then @other_info
553 * has been consumed and we may continue. If not, retry.
Marco Elver2402d0e2020-02-22 00:10:27 +0100554 */
Marco Elver61194182020-03-18 18:38:45 +0100555 } while (other_info->ai.size && other_info->ai.ptr == ai->ptr &&
556 other_info->task == current);
Marco Elver2402d0e2020-02-22 00:10:27 +0100557 if (is_running)
558 set_current_state(TASK_RUNNING);
559}
560
Marco Elver61194182020-03-18 18:38:45 +0100561/* Populate @other_info; requires that the provided @other_info not in use. */
562static void prepare_report_producer(unsigned long *flags,
563 const struct access_info *ai,
564 struct other_info *other_info)
Marco Elverdfd402a2019-11-14 19:02:54 +0100565{
Marco Elver61194182020-03-18 18:38:45 +0100566 raw_spin_lock_irqsave(&report_lock, *flags);
567
568 /*
569 * The same @other_infos entry cannot be used concurrently, because
570 * there is a one-to-one mapping to watchpoint slots (@watchpoints in
571 * core.c), and a watchpoint is only released for reuse after reporting
572 * is done by the consumer of @other_info. Therefore, it is impossible
573 * for another concurrent prepare_report_producer() to set the same
574 * @other_info, and are guaranteed exclusivity for the @other_infos
575 * entry pointed to by @other_info.
576 *
577 * To check this property holds, size should never be non-zero here,
578 * because every consumer of struct other_info resets size to 0 in
579 * release_report().
580 */
581 WARN_ON(other_info->ai.size);
582
583 other_info->ai = *ai;
584 other_info->num_stack_entries = stack_trace_save(other_info->stack_entries, NUM_STACK_ENTRIES, 2);
585
586 if (IS_ENABLED(CONFIG_KCSAN_VERBOSE))
587 set_other_info_task_blocking(flags, ai, other_info);
588
589 raw_spin_unlock_irqrestore(&report_lock, *flags);
590}
591
592/* Awaits producer to fill @other_info and then returns. */
593static bool prepare_report_consumer(unsigned long *flags,
594 const struct access_info *ai,
595 struct other_info *other_info)
596{
597
598 raw_spin_lock_irqsave(&report_lock, *flags);
599 while (!other_info->ai.size) { /* Await valid @other_info. */
600 raw_spin_unlock_irqrestore(&report_lock, *flags);
601 cpu_relax();
602 raw_spin_lock_irqsave(&report_lock, *flags);
Marco Elverdfd402a2019-11-14 19:02:54 +0100603 }
604
Marco Elver61194182020-03-18 18:38:45 +0100605 /* Should always have a matching access based on watchpoint encoding. */
606 if (WARN_ON(!matching_access((unsigned long)other_info->ai.ptr & WATCHPOINT_ADDR_MASK, other_info->ai.size,
607 (unsigned long)ai->ptr & WATCHPOINT_ADDR_MASK, ai->size)))
608 goto discard;
Marco Elverdfd402a2019-11-14 19:02:54 +0100609
Marco Elver61194182020-03-18 18:38:45 +0100610 if (!matching_access((unsigned long)other_info->ai.ptr, other_info->ai.size,
611 (unsigned long)ai->ptr, ai->size)) {
612 /*
613 * If the actual accesses to not match, this was a false
614 * positive due to watchpoint encoding.
615 */
Marco Elver2e986b82020-08-10 10:06:25 +0200616 atomic_long_inc(&kcsan_counters[KCSAN_COUNTER_ENCODING_FALSE_POSITIVES]);
Marco Elver61194182020-03-18 18:38:45 +0100617 goto discard;
618 }
619
620 return true;
621
622discard:
623 release_report(flags, other_info);
624 return false;
625}
626
Mark Rutland39b2e762021-04-14 13:28:21 +0200627static struct access_info prepare_access_info(const volatile void *ptr, size_t size,
Marco Elver55a55fe2021-08-09 13:25:12 +0200628 int access_type, unsigned long ip)
Marco Elver61194182020-03-18 18:38:45 +0100629{
Mark Rutland39b2e762021-04-14 13:28:21 +0200630 return (struct access_info) {
Marco Elver135c0872020-03-18 18:38:44 +0100631 .ptr = ptr,
632 .size = size,
633 .access_type = access_type,
634 .task_pid = in_task() ? task_pid_nr(current) : -1,
Marco Elver55a55fe2021-08-09 13:25:12 +0200635 .cpu_id = raw_smp_processor_id(),
Marco Elver6c65eb72021-08-09 13:25:14 +0200636 /* Only replace stack entry with @ip if scoped access. */
637 .ip = (access_type & KCSAN_ACCESS_SCOPED) ? ip : 0,
Marco Elver135c0872020-03-18 18:38:44 +0100638 };
Mark Rutland39b2e762021-04-14 13:28:21 +0200639}
640
Mark Rutland793c2572021-04-14 13:28:18 +0200641void kcsan_report_set_info(const volatile void *ptr, size_t size, int access_type,
Marco Elver55a55fe2021-08-09 13:25:12 +0200642 unsigned long ip, int watchpoint_idx)
Mark Rutland793c2572021-04-14 13:28:18 +0200643{
Marco Elver55a55fe2021-08-09 13:25:12 +0200644 const struct access_info ai = prepare_access_info(ptr, size, access_type, ip);
Mark Rutland19dfdc02021-04-14 13:28:22 +0200645 unsigned long flags;
Marco Elver61194182020-03-18 18:38:45 +0100646
647 kcsan_disable_current();
Mark Rutland19dfdc02021-04-14 13:28:22 +0200648 lockdep_off(); /* See kcsan_report_known_origin(). */
Marco Elverdfd402a2019-11-14 19:02:54 +0100649
Mark Rutland19dfdc02021-04-14 13:28:22 +0200650 prepare_report_producer(&flags, &ai, &other_infos[watchpoint_idx]);
651
652 lockdep_on();
653 kcsan_enable_current();
Mark Rutland793c2572021-04-14 13:28:18 +0200654}
655
656void kcsan_report_known_origin(const volatile void *ptr, size_t size, int access_type,
Marco Elver55a55fe2021-08-09 13:25:12 +0200657 unsigned long ip, enum kcsan_value_change value_change,
658 int watchpoint_idx, u64 old, u64 new, u64 mask)
Mark Rutland793c2572021-04-14 13:28:18 +0200659{
Marco Elver55a55fe2021-08-09 13:25:12 +0200660 const struct access_info ai = prepare_access_info(ptr, size, access_type, ip);
Mark Rutland19dfdc02021-04-14 13:28:22 +0200661 struct other_info *other_info = &other_infos[watchpoint_idx];
662 unsigned long flags = 0;
Mark Rutland39b2e762021-04-14 13:28:21 +0200663
Mark Rutland19dfdc02021-04-14 13:28:22 +0200664 kcsan_disable_current();
Marco Elverf1bc9622020-01-15 17:25:12 +0100665 /*
Marco Elver248591f2020-06-24 13:32:46 +0200666 * Because we may generate reports when we're in scheduler code, the use
667 * of printk() could deadlock. Until such time that all printing code
668 * called in print_report() is scheduler-safe, accept the risk, and just
669 * get our message out. As such, also disable lockdep to hide the
670 * warning, and avoid disabling lockdep for the rest of the kernel.
Marco Elverf1bc9622020-01-15 17:25:12 +0100671 */
672 lockdep_off();
673
Mark Rutland19dfdc02021-04-14 13:28:22 +0200674 if (!prepare_report_consumer(&flags, &ai, other_info))
675 goto out;
676 /*
677 * Never report if value_change is FALSE, only when it is
678 * either TRUE or MAYBE. In case of MAYBE, further filtering may
679 * be done once we know the full stack trace in print_report().
680 */
681 if (value_change != KCSAN_VALUE_CHANGE_FALSE)
Mark Rutland7bbe6dc2021-04-14 13:28:24 +0200682 print_report(value_change, &ai, other_info, old, new, mask);
Marco Elver81af89e2020-02-11 17:04:22 +0100683
Mark Rutland19dfdc02021-04-14 13:28:22 +0200684 release_report(&flags, other_info);
685out:
686 lockdep_on();
687 kcsan_enable_current();
Mark Rutland793c2572021-04-14 13:28:18 +0200688}
Marco Elverdfd402a2019-11-14 19:02:54 +0100689
Mark Rutland7bbe6dc2021-04-14 13:28:24 +0200690void kcsan_report_unknown_origin(const volatile void *ptr, size_t size, int access_type,
Marco Elver55a55fe2021-08-09 13:25:12 +0200691 unsigned long ip, u64 old, u64 new, u64 mask)
Mark Rutland793c2572021-04-14 13:28:18 +0200692{
Marco Elver55a55fe2021-08-09 13:25:12 +0200693 const struct access_info ai = prepare_access_info(ptr, size, access_type, ip);
Mark Rutland19dfdc02021-04-14 13:28:22 +0200694 unsigned long flags;
Mark Rutland39b2e762021-04-14 13:28:21 +0200695
Mark Rutland19dfdc02021-04-14 13:28:22 +0200696 kcsan_disable_current();
697 lockdep_off(); /* See kcsan_report_known_origin(). */
698
699 raw_spin_lock_irqsave(&report_lock, flags);
Mark Rutland7bbe6dc2021-04-14 13:28:24 +0200700 print_report(KCSAN_VALUE_CHANGE_TRUE, &ai, NULL, old, new, mask);
Mark Rutland19dfdc02021-04-14 13:28:22 +0200701 raw_spin_unlock_irqrestore(&report_lock, flags);
Marco Elverf1bc9622020-01-15 17:25:12 +0100702
703 lockdep_on();
Marco Elver61194182020-03-18 18:38:45 +0100704 kcsan_enable_current();
Marco Elverdfd402a2019-11-14 19:02:54 +0100705}