blob: b8d7a663497f9e9ea65507469a25fd5f252330bc [file] [log] [blame]
Thomas Gleixnerb886d83c2019-06-01 10:08:55 +02001// SPDX-License-Identifier: GPL-2.0-only
Arjan van de Ven22a9d642009-01-07 08:45:46 -08002/*
3 * async.c: Asynchronous function calls for boot performance
4 *
5 * (C) Copyright 2009 Intel Corporation
6 * Author: Arjan van de Ven <arjan@linux.intel.com>
Arjan van de Ven22a9d642009-01-07 08:45:46 -08007 */
8
9
10/*
11
12Goals and Theory of Operation
13
14The primary goal of this feature is to reduce the kernel boot time,
15by doing various independent hardware delays and discovery operations
16decoupled and not strictly serialized.
17
18More specifically, the asynchronous function call concept allows
19certain operations (primarily during system boot) to happen
20asynchronously, out of order, while these operations still
21have their externally visible parts happen sequentially and in-order.
22(not unlike how out-of-order CPUs retire their instructions in order)
23
24Key to the asynchronous function call implementation is the concept of
25a "sequence cookie" (which, although it has an abstracted type, can be
26thought of as a monotonically incrementing number).
27
28The async core will assign each scheduled event such a sequence cookie and
29pass this to the called functions.
30
31The asynchronously called function should before doing a globally visible
32operation, such as registering device numbers, call the
33async_synchronize_cookie() function and pass in its own cookie. The
34async_synchronize_cookie() function will make sure that all asynchronous
35operations that were scheduled prior to the operation corresponding with the
36cookie have completed.
37
38Subsystem/driver initialization code that scheduled asynchronous probe
39functions, but which shares global resources with other drivers/subsystems
40that do not use the asynchronous call feature, need to do a full
41synchronization with the async_synchronize_full() function, before returning
42from their init function. This is to maintain strict ordering between the
43asynchronous and synchronous parts of the kernel.
44
45*/
46
47#include <linux/async.h>
Paul McQuade84c15022011-05-31 20:51:55 +010048#include <linux/atomic.h>
49#include <linux/ktime.h>
Paul Gortmaker9984de12011-05-23 14:51:41 -040050#include <linux/export.h>
Arjan van de Ven22a9d642009-01-07 08:45:46 -080051#include <linux/wait.h>
52#include <linux/sched.h>
Tejun Heo5a0e3ad2010-03-24 17:04:11 +090053#include <linux/slab.h>
Tejun Heo083b8042010-07-02 10:03:52 +020054#include <linux/workqueue.h>
Arjan van de Ven22a9d642009-01-07 08:45:46 -080055
Tejun Heo84b233a2013-01-18 14:05:56 -080056#include "workqueue_internal.h"
57
Arjan van de Ven22a9d642009-01-07 08:45:46 -080058static async_cookie_t next_cookie = 1;
59
Tejun Heoc68eee12013-01-23 09:32:30 -080060#define MAX_WORK 32768
61#define ASYNC_COOKIE_MAX ULLONG_MAX /* infinity cookie */
Arjan van de Ven22a9d642009-01-07 08:45:46 -080062
Tejun Heo9fdb04c2013-01-23 09:32:30 -080063static LIST_HEAD(async_global_pending); /* pending from all registered doms */
Tejun Heo8723d5032013-01-23 09:32:30 -080064static ASYNC_DOMAIN(async_dfl_domain);
Arjan van de Ven22a9d642009-01-07 08:45:46 -080065static DEFINE_SPINLOCK(async_lock);
66
67struct async_entry {
Tejun Heo9fdb04c2013-01-23 09:32:30 -080068 struct list_head domain_list;
69 struct list_head global_list;
Tejun Heo083b8042010-07-02 10:03:52 +020070 struct work_struct work;
71 async_cookie_t cookie;
Lai Jiangshan362f2b02013-03-12 13:59:14 -070072 async_func_t func;
Tejun Heo083b8042010-07-02 10:03:52 +020073 void *data;
Tejun Heo8723d5032013-01-23 09:32:30 -080074 struct async_domain *domain;
Arjan van de Ven22a9d642009-01-07 08:45:46 -080075};
76
77static DECLARE_WAIT_QUEUE_HEAD(async_done);
Arjan van de Ven22a9d642009-01-07 08:45:46 -080078
79static atomic_t entry_count;
Arjan van de Ven22a9d642009-01-07 08:45:46 -080080
Rasmus Villemoes07416af2021-05-06 18:05:36 -070081static long long microseconds_since(ktime_t start)
82{
83 ktime_t now = ktime_get();
84 return ktime_to_ns(ktime_sub(now, start)) >> 10;
85}
86
Tejun Heo8723d5032013-01-23 09:32:30 -080087static async_cookie_t lowest_in_progress(struct async_domain *domain)
Arjan van de Ven37a76bd2009-01-11 15:35:01 +000088{
Rasmus Villemoes4f7e9882018-02-06 15:37:55 -080089 struct async_entry *first = NULL;
Tejun Heo52722792013-01-23 09:32:30 -080090 async_cookie_t ret = ASYNC_COOKIE_MAX;
Arjan van de Ven37a76bd2009-01-11 15:35:01 +000091 unsigned long flags;
Arjan van de Ven37a76bd2009-01-11 15:35:01 +000092
93 spin_lock_irqsave(&async_lock, flags);
Tejun Heo9fdb04c2013-01-23 09:32:30 -080094
Rasmus Villemoes4f7e9882018-02-06 15:37:55 -080095 if (domain) {
96 if (!list_empty(&domain->pending))
97 first = list_first_entry(&domain->pending,
98 struct async_entry, domain_list);
99 } else {
100 if (!list_empty(&async_global_pending))
101 first = list_first_entry(&async_global_pending,
102 struct async_entry, global_list);
103 }
Tejun Heo9fdb04c2013-01-23 09:32:30 -0800104
Rasmus Villemoes4f7e9882018-02-06 15:37:55 -0800105 if (first)
106 ret = first->cookie;
Tejun Heo9fdb04c2013-01-23 09:32:30 -0800107
Arjan van de Ven37a76bd2009-01-11 15:35:01 +0000108 spin_unlock_irqrestore(&async_lock, flags);
109 return ret;
110}
Tejun Heo083b8042010-07-02 10:03:52 +0200111
Arjan van de Ven22a9d642009-01-07 08:45:46 -0800112/*
113 * pick the first pending entry and run it
114 */
Tejun Heo083b8042010-07-02 10:03:52 +0200115static void async_run_entry_fn(struct work_struct *work)
Arjan van de Ven22a9d642009-01-07 08:45:46 -0800116{
Tejun Heo083b8042010-07-02 10:03:52 +0200117 struct async_entry *entry =
118 container_of(work, struct async_entry, work);
Arjan van de Ven22a9d642009-01-07 08:45:46 -0800119 unsigned long flags;
Rasmus Villemoes07416af2021-05-06 18:05:36 -0700120 ktime_t calltime;
Arjan van de Ven22a9d642009-01-07 08:45:46 -0800121
Tejun Heo52722792013-01-23 09:32:30 -0800122 /* 1) run (and print duration) */
Rasmus Villemoes07416af2021-05-06 18:05:36 -0700123 pr_debug("calling %lli_%pS @ %i\n", (long long)entry->cookie,
124 entry->func, task_pid_nr(current));
125 calltime = ktime_get();
126
Arjan van de Ven22a9d642009-01-07 08:45:46 -0800127 entry->func(entry->data, entry->cookie);
Rasmus Villemoes07416af2021-05-06 18:05:36 -0700128
129 pr_debug("initcall %lli_%pS returned after %lld usecs\n",
130 (long long)entry->cookie, entry->func,
131 microseconds_since(calltime));
Arjan van de Ven22a9d642009-01-07 08:45:46 -0800132
Tejun Heo52722792013-01-23 09:32:30 -0800133 /* 2) remove self from the pending queues */
Arjan van de Ven22a9d642009-01-07 08:45:46 -0800134 spin_lock_irqsave(&async_lock, flags);
Tejun Heo9fdb04c2013-01-23 09:32:30 -0800135 list_del_init(&entry->domain_list);
136 list_del_init(&entry->global_list);
Arjan van de Ven22a9d642009-01-07 08:45:46 -0800137
Tejun Heo52722792013-01-23 09:32:30 -0800138 /* 3) free the entry */
Arjan van de Ven22a9d642009-01-07 08:45:46 -0800139 kfree(entry);
140 atomic_dec(&entry_count);
141
142 spin_unlock_irqrestore(&async_lock, flags);
143
Tejun Heo52722792013-01-23 09:32:30 -0800144 /* 4) wake up any waiters */
Arjan van de Ven22a9d642009-01-07 08:45:46 -0800145 wake_up(&async_done);
Arjan van de Ven22a9d642009-01-07 08:45:46 -0800146}
147
Alexander Duyck6be92382019-01-22 10:39:31 -0800148/**
149 * async_schedule_node_domain - NUMA specific version of async_schedule_domain
150 * @func: function to execute asynchronously
151 * @data: data pointer to pass to the function
152 * @node: NUMA node that we want to schedule this on or close to
153 * @domain: the domain
154 *
155 * Returns an async_cookie_t that may be used for checkpointing later.
156 * @domain may be used in the async_synchronize_*_domain() functions to
157 * wait within a certain synchronization domain rather than globally.
158 *
159 * Note: This function may be called from atomic or non-atomic contexts.
160 *
161 * The node requested will be honored on a best effort basis. If the node
162 * has no CPUs associated with it then the work is distributed among all
163 * available CPUs.
164 */
165async_cookie_t async_schedule_node_domain(async_func_t func, void *data,
166 int node, struct async_domain *domain)
Arjan van de Ven22a9d642009-01-07 08:45:46 -0800167{
168 struct async_entry *entry;
169 unsigned long flags;
170 async_cookie_t newcookie;
Arjan van de Ven22a9d642009-01-07 08:45:46 -0800171
172 /* allow irq-off callers */
173 entry = kzalloc(sizeof(struct async_entry), GFP_ATOMIC);
174
175 /*
176 * If we're out of memory or if there's too much work
177 * pending already, we execute synchronously.
178 */
Tejun Heo083b8042010-07-02 10:03:52 +0200179 if (!entry || atomic_read(&entry_count) > MAX_WORK) {
Arjan van de Ven22a9d642009-01-07 08:45:46 -0800180 kfree(entry);
181 spin_lock_irqsave(&async_lock, flags);
182 newcookie = next_cookie++;
183 spin_unlock_irqrestore(&async_lock, flags);
184
185 /* low on memory.. run synchronously */
Lai Jiangshan362f2b02013-03-12 13:59:14 -0700186 func(data, newcookie);
Arjan van de Ven22a9d642009-01-07 08:45:46 -0800187 return newcookie;
188 }
James Hogana0327ff2013-01-25 10:13:59 +0000189 INIT_LIST_HEAD(&entry->domain_list);
190 INIT_LIST_HEAD(&entry->global_list);
Tejun Heo083b8042010-07-02 10:03:52 +0200191 INIT_WORK(&entry->work, async_run_entry_fn);
Lai Jiangshan362f2b02013-03-12 13:59:14 -0700192 entry->func = func;
Arjan van de Ven22a9d642009-01-07 08:45:46 -0800193 entry->data = data;
Tejun Heo8723d5032013-01-23 09:32:30 -0800194 entry->domain = domain;
Arjan van de Ven22a9d642009-01-07 08:45:46 -0800195
196 spin_lock_irqsave(&async_lock, flags);
Tejun Heo9fdb04c2013-01-23 09:32:30 -0800197
198 /* allocate cookie and queue */
Arjan van de Ven22a9d642009-01-07 08:45:46 -0800199 newcookie = entry->cookie = next_cookie++;
Tejun Heo9fdb04c2013-01-23 09:32:30 -0800200
201 list_add_tail(&entry->domain_list, &domain->pending);
202 if (domain->registered)
203 list_add_tail(&entry->global_list, &async_global_pending);
204
Arjan van de Ven22a9d642009-01-07 08:45:46 -0800205 atomic_inc(&entry_count);
206 spin_unlock_irqrestore(&async_lock, flags);
Tejun Heo083b8042010-07-02 10:03:52 +0200207
Tejun Heo774a1222013-01-15 18:52:51 -0800208 /* mark that this task has queued an async job, used by module init */
209 current->flags |= PF_USED_ASYNC;
210
Tejun Heo083b8042010-07-02 10:03:52 +0200211 /* schedule for execution */
Alexander Duyck6be92382019-01-22 10:39:31 -0800212 queue_work_node(node, system_unbound_wq, &entry->work);
Tejun Heo083b8042010-07-02 10:03:52 +0200213
Arjan van de Ven22a9d642009-01-07 08:45:46 -0800214 return newcookie;
215}
Alexander Duyck6be92382019-01-22 10:39:31 -0800216EXPORT_SYMBOL_GPL(async_schedule_node_domain);
Arjan van de Ven22a9d642009-01-07 08:45:46 -0800217
Cornelia Huckf30d5b32009-01-19 13:45:33 +0100218/**
Alexander Duyck6be92382019-01-22 10:39:31 -0800219 * async_schedule_node - NUMA specific version of async_schedule
Lai Jiangshan362f2b02013-03-12 13:59:14 -0700220 * @func: function to execute asynchronously
Cornelia Huckf30d5b32009-01-19 13:45:33 +0100221 * @data: data pointer to pass to the function
Alexander Duyck6be92382019-01-22 10:39:31 -0800222 * @node: NUMA node that we want to schedule this on or close to
Cornelia Huckf30d5b32009-01-19 13:45:33 +0100223 *
224 * Returns an async_cookie_t that may be used for checkpointing later.
225 * Note: This function may be called from atomic or non-atomic contexts.
Cornelia Huckf30d5b32009-01-19 13:45:33 +0100226 *
Alexander Duyck6be92382019-01-22 10:39:31 -0800227 * The node requested will be honored on a best effort basis. If the node
228 * has no CPUs associated with it then the work is distributed among all
229 * available CPUs.
Cornelia Huckf30d5b32009-01-19 13:45:33 +0100230 */
Alexander Duyck6be92382019-01-22 10:39:31 -0800231async_cookie_t async_schedule_node(async_func_t func, void *data, int node)
Arjan van de Ven22a9d642009-01-07 08:45:46 -0800232{
Alexander Duyck6be92382019-01-22 10:39:31 -0800233 return async_schedule_node_domain(func, data, node, &async_dfl_domain);
Arjan van de Ven22a9d642009-01-07 08:45:46 -0800234}
Alexander Duyck6be92382019-01-22 10:39:31 -0800235EXPORT_SYMBOL_GPL(async_schedule_node);
Arjan van de Ven22a9d642009-01-07 08:45:46 -0800236
Cornelia Huckf30d5b32009-01-19 13:45:33 +0100237/**
238 * async_synchronize_full - synchronize all asynchronous function calls
239 *
240 * This function waits until all asynchronous function calls have been done.
241 */
Arjan van de Ven22a9d642009-01-07 08:45:46 -0800242void async_synchronize_full(void)
243{
Tejun Heo9fdb04c2013-01-23 09:32:30 -0800244 async_synchronize_full_domain(NULL);
Arjan van de Ven22a9d642009-01-07 08:45:46 -0800245}
246EXPORT_SYMBOL_GPL(async_synchronize_full);
247
Cornelia Huckf30d5b32009-01-19 13:45:33 +0100248/**
Cornelia Huck766ccb92009-01-20 15:31:31 +0100249 * async_synchronize_full_domain - synchronize all asynchronous function within a certain domain
Tejun Heo8723d5032013-01-23 09:32:30 -0800250 * @domain: the domain to synchronize
Cornelia Huckf30d5b32009-01-19 13:45:33 +0100251 *
Cornelia Huck766ccb92009-01-20 15:31:31 +0100252 * This function waits until all asynchronous function calls for the
Tejun Heo8723d5032013-01-23 09:32:30 -0800253 * synchronization domain specified by @domain have been done.
Cornelia Huckf30d5b32009-01-19 13:45:33 +0100254 */
Dan Williams2955b472012-07-09 19:33:25 -0700255void async_synchronize_full_domain(struct async_domain *domain)
Arjan van de Ven22a9d642009-01-07 08:45:46 -0800256{
Tejun Heoc68eee12013-01-23 09:32:30 -0800257 async_synchronize_cookie_domain(ASYNC_COOKIE_MAX, domain);
Arjan van de Ven22a9d642009-01-07 08:45:46 -0800258}
Cornelia Huck766ccb92009-01-20 15:31:31 +0100259EXPORT_SYMBOL_GPL(async_synchronize_full_domain);
Arjan van de Ven22a9d642009-01-07 08:45:46 -0800260
Cornelia Huckf30d5b32009-01-19 13:45:33 +0100261/**
Cornelia Huck766ccb92009-01-20 15:31:31 +0100262 * async_synchronize_cookie_domain - synchronize asynchronous function calls within a certain domain with cookie checkpointing
Cornelia Huckf30d5b32009-01-19 13:45:33 +0100263 * @cookie: async_cookie_t to use as checkpoint
Tejun Heo9fdb04c2013-01-23 09:32:30 -0800264 * @domain: the domain to synchronize (%NULL for all registered domains)
Cornelia Huckf30d5b32009-01-19 13:45:33 +0100265 *
Cornelia Huck766ccb92009-01-20 15:31:31 +0100266 * This function waits until all asynchronous function calls for the
Tejun Heo8723d5032013-01-23 09:32:30 -0800267 * synchronization domain specified by @domain submitted prior to @cookie
268 * have been done.
Cornelia Huckf30d5b32009-01-19 13:45:33 +0100269 */
Tejun Heo8723d5032013-01-23 09:32:30 -0800270void async_synchronize_cookie_domain(async_cookie_t cookie, struct async_domain *domain)
Arjan van de Ven22a9d642009-01-07 08:45:46 -0800271{
Rasmus Villemoes07416af2021-05-06 18:05:36 -0700272 ktime_t starttime;
Arjan van de Ven22a9d642009-01-07 08:45:46 -0800273
Rasmus Villemoes07416af2021-05-06 18:05:36 -0700274 pr_debug("async_waiting @ %i\n", task_pid_nr(current));
275 starttime = ktime_get();
Arjan van de Ven22a9d642009-01-07 08:45:46 -0800276
Tejun Heo8723d5032013-01-23 09:32:30 -0800277 wait_event(async_done, lowest_in_progress(domain) >= cookie);
Arjan van de Ven22a9d642009-01-07 08:45:46 -0800278
Rasmus Villemoes07416af2021-05-06 18:05:36 -0700279 pr_debug("async_continuing @ %i after %lli usec\n", task_pid_nr(current),
280 microseconds_since(starttime));
Arjan van de Ven22a9d642009-01-07 08:45:46 -0800281}
Cornelia Huck766ccb92009-01-20 15:31:31 +0100282EXPORT_SYMBOL_GPL(async_synchronize_cookie_domain);
Arjan van de Ven22a9d642009-01-07 08:45:46 -0800283
Cornelia Huckf30d5b32009-01-19 13:45:33 +0100284/**
285 * async_synchronize_cookie - synchronize asynchronous function calls with cookie checkpointing
286 * @cookie: async_cookie_t to use as checkpoint
287 *
288 * This function waits until all asynchronous function calls prior to @cookie
289 * have been done.
290 */
Arjan van de Ven22a9d642009-01-07 08:45:46 -0800291void async_synchronize_cookie(async_cookie_t cookie)
292{
Tejun Heo8723d5032013-01-23 09:32:30 -0800293 async_synchronize_cookie_domain(cookie, &async_dfl_domain);
Arjan van de Ven22a9d642009-01-07 08:45:46 -0800294}
295EXPORT_SYMBOL_GPL(async_synchronize_cookie);
Tejun Heo84b233a2013-01-18 14:05:56 -0800296
297/**
298 * current_is_async - is %current an async worker task?
299 *
300 * Returns %true if %current is an async worker task.
301 */
302bool current_is_async(void)
303{
304 struct worker *worker = current_wq_worker();
305
306 return worker && worker->current_func == async_run_entry_fn;
307}
Lukas Wunner581da2c2015-11-19 16:31:11 +0100308EXPORT_SYMBOL_GPL(current_is_async);