blob: 0101aeef7ed79fbd62aba8d1043976a110cf1f6e [file] [log] [blame]
Rusty Russelle5582ca2006-09-29 02:01:35 -07001/* Copyright 2005 Rusty Russell rusty@rustcorp.com.au IBM Corporation.
2 * GPL v2 and any later version.
3 */
Linus Torvalds1da177e2005-04-16 15:20:36 -07004#include <linux/cpu.h>
5#include <linux/err.h>
Prarit Bhargavaee527cd2007-05-08 00:25:08 -07006#include <linux/kthread.h>
7#include <linux/module.h>
8#include <linux/sched.h>
9#include <linux/stop_machine.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070010#include <linux/syscalls.h>
Benjamin Herrenschmidta12bb442007-05-10 22:22:47 -070011#include <linux/interrupt.h>
12
Linus Torvalds1da177e2005-04-16 15:20:36 -070013#include <asm/atomic.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070014#include <asm/uaccess.h>
15
16/* Since we effect priority and affinity (both of which are visible
17 * to, and settable by outside processes) we do indirection via a
18 * kthread. */
19
20/* Thread to stop each CPU in user context. */
21enum stopmachine_state {
22 STOPMACHINE_WAIT,
23 STOPMACHINE_PREPARE,
24 STOPMACHINE_DISABLE_IRQ,
25 STOPMACHINE_EXIT,
26};
27
28static enum stopmachine_state stopmachine_state;
29static unsigned int stopmachine_num_threads;
30static atomic_t stopmachine_thread_ack;
Linus Torvalds1da177e2005-04-16 15:20:36 -070031
Andrew Mortond8cb7c12006-07-03 17:32:22 -070032static int stopmachine(void *cpu)
Linus Torvalds1da177e2005-04-16 15:20:36 -070033{
34 int irqs_disabled = 0;
35 int prepared = 0;
36
Mike Travisf70316d2008-04-04 18:11:06 -070037 set_cpus_allowed_ptr(current, &cpumask_of_cpu((int)(long)cpu));
Andrew Mortond8cb7c12006-07-03 17:32:22 -070038
Linus Torvalds1da177e2005-04-16 15:20:36 -070039 /* Ack: we are alive */
akpm@osdl.orgd59dd462005-05-01 08:58:47 -070040 smp_mb(); /* Theoretically the ack = 0 might not be on this CPU yet. */
Linus Torvalds1da177e2005-04-16 15:20:36 -070041 atomic_inc(&stopmachine_thread_ack);
42
43 /* Simple state machine */
44 while (stopmachine_state != STOPMACHINE_EXIT) {
45 if (stopmachine_state == STOPMACHINE_DISABLE_IRQ
46 && !irqs_disabled) {
47 local_irq_disable();
Benjamin Herrenschmidta12bb442007-05-10 22:22:47 -070048 hard_irq_disable();
Linus Torvalds1da177e2005-04-16 15:20:36 -070049 irqs_disabled = 1;
50 /* Ack: irqs disabled. */
akpm@osdl.orgd59dd462005-05-01 08:58:47 -070051 smp_mb(); /* Must read state first. */
Linus Torvalds1da177e2005-04-16 15:20:36 -070052 atomic_inc(&stopmachine_thread_ack);
53 } else if (stopmachine_state == STOPMACHINE_PREPARE
54 && !prepared) {
55 /* Everyone is in place, hold CPU. */
56 preempt_disable();
57 prepared = 1;
akpm@osdl.orgd59dd462005-05-01 08:58:47 -070058 smp_mb(); /* Must read state first. */
Linus Torvalds1da177e2005-04-16 15:20:36 -070059 atomic_inc(&stopmachine_thread_ack);
60 }
61 /* Yield in first stage: migration threads need to
62 * help our sisters onto their CPUs. */
63 if (!prepared && !irqs_disabled)
64 yield();
65 else
66 cpu_relax();
67 }
68
69 /* Ack: we are exiting. */
akpm@osdl.orgd59dd462005-05-01 08:58:47 -070070 smp_mb(); /* Must read state first. */
Linus Torvalds1da177e2005-04-16 15:20:36 -070071 atomic_inc(&stopmachine_thread_ack);
72
73 if (irqs_disabled)
74 local_irq_enable();
75 if (prepared)
76 preempt_enable();
77
78 return 0;
79}
80
81/* Change the thread state */
82static void stopmachine_set_state(enum stopmachine_state state)
83{
84 atomic_set(&stopmachine_thread_ack, 0);
akpm@osdl.orgd59dd462005-05-01 08:58:47 -070085 smp_wmb();
Linus Torvalds1da177e2005-04-16 15:20:36 -070086 stopmachine_state = state;
87 while (atomic_read(&stopmachine_thread_ack) != stopmachine_num_threads)
88 cpu_relax();
89}
90
91static int stop_machine(void)
92{
Andrew Mortond8cb7c12006-07-03 17:32:22 -070093 int i, ret = 0;
Linus Torvalds1da177e2005-04-16 15:20:36 -070094
95 atomic_set(&stopmachine_thread_ack, 0);
96 stopmachine_num_threads = 0;
97 stopmachine_state = STOPMACHINE_WAIT;
98
99 for_each_online_cpu(i) {
Ingo Molnar39c715b2005-06-21 17:14:34 -0700100 if (i == raw_smp_processor_id())
Linus Torvalds1da177e2005-04-16 15:20:36 -0700101 continue;
Andrew Mortond8cb7c12006-07-03 17:32:22 -0700102 ret = kernel_thread(stopmachine, (void *)(long)i,CLONE_KERNEL);
103 if (ret < 0)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700104 break;
105 stopmachine_num_threads++;
106 }
107
108 /* Wait for them all to come to life. */
109 while (atomic_read(&stopmachine_thread_ack) != stopmachine_num_threads)
110 yield();
111
112 /* If some failed, kill them all. */
113 if (ret < 0) {
114 stopmachine_set_state(STOPMACHINE_EXIT);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700115 return ret;
116 }
117
Linus Torvalds1da177e2005-04-16 15:20:36 -0700118 /* Now they are all started, make them hold the CPUs, ready. */
Kirill Korotaev45573982005-11-13 16:07:30 -0800119 preempt_disable();
Linus Torvalds1da177e2005-04-16 15:20:36 -0700120 stopmachine_set_state(STOPMACHINE_PREPARE);
121
122 /* Make them disable irqs. */
Kirill Korotaev45573982005-11-13 16:07:30 -0800123 local_irq_disable();
Benjamin Herrenschmidta12bb442007-05-10 22:22:47 -0700124 hard_irq_disable();
Linus Torvalds1da177e2005-04-16 15:20:36 -0700125 stopmachine_set_state(STOPMACHINE_DISABLE_IRQ);
126
127 return 0;
128}
129
130static void restart_machine(void)
131{
132 stopmachine_set_state(STOPMACHINE_EXIT);
133 local_irq_enable();
Kirill Korotaev45573982005-11-13 16:07:30 -0800134 preempt_enable_no_resched();
Linus Torvalds1da177e2005-04-16 15:20:36 -0700135}
136
Pavel Machekf5264482008-04-21 22:15:06 +0000137struct stop_machine_data {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700138 int (*fn)(void *);
139 void *data;
140 struct completion done;
141};
142
143static int do_stop(void *_smdata)
144{
145 struct stop_machine_data *smdata = _smdata;
146 int ret;
147
148 ret = stop_machine();
149 if (ret == 0) {
150 ret = smdata->fn(smdata->data);
151 restart_machine();
152 }
153
154 /* We're done: you can kthread_stop us now */
155 complete(&smdata->done);
156
157 /* Wait for kthread_stop */
158 set_current_state(TASK_INTERRUPTIBLE);
159 while (!kthread_should_stop()) {
160 schedule();
161 set_current_state(TASK_INTERRUPTIBLE);
162 }
163 __set_current_state(TASK_RUNNING);
164 return ret;
165}
166
167struct task_struct *__stop_machine_run(int (*fn)(void *), void *data,
168 unsigned int cpu)
169{
Daniel Walker6c6080f2008-02-06 01:37:41 -0800170 static DEFINE_MUTEX(stopmachine_mutex);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700171 struct stop_machine_data smdata;
172 struct task_struct *p;
173
174 smdata.fn = fn;
175 smdata.data = data;
176 init_completion(&smdata.done);
177
Daniel Walker6c6080f2008-02-06 01:37:41 -0800178 mutex_lock(&stopmachine_mutex);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700179
180 /* If they don't care which CPU fn runs on, bind to any online one. */
181 if (cpu == NR_CPUS)
Ingo Molnar39c715b2005-06-21 17:14:34 -0700182 cpu = raw_smp_processor_id();
Linus Torvalds1da177e2005-04-16 15:20:36 -0700183
184 p = kthread_create(do_stop, &smdata, "kstopmachine");
185 if (!IS_ERR(p)) {
Satoru Takeuchi85653af2007-07-15 23:39:47 -0700186 struct sched_param param = { .sched_priority = MAX_RT_PRIO-1 };
187
188 /* One high-prio thread per cpu. We'll do this one. */
189 sched_setscheduler(p, SCHED_FIFO, &param);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700190 kthread_bind(p, cpu);
191 wake_up_process(p);
192 wait_for_completion(&smdata.done);
193 }
Daniel Walker6c6080f2008-02-06 01:37:41 -0800194 mutex_unlock(&stopmachine_mutex);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700195 return p;
196}
197
198int stop_machine_run(int (*fn)(void *), void *data, unsigned int cpu)
199{
200 struct task_struct *p;
201 int ret;
202
203 /* No CPUs can come up or down during this. */
Gautham R Shenoy86ef5c92008-01-25 21:08:02 +0100204 get_online_cpus();
Linus Torvalds1da177e2005-04-16 15:20:36 -0700205 p = __stop_machine_run(fn, data, cpu);
206 if (!IS_ERR(p))
207 ret = kthread_stop(p);
208 else
209 ret = PTR_ERR(p);
Gautham R Shenoy86ef5c92008-01-25 21:08:02 +0100210 put_online_cpus();
Linus Torvalds1da177e2005-04-16 15:20:36 -0700211
212 return ret;
213}
Prarit Bhargavaee527cd2007-05-08 00:25:08 -0700214EXPORT_SYMBOL_GPL(stop_machine_run);