1
2
3
4
5
6
7
8
9
10
11#include <linux/completion.h>
12#include <linux/cpu.h>
13#include <linux/init.h>
14#include <linux/kthread.h>
15#include <linux/export.h>
16#include <linux/percpu.h>
17#include <linux/sched.h>
18#include <linux/stop_machine.h>
19#include <linux/interrupt.h>
20#include <linux/kallsyms.h>
21#include <linux/smpboot.h>
22#include <linux/atomic.h>
23#include <linux/lglock.h>
24
25
26
27
28
29struct cpu_stop_done {
30 atomic_t nr_todo;
31 bool executed;
32 int ret;
33 struct completion completion;
34};
35
36
37struct cpu_stopper {
38 spinlock_t lock;
39 bool enabled;
40 struct list_head works;
41};
42
43static DEFINE_PER_CPU(struct cpu_stopper, cpu_stopper);
44static DEFINE_PER_CPU(struct task_struct *, cpu_stopper_task);
45static bool stop_machine_initialized = false;
46
47
48
49
50
51
52
53DEFINE_STATIC_LGLOCK(stop_cpus_lock);
54
55static void cpu_stop_init_done(struct cpu_stop_done *done, unsigned int nr_todo)
56{
57 memset(done, 0, sizeof(*done));
58 atomic_set(&done->nr_todo, nr_todo);
59 init_completion(&done->completion);
60}
61
62
63static void cpu_stop_signal_done(struct cpu_stop_done *done, bool executed)
64{
65 if (done) {
66 if (executed)
67 done->executed = true;
68 if (atomic_dec_and_test(&done->nr_todo))
69 complete(&done->completion);
70 }
71}
72
73
74static void cpu_stop_queue_work(unsigned int cpu, struct cpu_stop_work *work)
75{
76 struct cpu_stopper *stopper = &per_cpu(cpu_stopper, cpu);
77 struct task_struct *p = per_cpu(cpu_stopper_task, cpu);
78
79 unsigned long flags;
80
81 spin_lock_irqsave(&stopper->lock, flags);
82
83 if (stopper->enabled) {
84 list_add_tail(&work->list, &stopper->works);
85 wake_up_process(p);
86 } else
87 cpu_stop_signal_done(work->done, false);
88
89 spin_unlock_irqrestore(&stopper->lock, flags);
90}
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116int stop_one_cpu(unsigned int cpu, cpu_stop_fn_t fn, void *arg)
117{
118 struct cpu_stop_done done;
119 struct cpu_stop_work work = { .fn = fn, .arg = arg, .done = &done };
120
121 cpu_stop_init_done(&done, 1);
122 cpu_stop_queue_work(cpu, &work);
123 wait_for_completion(&done.completion);
124 return done.executed ? done.ret : -ENOENT;
125}
126
127
128enum multi_stop_state {
129
130 MULTI_STOP_NONE,
131
132 MULTI_STOP_PREPARE,
133
134 MULTI_STOP_DISABLE_IRQ,
135
136 MULTI_STOP_RUN,
137
138 MULTI_STOP_EXIT,
139};
140
141struct multi_stop_data {
142 int (*fn)(void *);
143 void *data;
144
145 unsigned int num_threads;
146 const struct cpumask *active_cpus;
147
148 enum multi_stop_state state;
149 atomic_t thread_ack;
150};
151
152static void set_state(struct multi_stop_data *msdata,
153 enum multi_stop_state newstate)
154{
155
156 atomic_set(&msdata->thread_ack, msdata->num_threads);
157 smp_wmb();
158 msdata->state = newstate;
159}
160
161
162static void ack_state(struct multi_stop_data *msdata)
163{
164 if (atomic_dec_and_test(&msdata->thread_ack))
165 set_state(msdata, msdata->state + 1);
166}
167
168
169static int multi_cpu_stop(void *data)
170{
171 struct multi_stop_data *msdata = data;
172 enum multi_stop_state curstate = MULTI_STOP_NONE;
173 int cpu = smp_processor_id(), err = 0;
174 unsigned long flags;
175 bool is_active;
176
177
178
179
180
181 local_save_flags(flags);
182
183 if (!msdata->active_cpus)
184 is_active = cpu == cpumask_first(cpu_online_mask);
185 else
186 is_active = cpumask_test_cpu(cpu, msdata->active_cpus);
187
188
189 do {
190
191 cpu_relax();
192 if (msdata->state != curstate) {
193 curstate = msdata->state;
194 switch (curstate) {
195 case MULTI_STOP_DISABLE_IRQ:
196 local_irq_disable();
197 hard_irq_disable();
198 break;
199 case MULTI_STOP_RUN:
200 if (is_active)
201 err = msdata->fn(msdata->data);
202 break;
203 default:
204 break;
205 }
206 ack_state(msdata);
207 }
208 } while (curstate != MULTI_STOP_EXIT);
209
210 local_irq_restore(flags);
211 return err;
212}
213
214struct irq_cpu_stop_queue_work_info {
215 int cpu1;
216 int cpu2;
217 struct cpu_stop_work *work1;
218 struct cpu_stop_work *work2;
219};
220
221
222
223
224
225
226static void irq_cpu_stop_queue_work(void *arg)
227{
228 struct irq_cpu_stop_queue_work_info *info = arg;
229 cpu_stop_queue_work(info->cpu1, info->work1);
230 cpu_stop_queue_work(info->cpu2, info->work2);
231}
232
233
234
235
236
237
238
239
240
241
242
243
244int stop_two_cpus(unsigned int cpu1, unsigned int cpu2, cpu_stop_fn_t fn, void *arg)
245{
246 struct cpu_stop_done done;
247 struct cpu_stop_work work1, work2;
248 struct irq_cpu_stop_queue_work_info call_args;
249 struct multi_stop_data msdata;
250
251 preempt_disable();
252 msdata = (struct multi_stop_data){
253 .fn = fn,
254 .data = arg,
255 .num_threads = 2,
256 .active_cpus = cpumask_of(cpu1),
257 };
258
259 work1 = work2 = (struct cpu_stop_work){
260 .fn = multi_cpu_stop,
261 .arg = &msdata,
262 .done = &done
263 };
264
265 call_args = (struct irq_cpu_stop_queue_work_info){
266 .cpu1 = cpu1,
267 .cpu2 = cpu2,
268 .work1 = &work1,
269 .work2 = &work2,
270 };
271
272 cpu_stop_init_done(&done, 2);
273 set_state(&msdata, MULTI_STOP_PREPARE);
274
275
276
277
278
279
280
281
282
283 if (!cpu_active(cpu1) || !cpu_active(cpu2)) {
284 preempt_enable();
285 return -ENOENT;
286 }
287
288 lg_local_lock(&stop_cpus_lock);
289
290
291
292
293
294 smp_call_function_single(min(cpu1, cpu2),
295 &irq_cpu_stop_queue_work,
296 &call_args, 1);
297 lg_local_unlock(&stop_cpus_lock);
298 preempt_enable();
299
300 wait_for_completion(&done.completion);
301
302 return done.executed ? done.ret : -ENOENT;
303}
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318void stop_one_cpu_nowait(unsigned int cpu, cpu_stop_fn_t fn, void *arg,
319 struct cpu_stop_work *work_buf)
320{
321 *work_buf = (struct cpu_stop_work){ .fn = fn, .arg = arg, };
322 cpu_stop_queue_work(cpu, work_buf);
323}
324
325
326static DEFINE_MUTEX(stop_cpus_mutex);
327static DEFINE_PER_CPU(struct cpu_stop_work, stop_cpus_work);
328
329static void queue_stop_cpus_work(const struct cpumask *cpumask,
330 cpu_stop_fn_t fn, void *arg,
331 struct cpu_stop_done *done)
332{
333 struct cpu_stop_work *work;
334 unsigned int cpu;
335
336
337 for_each_cpu(cpu, cpumask) {
338 work = &per_cpu(stop_cpus_work, cpu);
339 work->fn = fn;
340 work->arg = arg;
341 work->done = done;
342 }
343
344
345
346
347
348
349 lg_global_lock(&stop_cpus_lock);
350 for_each_cpu(cpu, cpumask)
351 cpu_stop_queue_work(cpu, &per_cpu(stop_cpus_work, cpu));
352 lg_global_unlock(&stop_cpus_lock);
353}
354
355static int __stop_cpus(const struct cpumask *cpumask,
356 cpu_stop_fn_t fn, void *arg)
357{
358 struct cpu_stop_done done;
359
360 cpu_stop_init_done(&done, cpumask_weight(cpumask));
361 queue_stop_cpus_work(cpumask, fn, arg, &done);
362 wait_for_completion(&done.completion);
363 return done.executed ? done.ret : -ENOENT;
364}
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394int stop_cpus(const struct cpumask *cpumask, cpu_stop_fn_t fn, void *arg)
395{
396 int ret;
397
398
399 mutex_lock(&stop_cpus_mutex);
400 ret = __stop_cpus(cpumask, fn, arg);
401 mutex_unlock(&stop_cpus_mutex);
402 return ret;
403}
404
405
406
407
408
409
410
411
412
413
414
415
416
417
418
419
420
421
422
423int try_stop_cpus(const struct cpumask *cpumask, cpu_stop_fn_t fn, void *arg)
424{
425 int ret;
426
427
428 if (!mutex_trylock(&stop_cpus_mutex))
429 return -EAGAIN;
430 ret = __stop_cpus(cpumask, fn, arg);
431 mutex_unlock(&stop_cpus_mutex);
432 return ret;
433}
434
435static int cpu_stop_should_run(unsigned int cpu)
436{
437 struct cpu_stopper *stopper = &per_cpu(cpu_stopper, cpu);
438 unsigned long flags;
439 int run;
440
441 spin_lock_irqsave(&stopper->lock, flags);
442 run = !list_empty(&stopper->works);
443 spin_unlock_irqrestore(&stopper->lock, flags);
444 return run;
445}
446
447static void cpu_stopper_thread(unsigned int cpu)
448{
449 struct cpu_stopper *stopper = &per_cpu(cpu_stopper, cpu);
450 struct cpu_stop_work *work;
451 int ret;
452
453repeat:
454 work = NULL;
455 spin_lock_irq(&stopper->lock);
456 if (!list_empty(&stopper->works)) {
457 work = list_first_entry(&stopper->works,
458 struct cpu_stop_work, list);
459 list_del_init(&work->list);
460 }
461 spin_unlock_irq(&stopper->lock);
462
463 if (work) {
464 cpu_stop_fn_t fn = work->fn;
465 void *arg = work->arg;
466 struct cpu_stop_done *done = work->done;
467 char ksym_buf[KSYM_NAME_LEN] __maybe_unused;
468
469
470 preempt_disable();
471
472 ret = fn(arg);
473 if (ret)
474 done->ret = ret;
475
476
477 preempt_enable();
478 WARN_ONCE(preempt_count(),
479 "cpu_stop: %s(%p) leaked preempt count\n",
480 kallsyms_lookup((unsigned long)fn, NULL, NULL, NULL,
481 ksym_buf), arg);
482
483 cpu_stop_signal_done(done, true);
484 goto repeat;
485 }
486}
487
488extern void sched_set_stop_task(int cpu, struct task_struct *stop);
489
490static void cpu_stop_create(unsigned int cpu)
491{
492 sched_set_stop_task(cpu, per_cpu(cpu_stopper_task, cpu));
493}
494
495static void cpu_stop_park(unsigned int cpu)
496{
497 struct cpu_stopper *stopper = &per_cpu(cpu_stopper, cpu);
498 struct cpu_stop_work *work;
499 unsigned long flags;
500
501
502 spin_lock_irqsave(&stopper->lock, flags);
503 list_for_each_entry(work, &stopper->works, list)
504 cpu_stop_signal_done(work->done, false);
505 stopper->enabled = false;
506 spin_unlock_irqrestore(&stopper->lock, flags);
507}
508
509static void cpu_stop_unpark(unsigned int cpu)
510{
511 struct cpu_stopper *stopper = &per_cpu(cpu_stopper, cpu);
512
513 spin_lock_irq(&stopper->lock);
514 stopper->enabled = true;
515 spin_unlock_irq(&stopper->lock);
516}
517
518static struct smp_hotplug_thread cpu_stop_threads = {
519 .store = &cpu_stopper_task,
520 .thread_should_run = cpu_stop_should_run,
521 .thread_fn = cpu_stopper_thread,
522 .thread_comm = "migration/%u",
523 .create = cpu_stop_create,
524 .setup = cpu_stop_unpark,
525 .park = cpu_stop_park,
526 .pre_unpark = cpu_stop_unpark,
527 .selfparking = true,
528};
529
530static int __init cpu_stop_init(void)
531{
532 unsigned int cpu;
533
534 for_each_possible_cpu(cpu) {
535 struct cpu_stopper *stopper = &per_cpu(cpu_stopper, cpu);
536
537 spin_lock_init(&stopper->lock);
538 INIT_LIST_HEAD(&stopper->works);
539 }
540
541 BUG_ON(smpboot_register_percpu_thread(&cpu_stop_threads));
542 stop_machine_initialized = true;
543 return 0;
544}
545early_initcall(cpu_stop_init);
546
547#ifdef CONFIG_STOP_MACHINE
548
549int __stop_machine(int (*fn)(void *), void *data, const struct cpumask *cpus)
550{
551 struct multi_stop_data msdata = {
552 .fn = fn,
553 .data = data,
554 .num_threads = num_online_cpus(),
555 .active_cpus = cpus,
556 };
557
558 if (!stop_machine_initialized) {
559
560
561
562
563
564 unsigned long flags;
565 int ret;
566
567 WARN_ON_ONCE(msdata.num_threads != 1);
568
569 local_irq_save(flags);
570 hard_irq_disable();
571 ret = (*fn)(data);
572 local_irq_restore(flags);
573
574 return ret;
575 }
576
577
578 set_state(&msdata, MULTI_STOP_PREPARE);
579 return stop_cpus(cpu_online_mask, multi_cpu_stop, &msdata);
580}
581
582int stop_machine(int (*fn)(void *), void *data, const struct cpumask *cpus)
583{
584 int ret;
585
586
587 get_online_cpus();
588 ret = __stop_machine(fn, data, cpus);
589 put_online_cpus();
590 return ret;
591}
592EXPORT_SYMBOL_GPL(stop_machine);
593
594
595
596
597
598
599
600
601
602
603
604
605
606
607
608
609
610
611
612
613
614
615
616int stop_machine_from_inactive_cpu(int (*fn)(void *), void *data,
617 const struct cpumask *cpus)
618{
619 struct multi_stop_data msdata = { .fn = fn, .data = data,
620 .active_cpus = cpus };
621 struct cpu_stop_done done;
622 int ret;
623
624
625 BUG_ON(cpu_active(raw_smp_processor_id()));
626 msdata.num_threads = num_active_cpus() + 1;
627
628
629 while (!mutex_trylock(&stop_cpus_mutex))
630 cpu_relax();
631
632
633 set_state(&msdata, MULTI_STOP_PREPARE);
634 cpu_stop_init_done(&done, num_active_cpus());
635 queue_stop_cpus_work(cpu_active_mask, multi_cpu_stop, &msdata,
636 &done);
637 ret = multi_cpu_stop(&msdata);
638
639
640 while (!completion_done(&done.completion))
641 cpu_relax();
642
643 mutex_unlock(&stop_cpus_mutex);
644 return ret ?: done.ret;
645}
646
647#endif
648