1234567891011121314151617181920212223242526272829303132333435363738394041424344454647484950515253545556575859606162636465666768697071727374757677787980818283848586878889909192939495969798991001011021031041051061071081091101111121131141151161171181191201211221231241251261271281291301311321331341351361371381391401411421431441451461471481491501511521531541551561571581591601611621631641651661671681691701711721731741751761771781791801811821831841851861871881891901911921931941951961971981992002012022032042052062072082092102112122132142152162172182192202212222232242252262272282292302312322332342352362372382392402412422432442452462472482492502512522532542552562572582592602612622632642652662672682692702712722732742752762772782792802812822832842852862872882892902912922932942952962972982993003013023033043053063073083093103113123133143153163173183193203213223233243253263273283293303313323333343353363373383393403413423433443453463473483493503513523533543553563573583593603613623633643653663673683693703713723733743753763773783793803813823833843853863873883893903913923933943953963973983994004014024034044054064074084094104114124134144154164174184194204214224234244254264274284294304314324334344354364374384394404414424434444454464474484494504514524534544554564574584594604614624634644654664674684694704714724734744754764774784794804814824834844854864874884894904914924934944954964974984995005015025035045055065075085095105115125135145155165175185195205215225235245255265275285295305315325335345355365375385395405415425435445455465475485495505515525535545555565575585595605615625635645655665675685695705715725735745755765775785795805815825835845855865875885895905915925935945955965975985996006016026036046056066076086096106116126136146156166176186196206216226236246256266276286296306316326336346356366376386396406416426436446456466476486496506516526536546556566576586596606616626636646656666676686696706716726736746756766776786796806816826836846856866876886896906916926936946956966976986997007017027037047057067077087097107117127137147157167177187197207217227237247257267277287297307317327337347357367377387397407417427437447457467477487497507517527537547557567577587597607617627637647657667677687697707717727737747757767777787797807817827837847857867877887897907917927937947957967977987998008018028038048058068078088098108118128138148158168178188198208218228238248258268278288298308318328338348358368378388398408418428438448458468478488498508518528538548558568578588598608618628638648658668678688698708718728738748758768778788798808818828838848858868878888898908918928938948958968978988999009019029039049059069079089099109119129139149159169179189199209219229239249259269279289299309319329339349359369379389399409419429439449459469479489499509519529539549559569579589599609619629639649659669679689699709719729739749759769779789799809819829839849859869879889899909919929939949959969979989991000100110021003100410051006100710081009101010111012101310141015101610171018101910201021102210231024102510261027102810291030103110321033103410351036103710381039104010411042104310441045104610471048104910501051105210531054105510561057105810591060106110621063106410651066106710681069107010711072107310741075107610771078107910801081108210831084108510861087108810891090109110921093109410951096109710981099110011011102110311041105110611071108110911101111111211131114111511161117111811191120112111221123112411251126112711281129113011311132113311341135113611371138113911401141114211431144114511461147114811491150115111521153115411551156115711581159116011611162116311641165116611671168116911701171117211731174117511761177117811791180118111821183118411851186118711881189119011911192119311941195119611971198119912001201120212031204120512061207120812091210121112121213121412151216121712181219122012211222122312241225122612271228122912301231123212331234123512361237123812391240124112421243124412451246124712481249125012511252125312541255125612571258125912601261126212631264126512661267126812691270127112721273127412751276127712781279128012811282128312841285128612871288128912901291129212931294129512961297129812991300130113021303130413051306130713081309131013111312131313141315131613171318131913201321132213231324132513261327132813291330133113321333133413351336133713381339134013411342134313441345134613471348134913501351135213531354135513561357135813591360136113621363136413651366136713681369137013711372137313741375137613771378137913801381138213831384138513861387138813891390139113921393139413951396139713981399140014011402140314041405140614071408140914101411141214131414141514161417141814191420142114221423142414251426142714281429143014311432143314341435143614371438143914401441144214431444144514461447144814491450145114521453145414551456145714581459146014611462146314641465146614671468146914701471147214731474147514761477147814791480148114821483148414851486148714881489149014911492149314941495149614971498149915001501150215031504150515061507150815091510151115121513151415151516151715181519152015211522152315241525152615271528152915301531153215331534153515361537153815391540154115421543154415451546154715481549155015511552155315541555155615571558155915601561156215631564156515661567156815691570157115721573157415751576157715781579158015811582158315841585158615871588158915901591159215931594159515961597159815991600160116021603160416051606160716081609161016111612161316141615161616171618161916201621162216231624162516261627162816291630163116321633163416351636163716381639164016411642164316441645164616471648164916501651165216531654165516561657165816591660166116621663166416651666166716681669167016711672167316741675167616771678167916801681168216831684168516861687168816891690169116921693169416951696169716981699170017011702170317041705170617071708170917101711171217131714171517161717171817191720172117221723172417251726172717281729173017311732173317341735173617371738173917401741174217431744174517461747174817491750175117521753175417551756175717581759176017611762176317641765176617671768176917701771177217731774177517761777177817791780178117821783178417851786178717881789179017911792179317941795179617971798179918001801180218031804180518061807180818091810181118121813181418151816181718181819182018211822182318241825182618271828182918301831183218331834183518361837183818391840184118421843184418451846184718481849185018511852185318541855185618571858185918601861186218631864186518661867186818691870187118721873187418751876187718781879188018811882188318841885188618871888188918901891189218931894189518961897189818991900190119021903190419051906190719081909191019111912191319141915191619171918191919201921192219231924192519261927192819291930193119321933193419351936193719381939194019411942194319441945194619471948194919501951 |
- /* CPU control.
- * (C) 2001, 2002, 2003, 2004 Rusty Russell
- *
- * This code is licenced under the GPL.
- */
- #include <linux/proc_fs.h>
- #include <linux/smp.h>
- #include <linux/init.h>
- #include <linux/notifier.h>
- #include <linux/sched.h>
- #include <linux/unistd.h>
- #include <linux/cpu.h>
- #include <linux/oom.h>
- #include <linux/rcupdate.h>
- #include <linux/export.h>
- #include <linux/bug.h>
- #include <linux/kthread.h>
- #include <linux/stop_machine.h>
- #include <linux/mutex.h>
- #include <linux/gfp.h>
- #include <linux/suspend.h>
- #include <linux/lockdep.h>
- #include <linux/tick.h>
- #include <linux/irq.h>
- #include <linux/smpboot.h>
- #include <linux/relay.h>
- #include <linux/slab.h>
- #include <trace/events/power.h>
- #define CREATE_TRACE_POINTS
- #include <trace/events/cpuhp.h>
- #include "smpboot.h"
- /**
- * cpuhp_cpu_state - Per cpu hotplug state storage
- * @state: The current cpu state
- * @target: The target state
- * @thread: Pointer to the hotplug thread
- * @should_run: Thread should execute
- * @rollback: Perform a rollback
- * @single: Single callback invocation
- * @bringup: Single callback bringup or teardown selector
- * @cb_state: The state for a single callback (install/uninstall)
- * @result: Result of the operation
- * @done: Signal completion to the issuer of the task
- */
- struct cpuhp_cpu_state {
- enum cpuhp_state state;
- enum cpuhp_state target;
- #ifdef CONFIG_SMP
- struct task_struct *thread;
- bool should_run;
- bool rollback;
- bool single;
- bool bringup;
- struct hlist_node *node;
- enum cpuhp_state cb_state;
- int result;
- struct completion done;
- #endif
- };
- static DEFINE_PER_CPU(struct cpuhp_cpu_state, cpuhp_state);
- #if defined(CONFIG_LOCKDEP) && defined(CONFIG_SMP)
- static struct lock_class_key cpuhp_state_key;
- static struct lockdep_map cpuhp_state_lock_map =
- STATIC_LOCKDEP_MAP_INIT("cpuhp_state", &cpuhp_state_key);
- #endif
- /**
- * cpuhp_step - Hotplug state machine step
- * @name: Name of the step
- * @startup: Startup function of the step
- * @teardown: Teardown function of the step
- * @skip_onerr: Do not invoke the functions on error rollback
- * Will go away once the notifiers are gone
- * @cant_stop: Bringup/teardown can't be stopped at this step
- */
- struct cpuhp_step {
- const char *name;
- union {
- int (*single)(unsigned int cpu);
- int (*multi)(unsigned int cpu,
- struct hlist_node *node);
- } startup;
- union {
- int (*single)(unsigned int cpu);
- int (*multi)(unsigned int cpu,
- struct hlist_node *node);
- } teardown;
- struct hlist_head list;
- bool skip_onerr;
- bool cant_stop;
- bool multi_instance;
- };
- static DEFINE_MUTEX(cpuhp_state_mutex);
- static struct cpuhp_step cpuhp_bp_states[];
- static struct cpuhp_step cpuhp_ap_states[];
- static bool cpuhp_is_ap_state(enum cpuhp_state state)
- {
- /*
- * The extra check for CPUHP_TEARDOWN_CPU is only for documentation
- * purposes as that state is handled explicitly in cpu_down.
- */
- return state > CPUHP_BRINGUP_CPU && state != CPUHP_TEARDOWN_CPU;
- }
- static struct cpuhp_step *cpuhp_get_step(enum cpuhp_state state)
- {
- struct cpuhp_step *sp;
- sp = cpuhp_is_ap_state(state) ? cpuhp_ap_states : cpuhp_bp_states;
- return sp + state;
- }
- /**
- * cpuhp_invoke_callback _ Invoke the callbacks for a given state
- * @cpu: The cpu for which the callback should be invoked
- * @step: The step in the state machine
- * @bringup: True if the bringup callback should be invoked
- *
- * Called from cpu hotplug and from the state register machinery.
- */
- static int cpuhp_invoke_callback(unsigned int cpu, enum cpuhp_state state,
- bool bringup, struct hlist_node *node)
- {
- struct cpuhp_cpu_state *st = per_cpu_ptr(&cpuhp_state, cpu);
- struct cpuhp_step *step = cpuhp_get_step(state);
- int (*cbm)(unsigned int cpu, struct hlist_node *node);
- int (*cb)(unsigned int cpu);
- int ret, cnt;
- if (!step->multi_instance) {
- cb = bringup ? step->startup.single : step->teardown.single;
- if (!cb)
- return 0;
- trace_cpuhp_enter(cpu, st->target, state, cb);
- ret = cb(cpu);
- trace_cpuhp_exit(cpu, st->state, state, ret);
- return ret;
- }
- cbm = bringup ? step->startup.multi : step->teardown.multi;
- if (!cbm)
- return 0;
- /* Single invocation for instance add/remove */
- if (node) {
- trace_cpuhp_multi_enter(cpu, st->target, state, cbm, node);
- ret = cbm(cpu, node);
- trace_cpuhp_exit(cpu, st->state, state, ret);
- return ret;
- }
- /* State transition. Invoke on all instances */
- cnt = 0;
- hlist_for_each(node, &step->list) {
- trace_cpuhp_multi_enter(cpu, st->target, state, cbm, node);
- ret = cbm(cpu, node);
- trace_cpuhp_exit(cpu, st->state, state, ret);
- if (ret)
- goto err;
- cnt++;
- }
- return 0;
- err:
- /* Rollback the instances if one failed */
- cbm = !bringup ? step->startup.multi : step->teardown.multi;
- if (!cbm)
- return ret;
- hlist_for_each(node, &step->list) {
- if (!cnt--)
- break;
- cbm(cpu, node);
- }
- return ret;
- }
- #ifdef CONFIG_SMP
- /* Serializes the updates to cpu_online_mask, cpu_present_mask */
- static DEFINE_MUTEX(cpu_add_remove_lock);
- bool cpuhp_tasks_frozen;
- EXPORT_SYMBOL_GPL(cpuhp_tasks_frozen);
- /*
- * The following two APIs (cpu_maps_update_begin/done) must be used when
- * attempting to serialize the updates to cpu_online_mask & cpu_present_mask.
- * The APIs cpu_notifier_register_begin/done() must be used to protect CPU
- * hotplug callback (un)registration performed using __register_cpu_notifier()
- * or __unregister_cpu_notifier().
- */
- void cpu_maps_update_begin(void)
- {
- mutex_lock(&cpu_add_remove_lock);
- }
- EXPORT_SYMBOL(cpu_notifier_register_begin);
- void cpu_maps_update_done(void)
- {
- mutex_unlock(&cpu_add_remove_lock);
- }
- EXPORT_SYMBOL(cpu_notifier_register_done);
- static RAW_NOTIFIER_HEAD(cpu_chain);
- /* If set, cpu_up and cpu_down will return -EBUSY and do nothing.
- * Should always be manipulated under cpu_add_remove_lock
- */
- static int cpu_hotplug_disabled;
- #ifdef CONFIG_HOTPLUG_CPU
- static struct {
- struct task_struct *active_writer;
- /* wait queue to wake up the active_writer */
- wait_queue_head_t wq;
- /* verifies that no writer will get active while readers are active */
- struct mutex lock;
- /*
- * Also blocks the new readers during
- * an ongoing cpu hotplug operation.
- */
- atomic_t refcount;
- #ifdef CONFIG_DEBUG_LOCK_ALLOC
- struct lockdep_map dep_map;
- #endif
- } cpu_hotplug = {
- .active_writer = NULL,
- .wq = __WAIT_QUEUE_HEAD_INITIALIZER(cpu_hotplug.wq),
- .lock = __MUTEX_INITIALIZER(cpu_hotplug.lock),
- #ifdef CONFIG_DEBUG_LOCK_ALLOC
- .dep_map = STATIC_LOCKDEP_MAP_INIT("cpu_hotplug.dep_map", &cpu_hotplug.dep_map),
- #endif
- };
- /* Lockdep annotations for get/put_online_cpus() and cpu_hotplug_begin/end() */
- #define cpuhp_lock_acquire_read() lock_map_acquire_read(&cpu_hotplug.dep_map)
- #define cpuhp_lock_acquire_tryread() \
- lock_map_acquire_tryread(&cpu_hotplug.dep_map)
- #define cpuhp_lock_acquire() lock_map_acquire(&cpu_hotplug.dep_map)
- #define cpuhp_lock_release() lock_map_release(&cpu_hotplug.dep_map)
- void get_online_cpus(void)
- {
- might_sleep();
- if (cpu_hotplug.active_writer == current)
- return;
- cpuhp_lock_acquire_read();
- mutex_lock(&cpu_hotplug.lock);
- atomic_inc(&cpu_hotplug.refcount);
- mutex_unlock(&cpu_hotplug.lock);
- }
- EXPORT_SYMBOL_GPL(get_online_cpus);
- void put_online_cpus(void)
- {
- int refcount;
- if (cpu_hotplug.active_writer == current)
- return;
- refcount = atomic_dec_return(&cpu_hotplug.refcount);
- if (WARN_ON(refcount < 0)) /* try to fix things up */
- atomic_inc(&cpu_hotplug.refcount);
- if (refcount <= 0 && waitqueue_active(&cpu_hotplug.wq))
- wake_up(&cpu_hotplug.wq);
- cpuhp_lock_release();
- }
- EXPORT_SYMBOL_GPL(put_online_cpus);
- /*
- * This ensures that the hotplug operation can begin only when the
- * refcount goes to zero.
- *
- * Note that during a cpu-hotplug operation, the new readers, if any,
- * will be blocked by the cpu_hotplug.lock
- *
- * Since cpu_hotplug_begin() is always called after invoking
- * cpu_maps_update_begin(), we can be sure that only one writer is active.
- *
- * Note that theoretically, there is a possibility of a livelock:
- * - Refcount goes to zero, last reader wakes up the sleeping
- * writer.
- * - Last reader unlocks the cpu_hotplug.lock.
- * - A new reader arrives at this moment, bumps up the refcount.
- * - The writer acquires the cpu_hotplug.lock finds the refcount
- * non zero and goes to sleep again.
- *
- * However, this is very difficult to achieve in practice since
- * get_online_cpus() not an api which is called all that often.
- *
- */
- void cpu_hotplug_begin(void)
- {
- DEFINE_WAIT(wait);
- cpu_hotplug.active_writer = current;
- cpuhp_lock_acquire();
- for (;;) {
- mutex_lock(&cpu_hotplug.lock);
- prepare_to_wait(&cpu_hotplug.wq, &wait, TASK_UNINTERRUPTIBLE);
- if (likely(!atomic_read(&cpu_hotplug.refcount)))
- break;
- mutex_unlock(&cpu_hotplug.lock);
- schedule();
- }
- finish_wait(&cpu_hotplug.wq, &wait);
- }
- void cpu_hotplug_done(void)
- {
- cpu_hotplug.active_writer = NULL;
- mutex_unlock(&cpu_hotplug.lock);
- cpuhp_lock_release();
- }
- /*
- * Wait for currently running CPU hotplug operations to complete (if any) and
- * disable future CPU hotplug (from sysfs). The 'cpu_add_remove_lock' protects
- * the 'cpu_hotplug_disabled' flag. The same lock is also acquired by the
- * hotplug path before performing hotplug operations. So acquiring that lock
- * guarantees mutual exclusion from any currently running hotplug operations.
- */
- void cpu_hotplug_disable(void)
- {
- cpu_maps_update_begin();
- cpu_hotplug_disabled++;
- cpu_maps_update_done();
- }
- EXPORT_SYMBOL_GPL(cpu_hotplug_disable);
- static void __cpu_hotplug_enable(void)
- {
- if (WARN_ONCE(!cpu_hotplug_disabled, "Unbalanced cpu hotplug enable\n"))
- return;
- cpu_hotplug_disabled--;
- }
- void cpu_hotplug_enable(void)
- {
- cpu_maps_update_begin();
- __cpu_hotplug_enable();
- cpu_maps_update_done();
- }
- EXPORT_SYMBOL_GPL(cpu_hotplug_enable);
- #endif /* CONFIG_HOTPLUG_CPU */
- /* Need to know about CPUs going up/down? */
- int register_cpu_notifier(struct notifier_block *nb)
- {
- int ret;
- cpu_maps_update_begin();
- ret = raw_notifier_chain_register(&cpu_chain, nb);
- cpu_maps_update_done();
- return ret;
- }
- int __register_cpu_notifier(struct notifier_block *nb)
- {
- return raw_notifier_chain_register(&cpu_chain, nb);
- }
- static int __cpu_notify(unsigned long val, unsigned int cpu, int nr_to_call,
- int *nr_calls)
- {
- unsigned long mod = cpuhp_tasks_frozen ? CPU_TASKS_FROZEN : 0;
- void *hcpu = (void *)(long)cpu;
- int ret;
- ret = __raw_notifier_call_chain(&cpu_chain, val | mod, hcpu, nr_to_call,
- nr_calls);
- return notifier_to_errno(ret);
- }
- static int cpu_notify(unsigned long val, unsigned int cpu)
- {
- return __cpu_notify(val, cpu, -1, NULL);
- }
- static void cpu_notify_nofail(unsigned long val, unsigned int cpu)
- {
- BUG_ON(cpu_notify(val, cpu));
- }
- /* Notifier wrappers for transitioning to state machine */
- static int notify_prepare(unsigned int cpu)
- {
- int nr_calls = 0;
- int ret;
- ret = __cpu_notify(CPU_UP_PREPARE, cpu, -1, &nr_calls);
- if (ret) {
- nr_calls--;
- printk(KERN_WARNING "%s: attempt to bring up CPU %u failed\n",
- __func__, cpu);
- __cpu_notify(CPU_UP_CANCELED, cpu, nr_calls, NULL);
- }
- return ret;
- }
- static int notify_online(unsigned int cpu)
- {
- cpu_notify(CPU_ONLINE, cpu);
- return 0;
- }
- static void __cpuhp_kick_ap_work(struct cpuhp_cpu_state *st);
- static int bringup_wait_for_ap(unsigned int cpu)
- {
- struct cpuhp_cpu_state *st = per_cpu_ptr(&cpuhp_state, cpu);
- /* Wait for the CPU to reach CPUHP_AP_ONLINE_IDLE */
- wait_for_completion(&st->done);
- if (WARN_ON_ONCE((!cpu_online(cpu))))
- return -ECANCELED;
- /* Unpark the stopper thread and the hotplug thread of the target cpu */
- stop_machine_unpark(cpu);
- kthread_unpark(st->thread);
- /* Should we go further up ? */
- if (st->target > CPUHP_AP_ONLINE_IDLE) {
- __cpuhp_kick_ap_work(st);
- wait_for_completion(&st->done);
- }
- return st->result;
- }
- static int bringup_cpu(unsigned int cpu)
- {
- struct task_struct *idle = idle_thread_get(cpu);
- int ret;
- /*
- * Some architectures have to walk the irq descriptors to
- * setup the vector space for the cpu which comes online.
- * Prevent irq alloc/free across the bringup.
- */
- irq_lock_sparse();
- /* Arch-specific enabling code. */
- ret = __cpu_up(cpu, idle);
- irq_unlock_sparse();
- if (ret) {
- cpu_notify(CPU_UP_CANCELED, cpu);
- return ret;
- }
- return bringup_wait_for_ap(cpu);
- }
- /*
- * Hotplug state machine related functions
- */
- static void undo_cpu_down(unsigned int cpu, struct cpuhp_cpu_state *st)
- {
- for (st->state++; st->state < st->target; st->state++) {
- struct cpuhp_step *step = cpuhp_get_step(st->state);
- if (!step->skip_onerr)
- cpuhp_invoke_callback(cpu, st->state, true, NULL);
- }
- }
- static int cpuhp_down_callbacks(unsigned int cpu, struct cpuhp_cpu_state *st,
- enum cpuhp_state target)
- {
- enum cpuhp_state prev_state = st->state;
- int ret = 0;
- for (; st->state > target; st->state--) {
- ret = cpuhp_invoke_callback(cpu, st->state, false, NULL);
- if (ret) {
- st->target = prev_state;
- undo_cpu_down(cpu, st);
- break;
- }
- }
- return ret;
- }
- static void undo_cpu_up(unsigned int cpu, struct cpuhp_cpu_state *st)
- {
- for (st->state--; st->state > st->target; st->state--) {
- struct cpuhp_step *step = cpuhp_get_step(st->state);
- if (!step->skip_onerr)
- cpuhp_invoke_callback(cpu, st->state, false, NULL);
- }
- }
- static int cpuhp_up_callbacks(unsigned int cpu, struct cpuhp_cpu_state *st,
- enum cpuhp_state target)
- {
- enum cpuhp_state prev_state = st->state;
- int ret = 0;
- while (st->state < target) {
- st->state++;
- ret = cpuhp_invoke_callback(cpu, st->state, true, NULL);
- if (ret) {
- st->target = prev_state;
- undo_cpu_up(cpu, st);
- break;
- }
- }
- return ret;
- }
- /*
- * The cpu hotplug threads manage the bringup and teardown of the cpus
- */
- static void cpuhp_create(unsigned int cpu)
- {
- struct cpuhp_cpu_state *st = per_cpu_ptr(&cpuhp_state, cpu);
- init_completion(&st->done);
- }
- static int cpuhp_should_run(unsigned int cpu)
- {
- struct cpuhp_cpu_state *st = this_cpu_ptr(&cpuhp_state);
- return st->should_run;
- }
- /* Execute the teardown callbacks. Used to be CPU_DOWN_PREPARE */
- static int cpuhp_ap_offline(unsigned int cpu, struct cpuhp_cpu_state *st)
- {
- enum cpuhp_state target = max((int)st->target, CPUHP_TEARDOWN_CPU);
- return cpuhp_down_callbacks(cpu, st, target);
- }
- /* Execute the online startup callbacks. Used to be CPU_ONLINE */
- static int cpuhp_ap_online(unsigned int cpu, struct cpuhp_cpu_state *st)
- {
- return cpuhp_up_callbacks(cpu, st, st->target);
- }
- /*
- * Execute teardown/startup callbacks on the plugged cpu. Also used to invoke
- * callbacks when a state gets [un]installed at runtime.
- */
- static void cpuhp_thread_fun(unsigned int cpu)
- {
- struct cpuhp_cpu_state *st = this_cpu_ptr(&cpuhp_state);
- int ret = 0;
- /*
- * Paired with the mb() in cpuhp_kick_ap_work and
- * cpuhp_invoke_ap_callback, so the work set is consistent visible.
- */
- smp_mb();
- if (!st->should_run)
- return;
- st->should_run = false;
- lock_map_acquire(&cpuhp_state_lock_map);
- /* Single callback invocation for [un]install ? */
- if (st->single) {
- if (st->cb_state < CPUHP_AP_ONLINE) {
- local_irq_disable();
- ret = cpuhp_invoke_callback(cpu, st->cb_state,
- st->bringup, st->node);
- local_irq_enable();
- } else {
- ret = cpuhp_invoke_callback(cpu, st->cb_state,
- st->bringup, st->node);
- }
- } else if (st->rollback) {
- BUG_ON(st->state < CPUHP_AP_ONLINE_IDLE);
- undo_cpu_down(cpu, st);
- /*
- * This is a momentary workaround to keep the notifier users
- * happy. Will go away once we got rid of the notifiers.
- */
- cpu_notify_nofail(CPU_DOWN_FAILED, cpu);
- st->rollback = false;
- } else {
- /* Cannot happen .... */
- BUG_ON(st->state < CPUHP_AP_ONLINE_IDLE);
- /* Regular hotplug work */
- if (st->state < st->target)
- ret = cpuhp_ap_online(cpu, st);
- else if (st->state > st->target)
- ret = cpuhp_ap_offline(cpu, st);
- }
- lock_map_release(&cpuhp_state_lock_map);
- st->result = ret;
- complete(&st->done);
- }
- /* Invoke a single callback on a remote cpu */
- static int
- cpuhp_invoke_ap_callback(int cpu, enum cpuhp_state state, bool bringup,
- struct hlist_node *node)
- {
- struct cpuhp_cpu_state *st = per_cpu_ptr(&cpuhp_state, cpu);
- if (!cpu_online(cpu))
- return 0;
- lock_map_acquire(&cpuhp_state_lock_map);
- lock_map_release(&cpuhp_state_lock_map);
- /*
- * If we are up and running, use the hotplug thread. For early calls
- * we invoke the thread function directly.
- */
- if (!st->thread)
- return cpuhp_invoke_callback(cpu, state, bringup, node);
- st->cb_state = state;
- st->single = true;
- st->bringup = bringup;
- st->node = node;
- /*
- * Make sure the above stores are visible before should_run becomes
- * true. Paired with the mb() above in cpuhp_thread_fun()
- */
- smp_mb();
- st->should_run = true;
- wake_up_process(st->thread);
- wait_for_completion(&st->done);
- return st->result;
- }
- /* Regular hotplug invocation of the AP hotplug thread */
- static void __cpuhp_kick_ap_work(struct cpuhp_cpu_state *st)
- {
- st->result = 0;
- st->single = false;
- /*
- * Make sure the above stores are visible before should_run becomes
- * true. Paired with the mb() above in cpuhp_thread_fun()
- */
- smp_mb();
- st->should_run = true;
- wake_up_process(st->thread);
- }
- static int cpuhp_kick_ap_work(unsigned int cpu)
- {
- struct cpuhp_cpu_state *st = per_cpu_ptr(&cpuhp_state, cpu);
- enum cpuhp_state state = st->state;
- trace_cpuhp_enter(cpu, st->target, state, cpuhp_kick_ap_work);
- lock_map_acquire(&cpuhp_state_lock_map);
- lock_map_release(&cpuhp_state_lock_map);
- __cpuhp_kick_ap_work(st);
- wait_for_completion(&st->done);
- trace_cpuhp_exit(cpu, st->state, state, st->result);
- return st->result;
- }
- static struct smp_hotplug_thread cpuhp_threads = {
- .store = &cpuhp_state.thread,
- .create = &cpuhp_create,
- .thread_should_run = cpuhp_should_run,
- .thread_fn = cpuhp_thread_fun,
- .thread_comm = "cpuhp/%u",
- .selfparking = true,
- };
- void __init cpuhp_threads_init(void)
- {
- BUG_ON(smpboot_register_percpu_thread(&cpuhp_threads));
- kthread_unpark(this_cpu_read(cpuhp_state.thread));
- }
- EXPORT_SYMBOL(register_cpu_notifier);
- EXPORT_SYMBOL(__register_cpu_notifier);
- void unregister_cpu_notifier(struct notifier_block *nb)
- {
- cpu_maps_update_begin();
- raw_notifier_chain_unregister(&cpu_chain, nb);
- cpu_maps_update_done();
- }
- EXPORT_SYMBOL(unregister_cpu_notifier);
- void __unregister_cpu_notifier(struct notifier_block *nb)
- {
- raw_notifier_chain_unregister(&cpu_chain, nb);
- }
- EXPORT_SYMBOL(__unregister_cpu_notifier);
- #ifdef CONFIG_HOTPLUG_CPU
- /**
- * clear_tasks_mm_cpumask - Safely clear tasks' mm_cpumask for a CPU
- * @cpu: a CPU id
- *
- * This function walks all processes, finds a valid mm struct for each one and
- * then clears a corresponding bit in mm's cpumask. While this all sounds
- * trivial, there are various non-obvious corner cases, which this function
- * tries to solve in a safe manner.
- *
- * Also note that the function uses a somewhat relaxed locking scheme, so it may
- * be called only for an already offlined CPU.
- */
- void clear_tasks_mm_cpumask(int cpu)
- {
- struct task_struct *p;
- /*
- * This function is called after the cpu is taken down and marked
- * offline, so its not like new tasks will ever get this cpu set in
- * their mm mask. -- Peter Zijlstra
- * Thus, we may use rcu_read_lock() here, instead of grabbing
- * full-fledged tasklist_lock.
- */
- WARN_ON(cpu_online(cpu));
- rcu_read_lock();
- for_each_process(p) {
- struct task_struct *t;
- /*
- * Main thread might exit, but other threads may still have
- * a valid mm. Find one.
- */
- t = find_lock_task_mm(p);
- if (!t)
- continue;
- cpumask_clear_cpu(cpu, mm_cpumask(t->mm));
- task_unlock(t);
- }
- rcu_read_unlock();
- }
- static inline void check_for_tasks(int dead_cpu)
- {
- struct task_struct *g, *p;
- read_lock(&tasklist_lock);
- for_each_process_thread(g, p) {
- if (!p->on_rq)
- continue;
- /*
- * We do the check with unlocked task_rq(p)->lock.
- * Order the reading to do not warn about a task,
- * which was running on this cpu in the past, and
- * it's just been woken on another cpu.
- */
- rmb();
- if (task_cpu(p) != dead_cpu)
- continue;
- pr_warn("Task %s (pid=%d) is on cpu %d (state=%ld, flags=%x)\n",
- p->comm, task_pid_nr(p), dead_cpu, p->state, p->flags);
- }
- read_unlock(&tasklist_lock);
- }
- static int notify_down_prepare(unsigned int cpu)
- {
- int err, nr_calls = 0;
- err = __cpu_notify(CPU_DOWN_PREPARE, cpu, -1, &nr_calls);
- if (err) {
- nr_calls--;
- __cpu_notify(CPU_DOWN_FAILED, cpu, nr_calls, NULL);
- pr_warn("%s: attempt to take down CPU %u failed\n",
- __func__, cpu);
- }
- return err;
- }
- /* Take this CPU down. */
- static int take_cpu_down(void *_param)
- {
- struct cpuhp_cpu_state *st = this_cpu_ptr(&cpuhp_state);
- enum cpuhp_state target = max((int)st->target, CPUHP_AP_OFFLINE);
- int err, cpu = smp_processor_id();
- /* Ensure this CPU doesn't handle any more interrupts. */
- err = __cpu_disable();
- if (err < 0)
- return err;
- /*
- * We get here while we are in CPUHP_TEARDOWN_CPU state and we must not
- * do this step again.
- */
- WARN_ON(st->state != CPUHP_TEARDOWN_CPU);
- st->state--;
- /* Invoke the former CPU_DYING callbacks */
- for (; st->state > target; st->state--)
- cpuhp_invoke_callback(cpu, st->state, false, NULL);
- /* Give up timekeeping duties */
- tick_handover_do_timer();
- /* Park the stopper thread */
- stop_machine_park(cpu);
- return 0;
- }
- static int takedown_cpu(unsigned int cpu)
- {
- struct cpuhp_cpu_state *st = per_cpu_ptr(&cpuhp_state, cpu);
- int err;
- /* Park the smpboot threads */
- kthread_park(per_cpu_ptr(&cpuhp_state, cpu)->thread);
- smpboot_park_threads(cpu);
- /*
- * Prevent irq alloc/free while the dying cpu reorganizes the
- * interrupt affinities.
- */
- irq_lock_sparse();
- /*
- * So now all preempt/rcu users must observe !cpu_active().
- */
- err = stop_machine(take_cpu_down, NULL, cpumask_of(cpu));
- if (err) {
- /* CPU refused to die */
- irq_unlock_sparse();
- /* Unpark the hotplug thread so we can rollback there */
- kthread_unpark(per_cpu_ptr(&cpuhp_state, cpu)->thread);
- return err;
- }
- BUG_ON(cpu_online(cpu));
- /*
- * The CPUHP_AP_SCHED_MIGRATE_DYING callback will have removed all
- * runnable tasks from the cpu, there's only the idle task left now
- * that the migration thread is done doing the stop_machine thing.
- *
- * Wait for the stop thread to go away.
- */
- wait_for_completion(&st->done);
- BUG_ON(st->state != CPUHP_AP_IDLE_DEAD);
- /* Interrupts are moved away from the dying cpu, reenable alloc/free */
- irq_unlock_sparse();
- hotplug_cpu__broadcast_tick_pull(cpu);
- /* This actually kills the CPU. */
- __cpu_die(cpu);
- tick_cleanup_dead_cpu(cpu);
- return 0;
- }
- static int notify_dead(unsigned int cpu)
- {
- cpu_notify_nofail(CPU_DEAD, cpu);
- check_for_tasks(cpu);
- return 0;
- }
- static void cpuhp_complete_idle_dead(void *arg)
- {
- struct cpuhp_cpu_state *st = arg;
- complete(&st->done);
- }
- void cpuhp_report_idle_dead(void)
- {
- struct cpuhp_cpu_state *st = this_cpu_ptr(&cpuhp_state);
- BUG_ON(st->state != CPUHP_AP_OFFLINE);
- rcu_report_dead(smp_processor_id());
- st->state = CPUHP_AP_IDLE_DEAD;
- /*
- * We cannot call complete after rcu_report_dead() so we delegate it
- * to an online cpu.
- */
- smp_call_function_single(cpumask_first(cpu_online_mask),
- cpuhp_complete_idle_dead, st, 0);
- }
- #else
- #define notify_down_prepare NULL
- #define takedown_cpu NULL
- #define notify_dead NULL
- #endif
- #ifdef CONFIG_HOTPLUG_CPU
- /* Requires cpu_add_remove_lock to be held */
- static int __ref _cpu_down(unsigned int cpu, int tasks_frozen,
- enum cpuhp_state target)
- {
- struct cpuhp_cpu_state *st = per_cpu_ptr(&cpuhp_state, cpu);
- int prev_state, ret = 0;
- bool hasdied = false;
- if (num_online_cpus() == 1)
- return -EBUSY;
- if (!cpu_present(cpu))
- return -EINVAL;
- cpu_hotplug_begin();
- cpuhp_tasks_frozen = tasks_frozen;
- prev_state = st->state;
- st->target = target;
- /*
- * If the current CPU state is in the range of the AP hotplug thread,
- * then we need to kick the thread.
- */
- if (st->state > CPUHP_TEARDOWN_CPU) {
- ret = cpuhp_kick_ap_work(cpu);
- /*
- * The AP side has done the error rollback already. Just
- * return the error code..
- */
- if (ret)
- goto out;
- /*
- * We might have stopped still in the range of the AP hotplug
- * thread. Nothing to do anymore.
- */
- if (st->state > CPUHP_TEARDOWN_CPU)
- goto out;
- }
- /*
- * The AP brought itself down to CPUHP_TEARDOWN_CPU. So we need
- * to do the further cleanups.
- */
- ret = cpuhp_down_callbacks(cpu, st, target);
- if (ret && st->state > CPUHP_TEARDOWN_CPU && st->state < prev_state) {
- st->target = prev_state;
- st->rollback = true;
- cpuhp_kick_ap_work(cpu);
- }
- hasdied = prev_state != st->state && st->state == CPUHP_OFFLINE;
- out:
- cpu_hotplug_done();
- /* This post dead nonsense must die */
- if (!ret && hasdied)
- cpu_notify_nofail(CPU_POST_DEAD, cpu);
- return ret;
- }
- static int do_cpu_down(unsigned int cpu, enum cpuhp_state target)
- {
- int err;
- cpu_maps_update_begin();
- if (cpu_hotplug_disabled) {
- err = -EBUSY;
- goto out;
- }
- err = _cpu_down(cpu, 0, target);
- out:
- cpu_maps_update_done();
- return err;
- }
- int cpu_down(unsigned int cpu)
- {
- return do_cpu_down(cpu, CPUHP_OFFLINE);
- }
- EXPORT_SYMBOL(cpu_down);
- #endif /*CONFIG_HOTPLUG_CPU*/
- /**
- * notify_cpu_starting(cpu) - Invoke the callbacks on the starting CPU
- * @cpu: cpu that just started
- *
- * It must be called by the arch code on the new cpu, before the new cpu
- * enables interrupts and before the "boot" cpu returns from __cpu_up().
- */
- void notify_cpu_starting(unsigned int cpu)
- {
- struct cpuhp_cpu_state *st = per_cpu_ptr(&cpuhp_state, cpu);
- enum cpuhp_state target = min((int)st->target, CPUHP_AP_ONLINE);
- rcu_cpu_starting(cpu); /* Enables RCU usage on this CPU. */
- while (st->state < target) {
- st->state++;
- cpuhp_invoke_callback(cpu, st->state, true, NULL);
- }
- }
- /*
- * Called from the idle task. Wake up the controlling task which brings the
- * stopper and the hotplug thread of the upcoming CPU up and then delegates
- * the rest of the online bringup to the hotplug thread.
- */
- void cpuhp_online_idle(enum cpuhp_state state)
- {
- struct cpuhp_cpu_state *st = this_cpu_ptr(&cpuhp_state);
- /* Happens for the boot cpu */
- if (state != CPUHP_AP_ONLINE_IDLE)
- return;
- st->state = CPUHP_AP_ONLINE_IDLE;
- complete(&st->done);
- }
- /* Requires cpu_add_remove_lock to be held */
- static int _cpu_up(unsigned int cpu, int tasks_frozen, enum cpuhp_state target)
- {
- struct cpuhp_cpu_state *st = per_cpu_ptr(&cpuhp_state, cpu);
- struct task_struct *idle;
- int ret = 0;
- cpu_hotplug_begin();
- if (!cpu_present(cpu)) {
- ret = -EINVAL;
- goto out;
- }
- /*
- * The caller of do_cpu_up might have raced with another
- * caller. Ignore it for now.
- */
- if (st->state >= target)
- goto out;
- if (st->state == CPUHP_OFFLINE) {
- /* Let it fail before we try to bring the cpu up */
- idle = idle_thread_get(cpu);
- if (IS_ERR(idle)) {
- ret = PTR_ERR(idle);
- goto out;
- }
- }
- cpuhp_tasks_frozen = tasks_frozen;
- st->target = target;
- /*
- * If the current CPU state is in the range of the AP hotplug thread,
- * then we need to kick the thread once more.
- */
- if (st->state > CPUHP_BRINGUP_CPU) {
- ret = cpuhp_kick_ap_work(cpu);
- /*
- * The AP side has done the error rollback already. Just
- * return the error code..
- */
- if (ret)
- goto out;
- }
- /*
- * Try to reach the target state. We max out on the BP at
- * CPUHP_BRINGUP_CPU. After that the AP hotplug thread is
- * responsible for bringing it up to the target state.
- */
- target = min((int)target, CPUHP_BRINGUP_CPU);
- ret = cpuhp_up_callbacks(cpu, st, target);
- out:
- cpu_hotplug_done();
- return ret;
- }
- static int do_cpu_up(unsigned int cpu, enum cpuhp_state target)
- {
- int err = 0;
- if (!cpu_possible(cpu)) {
- pr_err("can't online cpu %d because it is not configured as may-hotadd at boot time\n",
- cpu);
- #if defined(CONFIG_IA64)
- pr_err("please check additional_cpus= boot parameter\n");
- #endif
- return -EINVAL;
- }
- err = try_online_node(cpu_to_node(cpu));
- if (err)
- return err;
- cpu_maps_update_begin();
- if (cpu_hotplug_disabled) {
- err = -EBUSY;
- goto out;
- }
- err = _cpu_up(cpu, 0, target);
- out:
- cpu_maps_update_done();
- return err;
- }
- int cpu_up(unsigned int cpu)
- {
- return do_cpu_up(cpu, CPUHP_ONLINE);
- }
- EXPORT_SYMBOL_GPL(cpu_up);
- #ifdef CONFIG_PM_SLEEP_SMP
- static cpumask_var_t frozen_cpus;
- int freeze_secondary_cpus(int primary)
- {
- int cpu, error = 0;
- cpu_maps_update_begin();
- if (!cpu_online(primary))
- primary = cpumask_first(cpu_online_mask);
- /*
- * We take down all of the non-boot CPUs in one shot to avoid races
- * with the userspace trying to use the CPU hotplug at the same time
- */
- cpumask_clear(frozen_cpus);
- pr_info("Disabling non-boot CPUs ...\n");
- for_each_online_cpu(cpu) {
- if (cpu == primary)
- continue;
- trace_suspend_resume(TPS("CPU_OFF"), cpu, true);
- error = _cpu_down(cpu, 1, CPUHP_OFFLINE);
- trace_suspend_resume(TPS("CPU_OFF"), cpu, false);
- if (!error)
- cpumask_set_cpu(cpu, frozen_cpus);
- else {
- pr_err("Error taking CPU%d down: %d\n", cpu, error);
- break;
- }
- }
- if (!error)
- BUG_ON(num_online_cpus() > 1);
- else
- pr_err("Non-boot CPUs are not disabled\n");
- /*
- * Make sure the CPUs won't be enabled by someone else. We need to do
- * this even in case of failure as all disable_nonboot_cpus() users are
- * supposed to do enable_nonboot_cpus() on the failure path.
- */
- cpu_hotplug_disabled++;
- cpu_maps_update_done();
- return error;
- }
- void __weak arch_enable_nonboot_cpus_begin(void)
- {
- }
- void __weak arch_enable_nonboot_cpus_end(void)
- {
- }
- void enable_nonboot_cpus(void)
- {
- int cpu, error;
- /* Allow everyone to use the CPU hotplug again */
- cpu_maps_update_begin();
- __cpu_hotplug_enable();
- if (cpumask_empty(frozen_cpus))
- goto out;
- pr_info("Enabling non-boot CPUs ...\n");
- arch_enable_nonboot_cpus_begin();
- for_each_cpu(cpu, frozen_cpus) {
- trace_suspend_resume(TPS("CPU_ON"), cpu, true);
- error = _cpu_up(cpu, 1, CPUHP_ONLINE);
- trace_suspend_resume(TPS("CPU_ON"), cpu, false);
- if (!error) {
- pr_info("CPU%d is up\n", cpu);
- continue;
- }
- pr_warn("Error taking CPU%d up: %d\n", cpu, error);
- }
- arch_enable_nonboot_cpus_end();
- cpumask_clear(frozen_cpus);
- out:
- cpu_maps_update_done();
- }
- static int __init alloc_frozen_cpus(void)
- {
- if (!alloc_cpumask_var(&frozen_cpus, GFP_KERNEL|__GFP_ZERO))
- return -ENOMEM;
- return 0;
- }
- core_initcall(alloc_frozen_cpus);
- /*
- * When callbacks for CPU hotplug notifications are being executed, we must
- * ensure that the state of the system with respect to the tasks being frozen
- * or not, as reported by the notification, remains unchanged *throughout the
- * duration* of the execution of the callbacks.
- * Hence we need to prevent the freezer from racing with regular CPU hotplug.
- *
- * This synchronization is implemented by mutually excluding regular CPU
- * hotplug and Suspend/Hibernate call paths by hooking onto the Suspend/
- * Hibernate notifications.
- */
- static int
- cpu_hotplug_pm_callback(struct notifier_block *nb,
- unsigned long action, void *ptr)
- {
- switch (action) {
- case PM_SUSPEND_PREPARE:
- case PM_HIBERNATION_PREPARE:
- cpu_hotplug_disable();
- break;
- case PM_POST_SUSPEND:
- case PM_POST_HIBERNATION:
- cpu_hotplug_enable();
- break;
- default:
- return NOTIFY_DONE;
- }
- return NOTIFY_OK;
- }
- static int __init cpu_hotplug_pm_sync_init(void)
- {
- /*
- * cpu_hotplug_pm_callback has higher priority than x86
- * bsp_pm_callback which depends on cpu_hotplug_pm_callback
- * to disable cpu hotplug to avoid cpu hotplug race.
- */
- pm_notifier(cpu_hotplug_pm_callback, 0);
- return 0;
- }
- core_initcall(cpu_hotplug_pm_sync_init);
- #endif /* CONFIG_PM_SLEEP_SMP */
- #endif /* CONFIG_SMP */
- /* Boot processor state steps */
- static struct cpuhp_step cpuhp_bp_states[] = {
- [CPUHP_OFFLINE] = {
- .name = "offline",
- .startup.single = NULL,
- .teardown.single = NULL,
- },
- #ifdef CONFIG_SMP
- [CPUHP_CREATE_THREADS]= {
- .name = "threads:prepare",
- .startup.single = smpboot_create_threads,
- .teardown.single = NULL,
- .cant_stop = true,
- },
- [CPUHP_PERF_PREPARE] = {
- .name = "perf:prepare",
- .startup.single = perf_event_init_cpu,
- .teardown.single = perf_event_exit_cpu,
- },
- [CPUHP_WORKQUEUE_PREP] = {
- .name = "workqueue:prepare",
- .startup.single = workqueue_prepare_cpu,
- .teardown.single = NULL,
- },
- [CPUHP_HRTIMERS_PREPARE] = {
- .name = "hrtimers:prepare",
- .startup.single = hrtimers_prepare_cpu,
- .teardown.single = hrtimers_dead_cpu,
- },
- [CPUHP_SMPCFD_PREPARE] = {
- .name = "smpcfd:prepare",
- .startup.single = smpcfd_prepare_cpu,
- .teardown.single = smpcfd_dead_cpu,
- },
- [CPUHP_RELAY_PREPARE] = {
- .name = "relay:prepare",
- .startup.single = relay_prepare_cpu,
- .teardown.single = NULL,
- },
- [CPUHP_SLAB_PREPARE] = {
- .name = "slab:prepare",
- .startup.single = slab_prepare_cpu,
- .teardown.single = slab_dead_cpu,
- },
- [CPUHP_RCUTREE_PREP] = {
- .name = "RCU/tree:prepare",
- .startup.single = rcutree_prepare_cpu,
- .teardown.single = rcutree_dead_cpu,
- },
- /*
- * Preparatory and dead notifiers. Will be replaced once the notifiers
- * are converted to states.
- */
- [CPUHP_NOTIFY_PREPARE] = {
- .name = "notify:prepare",
- .startup.single = notify_prepare,
- .teardown.single = notify_dead,
- .skip_onerr = true,
- .cant_stop = true,
- },
- /*
- * On the tear-down path, timers_dead_cpu() must be invoked
- * before blk_mq_queue_reinit_notify() from notify_dead(),
- * otherwise a RCU stall occurs.
- */
- [CPUHP_TIMERS_PREPARE] = {
- .name = "timers:dead",
- .startup.single = timers_prepare_cpu,
- .teardown.single = timers_dead_cpu,
- },
- /* Kicks the plugged cpu into life */
- [CPUHP_BRINGUP_CPU] = {
- .name = "cpu:bringup",
- .startup.single = bringup_cpu,
- .teardown.single = NULL,
- .cant_stop = true,
- },
- /*
- * Handled on controll processor until the plugged processor manages
- * this itself.
- */
- [CPUHP_TEARDOWN_CPU] = {
- .name = "cpu:teardown",
- .startup.single = NULL,
- .teardown.single = takedown_cpu,
- .cant_stop = true,
- },
- #else
- [CPUHP_BRINGUP_CPU] = { },
- #endif
- };
- /* Application processor state steps */
- static struct cpuhp_step cpuhp_ap_states[] = {
- #ifdef CONFIG_SMP
- /* Final state before CPU kills itself */
- [CPUHP_AP_IDLE_DEAD] = {
- .name = "idle:dead",
- },
- /*
- * Last state before CPU enters the idle loop to die. Transient state
- * for synchronization.
- */
- [CPUHP_AP_OFFLINE] = {
- .name = "ap:offline",
- .cant_stop = true,
- },
- /* First state is scheduler control. Interrupts are disabled */
- [CPUHP_AP_SCHED_STARTING] = {
- .name = "sched:starting",
- .startup.single = sched_cpu_starting,
- .teardown.single = sched_cpu_dying,
- },
- [CPUHP_AP_RCUTREE_DYING] = {
- .name = "RCU/tree:dying",
- .startup.single = NULL,
- .teardown.single = rcutree_dying_cpu,
- },
- [CPUHP_AP_SMPCFD_DYING] = {
- .name = "smpcfd:dying",
- .startup.single = NULL,
- .teardown.single = smpcfd_dying_cpu,
- },
- /* Entry state on starting. Interrupts enabled from here on. Transient
- * state for synchronsization */
- [CPUHP_AP_ONLINE] = {
- .name = "ap:online",
- },
- /* Handle smpboot threads park/unpark */
- [CPUHP_AP_SMPBOOT_THREADS] = {
- .name = "smpboot/threads:online",
- .startup.single = smpboot_unpark_threads,
- .teardown.single = NULL,
- },
- [CPUHP_AP_PERF_ONLINE] = {
- .name = "perf:online",
- .startup.single = perf_event_init_cpu,
- .teardown.single = perf_event_exit_cpu,
- },
- [CPUHP_AP_WORKQUEUE_ONLINE] = {
- .name = "workqueue:online",
- .startup.single = workqueue_online_cpu,
- .teardown.single = workqueue_offline_cpu,
- },
- [CPUHP_AP_RCUTREE_ONLINE] = {
- .name = "RCU/tree:online",
- .startup.single = rcutree_online_cpu,
- .teardown.single = rcutree_offline_cpu,
- },
- /*
- * Online/down_prepare notifiers. Will be removed once the notifiers
- * are converted to states.
- */
- [CPUHP_AP_NOTIFY_ONLINE] = {
- .name = "notify:online",
- .startup.single = notify_online,
- .teardown.single = notify_down_prepare,
- .skip_onerr = true,
- },
- #endif
- /*
- * The dynamically registered state space is here
- */
- #ifdef CONFIG_SMP
- /* Last state is scheduler control setting the cpu active */
- [CPUHP_AP_ACTIVE] = {
- .name = "sched:active",
- .startup.single = sched_cpu_activate,
- .teardown.single = sched_cpu_deactivate,
- },
- #endif
- /* CPU is fully up and running. */
- [CPUHP_ONLINE] = {
- .name = "online",
- .startup.single = NULL,
- .teardown.single = NULL,
- },
- };
- /* Sanity check for callbacks */
- static int cpuhp_cb_check(enum cpuhp_state state)
- {
- if (state <= CPUHP_OFFLINE || state >= CPUHP_ONLINE)
- return -EINVAL;
- return 0;
- }
- static void cpuhp_store_callbacks(enum cpuhp_state state,
- const char *name,
- int (*startup)(unsigned int cpu),
- int (*teardown)(unsigned int cpu),
- bool multi_instance)
- {
- /* (Un)Install the callbacks for further cpu hotplug operations */
- struct cpuhp_step *sp;
- sp = cpuhp_get_step(state);
- sp->startup.single = startup;
- sp->teardown.single = teardown;
- sp->name = name;
- sp->multi_instance = multi_instance;
- INIT_HLIST_HEAD(&sp->list);
- }
- static void *cpuhp_get_teardown_cb(enum cpuhp_state state)
- {
- return cpuhp_get_step(state)->teardown.single;
- }
- /*
- * Call the startup/teardown function for a step either on the AP or
- * on the current CPU.
- */
- static int cpuhp_issue_call(int cpu, enum cpuhp_state state, bool bringup,
- struct hlist_node *node)
- {
- struct cpuhp_step *sp = cpuhp_get_step(state);
- int ret;
- if ((bringup && !sp->startup.single) ||
- (!bringup && !sp->teardown.single))
- return 0;
- /*
- * The non AP bound callbacks can fail on bringup. On teardown
- * e.g. module removal we crash for now.
- */
- #ifdef CONFIG_SMP
- if (cpuhp_is_ap_state(state))
- ret = cpuhp_invoke_ap_callback(cpu, state, bringup, node);
- else
- ret = cpuhp_invoke_callback(cpu, state, bringup, node);
- #else
- ret = cpuhp_invoke_callback(cpu, state, bringup, node);
- #endif
- BUG_ON(ret && !bringup);
- return ret;
- }
- /*
- * Called from __cpuhp_setup_state on a recoverable failure.
- *
- * Note: The teardown callbacks for rollback are not allowed to fail!
- */
- static void cpuhp_rollback_install(int failedcpu, enum cpuhp_state state,
- struct hlist_node *node)
- {
- int cpu;
- /* Roll back the already executed steps on the other cpus */
- for_each_present_cpu(cpu) {
- struct cpuhp_cpu_state *st = per_cpu_ptr(&cpuhp_state, cpu);
- int cpustate = st->state;
- if (cpu >= failedcpu)
- break;
- /* Did we invoke the startup call on that cpu ? */
- if (cpustate >= state)
- cpuhp_issue_call(cpu, state, false, node);
- }
- }
- /*
- * Returns a free for dynamic slot assignment of the Online state. The states
- * are protected by the cpuhp_slot_states mutex and an empty slot is identified
- * by having no name assigned.
- */
- static int cpuhp_reserve_state(enum cpuhp_state state)
- {
- enum cpuhp_state i;
- for (i = CPUHP_AP_ONLINE_DYN; i <= CPUHP_AP_ONLINE_DYN_END; i++) {
- if (cpuhp_ap_states[i].name)
- continue;
- cpuhp_ap_states[i].name = "Reserved";
- return i;
- }
- WARN(1, "No more dynamic states available for CPU hotplug\n");
- return -ENOSPC;
- }
- int __cpuhp_state_add_instance(enum cpuhp_state state, struct hlist_node *node,
- bool invoke)
- {
- struct cpuhp_step *sp;
- int cpu;
- int ret;
- sp = cpuhp_get_step(state);
- if (sp->multi_instance == false)
- return -EINVAL;
- get_online_cpus();
- mutex_lock(&cpuhp_state_mutex);
- if (!invoke || !sp->startup.multi)
- goto add_node;
- /*
- * Try to call the startup callback for each present cpu
- * depending on the hotplug state of the cpu.
- */
- for_each_present_cpu(cpu) {
- struct cpuhp_cpu_state *st = per_cpu_ptr(&cpuhp_state, cpu);
- int cpustate = st->state;
- if (cpustate < state)
- continue;
- ret = cpuhp_issue_call(cpu, state, true, node);
- if (ret) {
- if (sp->teardown.multi)
- cpuhp_rollback_install(cpu, state, node);
- goto err;
- }
- }
- add_node:
- ret = 0;
- hlist_add_head(node, &sp->list);
- err:
- mutex_unlock(&cpuhp_state_mutex);
- put_online_cpus();
- return ret;
- }
- EXPORT_SYMBOL_GPL(__cpuhp_state_add_instance);
- /**
- * __cpuhp_setup_state - Setup the callbacks for an hotplug machine state
- * @state: The state to setup
- * @invoke: If true, the startup function is invoked for cpus where
- * cpu state >= @state
- * @startup: startup callback function
- * @teardown: teardown callback function
- *
- * Returns 0 if successful, otherwise a proper error code
- */
- int __cpuhp_setup_state(enum cpuhp_state state,
- const char *name, bool invoke,
- int (*startup)(unsigned int cpu),
- int (*teardown)(unsigned int cpu),
- bool multi_instance)
- {
- int cpu, ret = 0;
- int dyn_state = 0;
- if (cpuhp_cb_check(state) || !name)
- return -EINVAL;
- get_online_cpus();
- mutex_lock(&cpuhp_state_mutex);
- /* currently assignments for the ONLINE state are possible */
- if (state == CPUHP_AP_ONLINE_DYN) {
- dyn_state = 1;
- ret = cpuhp_reserve_state(state);
- if (ret < 0)
- goto out;
- state = ret;
- }
- cpuhp_store_callbacks(state, name, startup, teardown, multi_instance);
- if (!invoke || !startup)
- goto out;
- /*
- * Try to call the startup callback for each present cpu
- * depending on the hotplug state of the cpu.
- */
- for_each_present_cpu(cpu) {
- struct cpuhp_cpu_state *st = per_cpu_ptr(&cpuhp_state, cpu);
- int cpustate = st->state;
- if (cpustate < state)
- continue;
- ret = cpuhp_issue_call(cpu, state, true, NULL);
- if (ret) {
- if (teardown)
- cpuhp_rollback_install(cpu, state, NULL);
- cpuhp_store_callbacks(state, NULL, NULL, NULL, false);
- goto out;
- }
- }
- out:
- mutex_unlock(&cpuhp_state_mutex);
- put_online_cpus();
- if (!ret && dyn_state)
- return state;
- return ret;
- }
- EXPORT_SYMBOL(__cpuhp_setup_state);
- int __cpuhp_state_remove_instance(enum cpuhp_state state,
- struct hlist_node *node, bool invoke)
- {
- struct cpuhp_step *sp = cpuhp_get_step(state);
- int cpu;
- BUG_ON(cpuhp_cb_check(state));
- if (!sp->multi_instance)
- return -EINVAL;
- get_online_cpus();
- mutex_lock(&cpuhp_state_mutex);
- if (!invoke || !cpuhp_get_teardown_cb(state))
- goto remove;
- /*
- * Call the teardown callback for each present cpu depending
- * on the hotplug state of the cpu. This function is not
- * allowed to fail currently!
- */
- for_each_present_cpu(cpu) {
- struct cpuhp_cpu_state *st = per_cpu_ptr(&cpuhp_state, cpu);
- int cpustate = st->state;
- if (cpustate >= state)
- cpuhp_issue_call(cpu, state, false, node);
- }
- remove:
- hlist_del(node);
- mutex_unlock(&cpuhp_state_mutex);
- put_online_cpus();
- return 0;
- }
- EXPORT_SYMBOL_GPL(__cpuhp_state_remove_instance);
- /**
- * __cpuhp_remove_state - Remove the callbacks for an hotplug machine state
- * @state: The state to remove
- * @invoke: If true, the teardown function is invoked for cpus where
- * cpu state >= @state
- *
- * The teardown callback is currently not allowed to fail. Think
- * about module removal!
- */
- void __cpuhp_remove_state(enum cpuhp_state state, bool invoke)
- {
- struct cpuhp_step *sp = cpuhp_get_step(state);
- int cpu;
- BUG_ON(cpuhp_cb_check(state));
- get_online_cpus();
- mutex_lock(&cpuhp_state_mutex);
- if (sp->multi_instance) {
- WARN(!hlist_empty(&sp->list),
- "Error: Removing state %d which has instances left.\n",
- state);
- goto remove;
- }
- if (!invoke || !cpuhp_get_teardown_cb(state))
- goto remove;
- /*
- * Call the teardown callback for each present cpu depending
- * on the hotplug state of the cpu. This function is not
- * allowed to fail currently!
- */
- for_each_present_cpu(cpu) {
- struct cpuhp_cpu_state *st = per_cpu_ptr(&cpuhp_state, cpu);
- int cpustate = st->state;
- if (cpustate >= state)
- cpuhp_issue_call(cpu, state, false, NULL);
- }
- remove:
- cpuhp_store_callbacks(state, NULL, NULL, NULL, false);
- mutex_unlock(&cpuhp_state_mutex);
- put_online_cpus();
- }
- EXPORT_SYMBOL(__cpuhp_remove_state);
- #if defined(CONFIG_SYSFS) && defined(CONFIG_HOTPLUG_CPU)
- static ssize_t show_cpuhp_state(struct device *dev,
- struct device_attribute *attr, char *buf)
- {
- struct cpuhp_cpu_state *st = per_cpu_ptr(&cpuhp_state, dev->id);
- return sprintf(buf, "%d\n", st->state);
- }
- static DEVICE_ATTR(state, 0444, show_cpuhp_state, NULL);
- static ssize_t write_cpuhp_target(struct device *dev,
- struct device_attribute *attr,
- const char *buf, size_t count)
- {
- struct cpuhp_cpu_state *st = per_cpu_ptr(&cpuhp_state, dev->id);
- struct cpuhp_step *sp;
- int target, ret;
- ret = kstrtoint(buf, 10, &target);
- if (ret)
- return ret;
- #ifdef CONFIG_CPU_HOTPLUG_STATE_CONTROL
- if (target < CPUHP_OFFLINE || target > CPUHP_ONLINE)
- return -EINVAL;
- #else
- if (target != CPUHP_OFFLINE && target != CPUHP_ONLINE)
- return -EINVAL;
- #endif
- ret = lock_device_hotplug_sysfs();
- if (ret)
- return ret;
- mutex_lock(&cpuhp_state_mutex);
- sp = cpuhp_get_step(target);
- ret = !sp->name || sp->cant_stop ? -EINVAL : 0;
- mutex_unlock(&cpuhp_state_mutex);
- if (ret)
- goto out;
- if (st->state < target)
- ret = do_cpu_up(dev->id, target);
- else
- ret = do_cpu_down(dev->id, target);
- out:
- unlock_device_hotplug();
- return ret ? ret : count;
- }
- static ssize_t show_cpuhp_target(struct device *dev,
- struct device_attribute *attr, char *buf)
- {
- struct cpuhp_cpu_state *st = per_cpu_ptr(&cpuhp_state, dev->id);
- return sprintf(buf, "%d\n", st->target);
- }
- static DEVICE_ATTR(target, 0644, show_cpuhp_target, write_cpuhp_target);
- static struct attribute *cpuhp_cpu_attrs[] = {
- &dev_attr_state.attr,
- &dev_attr_target.attr,
- NULL
- };
- static struct attribute_group cpuhp_cpu_attr_group = {
- .attrs = cpuhp_cpu_attrs,
- .name = "hotplug",
- NULL
- };
- static ssize_t show_cpuhp_states(struct device *dev,
- struct device_attribute *attr, char *buf)
- {
- ssize_t cur, res = 0;
- int i;
- mutex_lock(&cpuhp_state_mutex);
- for (i = CPUHP_OFFLINE; i <= CPUHP_ONLINE; i++) {
- struct cpuhp_step *sp = cpuhp_get_step(i);
- if (sp->name) {
- cur = sprintf(buf, "%3d: %s\n", i, sp->name);
- buf += cur;
- res += cur;
- }
- }
- mutex_unlock(&cpuhp_state_mutex);
- return res;
- }
- static DEVICE_ATTR(states, 0444, show_cpuhp_states, NULL);
- static struct attribute *cpuhp_cpu_root_attrs[] = {
- &dev_attr_states.attr,
- NULL
- };
- static struct attribute_group cpuhp_cpu_root_attr_group = {
- .attrs = cpuhp_cpu_root_attrs,
- .name = "hotplug",
- NULL
- };
- static int __init cpuhp_sysfs_init(void)
- {
- int cpu, ret;
- ret = sysfs_create_group(&cpu_subsys.dev_root->kobj,
- &cpuhp_cpu_root_attr_group);
- if (ret)
- return ret;
- for_each_possible_cpu(cpu) {
- struct device *dev = get_cpu_device(cpu);
- if (!dev)
- continue;
- ret = sysfs_create_group(&dev->kobj, &cpuhp_cpu_attr_group);
- if (ret)
- return ret;
- }
- return 0;
- }
- device_initcall(cpuhp_sysfs_init);
- #endif
- /*
- * cpu_bit_bitmap[] is a special, "compressed" data structure that
- * represents all NR_CPUS bits binary values of 1<<nr.
- *
- * It is used by cpumask_of() to get a constant address to a CPU
- * mask value that has a single bit set only.
- */
- /* cpu_bit_bitmap[0] is empty - so we can back into it */
- #define MASK_DECLARE_1(x) [x+1][0] = (1UL << (x))
- #define MASK_DECLARE_2(x) MASK_DECLARE_1(x), MASK_DECLARE_1(x+1)
- #define MASK_DECLARE_4(x) MASK_DECLARE_2(x), MASK_DECLARE_2(x+2)
- #define MASK_DECLARE_8(x) MASK_DECLARE_4(x), MASK_DECLARE_4(x+4)
- const unsigned long cpu_bit_bitmap[BITS_PER_LONG+1][BITS_TO_LONGS(NR_CPUS)] = {
- MASK_DECLARE_8(0), MASK_DECLARE_8(8),
- MASK_DECLARE_8(16), MASK_DECLARE_8(24),
- #if BITS_PER_LONG > 32
- MASK_DECLARE_8(32), MASK_DECLARE_8(40),
- MASK_DECLARE_8(48), MASK_DECLARE_8(56),
- #endif
- };
- EXPORT_SYMBOL_GPL(cpu_bit_bitmap);
- const DECLARE_BITMAP(cpu_all_bits, NR_CPUS) = CPU_BITS_ALL;
- EXPORT_SYMBOL(cpu_all_bits);
- #ifdef CONFIG_INIT_ALL_POSSIBLE
- struct cpumask __cpu_possible_mask __read_mostly
- = {CPU_BITS_ALL};
- #else
- struct cpumask __cpu_possible_mask __read_mostly;
- #endif
- EXPORT_SYMBOL(__cpu_possible_mask);
- struct cpumask __cpu_online_mask __read_mostly;
- EXPORT_SYMBOL(__cpu_online_mask);
- struct cpumask __cpu_present_mask __read_mostly;
- EXPORT_SYMBOL(__cpu_present_mask);
- struct cpumask __cpu_active_mask __read_mostly;
- EXPORT_SYMBOL(__cpu_active_mask);
- void init_cpu_present(const struct cpumask *src)
- {
- cpumask_copy(&__cpu_present_mask, src);
- }
- void init_cpu_possible(const struct cpumask *src)
- {
- cpumask_copy(&__cpu_possible_mask, src);
- }
- void init_cpu_online(const struct cpumask *src)
- {
- cpumask_copy(&__cpu_online_mask, src);
- }
- /*
- * Activate the first processor.
- */
- void __init boot_cpu_init(void)
- {
- int cpu = smp_processor_id();
- /* Mark the boot cpu "present", "online" etc for SMP and UP case */
- set_cpu_online(cpu, true);
- set_cpu_active(cpu, true);
- set_cpu_present(cpu, true);
- set_cpu_possible(cpu, true);
- }
- /*
- * Must be called _AFTER_ setting up the per_cpu areas
- */
- void __init boot_cpu_state_init(void)
- {
- per_cpu_ptr(&cpuhp_state, smp_processor_id())->state = CPUHP_ONLINE;
- }
|