coupled.c 26 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742743744745746747748749750751752753754755756757758759760761762763764765766767768769770771772773774775776777778779780781782783784785786787788789790791792793794
  1. /*
  2. * coupled.c - helper functions to enter the same idle state on multiple cpus
  3. *
  4. * Copyright (c) 2011 Google, Inc.
  5. *
  6. * Author: Colin Cross <ccross@android.com>
  7. *
  8. * This program is free software; you can redistribute it and/or modify
  9. * it under the terms of the GNU General Public License as published by
  10. * the Free Software Foundation; either version 2 of the License, or
  11. * (at your option) any later version.
  12. *
  13. * This program is distributed in the hope that it will be useful, but WITHOUT
  14. * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
  15. * FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License for
  16. * more details.
  17. */
  18. #include <linux/kernel.h>
  19. #include <linux/cpu.h>
  20. #include <linux/cpuidle.h>
  21. #include <linux/mutex.h>
  22. #include <linux/sched.h>
  23. #include <linux/slab.h>
  24. #include <linux/spinlock.h>
  25. #include "cpuidle.h"
  26. /**
  27. * DOC: Coupled cpuidle states
  28. *
  29. * On some ARM SMP SoCs (OMAP4460, Tegra 2, and probably more), the
  30. * cpus cannot be independently powered down, either due to
  31. * sequencing restrictions (on Tegra 2, cpu 0 must be the last to
  32. * power down), or due to HW bugs (on OMAP4460, a cpu powering up
  33. * will corrupt the gic state unless the other cpu runs a work
  34. * around). Each cpu has a power state that it can enter without
  35. * coordinating with the other cpu (usually Wait For Interrupt, or
  36. * WFI), and one or more "coupled" power states that affect blocks
  37. * shared between the cpus (L2 cache, interrupt controller, and
  38. * sometimes the whole SoC). Entering a coupled power state must
  39. * be tightly controlled on both cpus.
  40. *
  41. * This file implements a solution, where each cpu will wait in the
  42. * WFI state until all cpus are ready to enter a coupled state, at
  43. * which point the coupled state function will be called on all
  44. * cpus at approximately the same time.
  45. *
  46. * Once all cpus are ready to enter idle, they are woken by an smp
  47. * cross call. At this point, there is a chance that one of the
  48. * cpus will find work to do, and choose not to enter idle. A
  49. * final pass is needed to guarantee that all cpus will call the
  50. * power state enter function at the same time. During this pass,
  51. * each cpu will increment the ready counter, and continue once the
  52. * ready counter matches the number of online coupled cpus. If any
  53. * cpu exits idle, the other cpus will decrement their counter and
  54. * retry.
  55. *
  56. * requested_state stores the deepest coupled idle state each cpu
  57. * is ready for. It is assumed that the states are indexed from
  58. * shallowest (highest power, lowest exit latency) to deepest
  59. * (lowest power, highest exit latency). The requested_state
  60. * variable is not locked. It is only written from the cpu that
  61. * it stores (or by the on/offlining cpu if that cpu is offline),
  62. * and only read after all the cpus are ready for the coupled idle
  63. * state are are no longer updating it.
  64. *
  65. * Three atomic counters are used. alive_count tracks the number
  66. * of cpus in the coupled set that are currently or soon will be
  67. * online. waiting_count tracks the number of cpus that are in
  68. * the waiting loop, in the ready loop, or in the coupled idle state.
  69. * ready_count tracks the number of cpus that are in the ready loop
  70. * or in the coupled idle state.
  71. *
  72. * To use coupled cpuidle states, a cpuidle driver must:
  73. *
  74. * Set struct cpuidle_device.coupled_cpus to the mask of all
  75. * coupled cpus, usually the same as cpu_possible_mask if all cpus
  76. * are part of the same cluster. The coupled_cpus mask must be
  77. * set in the struct cpuidle_device for each cpu.
  78. *
  79. * Set struct cpuidle_device.safe_state to a state that is not a
  80. * coupled state. This is usually WFI.
  81. *
  82. * Set CPUIDLE_FLAG_COUPLED in struct cpuidle_state.flags for each
  83. * state that affects multiple cpus.
  84. *
  85. * Provide a struct cpuidle_state.enter function for each state
  86. * that affects multiple cpus. This function is guaranteed to be
  87. * called on all cpus at approximately the same time. The driver
  88. * should ensure that the cpus all abort together if any cpu tries
  89. * to abort once the function is called. The function should return
  90. * with interrupts still disabled.
  91. */
  92. /**
  93. * struct cpuidle_coupled - data for set of cpus that share a coupled idle state
  94. * @coupled_cpus: mask of cpus that are part of the coupled set
  95. * @requested_state: array of requested states for cpus in the coupled set
  96. * @ready_waiting_counts: combined count of cpus in ready or waiting loops
  97. * @online_count: count of cpus that are online
  98. * @refcnt: reference count of cpuidle devices that are using this struct
  99. * @prevent: flag to prevent coupled idle while a cpu is hotplugging
  100. */
  101. struct cpuidle_coupled {
  102. cpumask_t coupled_cpus;
  103. int requested_state[NR_CPUS];
  104. atomic_t ready_waiting_counts;
  105. atomic_t abort_barrier;
  106. int online_count;
  107. int refcnt;
  108. int prevent;
  109. };
  110. #define WAITING_BITS 16
  111. #define MAX_WAITING_CPUS (1 << WAITING_BITS)
  112. #define WAITING_MASK (MAX_WAITING_CPUS - 1)
  113. #define READY_MASK (~WAITING_MASK)
  114. #define CPUIDLE_COUPLED_NOT_IDLE (-1)
  115. static DEFINE_MUTEX(cpuidle_coupled_lock);
  116. static DEFINE_PER_CPU(struct call_single_data, cpuidle_coupled_poke_cb);
  117. /*
  118. * The cpuidle_coupled_poke_pending mask is used to avoid calling
  119. * __smp_call_function_single with the per cpu call_single_data struct already
  120. * in use. This prevents a deadlock where two cpus are waiting for each others
  121. * call_single_data struct to be available
  122. */
  123. static cpumask_t cpuidle_coupled_poke_pending;
  124. /*
  125. * The cpuidle_coupled_poked mask is used to ensure that each cpu has been poked
  126. * once to minimize entering the ready loop with a poke pending, which would
  127. * require aborting and retrying.
  128. */
  129. static cpumask_t cpuidle_coupled_poked;
  130. /**
  131. * cpuidle_coupled_parallel_barrier - synchronize all online coupled cpus
  132. * @dev: cpuidle_device of the calling cpu
  133. * @a: atomic variable to hold the barrier
  134. *
  135. * No caller to this function will return from this function until all online
  136. * cpus in the same coupled group have called this function. Once any caller
  137. * has returned from this function, the barrier is immediately available for
  138. * reuse.
  139. *
  140. * The atomic variable a must be initialized to 0 before any cpu calls
  141. * this function, will be reset to 0 before any cpu returns from this function.
  142. *
  143. * Must only be called from within a coupled idle state handler
  144. * (state.enter when state.flags has CPUIDLE_FLAG_COUPLED set).
  145. *
  146. * Provides full smp barrier semantics before and after calling.
  147. */
  148. void cpuidle_coupled_parallel_barrier(struct cpuidle_device *dev, atomic_t *a)
  149. {
  150. int n = dev->coupled->online_count;
  151. smp_mb__before_atomic_inc();
  152. atomic_inc(a);
  153. while (atomic_read(a) < n)
  154. cpu_relax();
  155. if (atomic_inc_return(a) == n * 2) {
  156. atomic_set(a, 0);
  157. return;
  158. }
  159. while (atomic_read(a) > n)
  160. cpu_relax();
  161. }
  162. /**
  163. * cpuidle_state_is_coupled - check if a state is part of a coupled set
  164. * @dev: struct cpuidle_device for the current cpu
  165. * @drv: struct cpuidle_driver for the platform
  166. * @state: index of the target state in drv->states
  167. *
  168. * Returns true if the target state is coupled with cpus besides this one
  169. */
  170. bool cpuidle_state_is_coupled(struct cpuidle_device *dev,
  171. struct cpuidle_driver *drv, int state)
  172. {
  173. return drv->states[state].flags & CPUIDLE_FLAG_COUPLED;
  174. }
  175. /**
  176. * cpuidle_coupled_set_ready - mark a cpu as ready
  177. * @coupled: the struct coupled that contains the current cpu
  178. */
  179. static inline void cpuidle_coupled_set_ready(struct cpuidle_coupled *coupled)
  180. {
  181. atomic_add(MAX_WAITING_CPUS, &coupled->ready_waiting_counts);
  182. }
  183. /**
  184. * cpuidle_coupled_set_not_ready - mark a cpu as not ready
  185. * @coupled: the struct coupled that contains the current cpu
  186. *
  187. * Decrements the ready counter, unless the ready (and thus the waiting) counter
  188. * is equal to the number of online cpus. Prevents a race where one cpu
  189. * decrements the waiting counter and then re-increments it just before another
  190. * cpu has decremented its ready counter, leading to the ready counter going
  191. * down from the number of online cpus without going through the coupled idle
  192. * state.
  193. *
  194. * Returns 0 if the counter was decremented successfully, -EINVAL if the ready
  195. * counter was equal to the number of online cpus.
  196. */
  197. static
  198. inline int cpuidle_coupled_set_not_ready(struct cpuidle_coupled *coupled)
  199. {
  200. int all;
  201. int ret;
  202. all = coupled->online_count | (coupled->online_count << WAITING_BITS);
  203. ret = atomic_add_unless(&coupled->ready_waiting_counts,
  204. -MAX_WAITING_CPUS, all);
  205. return ret ? 0 : -EINVAL;
  206. }
  207. /**
  208. * cpuidle_coupled_no_cpus_ready - check if no cpus in a coupled set are ready
  209. * @coupled: the struct coupled that contains the current cpu
  210. *
  211. * Returns true if all of the cpus in a coupled set are out of the ready loop.
  212. */
  213. static inline int cpuidle_coupled_no_cpus_ready(struct cpuidle_coupled *coupled)
  214. {
  215. int r = atomic_read(&coupled->ready_waiting_counts) >> WAITING_BITS;
  216. return r == 0;
  217. }
  218. /**
  219. * cpuidle_coupled_cpus_ready - check if all cpus in a coupled set are ready
  220. * @coupled: the struct coupled that contains the current cpu
  221. *
  222. * Returns true if all cpus coupled to this target state are in the ready loop
  223. */
  224. static inline bool cpuidle_coupled_cpus_ready(struct cpuidle_coupled *coupled)
  225. {
  226. int r = atomic_read(&coupled->ready_waiting_counts) >> WAITING_BITS;
  227. return r == coupled->online_count;
  228. }
  229. /**
  230. * cpuidle_coupled_cpus_waiting - check if all cpus in a coupled set are waiting
  231. * @coupled: the struct coupled that contains the current cpu
  232. *
  233. * Returns true if all cpus coupled to this target state are in the wait loop
  234. */
  235. static inline bool cpuidle_coupled_cpus_waiting(struct cpuidle_coupled *coupled)
  236. {
  237. int w = atomic_read(&coupled->ready_waiting_counts) & WAITING_MASK;
  238. return w == coupled->online_count;
  239. }
  240. /**
  241. * cpuidle_coupled_no_cpus_waiting - check if no cpus in coupled set are waiting
  242. * @coupled: the struct coupled that contains the current cpu
  243. *
  244. * Returns true if all of the cpus in a coupled set are out of the waiting loop.
  245. */
  246. static inline int cpuidle_coupled_no_cpus_waiting(struct cpuidle_coupled *coupled)
  247. {
  248. int w = atomic_read(&coupled->ready_waiting_counts) & WAITING_MASK;
  249. return w == 0;
  250. }
  251. /**
  252. * cpuidle_coupled_get_state - determine the deepest idle state
  253. * @dev: struct cpuidle_device for this cpu
  254. * @coupled: the struct coupled that contains the current cpu
  255. *
  256. * Returns the deepest idle state that all coupled cpus can enter
  257. */
  258. static inline int cpuidle_coupled_get_state(struct cpuidle_device *dev,
  259. struct cpuidle_coupled *coupled)
  260. {
  261. int i;
  262. int state = INT_MAX;
  263. /*
  264. * Read barrier ensures that read of requested_state is ordered after
  265. * reads of ready_count. Matches the write barriers
  266. * cpuidle_set_state_waiting.
  267. */
  268. smp_rmb();
  269. for_each_cpu_mask(i, coupled->coupled_cpus)
  270. if (cpu_online(i) && coupled->requested_state[i] < state)
  271. state = coupled->requested_state[i];
  272. return state;
  273. }
  274. static void cpuidle_coupled_handle_poke(void *info)
  275. {
  276. int cpu = (unsigned long)info;
  277. cpumask_set_cpu(cpu, &cpuidle_coupled_poked);
  278. cpumask_clear_cpu(cpu, &cpuidle_coupled_poke_pending);
  279. }
  280. /**
  281. * cpuidle_coupled_poke - wake up a cpu that may be waiting
  282. * @cpu: target cpu
  283. *
  284. * Ensures that the target cpu exits it's waiting idle state (if it is in it)
  285. * and will see updates to waiting_count before it re-enters it's waiting idle
  286. * state.
  287. *
  288. * If cpuidle_coupled_poked_mask is already set for the target cpu, that cpu
  289. * either has or will soon have a pending IPI that will wake it out of idle,
  290. * or it is currently processing the IPI and is not in idle.
  291. */
  292. static void cpuidle_coupled_poke(int cpu)
  293. {
  294. struct call_single_data *csd = &per_cpu(cpuidle_coupled_poke_cb, cpu);
  295. if (!cpumask_test_and_set_cpu(cpu, &cpuidle_coupled_poke_pending))
  296. __smp_call_function_single(cpu, csd, 0);
  297. }
  298. /**
  299. * cpuidle_coupled_poke_others - wake up all other cpus that may be waiting
  300. * @dev: struct cpuidle_device for this cpu
  301. * @coupled: the struct coupled that contains the current cpu
  302. *
  303. * Calls cpuidle_coupled_poke on all other online cpus.
  304. */
  305. static void cpuidle_coupled_poke_others(int this_cpu,
  306. struct cpuidle_coupled *coupled)
  307. {
  308. int cpu;
  309. for_each_cpu_mask(cpu, coupled->coupled_cpus)
  310. if (cpu != this_cpu && cpu_online(cpu))
  311. cpuidle_coupled_poke(cpu);
  312. }
  313. /**
  314. * cpuidle_coupled_set_waiting - mark this cpu as in the wait loop
  315. * @dev: struct cpuidle_device for this cpu
  316. * @coupled: the struct coupled that contains the current cpu
  317. * @next_state: the index in drv->states of the requested state for this cpu
  318. *
  319. * Updates the requested idle state for the specified cpuidle device.
  320. * Returns the number of waiting cpus.
  321. */
  322. static int cpuidle_coupled_set_waiting(int cpu,
  323. struct cpuidle_coupled *coupled, int next_state)
  324. {
  325. coupled->requested_state[cpu] = next_state;
  326. /*
  327. * The atomic_inc_return provides a write barrier to order the write
  328. * to requested_state with the later write that increments ready_count.
  329. */
  330. return atomic_inc_return(&coupled->ready_waiting_counts) & WAITING_MASK;
  331. }
  332. /**
  333. * cpuidle_coupled_set_not_waiting - mark this cpu as leaving the wait loop
  334. * @dev: struct cpuidle_device for this cpu
  335. * @coupled: the struct coupled that contains the current cpu
  336. *
  337. * Removes the requested idle state for the specified cpuidle device.
  338. */
  339. static void cpuidle_coupled_set_not_waiting(int cpu,
  340. struct cpuidle_coupled *coupled)
  341. {
  342. /*
  343. * Decrementing waiting count can race with incrementing it in
  344. * cpuidle_coupled_set_waiting, but that's OK. Worst case, some
  345. * cpus will increment ready_count and then spin until they
  346. * notice that this cpu has cleared it's requested_state.
  347. */
  348. atomic_dec(&coupled->ready_waiting_counts);
  349. coupled->requested_state[cpu] = CPUIDLE_COUPLED_NOT_IDLE;
  350. }
  351. /**
  352. * cpuidle_coupled_set_done - mark this cpu as leaving the ready loop
  353. * @cpu: the current cpu
  354. * @coupled: the struct coupled that contains the current cpu
  355. *
  356. * Marks this cpu as no longer in the ready and waiting loops. Decrements
  357. * the waiting count first to prevent another cpu looping back in and seeing
  358. * this cpu as waiting just before it exits idle.
  359. */
  360. static void cpuidle_coupled_set_done(int cpu, struct cpuidle_coupled *coupled)
  361. {
  362. cpuidle_coupled_set_not_waiting(cpu, coupled);
  363. atomic_sub(MAX_WAITING_CPUS, &coupled->ready_waiting_counts);
  364. }
  365. /**
  366. * cpuidle_coupled_clear_pokes - spin until the poke interrupt is processed
  367. * @cpu - this cpu
  368. *
  369. * Turns on interrupts and spins until any outstanding poke interrupts have
  370. * been processed and the poke bit has been cleared.
  371. *
  372. * Other interrupts may also be processed while interrupts are enabled, so
  373. * need_resched() must be tested after this function returns to make sure
  374. * the interrupt didn't schedule work that should take the cpu out of idle.
  375. *
  376. * Returns 0 if no poke was pending, 1 if a poke was cleared.
  377. */
  378. static int cpuidle_coupled_clear_pokes(int cpu)
  379. {
  380. if (!cpumask_test_cpu(cpu, &cpuidle_coupled_poke_pending))
  381. return 0;
  382. local_irq_enable();
  383. while (cpumask_test_cpu(cpu, &cpuidle_coupled_poke_pending))
  384. cpu_relax();
  385. local_irq_disable();
  386. return 1;
  387. }
  388. static bool cpuidle_coupled_any_pokes_pending(struct cpuidle_coupled *coupled)
  389. {
  390. cpumask_t cpus;
  391. int ret;
  392. cpumask_and(&cpus, cpu_online_mask, &coupled->coupled_cpus);
  393. ret = cpumask_and(&cpus, &cpuidle_coupled_poke_pending, &cpus);
  394. return ret;
  395. }
  396. /**
  397. * cpuidle_enter_state_coupled - attempt to enter a state with coupled cpus
  398. * @dev: struct cpuidle_device for the current cpu
  399. * @drv: struct cpuidle_driver for the platform
  400. * @next_state: index of the requested state in drv->states
  401. *
  402. * Coordinate with coupled cpus to enter the target state. This is a two
  403. * stage process. In the first stage, the cpus are operating independently,
  404. * and may call into cpuidle_enter_state_coupled at completely different times.
  405. * To save as much power as possible, the first cpus to call this function will
  406. * go to an intermediate state (the cpuidle_device's safe state), and wait for
  407. * all the other cpus to call this function. Once all coupled cpus are idle,
  408. * the second stage will start. Each coupled cpu will spin until all cpus have
  409. * guaranteed that they will call the target_state.
  410. *
  411. * This function must be called with interrupts disabled. It may enable
  412. * interrupts while preparing for idle, and it will always return with
  413. * interrupts enabled.
  414. */
  415. int cpuidle_enter_state_coupled(struct cpuidle_device *dev,
  416. struct cpuidle_driver *drv, int next_state)
  417. {
  418. int entered_state = -1;
  419. struct cpuidle_coupled *coupled = dev->coupled;
  420. int w;
  421. if (!coupled)
  422. return -EINVAL;
  423. while (coupled->prevent) {
  424. cpuidle_coupled_clear_pokes(dev->cpu);
  425. if (need_resched()) {
  426. local_irq_enable();
  427. return entered_state;
  428. }
  429. entered_state = cpuidle_enter_state(dev, drv,
  430. dev->safe_state_index);
  431. local_irq_disable();
  432. }
  433. /* Read barrier ensures online_count is read after prevent is cleared */
  434. smp_rmb();
  435. reset:
  436. cpumask_clear_cpu(dev->cpu, &cpuidle_coupled_poked);
  437. w = cpuidle_coupled_set_waiting(dev->cpu, coupled, next_state);
  438. /*
  439. * If this is the last cpu to enter the waiting state, poke
  440. * all the other cpus out of their waiting state so they can
  441. * enter a deeper state. This can race with one of the cpus
  442. * exiting the waiting state due to an interrupt and
  443. * decrementing waiting_count, see comment below.
  444. */
  445. if (w == coupled->online_count) {
  446. cpumask_set_cpu(dev->cpu, &cpuidle_coupled_poked);
  447. cpuidle_coupled_poke_others(dev->cpu, coupled);
  448. }
  449. retry:
  450. /*
  451. * Wait for all coupled cpus to be idle, using the deepest state
  452. * allowed for a single cpu. If this was not the poking cpu, wait
  453. * for at least one poke before leaving to avoid a race where
  454. * two cpus could arrive at the waiting loop at the same time,
  455. * but the first of the two to arrive could skip the loop without
  456. * processing the pokes from the last to arrive.
  457. */
  458. while (!cpuidle_coupled_cpus_waiting(coupled) ||
  459. !cpumask_test_cpu(dev->cpu, &cpuidle_coupled_poked)) {
  460. if (cpuidle_coupled_clear_pokes(dev->cpu))
  461. continue;
  462. if (need_resched()) {
  463. cpuidle_coupled_set_not_waiting(dev->cpu, coupled);
  464. goto out;
  465. }
  466. if (coupled->prevent) {
  467. cpuidle_coupled_set_not_waiting(dev->cpu, coupled);
  468. goto out;
  469. }
  470. entered_state = cpuidle_enter_state(dev, drv,
  471. dev->safe_state_index);
  472. local_irq_disable();
  473. }
  474. cpuidle_coupled_clear_pokes(dev->cpu);
  475. if (need_resched()) {
  476. cpuidle_coupled_set_not_waiting(dev->cpu, coupled);
  477. goto out;
  478. }
  479. /*
  480. * Make sure final poke status for this cpu is visible before setting
  481. * cpu as ready.
  482. */
  483. smp_wmb();
  484. /*
  485. * All coupled cpus are probably idle. There is a small chance that
  486. * one of the other cpus just became active. Increment the ready count,
  487. * and spin until all coupled cpus have incremented the counter. Once a
  488. * cpu has incremented the ready counter, it cannot abort idle and must
  489. * spin until either all cpus have incremented the ready counter, or
  490. * another cpu leaves idle and decrements the waiting counter.
  491. */
  492. cpuidle_coupled_set_ready(coupled);
  493. while (!cpuidle_coupled_cpus_ready(coupled)) {
  494. /* Check if any other cpus bailed out of idle. */
  495. if (!cpuidle_coupled_cpus_waiting(coupled))
  496. if (!cpuidle_coupled_set_not_ready(coupled))
  497. goto retry;
  498. cpu_relax();
  499. }
  500. /*
  501. * Make sure read of all cpus ready is done before reading pending pokes
  502. */
  503. smp_rmb();
  504. /*
  505. * There is a small chance that a cpu left and reentered idle after this
  506. * cpu saw that all cpus were waiting. The cpu that reentered idle will
  507. * have sent this cpu a poke, which will still be pending after the
  508. * ready loop. The pending interrupt may be lost by the interrupt
  509. * controller when entering the deep idle state. It's not possible to
  510. * clear a pending interrupt without turning interrupts on and handling
  511. * it, and it's too late to turn on interrupts here, so reset the
  512. * coupled idle state of all cpus and retry.
  513. */
  514. if (cpuidle_coupled_any_pokes_pending(coupled)) {
  515. cpuidle_coupled_set_done(dev->cpu, coupled);
  516. /* Wait for all cpus to see the pending pokes */
  517. cpuidle_coupled_parallel_barrier(dev, &coupled->abort_barrier);
  518. goto reset;
  519. }
  520. /* all cpus have acked the coupled state */
  521. next_state = cpuidle_coupled_get_state(dev, coupled);
  522. entered_state = cpuidle_enter_state(dev, drv, next_state);
  523. cpuidle_coupled_set_done(dev->cpu, coupled);
  524. out:
  525. /*
  526. * Normal cpuidle states are expected to return with irqs enabled.
  527. * That leads to an inefficiency where a cpu receiving an interrupt
  528. * that brings it out of idle will process that interrupt before
  529. * exiting the idle enter function and decrementing ready_count. All
  530. * other cpus will need to spin waiting for the cpu that is processing
  531. * the interrupt. If the driver returns with interrupts disabled,
  532. * all other cpus will loop back into the safe idle state instead of
  533. * spinning, saving power.
  534. *
  535. * Calling local_irq_enable here allows coupled states to return with
  536. * interrupts disabled, but won't cause problems for drivers that
  537. * exit with interrupts enabled.
  538. */
  539. local_irq_enable();
  540. /*
  541. * Wait until all coupled cpus have exited idle. There is no risk that
  542. * a cpu exits and re-enters the ready state because this cpu has
  543. * already decremented its waiting_count.
  544. */
  545. while (!cpuidle_coupled_no_cpus_ready(coupled))
  546. cpu_relax();
  547. return entered_state;
  548. }
  549. static void cpuidle_coupled_update_online_cpus(struct cpuidle_coupled *coupled)
  550. {
  551. cpumask_t cpus;
  552. cpumask_and(&cpus, cpu_online_mask, &coupled->coupled_cpus);
  553. coupled->online_count = cpumask_weight(&cpus);
  554. }
  555. /**
  556. * cpuidle_coupled_register_device - register a coupled cpuidle device
  557. * @dev: struct cpuidle_device for the current cpu
  558. *
  559. * Called from cpuidle_register_device to handle coupled idle init. Finds the
  560. * cpuidle_coupled struct for this set of coupled cpus, or creates one if none
  561. * exists yet.
  562. */
  563. int cpuidle_coupled_register_device(struct cpuidle_device *dev)
  564. {
  565. int cpu;
  566. struct cpuidle_device *other_dev;
  567. struct call_single_data *csd;
  568. struct cpuidle_coupled *coupled;
  569. if (cpumask_empty(&dev->coupled_cpus))
  570. return 0;
  571. for_each_cpu_mask(cpu, dev->coupled_cpus) {
  572. other_dev = per_cpu(cpuidle_devices, cpu);
  573. if (other_dev && other_dev->coupled) {
  574. coupled = other_dev->coupled;
  575. goto have_coupled;
  576. }
  577. }
  578. /* No existing coupled info found, create a new one */
  579. coupled = kzalloc(sizeof(struct cpuidle_coupled), GFP_KERNEL);
  580. if (!coupled)
  581. return -ENOMEM;
  582. coupled->coupled_cpus = dev->coupled_cpus;
  583. have_coupled:
  584. dev->coupled = coupled;
  585. if (WARN_ON(!cpumask_equal(&dev->coupled_cpus, &coupled->coupled_cpus)))
  586. coupled->prevent++;
  587. cpuidle_coupled_update_online_cpus(coupled);
  588. coupled->refcnt++;
  589. csd = &per_cpu(cpuidle_coupled_poke_cb, dev->cpu);
  590. csd->func = cpuidle_coupled_handle_poke;
  591. csd->info = (void *)(unsigned long)dev->cpu;
  592. return 0;
  593. }
  594. /**
  595. * cpuidle_coupled_unregister_device - unregister a coupled cpuidle device
  596. * @dev: struct cpuidle_device for the current cpu
  597. *
  598. * Called from cpuidle_unregister_device to tear down coupled idle. Removes the
  599. * cpu from the coupled idle set, and frees the cpuidle_coupled_info struct if
  600. * this was the last cpu in the set.
  601. */
  602. void cpuidle_coupled_unregister_device(struct cpuidle_device *dev)
  603. {
  604. struct cpuidle_coupled *coupled = dev->coupled;
  605. if (cpumask_empty(&dev->coupled_cpus))
  606. return;
  607. if (--coupled->refcnt)
  608. kfree(coupled);
  609. dev->coupled = NULL;
  610. }
  611. /**
  612. * cpuidle_coupled_prevent_idle - prevent cpus from entering a coupled state
  613. * @coupled: the struct coupled that contains the cpu that is changing state
  614. *
  615. * Disables coupled cpuidle on a coupled set of cpus. Used to ensure that
  616. * cpu_online_mask doesn't change while cpus are coordinating coupled idle.
  617. */
  618. static void cpuidle_coupled_prevent_idle(struct cpuidle_coupled *coupled)
  619. {
  620. int cpu = get_cpu();
  621. /* Force all cpus out of the waiting loop. */
  622. coupled->prevent++;
  623. cpuidle_coupled_poke_others(cpu, coupled);
  624. put_cpu();
  625. while (!cpuidle_coupled_no_cpus_waiting(coupled))
  626. cpu_relax();
  627. }
  628. /**
  629. * cpuidle_coupled_allow_idle - allows cpus to enter a coupled state
  630. * @coupled: the struct coupled that contains the cpu that is changing state
  631. *
  632. * Enables coupled cpuidle on a coupled set of cpus. Used to ensure that
  633. * cpu_online_mask doesn't change while cpus are coordinating coupled idle.
  634. */
  635. static void cpuidle_coupled_allow_idle(struct cpuidle_coupled *coupled)
  636. {
  637. int cpu = get_cpu();
  638. /*
  639. * Write barrier ensures readers see the new online_count when they
  640. * see prevent == 0.
  641. */
  642. smp_wmb();
  643. coupled->prevent--;
  644. /* Force cpus out of the prevent loop. */
  645. cpuidle_coupled_poke_others(cpu, coupled);
  646. put_cpu();
  647. }
  648. /**
  649. * cpuidle_coupled_cpu_notify - notifier called during hotplug transitions
  650. * @nb: notifier block
  651. * @action: hotplug transition
  652. * @hcpu: target cpu number
  653. *
  654. * Called when a cpu is brought on or offline using hotplug. Updates the
  655. * coupled cpu set appropriately
  656. */
  657. static int cpuidle_coupled_cpu_notify(struct notifier_block *nb,
  658. unsigned long action, void *hcpu)
  659. {
  660. int cpu = (unsigned long)hcpu;
  661. struct cpuidle_device *dev;
  662. switch (action & ~CPU_TASKS_FROZEN) {
  663. case CPU_UP_PREPARE:
  664. case CPU_DOWN_PREPARE:
  665. case CPU_ONLINE:
  666. case CPU_DEAD:
  667. case CPU_UP_CANCELED:
  668. case CPU_DOWN_FAILED:
  669. break;
  670. default:
  671. return NOTIFY_OK;
  672. }
  673. mutex_lock(&cpuidle_lock);
  674. dev = per_cpu(cpuidle_devices, cpu);
  675. if (!dev || !dev->coupled)
  676. goto out;
  677. switch (action & ~CPU_TASKS_FROZEN) {
  678. case CPU_UP_PREPARE:
  679. case CPU_DOWN_PREPARE:
  680. cpuidle_coupled_prevent_idle(dev->coupled);
  681. break;
  682. case CPU_ONLINE:
  683. case CPU_DEAD:
  684. cpuidle_coupled_update_online_cpus(dev->coupled);
  685. /* Fall through */
  686. case CPU_UP_CANCELED:
  687. case CPU_DOWN_FAILED:
  688. cpuidle_coupled_allow_idle(dev->coupled);
  689. break;
  690. }
  691. out:
  692. mutex_unlock(&cpuidle_lock);
  693. return NOTIFY_OK;
  694. }
  695. static struct notifier_block cpuidle_coupled_cpu_notifier = {
  696. .notifier_call = cpuidle_coupled_cpu_notify,
  697. };
  698. static int __init cpuidle_coupled_init(void)
  699. {
  700. return register_cpu_notifier(&cpuidle_coupled_cpu_notifier);
  701. }
  702. core_initcall(cpuidle_coupled_init);