coupled.c 25 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742743744745746747748749750751752753754755756757758759760761762763764765766767768769770771772773774775776777778779780781782783784785786
  1. /*
  2. * coupled.c - helper functions to enter the same idle state on multiple cpus
  3. *
  4. * Copyright (c) 2011 Google, Inc.
  5. *
  6. * Author: Colin Cross <ccross@android.com>
  7. *
  8. * This program is free software; you can redistribute it and/or modify
  9. * it under the terms of the GNU General Public License as published by
  10. * the Free Software Foundation; either version 2 of the License, or
  11. * (at your option) any later version.
  12. *
  13. * This program is distributed in the hope that it will be useful, but WITHOUT
  14. * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
  15. * FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License for
  16. * more details.
  17. */
  18. #include <linux/kernel.h>
  19. #include <linux/cpu.h>
  20. #include <linux/cpuidle.h>
  21. #include <linux/mutex.h>
  22. #include <linux/sched.h>
  23. #include <linux/slab.h>
  24. #include <linux/spinlock.h>
  25. #include "cpuidle.h"
  26. /**
  27. * DOC: Coupled cpuidle states
  28. *
  29. * On some ARM SMP SoCs (OMAP4460, Tegra 2, and probably more), the
  30. * cpus cannot be independently powered down, either due to
  31. * sequencing restrictions (on Tegra 2, cpu 0 must be the last to
  32. * power down), or due to HW bugs (on OMAP4460, a cpu powering up
  33. * will corrupt the gic state unless the other cpu runs a work
  34. * around). Each cpu has a power state that it can enter without
  35. * coordinating with the other cpu (usually Wait For Interrupt, or
  36. * WFI), and one or more "coupled" power states that affect blocks
  37. * shared between the cpus (L2 cache, interrupt controller, and
  38. * sometimes the whole SoC). Entering a coupled power state must
  39. * be tightly controlled on both cpus.
  40. *
  41. * This file implements a solution, where each cpu will wait in the
  42. * WFI state until all cpus are ready to enter a coupled state, at
  43. * which point the coupled state function will be called on all
  44. * cpus at approximately the same time.
  45. *
  46. * Once all cpus are ready to enter idle, they are woken by an smp
  47. * cross call. At this point, there is a chance that one of the
  48. * cpus will find work to do, and choose not to enter idle. A
  49. * final pass is needed to guarantee that all cpus will call the
  50. * power state enter function at the same time. During this pass,
  51. * each cpu will increment the ready counter, and continue once the
  52. * ready counter matches the number of online coupled cpus. If any
  53. * cpu exits idle, the other cpus will decrement their counter and
  54. * retry.
  55. *
  56. * requested_state stores the deepest coupled idle state each cpu
  57. * is ready for. It is assumed that the states are indexed from
  58. * shallowest (highest power, lowest exit latency) to deepest
  59. * (lowest power, highest exit latency). The requested_state
  60. * variable is not locked. It is only written from the cpu that
  61. * it stores (or by the on/offlining cpu if that cpu is offline),
  62. * and only read after all the cpus are ready for the coupled idle
  63. * state are are no longer updating it.
  64. *
  65. * Three atomic counters are used. alive_count tracks the number
  66. * of cpus in the coupled set that are currently or soon will be
  67. * online. waiting_count tracks the number of cpus that are in
  68. * the waiting loop, in the ready loop, or in the coupled idle state.
  69. * ready_count tracks the number of cpus that are in the ready loop
  70. * or in the coupled idle state.
  71. *
  72. * To use coupled cpuidle states, a cpuidle driver must:
  73. *
  74. * Set struct cpuidle_device.coupled_cpus to the mask of all
  75. * coupled cpus, usually the same as cpu_possible_mask if all cpus
  76. * are part of the same cluster. The coupled_cpus mask must be
  77. * set in the struct cpuidle_device for each cpu.
  78. *
  79. * Set struct cpuidle_device.safe_state to a state that is not a
  80. * coupled state. This is usually WFI.
  81. *
  82. * Set CPUIDLE_FLAG_COUPLED in struct cpuidle_state.flags for each
  83. * state that affects multiple cpus.
  84. *
  85. * Provide a struct cpuidle_state.enter function for each state
  86. * that affects multiple cpus. This function is guaranteed to be
  87. * called on all cpus at approximately the same time. The driver
  88. * should ensure that the cpus all abort together if any cpu tries
  89. * to abort once the function is called. The function should return
  90. * with interrupts still disabled.
  91. */
  92. /**
  93. * struct cpuidle_coupled - data for set of cpus that share a coupled idle state
  94. * @coupled_cpus: mask of cpus that are part of the coupled set
  95. * @requested_state: array of requested states for cpus in the coupled set
  96. * @ready_waiting_counts: combined count of cpus in ready or waiting loops
  97. * @online_count: count of cpus that are online
  98. * @refcnt: reference count of cpuidle devices that are using this struct
  99. * @prevent: flag to prevent coupled idle while a cpu is hotplugging
  100. */
  101. struct cpuidle_coupled {
  102. cpumask_t coupled_cpus;
  103. int requested_state[NR_CPUS];
  104. atomic_t ready_waiting_counts;
  105. atomic_t abort_barrier;
  106. int online_count;
  107. int refcnt;
  108. int prevent;
  109. };
  110. #define WAITING_BITS 16
  111. #define MAX_WAITING_CPUS (1 << WAITING_BITS)
  112. #define WAITING_MASK (MAX_WAITING_CPUS - 1)
  113. #define READY_MASK (~WAITING_MASK)
  114. #define CPUIDLE_COUPLED_NOT_IDLE (-1)
  115. static DEFINE_MUTEX(cpuidle_coupled_lock);
  116. static DEFINE_PER_CPU(struct call_single_data, cpuidle_coupled_poke_cb);
  117. /*
  118. * The cpuidle_coupled_poke_pending mask is used to avoid calling
  119. * __smp_call_function_single with the per cpu call_single_data struct already
  120. * in use. This prevents a deadlock where two cpus are waiting for each others
  121. * call_single_data struct to be available
  122. */
  123. static cpumask_t cpuidle_coupled_poke_pending;
  124. /*
  125. * The cpuidle_coupled_poked mask is used to ensure that each cpu has been poked
  126. * once to minimize entering the ready loop with a poke pending, which would
  127. * require aborting and retrying.
  128. */
  129. static cpumask_t cpuidle_coupled_poked;
  130. /**
  131. * cpuidle_coupled_parallel_barrier - synchronize all online coupled cpus
  132. * @dev: cpuidle_device of the calling cpu
  133. * @a: atomic variable to hold the barrier
  134. *
  135. * No caller to this function will return from this function until all online
  136. * cpus in the same coupled group have called this function. Once any caller
  137. * has returned from this function, the barrier is immediately available for
  138. * reuse.
  139. *
  140. * The atomic variable a must be initialized to 0 before any cpu calls
  141. * this function, will be reset to 0 before any cpu returns from this function.
  142. *
  143. * Must only be called from within a coupled idle state handler
  144. * (state.enter when state.flags has CPUIDLE_FLAG_COUPLED set).
  145. *
  146. * Provides full smp barrier semantics before and after calling.
  147. */
  148. void cpuidle_coupled_parallel_barrier(struct cpuidle_device *dev, atomic_t *a)
  149. {
  150. int n = dev->coupled->online_count;
  151. smp_mb__before_atomic_inc();
  152. atomic_inc(a);
  153. while (atomic_read(a) < n)
  154. cpu_relax();
  155. if (atomic_inc_return(a) == n * 2) {
  156. atomic_set(a, 0);
  157. return;
  158. }
  159. while (atomic_read(a) > n)
  160. cpu_relax();
  161. }
  162. /**
  163. * cpuidle_state_is_coupled - check if a state is part of a coupled set
  164. * @dev: struct cpuidle_device for the current cpu
  165. * @drv: struct cpuidle_driver for the platform
  166. * @state: index of the target state in drv->states
  167. *
  168. * Returns true if the target state is coupled with cpus besides this one
  169. */
  170. bool cpuidle_state_is_coupled(struct cpuidle_device *dev,
  171. struct cpuidle_driver *drv, int state)
  172. {
  173. return drv->states[state].flags & CPUIDLE_FLAG_COUPLED;
  174. }
  175. /**
  176. * cpuidle_coupled_set_ready - mark a cpu as ready
  177. * @coupled: the struct coupled that contains the current cpu
  178. */
  179. static inline void cpuidle_coupled_set_ready(struct cpuidle_coupled *coupled)
  180. {
  181. atomic_add(MAX_WAITING_CPUS, &coupled->ready_waiting_counts);
  182. }
  183. /**
  184. * cpuidle_coupled_set_not_ready - mark a cpu as not ready
  185. * @coupled: the struct coupled that contains the current cpu
  186. *
  187. * Decrements the ready counter, unless the ready (and thus the waiting) counter
  188. * is equal to the number of online cpus. Prevents a race where one cpu
  189. * decrements the waiting counter and then re-increments it just before another
  190. * cpu has decremented its ready counter, leading to the ready counter going
  191. * down from the number of online cpus without going through the coupled idle
  192. * state.
  193. *
  194. * Returns 0 if the counter was decremented successfully, -EINVAL if the ready
  195. * counter was equal to the number of online cpus.
  196. */
  197. static
  198. inline int cpuidle_coupled_set_not_ready(struct cpuidle_coupled *coupled)
  199. {
  200. int all;
  201. int ret;
  202. all = coupled->online_count | (coupled->online_count << WAITING_BITS);
  203. ret = atomic_add_unless(&coupled->ready_waiting_counts,
  204. -MAX_WAITING_CPUS, all);
  205. return ret ? 0 : -EINVAL;
  206. }
  207. /**
  208. * cpuidle_coupled_no_cpus_ready - check if no cpus in a coupled set are ready
  209. * @coupled: the struct coupled that contains the current cpu
  210. *
  211. * Returns true if all of the cpus in a coupled set are out of the ready loop.
  212. */
  213. static inline int cpuidle_coupled_no_cpus_ready(struct cpuidle_coupled *coupled)
  214. {
  215. int r = atomic_read(&coupled->ready_waiting_counts) >> WAITING_BITS;
  216. return r == 0;
  217. }
  218. /**
  219. * cpuidle_coupled_cpus_ready - check if all cpus in a coupled set are ready
  220. * @coupled: the struct coupled that contains the current cpu
  221. *
  222. * Returns true if all cpus coupled to this target state are in the ready loop
  223. */
  224. static inline bool cpuidle_coupled_cpus_ready(struct cpuidle_coupled *coupled)
  225. {
  226. int r = atomic_read(&coupled->ready_waiting_counts) >> WAITING_BITS;
  227. return r == coupled->online_count;
  228. }
  229. /**
  230. * cpuidle_coupled_cpus_waiting - check if all cpus in a coupled set are waiting
  231. * @coupled: the struct coupled that contains the current cpu
  232. *
  233. * Returns true if all cpus coupled to this target state are in the wait loop
  234. */
  235. static inline bool cpuidle_coupled_cpus_waiting(struct cpuidle_coupled *coupled)
  236. {
  237. int w = atomic_read(&coupled->ready_waiting_counts) & WAITING_MASK;
  238. return w == coupled->online_count;
  239. }
  240. /**
  241. * cpuidle_coupled_no_cpus_waiting - check if no cpus in coupled set are waiting
  242. * @coupled: the struct coupled that contains the current cpu
  243. *
  244. * Returns true if all of the cpus in a coupled set are out of the waiting loop.
  245. */
  246. static inline int cpuidle_coupled_no_cpus_waiting(struct cpuidle_coupled *coupled)
  247. {
  248. int w = atomic_read(&coupled->ready_waiting_counts) & WAITING_MASK;
  249. return w == 0;
  250. }
  251. /**
  252. * cpuidle_coupled_get_state - determine the deepest idle state
  253. * @dev: struct cpuidle_device for this cpu
  254. * @coupled: the struct coupled that contains the current cpu
  255. *
  256. * Returns the deepest idle state that all coupled cpus can enter
  257. */
  258. static inline int cpuidle_coupled_get_state(struct cpuidle_device *dev,
  259. struct cpuidle_coupled *coupled)
  260. {
  261. int i;
  262. int state = INT_MAX;
  263. /*
  264. * Read barrier ensures that read of requested_state is ordered after
  265. * reads of ready_count. Matches the write barriers
  266. * cpuidle_set_state_waiting.
  267. */
  268. smp_rmb();
  269. for_each_cpu_mask(i, coupled->coupled_cpus)
  270. if (cpu_online(i) && coupled->requested_state[i] < state)
  271. state = coupled->requested_state[i];
  272. return state;
  273. }
  274. static void cpuidle_coupled_handle_poke(void *info)
  275. {
  276. int cpu = (unsigned long)info;
  277. cpumask_set_cpu(cpu, &cpuidle_coupled_poked);
  278. cpumask_clear_cpu(cpu, &cpuidle_coupled_poke_pending);
  279. }
  280. /**
  281. * cpuidle_coupled_poke - wake up a cpu that may be waiting
  282. * @cpu: target cpu
  283. *
  284. * Ensures that the target cpu exits it's waiting idle state (if it is in it)
  285. * and will see updates to waiting_count before it re-enters it's waiting idle
  286. * state.
  287. *
  288. * If cpuidle_coupled_poked_mask is already set for the target cpu, that cpu
  289. * either has or will soon have a pending IPI that will wake it out of idle,
  290. * or it is currently processing the IPI and is not in idle.
  291. */
  292. static void cpuidle_coupled_poke(int cpu)
  293. {
  294. struct call_single_data *csd = &per_cpu(cpuidle_coupled_poke_cb, cpu);
  295. if (!cpumask_test_and_set_cpu(cpu, &cpuidle_coupled_poke_pending))
  296. __smp_call_function_single(cpu, csd, 0);
  297. }
  298. /**
  299. * cpuidle_coupled_poke_others - wake up all other cpus that may be waiting
  300. * @dev: struct cpuidle_device for this cpu
  301. * @coupled: the struct coupled that contains the current cpu
  302. *
  303. * Calls cpuidle_coupled_poke on all other online cpus.
  304. */
  305. static void cpuidle_coupled_poke_others(int this_cpu,
  306. struct cpuidle_coupled *coupled)
  307. {
  308. int cpu;
  309. for_each_cpu_mask(cpu, coupled->coupled_cpus)
  310. if (cpu != this_cpu && cpu_online(cpu))
  311. cpuidle_coupled_poke(cpu);
  312. }
  313. /**
  314. * cpuidle_coupled_set_waiting - mark this cpu as in the wait loop
  315. * @dev: struct cpuidle_device for this cpu
  316. * @coupled: the struct coupled that contains the current cpu
  317. * @next_state: the index in drv->states of the requested state for this cpu
  318. *
  319. * Updates the requested idle state for the specified cpuidle device.
  320. * Returns the number of waiting cpus.
  321. */
  322. static int cpuidle_coupled_set_waiting(int cpu,
  323. struct cpuidle_coupled *coupled, int next_state)
  324. {
  325. coupled->requested_state[cpu] = next_state;
  326. /*
  327. * The atomic_inc_return provides a write barrier to order the write
  328. * to requested_state with the later write that increments ready_count.
  329. */
  330. return atomic_inc_return(&coupled->ready_waiting_counts) & WAITING_MASK;
  331. }
  332. /**
  333. * cpuidle_coupled_set_not_waiting - mark this cpu as leaving the wait loop
  334. * @dev: struct cpuidle_device for this cpu
  335. * @coupled: the struct coupled that contains the current cpu
  336. *
  337. * Removes the requested idle state for the specified cpuidle device.
  338. */
  339. static void cpuidle_coupled_set_not_waiting(int cpu,
  340. struct cpuidle_coupled *coupled)
  341. {
  342. /*
  343. * Decrementing waiting count can race with incrementing it in
  344. * cpuidle_coupled_set_waiting, but that's OK. Worst case, some
  345. * cpus will increment ready_count and then spin until they
  346. * notice that this cpu has cleared it's requested_state.
  347. */
  348. atomic_dec(&coupled->ready_waiting_counts);
  349. coupled->requested_state[cpu] = CPUIDLE_COUPLED_NOT_IDLE;
  350. }
  351. /**
  352. * cpuidle_coupled_set_done - mark this cpu as leaving the ready loop
  353. * @cpu: the current cpu
  354. * @coupled: the struct coupled that contains the current cpu
  355. *
  356. * Marks this cpu as no longer in the ready and waiting loops. Decrements
  357. * the waiting count first to prevent another cpu looping back in and seeing
  358. * this cpu as waiting just before it exits idle.
  359. */
  360. static void cpuidle_coupled_set_done(int cpu, struct cpuidle_coupled *coupled)
  361. {
  362. cpuidle_coupled_set_not_waiting(cpu, coupled);
  363. atomic_sub(MAX_WAITING_CPUS, &coupled->ready_waiting_counts);
  364. }
  365. /**
  366. * cpuidle_coupled_clear_pokes - spin until the poke interrupt is processed
  367. * @cpu - this cpu
  368. *
  369. * Turns on interrupts and spins until any outstanding poke interrupts have
  370. * been processed and the poke bit has been cleared.
  371. *
  372. * Other interrupts may also be processed while interrupts are enabled, so
  373. * need_resched() must be tested after turning interrupts off again to make sure
  374. * the interrupt didn't schedule work that should take the cpu out of idle.
  375. *
  376. * Returns 0 if need_resched was false, -EINTR if need_resched was true.
  377. */
  378. static int cpuidle_coupled_clear_pokes(int cpu)
  379. {
  380. local_irq_enable();
  381. while (cpumask_test_cpu(cpu, &cpuidle_coupled_poke_pending))
  382. cpu_relax();
  383. local_irq_disable();
  384. return need_resched() ? -EINTR : 0;
  385. }
  386. static bool cpuidle_coupled_any_pokes_pending(struct cpuidle_coupled *coupled)
  387. {
  388. cpumask_t cpus;
  389. int ret;
  390. cpumask_and(&cpus, cpu_online_mask, &coupled->coupled_cpus);
  391. ret = cpumask_and(&cpus, &cpuidle_coupled_poke_pending, &cpus);
  392. return ret;
  393. }
  394. /**
  395. * cpuidle_enter_state_coupled - attempt to enter a state with coupled cpus
  396. * @dev: struct cpuidle_device for the current cpu
  397. * @drv: struct cpuidle_driver for the platform
  398. * @next_state: index of the requested state in drv->states
  399. *
  400. * Coordinate with coupled cpus to enter the target state. This is a two
  401. * stage process. In the first stage, the cpus are operating independently,
  402. * and may call into cpuidle_enter_state_coupled at completely different times.
  403. * To save as much power as possible, the first cpus to call this function will
  404. * go to an intermediate state (the cpuidle_device's safe state), and wait for
  405. * all the other cpus to call this function. Once all coupled cpus are idle,
  406. * the second stage will start. Each coupled cpu will spin until all cpus have
  407. * guaranteed that they will call the target_state.
  408. *
  409. * This function must be called with interrupts disabled. It may enable
  410. * interrupts while preparing for idle, and it will always return with
  411. * interrupts enabled.
  412. */
  413. int cpuidle_enter_state_coupled(struct cpuidle_device *dev,
  414. struct cpuidle_driver *drv, int next_state)
  415. {
  416. int entered_state = -1;
  417. struct cpuidle_coupled *coupled = dev->coupled;
  418. int w;
  419. if (!coupled)
  420. return -EINVAL;
  421. while (coupled->prevent) {
  422. if (cpuidle_coupled_clear_pokes(dev->cpu)) {
  423. local_irq_enable();
  424. return entered_state;
  425. }
  426. entered_state = cpuidle_enter_state(dev, drv,
  427. dev->safe_state_index);
  428. local_irq_disable();
  429. }
  430. /* Read barrier ensures online_count is read after prevent is cleared */
  431. smp_rmb();
  432. reset:
  433. cpumask_clear_cpu(dev->cpu, &cpuidle_coupled_poked);
  434. w = cpuidle_coupled_set_waiting(dev->cpu, coupled, next_state);
  435. /*
  436. * If this is the last cpu to enter the waiting state, poke
  437. * all the other cpus out of their waiting state so they can
  438. * enter a deeper state. This can race with one of the cpus
  439. * exiting the waiting state due to an interrupt and
  440. * decrementing waiting_count, see comment below.
  441. */
  442. if (w == coupled->online_count) {
  443. cpumask_set_cpu(dev->cpu, &cpuidle_coupled_poked);
  444. cpuidle_coupled_poke_others(dev->cpu, coupled);
  445. }
  446. retry:
  447. /*
  448. * Wait for all coupled cpus to be idle, using the deepest state
  449. * allowed for a single cpu. If this was not the poking cpu, wait
  450. * for at least one poke before leaving to avoid a race where
  451. * two cpus could arrive at the waiting loop at the same time,
  452. * but the first of the two to arrive could skip the loop without
  453. * processing the pokes from the last to arrive.
  454. */
  455. while (!cpuidle_coupled_cpus_waiting(coupled) ||
  456. !cpumask_test_cpu(dev->cpu, &cpuidle_coupled_poked)) {
  457. if (cpuidle_coupled_clear_pokes(dev->cpu)) {
  458. cpuidle_coupled_set_not_waiting(dev->cpu, coupled);
  459. goto out;
  460. }
  461. if (coupled->prevent) {
  462. cpuidle_coupled_set_not_waiting(dev->cpu, coupled);
  463. goto out;
  464. }
  465. entered_state = cpuidle_enter_state(dev, drv,
  466. dev->safe_state_index);
  467. local_irq_disable();
  468. }
  469. if (cpuidle_coupled_clear_pokes(dev->cpu)) {
  470. cpuidle_coupled_set_not_waiting(dev->cpu, coupled);
  471. goto out;
  472. }
  473. /*
  474. * Make sure final poke status for this cpu is visible before setting
  475. * cpu as ready.
  476. */
  477. smp_wmb();
  478. /*
  479. * All coupled cpus are probably idle. There is a small chance that
  480. * one of the other cpus just became active. Increment the ready count,
  481. * and spin until all coupled cpus have incremented the counter. Once a
  482. * cpu has incremented the ready counter, it cannot abort idle and must
  483. * spin until either all cpus have incremented the ready counter, or
  484. * another cpu leaves idle and decrements the waiting counter.
  485. */
  486. cpuidle_coupled_set_ready(coupled);
  487. while (!cpuidle_coupled_cpus_ready(coupled)) {
  488. /* Check if any other cpus bailed out of idle. */
  489. if (!cpuidle_coupled_cpus_waiting(coupled))
  490. if (!cpuidle_coupled_set_not_ready(coupled))
  491. goto retry;
  492. cpu_relax();
  493. }
  494. /*
  495. * Make sure read of all cpus ready is done before reading pending pokes
  496. */
  497. smp_rmb();
  498. /*
  499. * There is a small chance that a cpu left and reentered idle after this
  500. * cpu saw that all cpus were waiting. The cpu that reentered idle will
  501. * have sent this cpu a poke, which will still be pending after the
  502. * ready loop. The pending interrupt may be lost by the interrupt
  503. * controller when entering the deep idle state. It's not possible to
  504. * clear a pending interrupt without turning interrupts on and handling
  505. * it, and it's too late to turn on interrupts here, so reset the
  506. * coupled idle state of all cpus and retry.
  507. */
  508. if (cpuidle_coupled_any_pokes_pending(coupled)) {
  509. cpuidle_coupled_set_done(dev->cpu, coupled);
  510. /* Wait for all cpus to see the pending pokes */
  511. cpuidle_coupled_parallel_barrier(dev, &coupled->abort_barrier);
  512. goto reset;
  513. }
  514. /* all cpus have acked the coupled state */
  515. next_state = cpuidle_coupled_get_state(dev, coupled);
  516. entered_state = cpuidle_enter_state(dev, drv, next_state);
  517. cpuidle_coupled_set_done(dev->cpu, coupled);
  518. out:
  519. /*
  520. * Normal cpuidle states are expected to return with irqs enabled.
  521. * That leads to an inefficiency where a cpu receiving an interrupt
  522. * that brings it out of idle will process that interrupt before
  523. * exiting the idle enter function and decrementing ready_count. All
  524. * other cpus will need to spin waiting for the cpu that is processing
  525. * the interrupt. If the driver returns with interrupts disabled,
  526. * all other cpus will loop back into the safe idle state instead of
  527. * spinning, saving power.
  528. *
  529. * Calling local_irq_enable here allows coupled states to return with
  530. * interrupts disabled, but won't cause problems for drivers that
  531. * exit with interrupts enabled.
  532. */
  533. local_irq_enable();
  534. /*
  535. * Wait until all coupled cpus have exited idle. There is no risk that
  536. * a cpu exits and re-enters the ready state because this cpu has
  537. * already decremented its waiting_count.
  538. */
  539. while (!cpuidle_coupled_no_cpus_ready(coupled))
  540. cpu_relax();
  541. return entered_state;
  542. }
  543. static void cpuidle_coupled_update_online_cpus(struct cpuidle_coupled *coupled)
  544. {
  545. cpumask_t cpus;
  546. cpumask_and(&cpus, cpu_online_mask, &coupled->coupled_cpus);
  547. coupled->online_count = cpumask_weight(&cpus);
  548. }
  549. /**
  550. * cpuidle_coupled_register_device - register a coupled cpuidle device
  551. * @dev: struct cpuidle_device for the current cpu
  552. *
  553. * Called from cpuidle_register_device to handle coupled idle init. Finds the
  554. * cpuidle_coupled struct for this set of coupled cpus, or creates one if none
  555. * exists yet.
  556. */
  557. int cpuidle_coupled_register_device(struct cpuidle_device *dev)
  558. {
  559. int cpu;
  560. struct cpuidle_device *other_dev;
  561. struct call_single_data *csd;
  562. struct cpuidle_coupled *coupled;
  563. if (cpumask_empty(&dev->coupled_cpus))
  564. return 0;
  565. for_each_cpu_mask(cpu, dev->coupled_cpus) {
  566. other_dev = per_cpu(cpuidle_devices, cpu);
  567. if (other_dev && other_dev->coupled) {
  568. coupled = other_dev->coupled;
  569. goto have_coupled;
  570. }
  571. }
  572. /* No existing coupled info found, create a new one */
  573. coupled = kzalloc(sizeof(struct cpuidle_coupled), GFP_KERNEL);
  574. if (!coupled)
  575. return -ENOMEM;
  576. coupled->coupled_cpus = dev->coupled_cpus;
  577. have_coupled:
  578. dev->coupled = coupled;
  579. if (WARN_ON(!cpumask_equal(&dev->coupled_cpus, &coupled->coupled_cpus)))
  580. coupled->prevent++;
  581. cpuidle_coupled_update_online_cpus(coupled);
  582. coupled->refcnt++;
  583. csd = &per_cpu(cpuidle_coupled_poke_cb, dev->cpu);
  584. csd->func = cpuidle_coupled_handle_poke;
  585. csd->info = (void *)(unsigned long)dev->cpu;
  586. return 0;
  587. }
  588. /**
  589. * cpuidle_coupled_unregister_device - unregister a coupled cpuidle device
  590. * @dev: struct cpuidle_device for the current cpu
  591. *
  592. * Called from cpuidle_unregister_device to tear down coupled idle. Removes the
  593. * cpu from the coupled idle set, and frees the cpuidle_coupled_info struct if
  594. * this was the last cpu in the set.
  595. */
  596. void cpuidle_coupled_unregister_device(struct cpuidle_device *dev)
  597. {
  598. struct cpuidle_coupled *coupled = dev->coupled;
  599. if (cpumask_empty(&dev->coupled_cpus))
  600. return;
  601. if (--coupled->refcnt)
  602. kfree(coupled);
  603. dev->coupled = NULL;
  604. }
  605. /**
  606. * cpuidle_coupled_prevent_idle - prevent cpus from entering a coupled state
  607. * @coupled: the struct coupled that contains the cpu that is changing state
  608. *
  609. * Disables coupled cpuidle on a coupled set of cpus. Used to ensure that
  610. * cpu_online_mask doesn't change while cpus are coordinating coupled idle.
  611. */
  612. static void cpuidle_coupled_prevent_idle(struct cpuidle_coupled *coupled)
  613. {
  614. int cpu = get_cpu();
  615. /* Force all cpus out of the waiting loop. */
  616. coupled->prevent++;
  617. cpuidle_coupled_poke_others(cpu, coupled);
  618. put_cpu();
  619. while (!cpuidle_coupled_no_cpus_waiting(coupled))
  620. cpu_relax();
  621. }
  622. /**
  623. * cpuidle_coupled_allow_idle - allows cpus to enter a coupled state
  624. * @coupled: the struct coupled that contains the cpu that is changing state
  625. *
  626. * Enables coupled cpuidle on a coupled set of cpus. Used to ensure that
  627. * cpu_online_mask doesn't change while cpus are coordinating coupled idle.
  628. */
  629. static void cpuidle_coupled_allow_idle(struct cpuidle_coupled *coupled)
  630. {
  631. int cpu = get_cpu();
  632. /*
  633. * Write barrier ensures readers see the new online_count when they
  634. * see prevent == 0.
  635. */
  636. smp_wmb();
  637. coupled->prevent--;
  638. /* Force cpus out of the prevent loop. */
  639. cpuidle_coupled_poke_others(cpu, coupled);
  640. put_cpu();
  641. }
  642. /**
  643. * cpuidle_coupled_cpu_notify - notifier called during hotplug transitions
  644. * @nb: notifier block
  645. * @action: hotplug transition
  646. * @hcpu: target cpu number
  647. *
  648. * Called when a cpu is brought on or offline using hotplug. Updates the
  649. * coupled cpu set appropriately
  650. */
  651. static int cpuidle_coupled_cpu_notify(struct notifier_block *nb,
  652. unsigned long action, void *hcpu)
  653. {
  654. int cpu = (unsigned long)hcpu;
  655. struct cpuidle_device *dev;
  656. switch (action & ~CPU_TASKS_FROZEN) {
  657. case CPU_UP_PREPARE:
  658. case CPU_DOWN_PREPARE:
  659. case CPU_ONLINE:
  660. case CPU_DEAD:
  661. case CPU_UP_CANCELED:
  662. case CPU_DOWN_FAILED:
  663. break;
  664. default:
  665. return NOTIFY_OK;
  666. }
  667. mutex_lock(&cpuidle_lock);
  668. dev = per_cpu(cpuidle_devices, cpu);
  669. if (!dev || !dev->coupled)
  670. goto out;
  671. switch (action & ~CPU_TASKS_FROZEN) {
  672. case CPU_UP_PREPARE:
  673. case CPU_DOWN_PREPARE:
  674. cpuidle_coupled_prevent_idle(dev->coupled);
  675. break;
  676. case CPU_ONLINE:
  677. case CPU_DEAD:
  678. cpuidle_coupled_update_online_cpus(dev->coupled);
  679. /* Fall through */
  680. case CPU_UP_CANCELED:
  681. case CPU_DOWN_FAILED:
  682. cpuidle_coupled_allow_idle(dev->coupled);
  683. break;
  684. }
  685. out:
  686. mutex_unlock(&cpuidle_lock);
  687. return NOTIFY_OK;
  688. }
  689. static struct notifier_block cpuidle_coupled_cpu_notifier = {
  690. .notifier_call = cpuidle_coupled_cpu_notify,
  691. };
  692. static int __init cpuidle_coupled_init(void)
  693. {
  694. return register_cpu_notifier(&cpuidle_coupled_cpu_notifier);
  695. }
  696. core_initcall(cpuidle_coupled_init);