coupled.c 26 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742743744745746747748749750751752753754755756757758759760761762763764765766767768769770771772773774775776777778779780781782783784785786787788789790791792793794795796797798799800801802803804805806807808809810811812813814
  1. /*
  2. * coupled.c - helper functions to enter the same idle state on multiple cpus
  3. *
  4. * Copyright (c) 2011 Google, Inc.
  5. *
  6. * Author: Colin Cross <ccross@android.com>
  7. *
  8. * This program is free software; you can redistribute it and/or modify
  9. * it under the terms of the GNU General Public License as published by
  10. * the Free Software Foundation; either version 2 of the License, or
  11. * (at your option) any later version.
  12. *
  13. * This program is distributed in the hope that it will be useful, but WITHOUT
  14. * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
  15. * FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License for
  16. * more details.
  17. */
  18. #include <linux/kernel.h>
  19. #include <linux/cpu.h>
  20. #include <linux/cpuidle.h>
  21. #include <linux/mutex.h>
  22. #include <linux/sched.h>
  23. #include <linux/slab.h>
  24. #include <linux/spinlock.h>
  25. #include "cpuidle.h"
  26. /**
  27. * DOC: Coupled cpuidle states
  28. *
  29. * On some ARM SMP SoCs (OMAP4460, Tegra 2, and probably more), the
  30. * cpus cannot be independently powered down, either due to
  31. * sequencing restrictions (on Tegra 2, cpu 0 must be the last to
  32. * power down), or due to HW bugs (on OMAP4460, a cpu powering up
  33. * will corrupt the gic state unless the other cpu runs a work
  34. * around). Each cpu has a power state that it can enter without
  35. * coordinating with the other cpu (usually Wait For Interrupt, or
  36. * WFI), and one or more "coupled" power states that affect blocks
  37. * shared between the cpus (L2 cache, interrupt controller, and
  38. * sometimes the whole SoC). Entering a coupled power state must
  39. * be tightly controlled on both cpus.
  40. *
  41. * This file implements a solution, where each cpu will wait in the
  42. * WFI state until all cpus are ready to enter a coupled state, at
  43. * which point the coupled state function will be called on all
  44. * cpus at approximately the same time.
  45. *
  46. * Once all cpus are ready to enter idle, they are woken by an smp
  47. * cross call. At this point, there is a chance that one of the
  48. * cpus will find work to do, and choose not to enter idle. A
  49. * final pass is needed to guarantee that all cpus will call the
  50. * power state enter function at the same time. During this pass,
  51. * each cpu will increment the ready counter, and continue once the
  52. * ready counter matches the number of online coupled cpus. If any
  53. * cpu exits idle, the other cpus will decrement their counter and
  54. * retry.
  55. *
  56. * requested_state stores the deepest coupled idle state each cpu
  57. * is ready for. It is assumed that the states are indexed from
  58. * shallowest (highest power, lowest exit latency) to deepest
  59. * (lowest power, highest exit latency). The requested_state
  60. * variable is not locked. It is only written from the cpu that
  61. * it stores (or by the on/offlining cpu if that cpu is offline),
  62. * and only read after all the cpus are ready for the coupled idle
  63. * state are are no longer updating it.
  64. *
  65. * Three atomic counters are used. alive_count tracks the number
  66. * of cpus in the coupled set that are currently or soon will be
  67. * online. waiting_count tracks the number of cpus that are in
  68. * the waiting loop, in the ready loop, or in the coupled idle state.
  69. * ready_count tracks the number of cpus that are in the ready loop
  70. * or in the coupled idle state.
  71. *
  72. * To use coupled cpuidle states, a cpuidle driver must:
  73. *
  74. * Set struct cpuidle_device.coupled_cpus to the mask of all
  75. * coupled cpus, usually the same as cpu_possible_mask if all cpus
  76. * are part of the same cluster. The coupled_cpus mask must be
  77. * set in the struct cpuidle_device for each cpu.
  78. *
  79. * Set struct cpuidle_device.safe_state to a state that is not a
  80. * coupled state. This is usually WFI.
  81. *
  82. * Set CPUIDLE_FLAG_COUPLED in struct cpuidle_state.flags for each
  83. * state that affects multiple cpus.
  84. *
  85. * Provide a struct cpuidle_state.enter function for each state
  86. * that affects multiple cpus. This function is guaranteed to be
  87. * called on all cpus at approximately the same time. The driver
  88. * should ensure that the cpus all abort together if any cpu tries
  89. * to abort once the function is called. The function should return
  90. * with interrupts still disabled.
  91. */
  92. /**
  93. * struct cpuidle_coupled - data for set of cpus that share a coupled idle state
  94. * @coupled_cpus: mask of cpus that are part of the coupled set
  95. * @requested_state: array of requested states for cpus in the coupled set
  96. * @ready_waiting_counts: combined count of cpus in ready or waiting loops
  97. * @online_count: count of cpus that are online
  98. * @refcnt: reference count of cpuidle devices that are using this struct
  99. * @prevent: flag to prevent coupled idle while a cpu is hotplugging
  100. */
  101. struct cpuidle_coupled {
  102. cpumask_t coupled_cpus;
  103. int requested_state[NR_CPUS];
  104. atomic_t ready_waiting_counts;
  105. atomic_t abort_barrier;
  106. int online_count;
  107. int refcnt;
  108. int prevent;
  109. };
  110. #define WAITING_BITS 16
  111. #define MAX_WAITING_CPUS (1 << WAITING_BITS)
  112. #define WAITING_MASK (MAX_WAITING_CPUS - 1)
  113. #define READY_MASK (~WAITING_MASK)
  114. #define CPUIDLE_COUPLED_NOT_IDLE (-1)
  115. static DEFINE_MUTEX(cpuidle_coupled_lock);
  116. static DEFINE_PER_CPU(struct call_single_data, cpuidle_coupled_poke_cb);
  117. /*
  118. * The cpuidle_coupled_poke_pending mask is used to avoid calling
  119. * __smp_call_function_single with the per cpu call_single_data struct already
  120. * in use. This prevents a deadlock where two cpus are waiting for each others
  121. * call_single_data struct to be available
  122. */
  123. static cpumask_t cpuidle_coupled_poke_pending;
  124. /*
  125. * The cpuidle_coupled_poked mask is used to ensure that each cpu has been poked
  126. * once to minimize entering the ready loop with a poke pending, which would
  127. * require aborting and retrying.
  128. */
  129. static cpumask_t cpuidle_coupled_poked;
  130. /**
  131. * cpuidle_coupled_parallel_barrier - synchronize all online coupled cpus
  132. * @dev: cpuidle_device of the calling cpu
  133. * @a: atomic variable to hold the barrier
  134. *
  135. * No caller to this function will return from this function until all online
  136. * cpus in the same coupled group have called this function. Once any caller
  137. * has returned from this function, the barrier is immediately available for
  138. * reuse.
  139. *
  140. * The atomic variable must be initialized to 0 before any cpu calls
  141. * this function, will be reset to 0 before any cpu returns from this function.
  142. *
  143. * Must only be called from within a coupled idle state handler
  144. * (state.enter when state.flags has CPUIDLE_FLAG_COUPLED set).
  145. *
  146. * Provides full smp barrier semantics before and after calling.
  147. */
  148. void cpuidle_coupled_parallel_barrier(struct cpuidle_device *dev, atomic_t *a)
  149. {
  150. int n = dev->coupled->online_count;
  151. smp_mb__before_atomic();
  152. atomic_inc(a);
  153. while (atomic_read(a) < n)
  154. cpu_relax();
  155. if (atomic_inc_return(a) == n * 2) {
  156. atomic_set(a, 0);
  157. return;
  158. }
  159. while (atomic_read(a) > n)
  160. cpu_relax();
  161. }
  162. /**
  163. * cpuidle_state_is_coupled - check if a state is part of a coupled set
  164. * @drv: struct cpuidle_driver for the platform
  165. * @state: index of the target state in drv->states
  166. *
  167. * Returns true if the target state is coupled with cpus besides this one
  168. */
  169. bool cpuidle_state_is_coupled(struct cpuidle_driver *drv, int state)
  170. {
  171. return drv->states[state].flags & CPUIDLE_FLAG_COUPLED;
  172. }
  173. /**
  174. * cpuidle_coupled_state_verify - check if the coupled states are correctly set.
  175. * @drv: struct cpuidle_driver for the platform
  176. *
  177. * Returns 0 for valid state values, a negative error code otherwise:
  178. * * -EINVAL if any coupled state(safe_state_index) is wrongly set.
  179. */
  180. int cpuidle_coupled_state_verify(struct cpuidle_driver *drv)
  181. {
  182. int i;
  183. for (i = drv->state_count - 1; i >= 0; i--) {
  184. if (cpuidle_state_is_coupled(drv, i) &&
  185. (drv->safe_state_index == i ||
  186. drv->safe_state_index < 0 ||
  187. drv->safe_state_index >= drv->state_count))
  188. return -EINVAL;
  189. }
  190. return 0;
  191. }
  192. /**
  193. * cpuidle_coupled_set_ready - mark a cpu as ready
  194. * @coupled: the struct coupled that contains the current cpu
  195. */
  196. static inline void cpuidle_coupled_set_ready(struct cpuidle_coupled *coupled)
  197. {
  198. atomic_add(MAX_WAITING_CPUS, &coupled->ready_waiting_counts);
  199. }
  200. /**
  201. * cpuidle_coupled_set_not_ready - mark a cpu as not ready
  202. * @coupled: the struct coupled that contains the current cpu
  203. *
  204. * Decrements the ready counter, unless the ready (and thus the waiting) counter
  205. * is equal to the number of online cpus. Prevents a race where one cpu
  206. * decrements the waiting counter and then re-increments it just before another
  207. * cpu has decremented its ready counter, leading to the ready counter going
  208. * down from the number of online cpus without going through the coupled idle
  209. * state.
  210. *
  211. * Returns 0 if the counter was decremented successfully, -EINVAL if the ready
  212. * counter was equal to the number of online cpus.
  213. */
  214. static
  215. inline int cpuidle_coupled_set_not_ready(struct cpuidle_coupled *coupled)
  216. {
  217. int all;
  218. int ret;
  219. all = coupled->online_count | (coupled->online_count << WAITING_BITS);
  220. ret = atomic_add_unless(&coupled->ready_waiting_counts,
  221. -MAX_WAITING_CPUS, all);
  222. return ret ? 0 : -EINVAL;
  223. }
  224. /**
  225. * cpuidle_coupled_no_cpus_ready - check if no cpus in a coupled set are ready
  226. * @coupled: the struct coupled that contains the current cpu
  227. *
  228. * Returns true if all of the cpus in a coupled set are out of the ready loop.
  229. */
  230. static inline int cpuidle_coupled_no_cpus_ready(struct cpuidle_coupled *coupled)
  231. {
  232. int r = atomic_read(&coupled->ready_waiting_counts) >> WAITING_BITS;
  233. return r == 0;
  234. }
  235. /**
  236. * cpuidle_coupled_cpus_ready - check if all cpus in a coupled set are ready
  237. * @coupled: the struct coupled that contains the current cpu
  238. *
  239. * Returns true if all cpus coupled to this target state are in the ready loop
  240. */
  241. static inline bool cpuidle_coupled_cpus_ready(struct cpuidle_coupled *coupled)
  242. {
  243. int r = atomic_read(&coupled->ready_waiting_counts) >> WAITING_BITS;
  244. return r == coupled->online_count;
  245. }
  246. /**
  247. * cpuidle_coupled_cpus_waiting - check if all cpus in a coupled set are waiting
  248. * @coupled: the struct coupled that contains the current cpu
  249. *
  250. * Returns true if all cpus coupled to this target state are in the wait loop
  251. */
  252. static inline bool cpuidle_coupled_cpus_waiting(struct cpuidle_coupled *coupled)
  253. {
  254. int w = atomic_read(&coupled->ready_waiting_counts) & WAITING_MASK;
  255. return w == coupled->online_count;
  256. }
  257. /**
  258. * cpuidle_coupled_no_cpus_waiting - check if no cpus in coupled set are waiting
  259. * @coupled: the struct coupled that contains the current cpu
  260. *
  261. * Returns true if all of the cpus in a coupled set are out of the waiting loop.
  262. */
  263. static inline int cpuidle_coupled_no_cpus_waiting(struct cpuidle_coupled *coupled)
  264. {
  265. int w = atomic_read(&coupled->ready_waiting_counts) & WAITING_MASK;
  266. return w == 0;
  267. }
  268. /**
  269. * cpuidle_coupled_get_state - determine the deepest idle state
  270. * @dev: struct cpuidle_device for this cpu
  271. * @coupled: the struct coupled that contains the current cpu
  272. *
  273. * Returns the deepest idle state that all coupled cpus can enter
  274. */
  275. static inline int cpuidle_coupled_get_state(struct cpuidle_device *dev,
  276. struct cpuidle_coupled *coupled)
  277. {
  278. int i;
  279. int state = INT_MAX;
  280. /*
  281. * Read barrier ensures that read of requested_state is ordered after
  282. * reads of ready_count. Matches the write barriers
  283. * cpuidle_set_state_waiting.
  284. */
  285. smp_rmb();
  286. for_each_cpu(i, &coupled->coupled_cpus)
  287. if (cpu_online(i) && coupled->requested_state[i] < state)
  288. state = coupled->requested_state[i];
  289. return state;
  290. }
  291. static void cpuidle_coupled_handle_poke(void *info)
  292. {
  293. int cpu = (unsigned long)info;
  294. cpumask_set_cpu(cpu, &cpuidle_coupled_poked);
  295. cpumask_clear_cpu(cpu, &cpuidle_coupled_poke_pending);
  296. }
  297. /**
  298. * cpuidle_coupled_poke - wake up a cpu that may be waiting
  299. * @cpu: target cpu
  300. *
  301. * Ensures that the target cpu exits it's waiting idle state (if it is in it)
  302. * and will see updates to waiting_count before it re-enters it's waiting idle
  303. * state.
  304. *
  305. * If cpuidle_coupled_poked_mask is already set for the target cpu, that cpu
  306. * either has or will soon have a pending IPI that will wake it out of idle,
  307. * or it is currently processing the IPI and is not in idle.
  308. */
  309. static void cpuidle_coupled_poke(int cpu)
  310. {
  311. struct call_single_data *csd = &per_cpu(cpuidle_coupled_poke_cb, cpu);
  312. if (!cpumask_test_and_set_cpu(cpu, &cpuidle_coupled_poke_pending))
  313. smp_call_function_single_async(cpu, csd);
  314. }
  315. /**
  316. * cpuidle_coupled_poke_others - wake up all other cpus that may be waiting
  317. * @dev: struct cpuidle_device for this cpu
  318. * @coupled: the struct coupled that contains the current cpu
  319. *
  320. * Calls cpuidle_coupled_poke on all other online cpus.
  321. */
  322. static void cpuidle_coupled_poke_others(int this_cpu,
  323. struct cpuidle_coupled *coupled)
  324. {
  325. int cpu;
  326. for_each_cpu(cpu, &coupled->coupled_cpus)
  327. if (cpu != this_cpu && cpu_online(cpu))
  328. cpuidle_coupled_poke(cpu);
  329. }
  330. /**
  331. * cpuidle_coupled_set_waiting - mark this cpu as in the wait loop
  332. * @dev: struct cpuidle_device for this cpu
  333. * @coupled: the struct coupled that contains the current cpu
  334. * @next_state: the index in drv->states of the requested state for this cpu
  335. *
  336. * Updates the requested idle state for the specified cpuidle device.
  337. * Returns the number of waiting cpus.
  338. */
  339. static int cpuidle_coupled_set_waiting(int cpu,
  340. struct cpuidle_coupled *coupled, int next_state)
  341. {
  342. coupled->requested_state[cpu] = next_state;
  343. /*
  344. * The atomic_inc_return provides a write barrier to order the write
  345. * to requested_state with the later write that increments ready_count.
  346. */
  347. return atomic_inc_return(&coupled->ready_waiting_counts) & WAITING_MASK;
  348. }
  349. /**
  350. * cpuidle_coupled_set_not_waiting - mark this cpu as leaving the wait loop
  351. * @dev: struct cpuidle_device for this cpu
  352. * @coupled: the struct coupled that contains the current cpu
  353. *
  354. * Removes the requested idle state for the specified cpuidle device.
  355. */
  356. static void cpuidle_coupled_set_not_waiting(int cpu,
  357. struct cpuidle_coupled *coupled)
  358. {
  359. /*
  360. * Decrementing waiting count can race with incrementing it in
  361. * cpuidle_coupled_set_waiting, but that's OK. Worst case, some
  362. * cpus will increment ready_count and then spin until they
  363. * notice that this cpu has cleared it's requested_state.
  364. */
  365. atomic_dec(&coupled->ready_waiting_counts);
  366. coupled->requested_state[cpu] = CPUIDLE_COUPLED_NOT_IDLE;
  367. }
  368. /**
  369. * cpuidle_coupled_set_done - mark this cpu as leaving the ready loop
  370. * @cpu: the current cpu
  371. * @coupled: the struct coupled that contains the current cpu
  372. *
  373. * Marks this cpu as no longer in the ready and waiting loops. Decrements
  374. * the waiting count first to prevent another cpu looping back in and seeing
  375. * this cpu as waiting just before it exits idle.
  376. */
  377. static void cpuidle_coupled_set_done(int cpu, struct cpuidle_coupled *coupled)
  378. {
  379. cpuidle_coupled_set_not_waiting(cpu, coupled);
  380. atomic_sub(MAX_WAITING_CPUS, &coupled->ready_waiting_counts);
  381. }
  382. /**
  383. * cpuidle_coupled_clear_pokes - spin until the poke interrupt is processed
  384. * @cpu - this cpu
  385. *
  386. * Turns on interrupts and spins until any outstanding poke interrupts have
  387. * been processed and the poke bit has been cleared.
  388. *
  389. * Other interrupts may also be processed while interrupts are enabled, so
  390. * need_resched() must be tested after this function returns to make sure
  391. * the interrupt didn't schedule work that should take the cpu out of idle.
  392. *
  393. * Returns 0 if no poke was pending, 1 if a poke was cleared.
  394. */
  395. static int cpuidle_coupled_clear_pokes(int cpu)
  396. {
  397. if (!cpumask_test_cpu(cpu, &cpuidle_coupled_poke_pending))
  398. return 0;
  399. local_irq_enable();
  400. while (cpumask_test_cpu(cpu, &cpuidle_coupled_poke_pending))
  401. cpu_relax();
  402. local_irq_disable();
  403. return 1;
  404. }
  405. static bool cpuidle_coupled_any_pokes_pending(struct cpuidle_coupled *coupled)
  406. {
  407. cpumask_t cpus;
  408. int ret;
  409. cpumask_and(&cpus, cpu_online_mask, &coupled->coupled_cpus);
  410. ret = cpumask_and(&cpus, &cpuidle_coupled_poke_pending, &cpus);
  411. return ret;
  412. }
  413. /**
  414. * cpuidle_enter_state_coupled - attempt to enter a state with coupled cpus
  415. * @dev: struct cpuidle_device for the current cpu
  416. * @drv: struct cpuidle_driver for the platform
  417. * @next_state: index of the requested state in drv->states
  418. *
  419. * Coordinate with coupled cpus to enter the target state. This is a two
  420. * stage process. In the first stage, the cpus are operating independently,
  421. * and may call into cpuidle_enter_state_coupled at completely different times.
  422. * To save as much power as possible, the first cpus to call this function will
  423. * go to an intermediate state (the cpuidle_device's safe state), and wait for
  424. * all the other cpus to call this function. Once all coupled cpus are idle,
  425. * the second stage will start. Each coupled cpu will spin until all cpus have
  426. * guaranteed that they will call the target_state.
  427. *
  428. * This function must be called with interrupts disabled. It may enable
  429. * interrupts while preparing for idle, and it will always return with
  430. * interrupts enabled.
  431. */
  432. int cpuidle_enter_state_coupled(struct cpuidle_device *dev,
  433. struct cpuidle_driver *drv, int next_state)
  434. {
  435. int entered_state = -1;
  436. struct cpuidle_coupled *coupled = dev->coupled;
  437. int w;
  438. if (!coupled)
  439. return -EINVAL;
  440. while (coupled->prevent) {
  441. cpuidle_coupled_clear_pokes(dev->cpu);
  442. if (need_resched()) {
  443. local_irq_enable();
  444. return entered_state;
  445. }
  446. entered_state = cpuidle_enter_state(dev, drv,
  447. drv->safe_state_index);
  448. local_irq_disable();
  449. }
  450. /* Read barrier ensures online_count is read after prevent is cleared */
  451. smp_rmb();
  452. reset:
  453. cpumask_clear_cpu(dev->cpu, &cpuidle_coupled_poked);
  454. w = cpuidle_coupled_set_waiting(dev->cpu, coupled, next_state);
  455. /*
  456. * If this is the last cpu to enter the waiting state, poke
  457. * all the other cpus out of their waiting state so they can
  458. * enter a deeper state. This can race with one of the cpus
  459. * exiting the waiting state due to an interrupt and
  460. * decrementing waiting_count, see comment below.
  461. */
  462. if (w == coupled->online_count) {
  463. cpumask_set_cpu(dev->cpu, &cpuidle_coupled_poked);
  464. cpuidle_coupled_poke_others(dev->cpu, coupled);
  465. }
  466. retry:
  467. /*
  468. * Wait for all coupled cpus to be idle, using the deepest state
  469. * allowed for a single cpu. If this was not the poking cpu, wait
  470. * for at least one poke before leaving to avoid a race where
  471. * two cpus could arrive at the waiting loop at the same time,
  472. * but the first of the two to arrive could skip the loop without
  473. * processing the pokes from the last to arrive.
  474. */
  475. while (!cpuidle_coupled_cpus_waiting(coupled) ||
  476. !cpumask_test_cpu(dev->cpu, &cpuidle_coupled_poked)) {
  477. if (cpuidle_coupled_clear_pokes(dev->cpu))
  478. continue;
  479. if (need_resched()) {
  480. cpuidle_coupled_set_not_waiting(dev->cpu, coupled);
  481. goto out;
  482. }
  483. if (coupled->prevent) {
  484. cpuidle_coupled_set_not_waiting(dev->cpu, coupled);
  485. goto out;
  486. }
  487. entered_state = cpuidle_enter_state(dev, drv,
  488. drv->safe_state_index);
  489. local_irq_disable();
  490. }
  491. cpuidle_coupled_clear_pokes(dev->cpu);
  492. if (need_resched()) {
  493. cpuidle_coupled_set_not_waiting(dev->cpu, coupled);
  494. goto out;
  495. }
  496. /*
  497. * Make sure final poke status for this cpu is visible before setting
  498. * cpu as ready.
  499. */
  500. smp_wmb();
  501. /*
  502. * All coupled cpus are probably idle. There is a small chance that
  503. * one of the other cpus just became active. Increment the ready count,
  504. * and spin until all coupled cpus have incremented the counter. Once a
  505. * cpu has incremented the ready counter, it cannot abort idle and must
  506. * spin until either all cpus have incremented the ready counter, or
  507. * another cpu leaves idle and decrements the waiting counter.
  508. */
  509. cpuidle_coupled_set_ready(coupled);
  510. while (!cpuidle_coupled_cpus_ready(coupled)) {
  511. /* Check if any other cpus bailed out of idle. */
  512. if (!cpuidle_coupled_cpus_waiting(coupled))
  513. if (!cpuidle_coupled_set_not_ready(coupled))
  514. goto retry;
  515. cpu_relax();
  516. }
  517. /*
  518. * Make sure read of all cpus ready is done before reading pending pokes
  519. */
  520. smp_rmb();
  521. /*
  522. * There is a small chance that a cpu left and reentered idle after this
  523. * cpu saw that all cpus were waiting. The cpu that reentered idle will
  524. * have sent this cpu a poke, which will still be pending after the
  525. * ready loop. The pending interrupt may be lost by the interrupt
  526. * controller when entering the deep idle state. It's not possible to
  527. * clear a pending interrupt without turning interrupts on and handling
  528. * it, and it's too late to turn on interrupts here, so reset the
  529. * coupled idle state of all cpus and retry.
  530. */
  531. if (cpuidle_coupled_any_pokes_pending(coupled)) {
  532. cpuidle_coupled_set_done(dev->cpu, coupled);
  533. /* Wait for all cpus to see the pending pokes */
  534. cpuidle_coupled_parallel_barrier(dev, &coupled->abort_barrier);
  535. goto reset;
  536. }
  537. /* all cpus have acked the coupled state */
  538. next_state = cpuidle_coupled_get_state(dev, coupled);
  539. entered_state = cpuidle_enter_state(dev, drv, next_state);
  540. cpuidle_coupled_set_done(dev->cpu, coupled);
  541. out:
  542. /*
  543. * Normal cpuidle states are expected to return with irqs enabled.
  544. * That leads to an inefficiency where a cpu receiving an interrupt
  545. * that brings it out of idle will process that interrupt before
  546. * exiting the idle enter function and decrementing ready_count. All
  547. * other cpus will need to spin waiting for the cpu that is processing
  548. * the interrupt. If the driver returns with interrupts disabled,
  549. * all other cpus will loop back into the safe idle state instead of
  550. * spinning, saving power.
  551. *
  552. * Calling local_irq_enable here allows coupled states to return with
  553. * interrupts disabled, but won't cause problems for drivers that
  554. * exit with interrupts enabled.
  555. */
  556. local_irq_enable();
  557. /*
  558. * Wait until all coupled cpus have exited idle. There is no risk that
  559. * a cpu exits and re-enters the ready state because this cpu has
  560. * already decremented its waiting_count.
  561. */
  562. while (!cpuidle_coupled_no_cpus_ready(coupled))
  563. cpu_relax();
  564. return entered_state;
  565. }
  566. static void cpuidle_coupled_update_online_cpus(struct cpuidle_coupled *coupled)
  567. {
  568. cpumask_t cpus;
  569. cpumask_and(&cpus, cpu_online_mask, &coupled->coupled_cpus);
  570. coupled->online_count = cpumask_weight(&cpus);
  571. }
  572. /**
  573. * cpuidle_coupled_register_device - register a coupled cpuidle device
  574. * @dev: struct cpuidle_device for the current cpu
  575. *
  576. * Called from cpuidle_register_device to handle coupled idle init. Finds the
  577. * cpuidle_coupled struct for this set of coupled cpus, or creates one if none
  578. * exists yet.
  579. */
  580. int cpuidle_coupled_register_device(struct cpuidle_device *dev)
  581. {
  582. int cpu;
  583. struct cpuidle_device *other_dev;
  584. struct call_single_data *csd;
  585. struct cpuidle_coupled *coupled;
  586. if (cpumask_empty(&dev->coupled_cpus))
  587. return 0;
  588. for_each_cpu(cpu, &dev->coupled_cpus) {
  589. other_dev = per_cpu(cpuidle_devices, cpu);
  590. if (other_dev && other_dev->coupled) {
  591. coupled = other_dev->coupled;
  592. goto have_coupled;
  593. }
  594. }
  595. /* No existing coupled info found, create a new one */
  596. coupled = kzalloc(sizeof(struct cpuidle_coupled), GFP_KERNEL);
  597. if (!coupled)
  598. return -ENOMEM;
  599. coupled->coupled_cpus = dev->coupled_cpus;
  600. have_coupled:
  601. dev->coupled = coupled;
  602. if (WARN_ON(!cpumask_equal(&dev->coupled_cpus, &coupled->coupled_cpus)))
  603. coupled->prevent++;
  604. cpuidle_coupled_update_online_cpus(coupled);
  605. coupled->refcnt++;
  606. csd = &per_cpu(cpuidle_coupled_poke_cb, dev->cpu);
  607. csd->func = cpuidle_coupled_handle_poke;
  608. csd->info = (void *)(unsigned long)dev->cpu;
  609. return 0;
  610. }
  611. /**
  612. * cpuidle_coupled_unregister_device - unregister a coupled cpuidle device
  613. * @dev: struct cpuidle_device for the current cpu
  614. *
  615. * Called from cpuidle_unregister_device to tear down coupled idle. Removes the
  616. * cpu from the coupled idle set, and frees the cpuidle_coupled_info struct if
  617. * this was the last cpu in the set.
  618. */
  619. void cpuidle_coupled_unregister_device(struct cpuidle_device *dev)
  620. {
  621. struct cpuidle_coupled *coupled = dev->coupled;
  622. if (cpumask_empty(&dev->coupled_cpus))
  623. return;
  624. if (--coupled->refcnt)
  625. kfree(coupled);
  626. dev->coupled = NULL;
  627. }
  628. /**
  629. * cpuidle_coupled_prevent_idle - prevent cpus from entering a coupled state
  630. * @coupled: the struct coupled that contains the cpu that is changing state
  631. *
  632. * Disables coupled cpuidle on a coupled set of cpus. Used to ensure that
  633. * cpu_online_mask doesn't change while cpus are coordinating coupled idle.
  634. */
  635. static void cpuidle_coupled_prevent_idle(struct cpuidle_coupled *coupled)
  636. {
  637. int cpu = get_cpu();
  638. /* Force all cpus out of the waiting loop. */
  639. coupled->prevent++;
  640. cpuidle_coupled_poke_others(cpu, coupled);
  641. put_cpu();
  642. while (!cpuidle_coupled_no_cpus_waiting(coupled))
  643. cpu_relax();
  644. }
  645. /**
  646. * cpuidle_coupled_allow_idle - allows cpus to enter a coupled state
  647. * @coupled: the struct coupled that contains the cpu that is changing state
  648. *
  649. * Enables coupled cpuidle on a coupled set of cpus. Used to ensure that
  650. * cpu_online_mask doesn't change while cpus are coordinating coupled idle.
  651. */
  652. static void cpuidle_coupled_allow_idle(struct cpuidle_coupled *coupled)
  653. {
  654. int cpu = get_cpu();
  655. /*
  656. * Write barrier ensures readers see the new online_count when they
  657. * see prevent == 0.
  658. */
  659. smp_wmb();
  660. coupled->prevent--;
  661. /* Force cpus out of the prevent loop. */
  662. cpuidle_coupled_poke_others(cpu, coupled);
  663. put_cpu();
  664. }
  665. /**
  666. * cpuidle_coupled_cpu_notify - notifier called during hotplug transitions
  667. * @nb: notifier block
  668. * @action: hotplug transition
  669. * @hcpu: target cpu number
  670. *
  671. * Called when a cpu is brought on or offline using hotplug. Updates the
  672. * coupled cpu set appropriately
  673. */
  674. static int cpuidle_coupled_cpu_notify(struct notifier_block *nb,
  675. unsigned long action, void *hcpu)
  676. {
  677. int cpu = (unsigned long)hcpu;
  678. struct cpuidle_device *dev;
  679. switch (action & ~CPU_TASKS_FROZEN) {
  680. case CPU_UP_PREPARE:
  681. case CPU_DOWN_PREPARE:
  682. case CPU_ONLINE:
  683. case CPU_DEAD:
  684. case CPU_UP_CANCELED:
  685. case CPU_DOWN_FAILED:
  686. break;
  687. default:
  688. return NOTIFY_OK;
  689. }
  690. mutex_lock(&cpuidle_lock);
  691. dev = per_cpu(cpuidle_devices, cpu);
  692. if (!dev || !dev->coupled)
  693. goto out;
  694. switch (action & ~CPU_TASKS_FROZEN) {
  695. case CPU_UP_PREPARE:
  696. case CPU_DOWN_PREPARE:
  697. cpuidle_coupled_prevent_idle(dev->coupled);
  698. break;
  699. case CPU_ONLINE:
  700. case CPU_DEAD:
  701. cpuidle_coupled_update_online_cpus(dev->coupled);
  702. /* Fall through */
  703. case CPU_UP_CANCELED:
  704. case CPU_DOWN_FAILED:
  705. cpuidle_coupled_allow_idle(dev->coupled);
  706. break;
  707. }
  708. out:
  709. mutex_unlock(&cpuidle_lock);
  710. return NOTIFY_OK;
  711. }
  712. static struct notifier_block cpuidle_coupled_cpu_notifier = {
  713. .notifier_call = cpuidle_coupled_cpu_notify,
  714. };
  715. static int __init cpuidle_coupled_init(void)
  716. {
  717. return register_cpu_notifier(&cpuidle_coupled_cpu_notifier);
  718. }
  719. core_initcall(cpuidle_coupled_init);