rcu.h 16 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573
  1. /*
  2. * Read-Copy Update definitions shared among RCU implementations.
  3. *
  4. * This program is free software; you can redistribute it and/or modify
  5. * it under the terms of the GNU General Public License as published by
  6. * the Free Software Foundation; either version 2 of the License, or
  7. * (at your option) any later version.
  8. *
  9. * This program is distributed in the hope that it will be useful,
  10. * but WITHOUT ANY WARRANTY; without even the implied warranty of
  11. * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
  12. * GNU General Public License for more details.
  13. *
  14. * You should have received a copy of the GNU General Public License
  15. * along with this program; if not, you can access it online at
  16. * http://www.gnu.org/licenses/gpl-2.0.html.
  17. *
  18. * Copyright IBM Corporation, 2011
  19. *
  20. * Author: Paul E. McKenney <paulmck@linux.vnet.ibm.com>
  21. */
  22. #ifndef __LINUX_RCU_H
  23. #define __LINUX_RCU_H
  24. #include <trace/events/rcu.h>
  25. #ifdef CONFIG_RCU_TRACE
  26. #define RCU_TRACE(stmt) stmt
  27. #else /* #ifdef CONFIG_RCU_TRACE */
  28. #define RCU_TRACE(stmt)
  29. #endif /* #else #ifdef CONFIG_RCU_TRACE */
  30. /*
  31. * Process-level increment to ->dynticks_nesting field. This allows for
  32. * architectures that use half-interrupts and half-exceptions from
  33. * process context.
  34. *
  35. * DYNTICK_TASK_NEST_MASK defines a field of width DYNTICK_TASK_NEST_WIDTH
  36. * that counts the number of process-based reasons why RCU cannot
  37. * consider the corresponding CPU to be idle, and DYNTICK_TASK_NEST_VALUE
  38. * is the value used to increment or decrement this field.
  39. *
  40. * The rest of the bits could in principle be used to count interrupts,
  41. * but this would mean that a negative-one value in the interrupt
  42. * field could incorrectly zero out the DYNTICK_TASK_NEST_MASK field.
  43. * We therefore provide a two-bit guard field defined by DYNTICK_TASK_MASK
  44. * that is set to DYNTICK_TASK_FLAG upon initial exit from idle.
  45. * The DYNTICK_TASK_EXIT_IDLE value is thus the combined value used upon
  46. * initial exit from idle.
  47. */
  48. #define DYNTICK_TASK_NEST_WIDTH 7
  49. #define DYNTICK_TASK_NEST_VALUE ((LLONG_MAX >> DYNTICK_TASK_NEST_WIDTH) + 1)
  50. #define DYNTICK_TASK_NEST_MASK (LLONG_MAX - DYNTICK_TASK_NEST_VALUE + 1)
  51. #define DYNTICK_TASK_FLAG ((DYNTICK_TASK_NEST_VALUE / 8) * 2)
  52. #define DYNTICK_TASK_MASK ((DYNTICK_TASK_NEST_VALUE / 8) * 3)
  53. #define DYNTICK_TASK_EXIT_IDLE (DYNTICK_TASK_NEST_VALUE + \
  54. DYNTICK_TASK_FLAG)
  55. /*
  56. * Grace-period counter management.
  57. */
  58. #define RCU_SEQ_CTR_SHIFT 2
  59. #define RCU_SEQ_STATE_MASK ((1 << RCU_SEQ_CTR_SHIFT) - 1)
  60. /*
  61. * Return the counter portion of a sequence number previously returned
  62. * by rcu_seq_snap() or rcu_seq_current().
  63. */
  64. static inline unsigned long rcu_seq_ctr(unsigned long s)
  65. {
  66. return s >> RCU_SEQ_CTR_SHIFT;
  67. }
  68. /*
  69. * Return the state portion of a sequence number previously returned
  70. * by rcu_seq_snap() or rcu_seq_current().
  71. */
  72. static inline int rcu_seq_state(unsigned long s)
  73. {
  74. return s & RCU_SEQ_STATE_MASK;
  75. }
  76. /*
  77. * Set the state portion of the pointed-to sequence number.
  78. * The caller is responsible for preventing conflicting updates.
  79. */
  80. static inline void rcu_seq_set_state(unsigned long *sp, int newstate)
  81. {
  82. WARN_ON_ONCE(newstate & ~RCU_SEQ_STATE_MASK);
  83. WRITE_ONCE(*sp, (*sp & ~RCU_SEQ_STATE_MASK) + newstate);
  84. }
  85. /* Adjust sequence number for start of update-side operation. */
  86. static inline void rcu_seq_start(unsigned long *sp)
  87. {
  88. WRITE_ONCE(*sp, *sp + 1);
  89. smp_mb(); /* Ensure update-side operation after counter increment. */
  90. WARN_ON_ONCE(rcu_seq_state(*sp) != 1);
  91. }
  92. /* Adjust sequence number for end of update-side operation. */
  93. static inline void rcu_seq_end(unsigned long *sp)
  94. {
  95. smp_mb(); /* Ensure update-side operation before counter increment. */
  96. WARN_ON_ONCE(!rcu_seq_state(*sp));
  97. WRITE_ONCE(*sp, (*sp | RCU_SEQ_STATE_MASK) + 1);
  98. }
  99. /* Take a snapshot of the update side's sequence number. */
  100. static inline unsigned long rcu_seq_snap(unsigned long *sp)
  101. {
  102. unsigned long s;
  103. s = (READ_ONCE(*sp) + 2 * RCU_SEQ_STATE_MASK + 1) & ~RCU_SEQ_STATE_MASK;
  104. smp_mb(); /* Above access must not bleed into critical section. */
  105. return s;
  106. }
  107. /* Return the current value the update side's sequence number, no ordering. */
  108. static inline unsigned long rcu_seq_current(unsigned long *sp)
  109. {
  110. return READ_ONCE(*sp);
  111. }
  112. /*
  113. * Given a snapshot from rcu_seq_snap(), determine whether or not a
  114. * full update-side operation has occurred.
  115. */
  116. static inline bool rcu_seq_done(unsigned long *sp, unsigned long s)
  117. {
  118. return ULONG_CMP_GE(READ_ONCE(*sp), s);
  119. }
  120. /*
  121. * debug_rcu_head_queue()/debug_rcu_head_unqueue() are used internally
  122. * by call_rcu() and rcu callback execution, and are therefore not part of the
  123. * RCU API. Leaving in rcupdate.h because they are used by all RCU flavors.
  124. */
  125. #ifdef CONFIG_DEBUG_OBJECTS_RCU_HEAD
  126. # define STATE_RCU_HEAD_READY 0
  127. # define STATE_RCU_HEAD_QUEUED 1
  128. extern struct debug_obj_descr rcuhead_debug_descr;
  129. static inline int debug_rcu_head_queue(struct rcu_head *head)
  130. {
  131. int r1;
  132. r1 = debug_object_activate(head, &rcuhead_debug_descr);
  133. debug_object_active_state(head, &rcuhead_debug_descr,
  134. STATE_RCU_HEAD_READY,
  135. STATE_RCU_HEAD_QUEUED);
  136. return r1;
  137. }
  138. static inline void debug_rcu_head_unqueue(struct rcu_head *head)
  139. {
  140. debug_object_active_state(head, &rcuhead_debug_descr,
  141. STATE_RCU_HEAD_QUEUED,
  142. STATE_RCU_HEAD_READY);
  143. debug_object_deactivate(head, &rcuhead_debug_descr);
  144. }
  145. #else /* !CONFIG_DEBUG_OBJECTS_RCU_HEAD */
  146. static inline int debug_rcu_head_queue(struct rcu_head *head)
  147. {
  148. return 0;
  149. }
  150. static inline void debug_rcu_head_unqueue(struct rcu_head *head)
  151. {
  152. }
  153. #endif /* #else !CONFIG_DEBUG_OBJECTS_RCU_HEAD */
  154. void kfree(const void *);
  155. /*
  156. * Reclaim the specified callback, either by invoking it (non-lazy case)
  157. * or freeing it directly (lazy case). Return true if lazy, false otherwise.
  158. */
  159. static inline bool __rcu_reclaim(const char *rn, struct rcu_head *head)
  160. {
  161. unsigned long offset = (unsigned long)head->func;
  162. rcu_lock_acquire(&rcu_callback_map);
  163. if (__is_kfree_rcu_offset(offset)) {
  164. RCU_TRACE(trace_rcu_invoke_kfree_callback(rn, head, offset);)
  165. kfree((void *)head - offset);
  166. rcu_lock_release(&rcu_callback_map);
  167. return true;
  168. } else {
  169. RCU_TRACE(trace_rcu_invoke_callback(rn, head);)
  170. head->func(head);
  171. rcu_lock_release(&rcu_callback_map);
  172. return false;
  173. }
  174. }
  175. #ifdef CONFIG_RCU_STALL_COMMON
  176. extern int rcu_cpu_stall_suppress;
  177. int rcu_jiffies_till_stall_check(void);
  178. #endif /* #ifdef CONFIG_RCU_STALL_COMMON */
  179. /*
  180. * Strings used in tracepoints need to be exported via the
  181. * tracing system such that tools like perf and trace-cmd can
  182. * translate the string address pointers to actual text.
  183. */
  184. #define TPS(x) tracepoint_string(x)
  185. /*
  186. * Dump the ftrace buffer, but only one time per callsite per boot.
  187. */
  188. #define rcu_ftrace_dump(oops_dump_mode) \
  189. do { \
  190. static atomic_t ___rfd_beenhere = ATOMIC_INIT(0); \
  191. \
  192. if (!atomic_read(&___rfd_beenhere) && \
  193. !atomic_xchg(&___rfd_beenhere, 1)) \
  194. ftrace_dump(oops_dump_mode); \
  195. } while (0)
  196. void rcu_early_boot_tests(void);
  197. void rcu_test_sync_prims(void);
  198. /*
  199. * This function really isn't for public consumption, but RCU is special in
  200. * that context switches can allow the state machine to make progress.
  201. */
  202. extern void resched_cpu(int cpu);
  203. #if defined(SRCU) || !defined(TINY_RCU)
  204. #include <linux/rcu_node_tree.h>
  205. extern int rcu_num_lvls;
  206. extern int num_rcu_lvl[];
  207. extern int rcu_num_nodes;
  208. static bool rcu_fanout_exact;
  209. static int rcu_fanout_leaf;
  210. /*
  211. * Compute the per-level fanout, either using the exact fanout specified
  212. * or balancing the tree, depending on the rcu_fanout_exact boot parameter.
  213. */
  214. static inline void rcu_init_levelspread(int *levelspread, const int *levelcnt)
  215. {
  216. int i;
  217. if (rcu_fanout_exact) {
  218. levelspread[rcu_num_lvls - 1] = rcu_fanout_leaf;
  219. for (i = rcu_num_lvls - 2; i >= 0; i--)
  220. levelspread[i] = RCU_FANOUT;
  221. } else {
  222. int ccur;
  223. int cprv;
  224. cprv = nr_cpu_ids;
  225. for (i = rcu_num_lvls - 1; i >= 0; i--) {
  226. ccur = levelcnt[i];
  227. levelspread[i] = (cprv + ccur - 1) / ccur;
  228. cprv = ccur;
  229. }
  230. }
  231. }
  232. /*
  233. * Do a full breadth-first scan of the rcu_node structures for the
  234. * specified rcu_state structure.
  235. */
  236. #define rcu_for_each_node_breadth_first(rsp, rnp) \
  237. for ((rnp) = &(rsp)->node[0]; \
  238. (rnp) < &(rsp)->node[rcu_num_nodes]; (rnp)++)
  239. /*
  240. * Do a breadth-first scan of the non-leaf rcu_node structures for the
  241. * specified rcu_state structure. Note that if there is a singleton
  242. * rcu_node tree with but one rcu_node structure, this loop is a no-op.
  243. */
  244. #define rcu_for_each_nonleaf_node_breadth_first(rsp, rnp) \
  245. for ((rnp) = &(rsp)->node[0]; \
  246. (rnp) < (rsp)->level[rcu_num_lvls - 1]; (rnp)++)
  247. /*
  248. * Scan the leaves of the rcu_node hierarchy for the specified rcu_state
  249. * structure. Note that if there is a singleton rcu_node tree with but
  250. * one rcu_node structure, this loop -will- visit the rcu_node structure.
  251. * It is still a leaf node, even if it is also the root node.
  252. */
  253. #define rcu_for_each_leaf_node(rsp, rnp) \
  254. for ((rnp) = (rsp)->level[rcu_num_lvls - 1]; \
  255. (rnp) < &(rsp)->node[rcu_num_nodes]; (rnp)++)
  256. /*
  257. * Iterate over all possible CPUs in a leaf RCU node.
  258. */
  259. #define for_each_leaf_node_possible_cpu(rnp, cpu) \
  260. for ((cpu) = cpumask_next(rnp->grplo - 1, cpu_possible_mask); \
  261. cpu <= rnp->grphi; \
  262. cpu = cpumask_next((cpu), cpu_possible_mask))
  263. /*
  264. * Wrappers for the rcu_node::lock acquire and release.
  265. *
  266. * Because the rcu_nodes form a tree, the tree traversal locking will observe
  267. * different lock values, this in turn means that an UNLOCK of one level
  268. * followed by a LOCK of another level does not imply a full memory barrier;
  269. * and most importantly transitivity is lost.
  270. *
  271. * In order to restore full ordering between tree levels, augment the regular
  272. * lock acquire functions with smp_mb__after_unlock_lock().
  273. *
  274. * As ->lock of struct rcu_node is a __private field, therefore one should use
  275. * these wrappers rather than directly call raw_spin_{lock,unlock}* on ->lock.
  276. */
  277. #define raw_spin_lock_rcu_node(p) \
  278. do { \
  279. raw_spin_lock(&ACCESS_PRIVATE(p, lock)); \
  280. smp_mb__after_unlock_lock(); \
  281. } while (0)
  282. #define raw_spin_unlock_rcu_node(p) raw_spin_unlock(&ACCESS_PRIVATE(p, lock))
  283. #define raw_spin_lock_irq_rcu_node(p) \
  284. do { \
  285. raw_spin_lock_irq(&ACCESS_PRIVATE(p, lock)); \
  286. smp_mb__after_unlock_lock(); \
  287. } while (0)
  288. #define raw_spin_unlock_irq_rcu_node(p) \
  289. raw_spin_unlock_irq(&ACCESS_PRIVATE(p, lock))
  290. #define raw_spin_lock_irqsave_rcu_node(p, flags) \
  291. do { \
  292. raw_spin_lock_irqsave(&ACCESS_PRIVATE(p, lock), flags); \
  293. smp_mb__after_unlock_lock(); \
  294. } while (0)
  295. #define raw_spin_unlock_irqrestore_rcu_node(p, flags) \
  296. raw_spin_unlock_irqrestore(&ACCESS_PRIVATE(p, lock), flags) \
  297. #define raw_spin_trylock_rcu_node(p) \
  298. ({ \
  299. bool ___locked = raw_spin_trylock(&ACCESS_PRIVATE(p, lock)); \
  300. \
  301. if (___locked) \
  302. smp_mb__after_unlock_lock(); \
  303. ___locked; \
  304. })
  305. #endif /* #if defined(SRCU) || !defined(TINY_RCU) */
  306. #ifdef CONFIG_TINY_RCU
  307. /* Tiny RCU doesn't expedite, as its purpose in life is instead to be tiny. */
  308. static inline bool rcu_gp_is_normal(void) /* Internal RCU use. */
  309. {
  310. return true;
  311. }
  312. static inline bool rcu_gp_is_expedited(void) /* Internal RCU use. */
  313. {
  314. return false;
  315. }
  316. static inline void rcu_expedite_gp(void)
  317. {
  318. }
  319. static inline void rcu_unexpedite_gp(void)
  320. {
  321. }
  322. #else /* #ifdef CONFIG_TINY_RCU */
  323. bool rcu_gp_is_normal(void); /* Internal RCU use. */
  324. bool rcu_gp_is_expedited(void); /* Internal RCU use. */
  325. void rcu_expedite_gp(void);
  326. void rcu_unexpedite_gp(void);
  327. void rcupdate_announce_bootup_oddness(void);
  328. #endif /* #else #ifdef CONFIG_TINY_RCU */
  329. #define RCU_SCHEDULER_INACTIVE 0
  330. #define RCU_SCHEDULER_INIT 1
  331. #define RCU_SCHEDULER_RUNNING 2
  332. #ifdef CONFIG_TINY_RCU
  333. static inline void rcu_request_urgent_qs_task(struct task_struct *t) { }
  334. #else /* #ifdef CONFIG_TINY_RCU */
  335. void rcu_request_urgent_qs_task(struct task_struct *t);
  336. #endif /* #else #ifdef CONFIG_TINY_RCU */
  337. enum rcutorture_type {
  338. RCU_FLAVOR,
  339. RCU_BH_FLAVOR,
  340. RCU_SCHED_FLAVOR,
  341. RCU_TASKS_FLAVOR,
  342. SRCU_FLAVOR,
  343. INVALID_RCU_FLAVOR
  344. };
  345. #if defined(CONFIG_TREE_RCU) || defined(CONFIG_PREEMPT_RCU)
  346. void rcutorture_get_gp_data(enum rcutorture_type test_type, int *flags,
  347. unsigned long *gpnum, unsigned long *completed);
  348. void rcutorture_record_test_transition(void);
  349. void rcutorture_record_progress(unsigned long vernum);
  350. void do_trace_rcu_torture_read(const char *rcutorturename,
  351. struct rcu_head *rhp,
  352. unsigned long secs,
  353. unsigned long c_old,
  354. unsigned long c);
  355. #else
  356. static inline void rcutorture_get_gp_data(enum rcutorture_type test_type,
  357. int *flags,
  358. unsigned long *gpnum,
  359. unsigned long *completed)
  360. {
  361. *flags = 0;
  362. *gpnum = 0;
  363. *completed = 0;
  364. }
  365. static inline void rcutorture_record_test_transition(void)
  366. {
  367. }
  368. static inline void rcutorture_record_progress(unsigned long vernum)
  369. {
  370. }
  371. #ifdef CONFIG_RCU_TRACE
  372. void do_trace_rcu_torture_read(const char *rcutorturename,
  373. struct rcu_head *rhp,
  374. unsigned long secs,
  375. unsigned long c_old,
  376. unsigned long c);
  377. #else
  378. #define do_trace_rcu_torture_read(rcutorturename, rhp, secs, c_old, c) \
  379. do { } while (0)
  380. #endif
  381. #endif
  382. #ifdef CONFIG_TINY_SRCU
  383. static inline void srcutorture_get_gp_data(enum rcutorture_type test_type,
  384. struct srcu_struct *sp, int *flags,
  385. unsigned long *gpnum,
  386. unsigned long *completed)
  387. {
  388. if (test_type != SRCU_FLAVOR)
  389. return;
  390. *flags = 0;
  391. *completed = sp->srcu_idx;
  392. *gpnum = *completed;
  393. }
  394. #elif defined(CONFIG_TREE_SRCU)
  395. void srcutorture_get_gp_data(enum rcutorture_type test_type,
  396. struct srcu_struct *sp, int *flags,
  397. unsigned long *gpnum, unsigned long *completed);
  398. #endif
  399. #ifdef CONFIG_TINY_RCU
  400. /*
  401. * Return the number of grace periods started.
  402. */
  403. static inline unsigned long rcu_batches_started(void)
  404. {
  405. return 0;
  406. }
  407. /*
  408. * Return the number of bottom-half grace periods started.
  409. */
  410. static inline unsigned long rcu_batches_started_bh(void)
  411. {
  412. return 0;
  413. }
  414. /*
  415. * Return the number of sched grace periods started.
  416. */
  417. static inline unsigned long rcu_batches_started_sched(void)
  418. {
  419. return 0;
  420. }
  421. /*
  422. * Return the number of grace periods completed.
  423. */
  424. static inline unsigned long rcu_batches_completed(void)
  425. {
  426. return 0;
  427. }
  428. /*
  429. * Return the number of bottom-half grace periods completed.
  430. */
  431. static inline unsigned long rcu_batches_completed_bh(void)
  432. {
  433. return 0;
  434. }
  435. /*
  436. * Return the number of sched grace periods completed.
  437. */
  438. static inline unsigned long rcu_batches_completed_sched(void)
  439. {
  440. return 0;
  441. }
  442. /*
  443. * Return the number of expedited grace periods completed.
  444. */
  445. static inline unsigned long rcu_exp_batches_completed(void)
  446. {
  447. return 0;
  448. }
  449. /*
  450. * Return the number of expedited sched grace periods completed.
  451. */
  452. static inline unsigned long rcu_exp_batches_completed_sched(void)
  453. {
  454. return 0;
  455. }
  456. static inline unsigned long srcu_batches_completed(struct srcu_struct *sp)
  457. {
  458. return 0;
  459. }
  460. static inline void rcu_force_quiescent_state(void)
  461. {
  462. }
  463. static inline void rcu_bh_force_quiescent_state(void)
  464. {
  465. }
  466. static inline void rcu_sched_force_quiescent_state(void)
  467. {
  468. }
  469. static inline void show_rcu_gp_kthreads(void)
  470. {
  471. }
  472. #else /* #ifdef CONFIG_TINY_RCU */
  473. extern unsigned long rcutorture_testseq;
  474. extern unsigned long rcutorture_vernum;
  475. unsigned long rcu_batches_started(void);
  476. unsigned long rcu_batches_started_bh(void);
  477. unsigned long rcu_batches_started_sched(void);
  478. unsigned long rcu_batches_completed(void);
  479. unsigned long rcu_batches_completed_bh(void);
  480. unsigned long rcu_batches_completed_sched(void);
  481. unsigned long rcu_exp_batches_completed(void);
  482. unsigned long rcu_exp_batches_completed_sched(void);
  483. unsigned long srcu_batches_completed(struct srcu_struct *sp);
  484. void show_rcu_gp_kthreads(void);
  485. void rcu_force_quiescent_state(void);
  486. void rcu_bh_force_quiescent_state(void);
  487. void rcu_sched_force_quiescent_state(void);
  488. #endif /* #else #ifdef CONFIG_TINY_RCU */
  489. #ifdef CONFIG_RCU_NOCB_CPU
  490. bool rcu_is_nocb_cpu(int cpu);
  491. #else
  492. static inline bool rcu_is_nocb_cpu(int cpu) { return false; }
  493. #endif
  494. #endif /* __LINUX_RCU_H */