rcupdate.c 9.3 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313
  1. /*
  2. * Read-Copy Update mechanism for mutual exclusion
  3. *
  4. * This program is free software; you can redistribute it and/or modify
  5. * it under the terms of the GNU General Public License as published by
  6. * the Free Software Foundation; either version 2 of the License, or
  7. * (at your option) any later version.
  8. *
  9. * This program is distributed in the hope that it will be useful,
  10. * but WITHOUT ANY WARRANTY; without even the implied warranty of
  11. * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
  12. * GNU General Public License for more details.
  13. *
  14. * You should have received a copy of the GNU General Public License
  15. * along with this program; if not, write to the Free Software
  16. * Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA 02111-1307, USA.
  17. *
  18. * Copyright IBM Corporation, 2001
  19. *
  20. * Authors: Dipankar Sarma <dipankar@in.ibm.com>
  21. * Manfred Spraul <manfred@colorfullife.com>
  22. *
  23. * Based on the original work by Paul McKenney <paulmck@us.ibm.com>
  24. * and inputs from Rusty Russell, Andrea Arcangeli and Andi Kleen.
  25. * Papers:
  26. * http://www.rdrop.com/users/paulmck/paper/rclockpdcsproof.pdf
  27. * http://lse.sourceforge.net/locking/rclock_OLS.2001.05.01c.sc.pdf (OLS2001)
  28. *
  29. * For detailed explanation of Read-Copy Update mechanism see -
  30. * http://lse.sourceforge.net/locking/rcupdate.html
  31. *
  32. */
  33. #include <linux/types.h>
  34. #include <linux/kernel.h>
  35. #include <linux/init.h>
  36. #include <linux/spinlock.h>
  37. #include <linux/smp.h>
  38. #include <linux/interrupt.h>
  39. #include <linux/sched.h>
  40. #include <asm/atomic.h>
  41. #include <linux/bitops.h>
  42. #include <linux/percpu.h>
  43. #include <linux/notifier.h>
  44. #include <linux/cpu.h>
  45. #include <linux/mutex.h>
  46. #include <linux/module.h>
  47. #include <linux/kernel_stat.h>
  48. enum rcu_barrier {
  49. RCU_BARRIER_STD,
  50. RCU_BARRIER_BH,
  51. RCU_BARRIER_SCHED,
  52. };
  53. static DEFINE_PER_CPU(struct rcu_head, rcu_barrier_head) = {NULL};
  54. static atomic_t rcu_barrier_cpu_count;
  55. static DEFINE_MUTEX(rcu_barrier_mutex);
  56. static struct completion rcu_barrier_completion;
  57. int rcu_scheduler_active __read_mostly;
  58. static atomic_t rcu_migrate_type_count = ATOMIC_INIT(0);
  59. static struct rcu_head rcu_migrate_head[3];
  60. static DECLARE_WAIT_QUEUE_HEAD(rcu_migrate_wq);
  61. /*
  62. * Awaken the corresponding synchronize_rcu() instance now that a
  63. * grace period has elapsed.
  64. */
  65. void wakeme_after_rcu(struct rcu_head *head)
  66. {
  67. struct rcu_synchronize *rcu;
  68. rcu = container_of(head, struct rcu_synchronize, head);
  69. complete(&rcu->completion);
  70. }
  71. #ifdef CONFIG_TREE_PREEMPT_RCU
  72. /**
  73. * synchronize_rcu - wait until a grace period has elapsed.
  74. *
  75. * Control will return to the caller some time after a full grace
  76. * period has elapsed, in other words after all currently executing RCU
  77. * read-side critical sections have completed. RCU read-side critical
  78. * sections are delimited by rcu_read_lock() and rcu_read_unlock(),
  79. * and may be nested.
  80. */
  81. void synchronize_rcu(void)
  82. {
  83. struct rcu_synchronize rcu;
  84. if (!rcu_scheduler_active)
  85. return;
  86. init_completion(&rcu.completion);
  87. /* Will wake me after RCU finished. */
  88. call_rcu(&rcu.head, wakeme_after_rcu);
  89. /* Wait for it. */
  90. wait_for_completion(&rcu.completion);
  91. }
  92. EXPORT_SYMBOL_GPL(synchronize_rcu);
  93. #endif /* #ifdef CONFIG_TREE_PREEMPT_RCU */
  94. /**
  95. * synchronize_sched - wait until an rcu-sched grace period has elapsed.
  96. *
  97. * Control will return to the caller some time after a full rcu-sched
  98. * grace period has elapsed, in other words after all currently executing
  99. * rcu-sched read-side critical sections have completed. These read-side
  100. * critical sections are delimited by rcu_read_lock_sched() and
  101. * rcu_read_unlock_sched(), and may be nested. Note that preempt_disable(),
  102. * local_irq_disable(), and so on may be used in place of
  103. * rcu_read_lock_sched().
  104. *
  105. * This means that all preempt_disable code sequences, including NMI and
  106. * hardware-interrupt handlers, in progress on entry will have completed
  107. * before this primitive returns. However, this does not guarantee that
  108. * softirq handlers will have completed, since in some kernels, these
  109. * handlers can run in process context, and can block.
  110. *
  111. * This primitive provides the guarantees made by the (now removed)
  112. * synchronize_kernel() API. In contrast, synchronize_rcu() only
  113. * guarantees that rcu_read_lock() sections will have completed.
  114. * In "classic RCU", these two guarantees happen to be one and
  115. * the same, but can differ in realtime RCU implementations.
  116. */
  117. void synchronize_sched(void)
  118. {
  119. struct rcu_synchronize rcu;
  120. if (rcu_blocking_is_gp())
  121. return;
  122. init_completion(&rcu.completion);
  123. /* Will wake me after RCU finished. */
  124. call_rcu_sched(&rcu.head, wakeme_after_rcu);
  125. /* Wait for it. */
  126. wait_for_completion(&rcu.completion);
  127. }
  128. EXPORT_SYMBOL_GPL(synchronize_sched);
  129. /**
  130. * synchronize_rcu_bh - wait until an rcu_bh grace period has elapsed.
  131. *
  132. * Control will return to the caller some time after a full rcu_bh grace
  133. * period has elapsed, in other words after all currently executing rcu_bh
  134. * read-side critical sections have completed. RCU read-side critical
  135. * sections are delimited by rcu_read_lock_bh() and rcu_read_unlock_bh(),
  136. * and may be nested.
  137. */
  138. void synchronize_rcu_bh(void)
  139. {
  140. struct rcu_synchronize rcu;
  141. if (rcu_blocking_is_gp())
  142. return;
  143. init_completion(&rcu.completion);
  144. /* Will wake me after RCU finished. */
  145. call_rcu_bh(&rcu.head, wakeme_after_rcu);
  146. /* Wait for it. */
  147. wait_for_completion(&rcu.completion);
  148. }
  149. EXPORT_SYMBOL_GPL(synchronize_rcu_bh);
  150. static void rcu_barrier_callback(struct rcu_head *notused)
  151. {
  152. if (atomic_dec_and_test(&rcu_barrier_cpu_count))
  153. complete(&rcu_barrier_completion);
  154. }
  155. /*
  156. * Called with preemption disabled, and from cross-cpu IRQ context.
  157. */
  158. static void rcu_barrier_func(void *type)
  159. {
  160. int cpu = smp_processor_id();
  161. struct rcu_head *head = &per_cpu(rcu_barrier_head, cpu);
  162. atomic_inc(&rcu_barrier_cpu_count);
  163. switch ((enum rcu_barrier)type) {
  164. case RCU_BARRIER_STD:
  165. call_rcu(head, rcu_barrier_callback);
  166. break;
  167. case RCU_BARRIER_BH:
  168. call_rcu_bh(head, rcu_barrier_callback);
  169. break;
  170. case RCU_BARRIER_SCHED:
  171. call_rcu_sched(head, rcu_barrier_callback);
  172. break;
  173. }
  174. }
  175. static inline void wait_migrated_callbacks(void)
  176. {
  177. wait_event(rcu_migrate_wq, !atomic_read(&rcu_migrate_type_count));
  178. smp_mb(); /* In case we didn't sleep. */
  179. }
  180. /*
  181. * Orchestrate the specified type of RCU barrier, waiting for all
  182. * RCU callbacks of the specified type to complete.
  183. */
  184. static void _rcu_barrier(enum rcu_barrier type)
  185. {
  186. BUG_ON(in_interrupt());
  187. /* Take cpucontrol mutex to protect against CPU hotplug */
  188. mutex_lock(&rcu_barrier_mutex);
  189. init_completion(&rcu_barrier_completion);
  190. /*
  191. * Initialize rcu_barrier_cpu_count to 1, then invoke
  192. * rcu_barrier_func() on each CPU, so that each CPU also has
  193. * incremented rcu_barrier_cpu_count. Only then is it safe to
  194. * decrement rcu_barrier_cpu_count -- otherwise the first CPU
  195. * might complete its grace period before all of the other CPUs
  196. * did their increment, causing this function to return too
  197. * early.
  198. */
  199. atomic_set(&rcu_barrier_cpu_count, 1);
  200. on_each_cpu(rcu_barrier_func, (void *)type, 1);
  201. if (atomic_dec_and_test(&rcu_barrier_cpu_count))
  202. complete(&rcu_barrier_completion);
  203. wait_for_completion(&rcu_barrier_completion);
  204. mutex_unlock(&rcu_barrier_mutex);
  205. wait_migrated_callbacks();
  206. }
  207. /**
  208. * rcu_barrier - Wait until all in-flight call_rcu() callbacks complete.
  209. */
  210. void rcu_barrier(void)
  211. {
  212. _rcu_barrier(RCU_BARRIER_STD);
  213. }
  214. EXPORT_SYMBOL_GPL(rcu_barrier);
  215. /**
  216. * rcu_barrier_bh - Wait until all in-flight call_rcu_bh() callbacks complete.
  217. */
  218. void rcu_barrier_bh(void)
  219. {
  220. _rcu_barrier(RCU_BARRIER_BH);
  221. }
  222. EXPORT_SYMBOL_GPL(rcu_barrier_bh);
  223. /**
  224. * rcu_barrier_sched - Wait for in-flight call_rcu_sched() callbacks.
  225. */
  226. void rcu_barrier_sched(void)
  227. {
  228. _rcu_barrier(RCU_BARRIER_SCHED);
  229. }
  230. EXPORT_SYMBOL_GPL(rcu_barrier_sched);
  231. static void rcu_migrate_callback(struct rcu_head *notused)
  232. {
  233. if (atomic_dec_and_test(&rcu_migrate_type_count))
  234. wake_up(&rcu_migrate_wq);
  235. }
  236. extern int rcu_cpu_notify(struct notifier_block *self,
  237. unsigned long action, void *hcpu);
  238. static int __cpuinit rcu_barrier_cpu_hotplug(struct notifier_block *self,
  239. unsigned long action, void *hcpu)
  240. {
  241. rcu_cpu_notify(self, action, hcpu);
  242. if (action == CPU_DYING) {
  243. /*
  244. * preempt_disable() in on_each_cpu() prevents stop_machine(),
  245. * so when "on_each_cpu(rcu_barrier_func, (void *)type, 1);"
  246. * returns, all online cpus have queued rcu_barrier_func(),
  247. * and the dead cpu(if it exist) queues rcu_migrate_callback()s.
  248. *
  249. * These callbacks ensure _rcu_barrier() waits for all
  250. * RCU callbacks of the specified type to complete.
  251. */
  252. atomic_set(&rcu_migrate_type_count, 3);
  253. call_rcu_bh(rcu_migrate_head, rcu_migrate_callback);
  254. call_rcu_sched(rcu_migrate_head + 1, rcu_migrate_callback);
  255. call_rcu(rcu_migrate_head + 2, rcu_migrate_callback);
  256. } else if (action == CPU_DOWN_PREPARE) {
  257. /* Don't need to wait until next removal operation. */
  258. /* rcu_migrate_head is protected by cpu_add_remove_lock */
  259. wait_migrated_callbacks();
  260. }
  261. return NOTIFY_OK;
  262. }
  263. void __init rcu_init(void)
  264. {
  265. int i;
  266. __rcu_init();
  267. cpu_notifier(rcu_barrier_cpu_hotplug, 0);
  268. /*
  269. * We don't need protection against CPU-hotplug here because
  270. * this is called early in boot, before either interrupts
  271. * or the scheduler are operational.
  272. */
  273. for_each_online_cpu(i)
  274. rcu_barrier_cpu_hotplug(NULL, CPU_UP_PREPARE, (void *)(long)i);
  275. }
  276. void rcu_scheduler_starting(void)
  277. {
  278. WARN_ON(num_online_cpus() != 1);
  279. WARN_ON(nr_context_switches() > 0);
  280. rcu_scheduler_active = 1;
  281. }