diff options
Diffstat (limited to 'kernel/rcutree_plugin.h')
-rw-r--r-- | kernel/rcutree_plugin.h | 110 |
1 files changed, 72 insertions, 38 deletions
diff --git a/kernel/rcutree_plugin.h b/kernel/rcutree_plugin.h index 47789369ea59..1cee04f627eb 100644 --- a/kernel/rcutree_plugin.h +++ b/kernel/rcutree_plugin.h | |||
@@ -64,22 +64,31 @@ EXPORT_SYMBOL_GPL(rcu_batches_completed); | |||
64 | * not in a quiescent state. There might be any number of tasks blocked | 64 | * not in a quiescent state. There might be any number of tasks blocked |
65 | * while in an RCU read-side critical section. | 65 | * while in an RCU read-side critical section. |
66 | */ | 66 | */ |
67 | static void rcu_preempt_qs_record(int cpu) | 67 | static void rcu_preempt_qs(int cpu) |
68 | { | 68 | { |
69 | struct rcu_data *rdp = &per_cpu(rcu_preempt_data, cpu); | 69 | struct rcu_data *rdp = &per_cpu(rcu_preempt_data, cpu); |
70 | rdp->passed_quiesc = 1; | ||
71 | rdp->passed_quiesc_completed = rdp->completed; | 70 | rdp->passed_quiesc_completed = rdp->completed; |
71 | barrier(); | ||
72 | rdp->passed_quiesc = 1; | ||
72 | } | 73 | } |
73 | 74 | ||
74 | /* | 75 | /* |
75 | * We have entered the scheduler or are between softirqs in ksoftirqd. | 76 | * We have entered the scheduler, and the current task might soon be |
76 | * If we are in an RCU read-side critical section, we need to reflect | 77 | * context-switched away from. If this task is in an RCU read-side |
77 | * that in the state of the rcu_node structure corresponding to this CPU. | 78 | * critical section, we will no longer be able to rely on the CPU to |
78 | * Caller must disable hardirqs. | 79 | * record that fact, so we enqueue the task on the appropriate entry |
80 | * of the blocked_tasks[] array. The task will dequeue itself when | ||
81 | * it exits the outermost enclosing RCU read-side critical section. | ||
82 | * Therefore, the current grace period cannot be permitted to complete | ||
83 | * until the blocked_tasks[] entry indexed by the low-order bit of | ||
84 | * rnp->gpnum empties. | ||
85 | * | ||
86 | * Caller must disable preemption. | ||
79 | */ | 87 | */ |
80 | static void rcu_preempt_qs(int cpu) | 88 | static void rcu_preempt_note_context_switch(int cpu) |
81 | { | 89 | { |
82 | struct task_struct *t = current; | 90 | struct task_struct *t = current; |
91 | unsigned long flags; | ||
83 | int phase; | 92 | int phase; |
84 | struct rcu_data *rdp; | 93 | struct rcu_data *rdp; |
85 | struct rcu_node *rnp; | 94 | struct rcu_node *rnp; |
@@ -90,7 +99,7 @@ static void rcu_preempt_qs(int cpu) | |||
90 | /* Possibly blocking in an RCU read-side critical section. */ | 99 | /* Possibly blocking in an RCU read-side critical section. */ |
91 | rdp = rcu_preempt_state.rda[cpu]; | 100 | rdp = rcu_preempt_state.rda[cpu]; |
92 | rnp = rdp->mynode; | 101 | rnp = rdp->mynode; |
93 | spin_lock(&rnp->lock); | 102 | spin_lock_irqsave(&rnp->lock, flags); |
94 | t->rcu_read_unlock_special |= RCU_READ_UNLOCK_BLOCKED; | 103 | t->rcu_read_unlock_special |= RCU_READ_UNLOCK_BLOCKED; |
95 | t->rcu_blocked_node = rnp; | 104 | t->rcu_blocked_node = rnp; |
96 | 105 | ||
@@ -103,11 +112,15 @@ static void rcu_preempt_qs(int cpu) | |||
103 | * state for the current grace period), then as long | 112 | * state for the current grace period), then as long |
104 | * as that task remains queued, the current grace period | 113 | * as that task remains queued, the current grace period |
105 | * cannot end. | 114 | * cannot end. |
115 | * | ||
116 | * But first, note that the current CPU must still be | ||
117 | * on line! | ||
106 | */ | 118 | */ |
107 | phase = !(rnp->qsmask & rdp->grpmask) ^ (rnp->gpnum & 0x1); | 119 | WARN_ON_ONCE((rdp->grpmask & rnp->qsmaskinit) == 0); |
120 | WARN_ON_ONCE(!list_empty(&t->rcu_node_entry)); | ||
121 | phase = (rnp->gpnum + !(rnp->qsmask & rdp->grpmask)) & 0x1; | ||
108 | list_add(&t->rcu_node_entry, &rnp->blocked_tasks[phase]); | 122 | list_add(&t->rcu_node_entry, &rnp->blocked_tasks[phase]); |
109 | smp_mb(); /* Ensure later ctxt swtch seen after above. */ | 123 | spin_unlock_irqrestore(&rnp->lock, flags); |
110 | spin_unlock(&rnp->lock); | ||
111 | } | 124 | } |
112 | 125 | ||
113 | /* | 126 | /* |
@@ -119,9 +132,10 @@ static void rcu_preempt_qs(int cpu) | |||
119 | * grace period, then the fact that the task has been enqueued | 132 | * grace period, then the fact that the task has been enqueued |
120 | * means that we continue to block the current grace period. | 133 | * means that we continue to block the current grace period. |
121 | */ | 134 | */ |
122 | rcu_preempt_qs_record(cpu); | 135 | rcu_preempt_qs(cpu); |
123 | t->rcu_read_unlock_special &= ~(RCU_READ_UNLOCK_NEED_QS | | 136 | local_irq_save(flags); |
124 | RCU_READ_UNLOCK_GOT_QS); | 137 | t->rcu_read_unlock_special &= ~RCU_READ_UNLOCK_NEED_QS; |
138 | local_irq_restore(flags); | ||
125 | } | 139 | } |
126 | 140 | ||
127 | /* | 141 | /* |
@@ -157,7 +171,7 @@ static void rcu_read_unlock_special(struct task_struct *t) | |||
157 | special = t->rcu_read_unlock_special; | 171 | special = t->rcu_read_unlock_special; |
158 | if (special & RCU_READ_UNLOCK_NEED_QS) { | 172 | if (special & RCU_READ_UNLOCK_NEED_QS) { |
159 | t->rcu_read_unlock_special &= ~RCU_READ_UNLOCK_NEED_QS; | 173 | t->rcu_read_unlock_special &= ~RCU_READ_UNLOCK_NEED_QS; |
160 | t->rcu_read_unlock_special |= RCU_READ_UNLOCK_GOT_QS; | 174 | rcu_preempt_qs(smp_processor_id()); |
161 | } | 175 | } |
162 | 176 | ||
163 | /* Hardware IRQ handlers cannot block. */ | 177 | /* Hardware IRQ handlers cannot block. */ |
@@ -177,10 +191,10 @@ static void rcu_read_unlock_special(struct task_struct *t) | |||
177 | */ | 191 | */ |
178 | for (;;) { | 192 | for (;;) { |
179 | rnp = t->rcu_blocked_node; | 193 | rnp = t->rcu_blocked_node; |
180 | spin_lock(&rnp->lock); | 194 | spin_lock(&rnp->lock); /* irqs already disabled. */ |
181 | if (rnp == t->rcu_blocked_node) | 195 | if (rnp == t->rcu_blocked_node) |
182 | break; | 196 | break; |
183 | spin_unlock(&rnp->lock); | 197 | spin_unlock(&rnp->lock); /* irqs remain disabled. */ |
184 | } | 198 | } |
185 | empty = list_empty(&rnp->blocked_tasks[rnp->gpnum & 0x1]); | 199 | empty = list_empty(&rnp->blocked_tasks[rnp->gpnum & 0x1]); |
186 | list_del_init(&t->rcu_node_entry); | 200 | list_del_init(&t->rcu_node_entry); |
@@ -194,9 +208,8 @@ static void rcu_read_unlock_special(struct task_struct *t) | |||
194 | */ | 208 | */ |
195 | if (!empty && rnp->qsmask == 0 && | 209 | if (!empty && rnp->qsmask == 0 && |
196 | list_empty(&rnp->blocked_tasks[rnp->gpnum & 0x1])) { | 210 | list_empty(&rnp->blocked_tasks[rnp->gpnum & 0x1])) { |
197 | t->rcu_read_unlock_special &= | 211 | struct rcu_node *rnp_p; |
198 | ~(RCU_READ_UNLOCK_NEED_QS | | 212 | |
199 | RCU_READ_UNLOCK_GOT_QS); | ||
200 | if (rnp->parent == NULL) { | 213 | if (rnp->parent == NULL) { |
201 | /* Only one rcu_node in the tree. */ | 214 | /* Only one rcu_node in the tree. */ |
202 | cpu_quiet_msk_finish(&rcu_preempt_state, flags); | 215 | cpu_quiet_msk_finish(&rcu_preempt_state, flags); |
@@ -205,9 +218,10 @@ static void rcu_read_unlock_special(struct task_struct *t) | |||
205 | /* Report up the rest of the hierarchy. */ | 218 | /* Report up the rest of the hierarchy. */ |
206 | mask = rnp->grpmask; | 219 | mask = rnp->grpmask; |
207 | spin_unlock_irqrestore(&rnp->lock, flags); | 220 | spin_unlock_irqrestore(&rnp->lock, flags); |
208 | rnp = rnp->parent; | 221 | rnp_p = rnp->parent; |
209 | spin_lock_irqsave(&rnp->lock, flags); | 222 | spin_lock_irqsave(&rnp_p->lock, flags); |
210 | cpu_quiet_msk(mask, &rcu_preempt_state, rnp, flags); | 223 | WARN_ON_ONCE(rnp->qsmask); |
224 | cpu_quiet_msk(mask, &rcu_preempt_state, rnp_p, flags); | ||
211 | return; | 225 | return; |
212 | } | 226 | } |
213 | spin_unlock(&rnp->lock); | 227 | spin_unlock(&rnp->lock); |
@@ -259,6 +273,19 @@ static void rcu_print_task_stall(struct rcu_node *rnp) | |||
259 | #endif /* #ifdef CONFIG_RCU_CPU_STALL_DETECTOR */ | 273 | #endif /* #ifdef CONFIG_RCU_CPU_STALL_DETECTOR */ |
260 | 274 | ||
261 | /* | 275 | /* |
276 | * Check that the list of blocked tasks for the newly completed grace | ||
277 | * period is in fact empty. It is a serious bug to complete a grace | ||
278 | * period that still has RCU readers blocked! This function must be | ||
279 | * invoked -before- updating this rnp's ->gpnum, and the rnp's ->lock | ||
280 | * must be held by the caller. | ||
281 | */ | ||
282 | static void rcu_preempt_check_blocked_tasks(struct rcu_node *rnp) | ||
283 | { | ||
284 | WARN_ON_ONCE(!list_empty(&rnp->blocked_tasks[rnp->gpnum & 0x1])); | ||
285 | WARN_ON_ONCE(rnp->qsmask); | ||
286 | } | ||
287 | |||
288 | /* | ||
262 | * Check for preempted RCU readers for the specified rcu_node structure. | 289 | * Check for preempted RCU readers for the specified rcu_node structure. |
263 | * If the caller needs a reliable answer, it must hold the rcu_node's | 290 | * If the caller needs a reliable answer, it must hold the rcu_node's |
264 | * >lock. | 291 | * >lock. |
@@ -280,7 +307,8 @@ static int rcu_preempted_readers(struct rcu_node *rnp) | |||
280 | * The caller must hold rnp->lock with irqs disabled. | 307 | * The caller must hold rnp->lock with irqs disabled. |
281 | */ | 308 | */ |
282 | static void rcu_preempt_offline_tasks(struct rcu_state *rsp, | 309 | static void rcu_preempt_offline_tasks(struct rcu_state *rsp, |
283 | struct rcu_node *rnp) | 310 | struct rcu_node *rnp, |
311 | struct rcu_data *rdp) | ||
284 | { | 312 | { |
285 | int i; | 313 | int i; |
286 | struct list_head *lp; | 314 | struct list_head *lp; |
@@ -292,6 +320,9 @@ static void rcu_preempt_offline_tasks(struct rcu_state *rsp, | |||
292 | WARN_ONCE(1, "Last CPU thought to be offlined?"); | 320 | WARN_ONCE(1, "Last CPU thought to be offlined?"); |
293 | return; /* Shouldn't happen: at least one CPU online. */ | 321 | return; /* Shouldn't happen: at least one CPU online. */ |
294 | } | 322 | } |
323 | WARN_ON_ONCE(rnp != rdp->mynode && | ||
324 | (!list_empty(&rnp->blocked_tasks[0]) || | ||
325 | !list_empty(&rnp->blocked_tasks[1]))); | ||
295 | 326 | ||
296 | /* | 327 | /* |
297 | * Move tasks up to root rcu_node. Rely on the fact that the | 328 | * Move tasks up to root rcu_node. Rely on the fact that the |
@@ -335,20 +366,12 @@ static void rcu_preempt_check_callbacks(int cpu) | |||
335 | struct task_struct *t = current; | 366 | struct task_struct *t = current; |
336 | 367 | ||
337 | if (t->rcu_read_lock_nesting == 0) { | 368 | if (t->rcu_read_lock_nesting == 0) { |
338 | t->rcu_read_unlock_special &= | 369 | t->rcu_read_unlock_special &= ~RCU_READ_UNLOCK_NEED_QS; |
339 | ~(RCU_READ_UNLOCK_NEED_QS | RCU_READ_UNLOCK_GOT_QS); | 370 | rcu_preempt_qs(cpu); |
340 | rcu_preempt_qs_record(cpu); | ||
341 | return; | 371 | return; |
342 | } | 372 | } |
343 | if (per_cpu(rcu_preempt_data, cpu).qs_pending) { | 373 | if (per_cpu(rcu_preempt_data, cpu).qs_pending) |
344 | if (t->rcu_read_unlock_special & RCU_READ_UNLOCK_GOT_QS) { | 374 | t->rcu_read_unlock_special |= RCU_READ_UNLOCK_NEED_QS; |
345 | rcu_preempt_qs_record(cpu); | ||
346 | t->rcu_read_unlock_special &= ~RCU_READ_UNLOCK_GOT_QS; | ||
347 | } else if (!(t->rcu_read_unlock_special & | ||
348 | RCU_READ_UNLOCK_NEED_QS)) { | ||
349 | t->rcu_read_unlock_special |= RCU_READ_UNLOCK_NEED_QS; | ||
350 | } | ||
351 | } | ||
352 | } | 375 | } |
353 | 376 | ||
354 | /* | 377 | /* |
@@ -434,7 +457,7 @@ EXPORT_SYMBOL_GPL(rcu_batches_completed); | |||
434 | * Because preemptable RCU does not exist, we never have to check for | 457 | * Because preemptable RCU does not exist, we never have to check for |
435 | * CPUs being in quiescent states. | 458 | * CPUs being in quiescent states. |
436 | */ | 459 | */ |
437 | static void rcu_preempt_qs(int cpu) | 460 | static void rcu_preempt_note_context_switch(int cpu) |
438 | { | 461 | { |
439 | } | 462 | } |
440 | 463 | ||
@@ -451,6 +474,16 @@ static void rcu_print_task_stall(struct rcu_node *rnp) | |||
451 | #endif /* #ifdef CONFIG_RCU_CPU_STALL_DETECTOR */ | 474 | #endif /* #ifdef CONFIG_RCU_CPU_STALL_DETECTOR */ |
452 | 475 | ||
453 | /* | 476 | /* |
477 | * Because there is no preemptable RCU, there can be no readers blocked, | ||
478 | * so there is no need to check for blocked tasks. So check only for | ||
479 | * bogus qsmask values. | ||
480 | */ | ||
481 | static void rcu_preempt_check_blocked_tasks(struct rcu_node *rnp) | ||
482 | { | ||
483 | WARN_ON_ONCE(rnp->qsmask); | ||
484 | } | ||
485 | |||
486 | /* | ||
454 | * Because preemptable RCU does not exist, there are never any preempted | 487 | * Because preemptable RCU does not exist, there are never any preempted |
455 | * RCU readers. | 488 | * RCU readers. |
456 | */ | 489 | */ |
@@ -466,7 +499,8 @@ static int rcu_preempted_readers(struct rcu_node *rnp) | |||
466 | * tasks that were blocked within RCU read-side critical sections. | 499 | * tasks that were blocked within RCU read-side critical sections. |
467 | */ | 500 | */ |
468 | static void rcu_preempt_offline_tasks(struct rcu_state *rsp, | 501 | static void rcu_preempt_offline_tasks(struct rcu_state *rsp, |
469 | struct rcu_node *rnp) | 502 | struct rcu_node *rnp, |
503 | struct rcu_data *rdp) | ||
470 | { | 504 | { |
471 | } | 505 | } |
472 | 506 | ||