diff options
Diffstat (limited to 'kernel/rcutree_plugin.h')
| -rw-r--r-- | kernel/rcutree_plugin.h | 110 |
1 files changed, 72 insertions, 38 deletions
diff --git a/kernel/rcutree_plugin.h b/kernel/rcutree_plugin.h index 47789369ea59..1cee04f627eb 100644 --- a/kernel/rcutree_plugin.h +++ b/kernel/rcutree_plugin.h | |||
| @@ -64,22 +64,31 @@ EXPORT_SYMBOL_GPL(rcu_batches_completed); | |||
| 64 | * not in a quiescent state. There might be any number of tasks blocked | 64 | * not in a quiescent state. There might be any number of tasks blocked |
| 65 | * while in an RCU read-side critical section. | 65 | * while in an RCU read-side critical section. |
| 66 | */ | 66 | */ |
| 67 | static void rcu_preempt_qs_record(int cpu) | 67 | static void rcu_preempt_qs(int cpu) |
| 68 | { | 68 | { |
| 69 | struct rcu_data *rdp = &per_cpu(rcu_preempt_data, cpu); | 69 | struct rcu_data *rdp = &per_cpu(rcu_preempt_data, cpu); |
| 70 | rdp->passed_quiesc = 1; | ||
| 71 | rdp->passed_quiesc_completed = rdp->completed; | 70 | rdp->passed_quiesc_completed = rdp->completed; |
| 71 | barrier(); | ||
| 72 | rdp->passed_quiesc = 1; | ||
| 72 | } | 73 | } |
| 73 | 74 | ||
| 74 | /* | 75 | /* |
| 75 | * We have entered the scheduler or are between softirqs in ksoftirqd. | 76 | * We have entered the scheduler, and the current task might soon be |
| 76 | * If we are in an RCU read-side critical section, we need to reflect | 77 | * context-switched away from. If this task is in an RCU read-side |
| 77 | * that in the state of the rcu_node structure corresponding to this CPU. | 78 | * critical section, we will no longer be able to rely on the CPU to |
| 78 | * Caller must disable hardirqs. | 79 | * record that fact, so we enqueue the task on the appropriate entry |
| 80 | * of the blocked_tasks[] array. The task will dequeue itself when | ||
| 81 | * it exits the outermost enclosing RCU read-side critical section. | ||
| 82 | * Therefore, the current grace period cannot be permitted to complete | ||
| 83 | * until the blocked_tasks[] entry indexed by the low-order bit of | ||
| 84 | * rnp->gpnum empties. | ||
| 85 | * | ||
| 86 | * Caller must disable preemption. | ||
| 79 | */ | 87 | */ |
| 80 | static void rcu_preempt_qs(int cpu) | 88 | static void rcu_preempt_note_context_switch(int cpu) |
| 81 | { | 89 | { |
| 82 | struct task_struct *t = current; | 90 | struct task_struct *t = current; |
| 91 | unsigned long flags; | ||
| 83 | int phase; | 92 | int phase; |
| 84 | struct rcu_data *rdp; | 93 | struct rcu_data *rdp; |
| 85 | struct rcu_node *rnp; | 94 | struct rcu_node *rnp; |
| @@ -90,7 +99,7 @@ static void rcu_preempt_qs(int cpu) | |||
| 90 | /* Possibly blocking in an RCU read-side critical section. */ | 99 | /* Possibly blocking in an RCU read-side critical section. */ |
| 91 | rdp = rcu_preempt_state.rda[cpu]; | 100 | rdp = rcu_preempt_state.rda[cpu]; |
| 92 | rnp = rdp->mynode; | 101 | rnp = rdp->mynode; |
| 93 | spin_lock(&rnp->lock); | 102 | spin_lock_irqsave(&rnp->lock, flags); |
| 94 | t->rcu_read_unlock_special |= RCU_READ_UNLOCK_BLOCKED; | 103 | t->rcu_read_unlock_special |= RCU_READ_UNLOCK_BLOCKED; |
| 95 | t->rcu_blocked_node = rnp; | 104 | t->rcu_blocked_node = rnp; |
| 96 | 105 | ||
| @@ -103,11 +112,15 @@ static void rcu_preempt_qs(int cpu) | |||
| 103 | * state for the current grace period), then as long | 112 | * state for the current grace period), then as long |
| 104 | * as that task remains queued, the current grace period | 113 | * as that task remains queued, the current grace period |
| 105 | * cannot end. | 114 | * cannot end. |
| 115 | * | ||
| 116 | * But first, note that the current CPU must still be | ||
| 117 | * on line! | ||
| 106 | */ | 118 | */ |
| 107 | phase = !(rnp->qsmask & rdp->grpmask) ^ (rnp->gpnum & 0x1); | 119 | WARN_ON_ONCE((rdp->grpmask & rnp->qsmaskinit) == 0); |
| 120 | WARN_ON_ONCE(!list_empty(&t->rcu_node_entry)); | ||
| 121 | phase = (rnp->gpnum + !(rnp->qsmask & rdp->grpmask)) & 0x1; | ||
| 108 | list_add(&t->rcu_node_entry, &rnp->blocked_tasks[phase]); | 122 | list_add(&t->rcu_node_entry, &rnp->blocked_tasks[phase]); |
| 109 | smp_mb(); /* Ensure later ctxt swtch seen after above. */ | 123 | spin_unlock_irqrestore(&rnp->lock, flags); |
| 110 | spin_unlock(&rnp->lock); | ||
| 111 | } | 124 | } |
| 112 | 125 | ||
| 113 | /* | 126 | /* |
| @@ -119,9 +132,10 @@ static void rcu_preempt_qs(int cpu) | |||
| 119 | * grace period, then the fact that the task has been enqueued | 132 | * grace period, then the fact that the task has been enqueued |
| 120 | * means that we continue to block the current grace period. | 133 | * means that we continue to block the current grace period. |
| 121 | */ | 134 | */ |
| 122 | rcu_preempt_qs_record(cpu); | 135 | rcu_preempt_qs(cpu); |
| 123 | t->rcu_read_unlock_special &= ~(RCU_READ_UNLOCK_NEED_QS | | 136 | local_irq_save(flags); |
| 124 | RCU_READ_UNLOCK_GOT_QS); | 137 | t->rcu_read_unlock_special &= ~RCU_READ_UNLOCK_NEED_QS; |
| 138 | local_irq_restore(flags); | ||
| 125 | } | 139 | } |
| 126 | 140 | ||
| 127 | /* | 141 | /* |
| @@ -157,7 +171,7 @@ static void rcu_read_unlock_special(struct task_struct *t) | |||
| 157 | special = t->rcu_read_unlock_special; | 171 | special = t->rcu_read_unlock_special; |
| 158 | if (special & RCU_READ_UNLOCK_NEED_QS) { | 172 | if (special & RCU_READ_UNLOCK_NEED_QS) { |
| 159 | t->rcu_read_unlock_special &= ~RCU_READ_UNLOCK_NEED_QS; | 173 | t->rcu_read_unlock_special &= ~RCU_READ_UNLOCK_NEED_QS; |
| 160 | t->rcu_read_unlock_special |= RCU_READ_UNLOCK_GOT_QS; | 174 | rcu_preempt_qs(smp_processor_id()); |
| 161 | } | 175 | } |
| 162 | 176 | ||
| 163 | /* Hardware IRQ handlers cannot block. */ | 177 | /* Hardware IRQ handlers cannot block. */ |
| @@ -177,10 +191,10 @@ static void rcu_read_unlock_special(struct task_struct *t) | |||
| 177 | */ | 191 | */ |
| 178 | for (;;) { | 192 | for (;;) { |
| 179 | rnp = t->rcu_blocked_node; | 193 | rnp = t->rcu_blocked_node; |
| 180 | spin_lock(&rnp->lock); | 194 | spin_lock(&rnp->lock); /* irqs already disabled. */ |
| 181 | if (rnp == t->rcu_blocked_node) | 195 | if (rnp == t->rcu_blocked_node) |
| 182 | break; | 196 | break; |
| 183 | spin_unlock(&rnp->lock); | 197 | spin_unlock(&rnp->lock); /* irqs remain disabled. */ |
| 184 | } | 198 | } |
| 185 | empty = list_empty(&rnp->blocked_tasks[rnp->gpnum & 0x1]); | 199 | empty = list_empty(&rnp->blocked_tasks[rnp->gpnum & 0x1]); |
| 186 | list_del_init(&t->rcu_node_entry); | 200 | list_del_init(&t->rcu_node_entry); |
| @@ -194,9 +208,8 @@ static void rcu_read_unlock_special(struct task_struct *t) | |||
| 194 | */ | 208 | */ |
| 195 | if (!empty && rnp->qsmask == 0 && | 209 | if (!empty && rnp->qsmask == 0 && |
| 196 | list_empty(&rnp->blocked_tasks[rnp->gpnum & 0x1])) { | 210 | list_empty(&rnp->blocked_tasks[rnp->gpnum & 0x1])) { |
| 197 | t->rcu_read_unlock_special &= | 211 | struct rcu_node *rnp_p; |
| 198 | ~(RCU_READ_UNLOCK_NEED_QS | | 212 | |
| 199 | RCU_READ_UNLOCK_GOT_QS); | ||
| 200 | if (rnp->parent == NULL) { | 213 | if (rnp->parent == NULL) { |
| 201 | /* Only one rcu_node in the tree. */ | 214 | /* Only one rcu_node in the tree. */ |
| 202 | cpu_quiet_msk_finish(&rcu_preempt_state, flags); | 215 | cpu_quiet_msk_finish(&rcu_preempt_state, flags); |
| @@ -205,9 +218,10 @@ static void rcu_read_unlock_special(struct task_struct *t) | |||
| 205 | /* Report up the rest of the hierarchy. */ | 218 | /* Report up the rest of the hierarchy. */ |
| 206 | mask = rnp->grpmask; | 219 | mask = rnp->grpmask; |
| 207 | spin_unlock_irqrestore(&rnp->lock, flags); | 220 | spin_unlock_irqrestore(&rnp->lock, flags); |
| 208 | rnp = rnp->parent; | 221 | rnp_p = rnp->parent; |
| 209 | spin_lock_irqsave(&rnp->lock, flags); | 222 | spin_lock_irqsave(&rnp_p->lock, flags); |
| 210 | cpu_quiet_msk(mask, &rcu_preempt_state, rnp, flags); | 223 | WARN_ON_ONCE(rnp->qsmask); |
| 224 | cpu_quiet_msk(mask, &rcu_preempt_state, rnp_p, flags); | ||
| 211 | return; | 225 | return; |
| 212 | } | 226 | } |
| 213 | spin_unlock(&rnp->lock); | 227 | spin_unlock(&rnp->lock); |
| @@ -259,6 +273,19 @@ static void rcu_print_task_stall(struct rcu_node *rnp) | |||
| 259 | #endif /* #ifdef CONFIG_RCU_CPU_STALL_DETECTOR */ | 273 | #endif /* #ifdef CONFIG_RCU_CPU_STALL_DETECTOR */ |
| 260 | 274 | ||
| 261 | /* | 275 | /* |
| 276 | * Check that the list of blocked tasks for the newly completed grace | ||
| 277 | * period is in fact empty. It is a serious bug to complete a grace | ||
| 278 | * period that still has RCU readers blocked! This function must be | ||
| 279 | * invoked -before- updating this rnp's ->gpnum, and the rnp's ->lock | ||
| 280 | * must be held by the caller. | ||
| 281 | */ | ||
| 282 | static void rcu_preempt_check_blocked_tasks(struct rcu_node *rnp) | ||
| 283 | { | ||
| 284 | WARN_ON_ONCE(!list_empty(&rnp->blocked_tasks[rnp->gpnum & 0x1])); | ||
| 285 | WARN_ON_ONCE(rnp->qsmask); | ||
| 286 | } | ||
| 287 | |||
| 288 | /* | ||
| 262 | * Check for preempted RCU readers for the specified rcu_node structure. | 289 | * Check for preempted RCU readers for the specified rcu_node structure. |
| 263 | * If the caller needs a reliable answer, it must hold the rcu_node's | 290 | * If the caller needs a reliable answer, it must hold the rcu_node's |
| 264 | * >lock. | 291 | * >lock. |
| @@ -280,7 +307,8 @@ static int rcu_preempted_readers(struct rcu_node *rnp) | |||
| 280 | * The caller must hold rnp->lock with irqs disabled. | 307 | * The caller must hold rnp->lock with irqs disabled. |
| 281 | */ | 308 | */ |
| 282 | static void rcu_preempt_offline_tasks(struct rcu_state *rsp, | 309 | static void rcu_preempt_offline_tasks(struct rcu_state *rsp, |
| 283 | struct rcu_node *rnp) | 310 | struct rcu_node *rnp, |
| 311 | struct rcu_data *rdp) | ||
| 284 | { | 312 | { |
| 285 | int i; | 313 | int i; |
| 286 | struct list_head *lp; | 314 | struct list_head *lp; |
| @@ -292,6 +320,9 @@ static void rcu_preempt_offline_tasks(struct rcu_state *rsp, | |||
| 292 | WARN_ONCE(1, "Last CPU thought to be offlined?"); | 320 | WARN_ONCE(1, "Last CPU thought to be offlined?"); |
| 293 | return; /* Shouldn't happen: at least one CPU online. */ | 321 | return; /* Shouldn't happen: at least one CPU online. */ |
| 294 | } | 322 | } |
| 323 | WARN_ON_ONCE(rnp != rdp->mynode && | ||
| 324 | (!list_empty(&rnp->blocked_tasks[0]) || | ||
| 325 | !list_empty(&rnp->blocked_tasks[1]))); | ||
| 295 | 326 | ||
| 296 | /* | 327 | /* |
| 297 | * Move tasks up to root rcu_node. Rely on the fact that the | 328 | * Move tasks up to root rcu_node. Rely on the fact that the |
| @@ -335,20 +366,12 @@ static void rcu_preempt_check_callbacks(int cpu) | |||
| 335 | struct task_struct *t = current; | 366 | struct task_struct *t = current; |
| 336 | 367 | ||
| 337 | if (t->rcu_read_lock_nesting == 0) { | 368 | if (t->rcu_read_lock_nesting == 0) { |
| 338 | t->rcu_read_unlock_special &= | 369 | t->rcu_read_unlock_special &= ~RCU_READ_UNLOCK_NEED_QS; |
| 339 | ~(RCU_READ_UNLOCK_NEED_QS | RCU_READ_UNLOCK_GOT_QS); | 370 | rcu_preempt_qs(cpu); |
| 340 | rcu_preempt_qs_record(cpu); | ||
| 341 | return; | 371 | return; |
| 342 | } | 372 | } |
| 343 | if (per_cpu(rcu_preempt_data, cpu).qs_pending) { | 373 | if (per_cpu(rcu_preempt_data, cpu).qs_pending) |
| 344 | if (t->rcu_read_unlock_special & RCU_READ_UNLOCK_GOT_QS) { | 374 | t->rcu_read_unlock_special |= RCU_READ_UNLOCK_NEED_QS; |
| 345 | rcu_preempt_qs_record(cpu); | ||
| 346 | t->rcu_read_unlock_special &= ~RCU_READ_UNLOCK_GOT_QS; | ||
| 347 | } else if (!(t->rcu_read_unlock_special & | ||
| 348 | RCU_READ_UNLOCK_NEED_QS)) { | ||
| 349 | t->rcu_read_unlock_special |= RCU_READ_UNLOCK_NEED_QS; | ||
| 350 | } | ||
| 351 | } | ||
| 352 | } | 375 | } |
| 353 | 376 | ||
| 354 | /* | 377 | /* |
| @@ -434,7 +457,7 @@ EXPORT_SYMBOL_GPL(rcu_batches_completed); | |||
| 434 | * Because preemptable RCU does not exist, we never have to check for | 457 | * Because preemptable RCU does not exist, we never have to check for |
| 435 | * CPUs being in quiescent states. | 458 | * CPUs being in quiescent states. |
| 436 | */ | 459 | */ |
| 437 | static void rcu_preempt_qs(int cpu) | 460 | static void rcu_preempt_note_context_switch(int cpu) |
| 438 | { | 461 | { |
| 439 | } | 462 | } |
| 440 | 463 | ||
| @@ -451,6 +474,16 @@ static void rcu_print_task_stall(struct rcu_node *rnp) | |||
| 451 | #endif /* #ifdef CONFIG_RCU_CPU_STALL_DETECTOR */ | 474 | #endif /* #ifdef CONFIG_RCU_CPU_STALL_DETECTOR */ |
| 452 | 475 | ||
| 453 | /* | 476 | /* |
| 477 | * Because there is no preemptable RCU, there can be no readers blocked, | ||
| 478 | * so there is no need to check for blocked tasks. So check only for | ||
| 479 | * bogus qsmask values. | ||
| 480 | */ | ||
| 481 | static void rcu_preempt_check_blocked_tasks(struct rcu_node *rnp) | ||
| 482 | { | ||
| 483 | WARN_ON_ONCE(rnp->qsmask); | ||
| 484 | } | ||
| 485 | |||
| 486 | /* | ||
| 454 | * Because preemptable RCU does not exist, there are never any preempted | 487 | * Because preemptable RCU does not exist, there are never any preempted |
| 455 | * RCU readers. | 488 | * RCU readers. |
| 456 | */ | 489 | */ |
| @@ -466,7 +499,8 @@ static int rcu_preempted_readers(struct rcu_node *rnp) | |||
| 466 | * tasks that were blocked within RCU read-side critical sections. | 499 | * tasks that were blocked within RCU read-side critical sections. |
| 467 | */ | 500 | */ |
| 468 | static void rcu_preempt_offline_tasks(struct rcu_state *rsp, | 501 | static void rcu_preempt_offline_tasks(struct rcu_state *rsp, |
| 469 | struct rcu_node *rnp) | 502 | struct rcu_node *rnp, |
| 503 | struct rcu_data *rdp) | ||
| 470 | { | 504 | { |
| 471 | } | 505 | } |
| 472 | 506 | ||
