aboutsummaryrefslogtreecommitdiffstats
diff options
context:
space:
mode:
authorTejun Heo <tj@kernel.org>2011-12-13 18:33:42 -0500
committerJens Axboe <axboe@kernel.dk>2011-12-13 18:33:42 -0500
commit7e5a8794492e43e9eebb68a98a23be055888ccd0 (patch)
treecc049a23b2c994f910d3101860bc1c2ecb7aa35f
parent3d3c2379feb177a5fd55bb0ed76776dc9d4f3243 (diff)
block, cfq: move io_cq exit/release to blk-ioc.c
With kmem_cache managed by blk-ioc, io_cq exit/release can be moved to blk-ioc too. The odd ->io_cq->exit/release() callbacks are replaced with elevator_ops->elevator_exit_icq_fn() with unlinking from both ioc and q, and freeing automatically handled by blk-ioc. The elevator operation only need to perform exit operation specific to the elevator - in cfq's case, exiting the cfqq's. Also, clearing of io_cq's on q detach is moved to block core and automatically performed on elevator switch and q release. Because the q io_cq points to might be freed before RCU callback for the io_cq runs, blk-ioc code should remember to which cache the io_cq needs to be freed when the io_cq is released. New field io_cq->__rcu_icq_cache is added for this purpose. As both the new field and rcu_head are used only after io_cq is released and the q/ioc_node fields aren't, they are put into unions. Signed-off-by: Tejun Heo <tj@kernel.org> Signed-off-by: Jens Axboe <axboe@kernel.dk>
-rw-r--r--block/blk-ioc.c76
-rw-r--r--block/blk-sysfs.c6
-rw-r--r--block/blk.h1
-rw-r--r--block/cfq-iosched.c47
-rw-r--r--block/elevator.c3
-rw-r--r--include/linux/elevator.h5
-rw-r--r--include/linux/iocontext.h20
7 files changed, 97 insertions, 61 deletions
diff --git a/block/blk-ioc.c b/block/blk-ioc.c
index 87ecc98b8ade..0910a5584d38 100644
--- a/block/blk-ioc.c
+++ b/block/blk-ioc.c
@@ -44,6 +44,51 @@ EXPORT_SYMBOL(get_io_context);
44#define ioc_release_depth_dec(q) do { } while (0) 44#define ioc_release_depth_dec(q) do { } while (0)
45#endif 45#endif
46 46
47static void icq_free_icq_rcu(struct rcu_head *head)
48{
49 struct io_cq *icq = container_of(head, struct io_cq, __rcu_head);
50
51 kmem_cache_free(icq->__rcu_icq_cache, icq);
52}
53
54/*
55 * Exit and free an icq. Called with both ioc and q locked.
56 */
57static void ioc_exit_icq(struct io_cq *icq)
58{
59 struct io_context *ioc = icq->ioc;
60 struct request_queue *q = icq->q;
61 struct elevator_type *et = q->elevator->type;
62
63 lockdep_assert_held(&ioc->lock);
64 lockdep_assert_held(q->queue_lock);
65
66 radix_tree_delete(&ioc->icq_tree, icq->q->id);
67 hlist_del_init(&icq->ioc_node);
68 list_del_init(&icq->q_node);
69
70 /*
71 * Both setting lookup hint to and clearing it from @icq are done
72 * under queue_lock. If it's not pointing to @icq now, it never
73 * will. Hint assignment itself can race safely.
74 */
75 if (rcu_dereference_raw(ioc->icq_hint) == icq)
76 rcu_assign_pointer(ioc->icq_hint, NULL);
77
78 if (et->ops.elevator_exit_icq_fn) {
79 ioc_release_depth_inc(q);
80 et->ops.elevator_exit_icq_fn(icq);
81 ioc_release_depth_dec(q);
82 }
83
84 /*
85 * @icq->q might have gone away by the time RCU callback runs
86 * making it impossible to determine icq_cache. Record it in @icq.
87 */
88 icq->__rcu_icq_cache = et->icq_cache;
89 call_rcu(&icq->__rcu_head, icq_free_icq_rcu);
90}
91
47/* 92/*
48 * Slow path for ioc release in put_io_context(). Performs double-lock 93 * Slow path for ioc release in put_io_context(). Performs double-lock
49 * dancing to unlink all icq's and then frees ioc. 94 * dancing to unlink all icq's and then frees ioc.
@@ -87,10 +132,7 @@ static void ioc_release_fn(struct work_struct *work)
87 spin_lock(&ioc->lock); 132 spin_lock(&ioc->lock);
88 continue; 133 continue;
89 } 134 }
90 ioc_release_depth_inc(this_q); 135 ioc_exit_icq(icq);
91 icq->exit(icq);
92 icq->release(icq);
93 ioc_release_depth_dec(this_q);
94 } 136 }
95 137
96 if (last_q) { 138 if (last_q) {
@@ -167,10 +209,7 @@ void put_io_context(struct io_context *ioc, struct request_queue *locked_q)
167 last_q = this_q; 209 last_q = this_q;
168 continue; 210 continue;
169 } 211 }
170 ioc_release_depth_inc(this_q); 212 ioc_exit_icq(icq);
171 icq->exit(icq);
172 icq->release(icq);
173 ioc_release_depth_dec(this_q);
174 } 213 }
175 214
176 if (last_q && last_q != locked_q) 215 if (last_q && last_q != locked_q)
@@ -203,6 +242,27 @@ void exit_io_context(struct task_struct *task)
203 put_io_context(ioc, NULL); 242 put_io_context(ioc, NULL);
204} 243}
205 244
245/**
246 * ioc_clear_queue - break any ioc association with the specified queue
247 * @q: request_queue being cleared
248 *
249 * Walk @q->icq_list and exit all io_cq's. Must be called with @q locked.
250 */
251void ioc_clear_queue(struct request_queue *q)
252{
253 lockdep_assert_held(q->queue_lock);
254
255 while (!list_empty(&q->icq_list)) {
256 struct io_cq *icq = list_entry(q->icq_list.next,
257 struct io_cq, q_node);
258 struct io_context *ioc = icq->ioc;
259
260 spin_lock(&ioc->lock);
261 ioc_exit_icq(icq);
262 spin_unlock(&ioc->lock);
263 }
264}
265
206void create_io_context_slowpath(struct task_struct *task, gfp_t gfp_flags, 266void create_io_context_slowpath(struct task_struct *task, gfp_t gfp_flags,
207 int node) 267 int node)
208{ 268{
diff --git a/block/blk-sysfs.c b/block/blk-sysfs.c
index 5b4b4ab5e785..cf150011d808 100644
--- a/block/blk-sysfs.c
+++ b/block/blk-sysfs.c
@@ -479,8 +479,12 @@ static void blk_release_queue(struct kobject *kobj)
479 479
480 blk_sync_queue(q); 480 blk_sync_queue(q);
481 481
482 if (q->elevator) 482 if (q->elevator) {
483 spin_lock_irq(q->queue_lock);
484 ioc_clear_queue(q);
485 spin_unlock_irq(q->queue_lock);
483 elevator_exit(q->elevator); 486 elevator_exit(q->elevator);
487 }
484 488
485 blk_throtl_exit(q); 489 blk_throtl_exit(q);
486 490
diff --git a/block/blk.h b/block/blk.h
index 3c510a4b5054..ed4d9bf2ab16 100644
--- a/block/blk.h
+++ b/block/blk.h
@@ -200,6 +200,7 @@ static inline int blk_do_io_stat(struct request *rq)
200 */ 200 */
201void get_io_context(struct io_context *ioc); 201void get_io_context(struct io_context *ioc);
202struct io_cq *ioc_lookup_icq(struct io_context *ioc, struct request_queue *q); 202struct io_cq *ioc_lookup_icq(struct io_context *ioc, struct request_queue *q);
203void ioc_clear_queue(struct request_queue *q);
203 204
204void create_io_context_slowpath(struct task_struct *task, gfp_t gfp_mask, 205void create_io_context_slowpath(struct task_struct *task, gfp_t gfp_mask,
205 int node); 206 int node);
diff --git a/block/cfq-iosched.c b/block/cfq-iosched.c
index 06e59abcb57f..f6d315551496 100644
--- a/block/cfq-iosched.c
+++ b/block/cfq-iosched.c
@@ -2674,26 +2674,6 @@ static void cfq_put_queue(struct cfq_queue *cfqq)
2674 cfq_put_cfqg(cfqg); 2674 cfq_put_cfqg(cfqg);
2675} 2675}
2676 2676
2677static void cfq_icq_free_rcu(struct rcu_head *head)
2678{
2679 kmem_cache_free(cfq_icq_pool,
2680 icq_to_cic(container_of(head, struct io_cq, rcu_head)));
2681}
2682
2683static void cfq_icq_free(struct io_cq *icq)
2684{
2685 call_rcu(&icq->rcu_head, cfq_icq_free_rcu);
2686}
2687
2688static void cfq_release_icq(struct io_cq *icq)
2689{
2690 struct io_context *ioc = icq->ioc;
2691
2692 radix_tree_delete(&ioc->icq_tree, icq->q->id);
2693 hlist_del(&icq->ioc_node);
2694 cfq_icq_free(icq);
2695}
2696
2697static void cfq_put_cooperator(struct cfq_queue *cfqq) 2677static void cfq_put_cooperator(struct cfq_queue *cfqq)
2698{ 2678{
2699 struct cfq_queue *__cfqq, *next; 2679 struct cfq_queue *__cfqq, *next;
@@ -2731,17 +2711,6 @@ static void cfq_exit_icq(struct io_cq *icq)
2731{ 2711{
2732 struct cfq_io_cq *cic = icq_to_cic(icq); 2712 struct cfq_io_cq *cic = icq_to_cic(icq);
2733 struct cfq_data *cfqd = cic_to_cfqd(cic); 2713 struct cfq_data *cfqd = cic_to_cfqd(cic);
2734 struct io_context *ioc = icq->ioc;
2735
2736 list_del_init(&icq->q_node);
2737
2738 /*
2739 * Both setting lookup hint to and clearing it from @icq are done
2740 * under queue_lock. If it's not pointing to @icq now, it never
2741 * will. Hint assignment itself can race safely.
2742 */
2743 if (rcu_dereference_raw(ioc->icq_hint) == icq)
2744 rcu_assign_pointer(ioc->icq_hint, NULL);
2745 2714
2746 if (cic->cfqq[BLK_RW_ASYNC]) { 2715 if (cic->cfqq[BLK_RW_ASYNC]) {
2747 cfq_exit_cfqq(cfqd, cic->cfqq[BLK_RW_ASYNC]); 2716 cfq_exit_cfqq(cfqd, cic->cfqq[BLK_RW_ASYNC]);
@@ -2764,8 +2733,6 @@ static struct cfq_io_cq *cfq_alloc_cic(struct cfq_data *cfqd, gfp_t gfp_mask)
2764 cic->ttime.last_end_request = jiffies; 2733 cic->ttime.last_end_request = jiffies;
2765 INIT_LIST_HEAD(&cic->icq.q_node); 2734 INIT_LIST_HEAD(&cic->icq.q_node);
2766 INIT_HLIST_NODE(&cic->icq.ioc_node); 2735 INIT_HLIST_NODE(&cic->icq.ioc_node);
2767 cic->icq.exit = cfq_exit_icq;
2768 cic->icq.release = cfq_release_icq;
2769 } 2736 }
2770 2737
2771 return cic; 2738 return cic;
@@ -3034,7 +3001,7 @@ out:
3034 if (ret) 3001 if (ret)
3035 printk(KERN_ERR "cfq: icq link failed!\n"); 3002 printk(KERN_ERR "cfq: icq link failed!\n");
3036 if (icq) 3003 if (icq)
3037 cfq_icq_free(icq); 3004 kmem_cache_free(cfq_icq_pool, icq);
3038 return ret; 3005 return ret;
3039} 3006}
3040 3007
@@ -3774,17 +3741,6 @@ static void cfq_exit_queue(struct elevator_queue *e)
3774 if (cfqd->active_queue) 3741 if (cfqd->active_queue)
3775 __cfq_slice_expired(cfqd, cfqd->active_queue, 0); 3742 __cfq_slice_expired(cfqd, cfqd->active_queue, 0);
3776 3743
3777 while (!list_empty(&q->icq_list)) {
3778 struct io_cq *icq = list_entry(q->icq_list.next,
3779 struct io_cq, q_node);
3780 struct io_context *ioc = icq->ioc;
3781
3782 spin_lock(&ioc->lock);
3783 cfq_exit_icq(icq);
3784 cfq_release_icq(icq);
3785 spin_unlock(&ioc->lock);
3786 }
3787
3788 cfq_put_async_queues(cfqd); 3744 cfq_put_async_queues(cfqd);
3789 cfq_release_cfq_groups(cfqd); 3745 cfq_release_cfq_groups(cfqd);
3790 3746
@@ -4019,6 +3975,7 @@ static struct elevator_type iosched_cfq = {
4019 .elevator_completed_req_fn = cfq_completed_request, 3975 .elevator_completed_req_fn = cfq_completed_request,
4020 .elevator_former_req_fn = elv_rb_former_request, 3976 .elevator_former_req_fn = elv_rb_former_request,
4021 .elevator_latter_req_fn = elv_rb_latter_request, 3977 .elevator_latter_req_fn = elv_rb_latter_request,
3978 .elevator_exit_icq_fn = cfq_exit_icq,
4022 .elevator_set_req_fn = cfq_set_request, 3979 .elevator_set_req_fn = cfq_set_request,
4023 .elevator_put_req_fn = cfq_put_request, 3980 .elevator_put_req_fn = cfq_put_request,
4024 .elevator_may_queue_fn = cfq_may_queue, 3981 .elevator_may_queue_fn = cfq_may_queue,
diff --git a/block/elevator.c b/block/elevator.c
index cca049fb45c8..91e18f8af9be 100644
--- a/block/elevator.c
+++ b/block/elevator.c
@@ -979,8 +979,9 @@ static int elevator_switch(struct request_queue *q, struct elevator_type *new_e)
979 goto fail_register; 979 goto fail_register;
980 } 980 }
981 981
982 /* done, replace the old one with new one and turn off BYPASS */ 982 /* done, clear io_cq's, switch elevators and turn off BYPASS */
983 spin_lock_irq(q->queue_lock); 983 spin_lock_irq(q->queue_lock);
984 ioc_clear_queue(q);
984 old_elevator = q->elevator; 985 old_elevator = q->elevator;
985 q->elevator = e; 986 q->elevator = e;
986 spin_unlock_irq(q->queue_lock); 987 spin_unlock_irq(q->queue_lock);
diff --git a/include/linux/elevator.h b/include/linux/elevator.h
index d3d3e28cbfd4..06e4dd568717 100644
--- a/include/linux/elevator.h
+++ b/include/linux/elevator.h
@@ -5,6 +5,8 @@
5 5
6#ifdef CONFIG_BLOCK 6#ifdef CONFIG_BLOCK
7 7
8struct io_cq;
9
8typedef int (elevator_merge_fn) (struct request_queue *, struct request **, 10typedef int (elevator_merge_fn) (struct request_queue *, struct request **,
9 struct bio *); 11 struct bio *);
10 12
@@ -24,6 +26,7 @@ typedef struct request *(elevator_request_list_fn) (struct request_queue *, stru
24typedef void (elevator_completed_req_fn) (struct request_queue *, struct request *); 26typedef void (elevator_completed_req_fn) (struct request_queue *, struct request *);
25typedef int (elevator_may_queue_fn) (struct request_queue *, int); 27typedef int (elevator_may_queue_fn) (struct request_queue *, int);
26 28
29typedef void (elevator_exit_icq_fn) (struct io_cq *);
27typedef int (elevator_set_req_fn) (struct request_queue *, struct request *, gfp_t); 30typedef int (elevator_set_req_fn) (struct request_queue *, struct request *, gfp_t);
28typedef void (elevator_put_req_fn) (struct request *); 31typedef void (elevator_put_req_fn) (struct request *);
29typedef void (elevator_activate_req_fn) (struct request_queue *, struct request *); 32typedef void (elevator_activate_req_fn) (struct request_queue *, struct request *);
@@ -56,6 +59,8 @@ struct elevator_ops
56 elevator_request_list_fn *elevator_former_req_fn; 59 elevator_request_list_fn *elevator_former_req_fn;
57 elevator_request_list_fn *elevator_latter_req_fn; 60 elevator_request_list_fn *elevator_latter_req_fn;
58 61
62 elevator_exit_icq_fn *elevator_exit_icq_fn;
63
59 elevator_set_req_fn *elevator_set_req_fn; 64 elevator_set_req_fn *elevator_set_req_fn;
60 elevator_put_req_fn *elevator_put_req_fn; 65 elevator_put_req_fn *elevator_put_req_fn;
61 66
diff --git a/include/linux/iocontext.h b/include/linux/iocontext.h
index d15ca6591f96..ac390a34c0e7 100644
--- a/include/linux/iocontext.h
+++ b/include/linux/iocontext.h
@@ -14,14 +14,22 @@ struct io_cq {
14 struct request_queue *q; 14 struct request_queue *q;
15 struct io_context *ioc; 15 struct io_context *ioc;
16 16
17 struct list_head q_node; 17 /*
18 struct hlist_node ioc_node; 18 * q_node and ioc_node link io_cq through icq_list of q and ioc
19 * respectively. Both fields are unused once ioc_exit_icq() is
20 * called and shared with __rcu_icq_cache and __rcu_head which are
21 * used for RCU free of io_cq.
22 */
23 union {
24 struct list_head q_node;
25 struct kmem_cache *__rcu_icq_cache;
26 };
27 union {
28 struct hlist_node ioc_node;
29 struct rcu_head __rcu_head;
30 };
19 31
20 unsigned long changed; 32 unsigned long changed;
21 struct rcu_head rcu_head;
22
23 void (*exit)(struct io_cq *);
24 void (*release)(struct io_cq *);
25}; 33};
26 34
27/* 35/*