aboutsummaryrefslogtreecommitdiffstats
diff options
context:
space:
mode:
authorMing Lei <tom.leiming@gmail.com>2014-05-31 12:43:37 -0400
committerJens Axboe <axboe@fb.com>2014-06-03 23:04:39 -0400
commitcb96a42cc1f50ba1c7b1e9b2343bec80b926107f (patch)
treec69f953fcd7d04288903abe73a0f92f155882bfd
parent1aecfe4887713838c79bc52f774609a57db4f988 (diff)
blk-mq: fix schedule from atomic context
blk_mq_put_ctx() has to be called before io_schedule() in bt_get(). This patch fixes the problem by taking similar approach from percpu_ida allocation for the situation. Signed-off-by: Ming Lei <tom.leiming@gmail.com> Signed-off-by: Jens Axboe <axboe@fb.com>
-rw-r--r--block/blk-mq-tag.c48
-rw-r--r--block/blk-mq-tag.h2
-rw-r--r--block/blk-mq.c36
-rw-r--r--block/blk-mq.h23
4 files changed, 78 insertions, 31 deletions
diff --git a/block/blk-mq-tag.c b/block/blk-mq-tag.c
index d90c4aeb7dd3..1aab39f71d95 100644
--- a/block/blk-mq-tag.c
+++ b/block/blk-mq-tag.c
@@ -221,8 +221,10 @@ static struct bt_wait_state *bt_wait_ptr(struct blk_mq_bitmap_tags *bt,
221 return bs; 221 return bs;
222} 222}
223 223
224static int bt_get(struct blk_mq_bitmap_tags *bt, struct blk_mq_hw_ctx *hctx, 224static int bt_get(struct blk_mq_alloc_data *data,
225 unsigned int *last_tag, gfp_t gfp) 225 struct blk_mq_bitmap_tags *bt,
226 struct blk_mq_hw_ctx *hctx,
227 unsigned int *last_tag)
226{ 228{
227 struct bt_wait_state *bs; 229 struct bt_wait_state *bs;
228 DEFINE_WAIT(wait); 230 DEFINE_WAIT(wait);
@@ -232,7 +234,7 @@ static int bt_get(struct blk_mq_bitmap_tags *bt, struct blk_mq_hw_ctx *hctx,
232 if (tag != -1) 234 if (tag != -1)
233 return tag; 235 return tag;
234 236
235 if (!(gfp & __GFP_WAIT)) 237 if (!(data->gfp & __GFP_WAIT))
236 return -1; 238 return -1;
237 239
238 bs = bt_wait_ptr(bt, hctx); 240 bs = bt_wait_ptr(bt, hctx);
@@ -249,50 +251,62 @@ static int bt_get(struct blk_mq_bitmap_tags *bt, struct blk_mq_hw_ctx *hctx,
249 if (was_empty) 251 if (was_empty)
250 atomic_set(&bs->wait_cnt, bt->wake_cnt); 252 atomic_set(&bs->wait_cnt, bt->wake_cnt);
251 253
254 blk_mq_put_ctx(data->ctx);
255
252 io_schedule(); 256 io_schedule();
257
258 data->ctx = blk_mq_get_ctx(data->q);
259 data->hctx = data->q->mq_ops->map_queue(data->q,
260 data->ctx->cpu);
261 if (data->reserved) {
262 bt = &data->hctx->tags->breserved_tags;
263 } else {
264 last_tag = &data->ctx->last_tag;
265 hctx = data->hctx;
266 bt = &hctx->tags->bitmap_tags;
267 }
268 finish_wait(&bs->wait, &wait);
269 bs = bt_wait_ptr(bt, hctx);
253 } while (1); 270 } while (1);
254 271
255 finish_wait(&bs->wait, &wait); 272 finish_wait(&bs->wait, &wait);
256 return tag; 273 return tag;
257} 274}
258 275
259static unsigned int __blk_mq_get_tag(struct blk_mq_tags *tags, 276static unsigned int __blk_mq_get_tag(struct blk_mq_alloc_data *data)
260 struct blk_mq_hw_ctx *hctx,
261 unsigned int *last_tag, gfp_t gfp)
262{ 277{
263 int tag; 278 int tag;
264 279
265 tag = bt_get(&tags->bitmap_tags, hctx, last_tag, gfp); 280 tag = bt_get(data, &data->hctx->tags->bitmap_tags, data->hctx,
281 &data->ctx->last_tag);
266 if (tag >= 0) 282 if (tag >= 0)
267 return tag + tags->nr_reserved_tags; 283 return tag + data->hctx->tags->nr_reserved_tags;
268 284
269 return BLK_MQ_TAG_FAIL; 285 return BLK_MQ_TAG_FAIL;
270} 286}
271 287
272static unsigned int __blk_mq_get_reserved_tag(struct blk_mq_tags *tags, 288static unsigned int __blk_mq_get_reserved_tag(struct blk_mq_alloc_data *data)
273 gfp_t gfp)
274{ 289{
275 int tag, zero = 0; 290 int tag, zero = 0;
276 291
277 if (unlikely(!tags->nr_reserved_tags)) { 292 if (unlikely(!data->hctx->tags->nr_reserved_tags)) {
278 WARN_ON_ONCE(1); 293 WARN_ON_ONCE(1);
279 return BLK_MQ_TAG_FAIL; 294 return BLK_MQ_TAG_FAIL;
280 } 295 }
281 296
282 tag = bt_get(&tags->breserved_tags, NULL, &zero, gfp); 297 tag = bt_get(data, &data->hctx->tags->breserved_tags, NULL, &zero);
283 if (tag < 0) 298 if (tag < 0)
284 return BLK_MQ_TAG_FAIL; 299 return BLK_MQ_TAG_FAIL;
285 300
286 return tag; 301 return tag;
287} 302}
288 303
289unsigned int blk_mq_get_tag(struct blk_mq_hw_ctx *hctx, unsigned int *last_tag, 304unsigned int blk_mq_get_tag(struct blk_mq_alloc_data *data)
290 gfp_t gfp, bool reserved)
291{ 305{
292 if (!reserved) 306 if (!data->reserved)
293 return __blk_mq_get_tag(hctx->tags, hctx, last_tag, gfp); 307 return __blk_mq_get_tag(data);
294 308
295 return __blk_mq_get_reserved_tag(hctx->tags, gfp); 309 return __blk_mq_get_reserved_tag(data);
296} 310}
297 311
298static struct bt_wait_state *bt_wake_ptr(struct blk_mq_bitmap_tags *bt) 312static struct bt_wait_state *bt_wake_ptr(struct blk_mq_bitmap_tags *bt)
diff --git a/block/blk-mq-tag.h b/block/blk-mq-tag.h
index c959de58d2a5..98696a65d4d4 100644
--- a/block/blk-mq-tag.h
+++ b/block/blk-mq-tag.h
@@ -48,7 +48,7 @@ struct blk_mq_tags {
48extern struct blk_mq_tags *blk_mq_init_tags(unsigned int nr_tags, unsigned int reserved_tags, int node); 48extern struct blk_mq_tags *blk_mq_init_tags(unsigned int nr_tags, unsigned int reserved_tags, int node);
49extern void blk_mq_free_tags(struct blk_mq_tags *tags); 49extern void blk_mq_free_tags(struct blk_mq_tags *tags);
50 50
51extern unsigned int blk_mq_get_tag(struct blk_mq_hw_ctx *hctx, unsigned int *last_tag, gfp_t gfp, bool reserved); 51extern unsigned int blk_mq_get_tag(struct blk_mq_alloc_data *data);
52extern void blk_mq_put_tag(struct blk_mq_hw_ctx *hctx, unsigned int tag, unsigned int *last_tag); 52extern void blk_mq_put_tag(struct blk_mq_hw_ctx *hctx, unsigned int tag, unsigned int *last_tag);
53extern bool blk_mq_has_free_tags(struct blk_mq_tags *tags); 53extern bool blk_mq_has_free_tags(struct blk_mq_tags *tags);
54extern ssize_t blk_mq_tag_sysfs_show(struct blk_mq_tags *tags, char *page); 54extern ssize_t blk_mq_tag_sysfs_show(struct blk_mq_tags *tags, char *page);
diff --git a/block/blk-mq.c b/block/blk-mq.c
index b9230c522c6b..43eb3156e110 100644
--- a/block/blk-mq.c
+++ b/block/blk-mq.c
@@ -210,24 +210,23 @@ static void blk_mq_rq_ctx_init(struct request_queue *q, struct blk_mq_ctx *ctx,
210} 210}
211 211
212static struct request * 212static struct request *
213__blk_mq_alloc_request(struct request_queue *q, struct blk_mq_hw_ctx *hctx, 213__blk_mq_alloc_request(struct blk_mq_alloc_data *data, int rw)
214 struct blk_mq_ctx *ctx, int rw, gfp_t gfp, bool reserved)
215{ 214{
216 struct request *rq; 215 struct request *rq;
217 unsigned int tag; 216 unsigned int tag;
218 217
219 tag = blk_mq_get_tag(hctx, &ctx->last_tag, gfp, reserved); 218 tag = blk_mq_get_tag(data);
220 if (tag != BLK_MQ_TAG_FAIL) { 219 if (tag != BLK_MQ_TAG_FAIL) {
221 rq = hctx->tags->rqs[tag]; 220 rq = data->hctx->tags->rqs[tag];
222 221
223 rq->cmd_flags = 0; 222 rq->cmd_flags = 0;
224 if (blk_mq_tag_busy(hctx)) { 223 if (blk_mq_tag_busy(data->hctx)) {
225 rq->cmd_flags = REQ_MQ_INFLIGHT; 224 rq->cmd_flags = REQ_MQ_INFLIGHT;
226 atomic_inc(&hctx->nr_active); 225 atomic_inc(&data->hctx->nr_active);
227 } 226 }
228 227
229 rq->tag = tag; 228 rq->tag = tag;
230 blk_mq_rq_ctx_init(q, ctx, rq, rw); 229 blk_mq_rq_ctx_init(data->q, data->ctx, rq, rw);
231 return rq; 230 return rq;
232 } 231 }
233 232
@@ -240,22 +239,27 @@ struct request *blk_mq_alloc_request(struct request_queue *q, int rw, gfp_t gfp,
240 struct blk_mq_ctx *ctx; 239 struct blk_mq_ctx *ctx;
241 struct blk_mq_hw_ctx *hctx; 240 struct blk_mq_hw_ctx *hctx;
242 struct request *rq; 241 struct request *rq;
242 struct blk_mq_alloc_data alloc_data;
243 243
244 if (blk_mq_queue_enter(q)) 244 if (blk_mq_queue_enter(q))
245 return NULL; 245 return NULL;
246 246
247 ctx = blk_mq_get_ctx(q); 247 ctx = blk_mq_get_ctx(q);
248 hctx = q->mq_ops->map_queue(q, ctx->cpu); 248 hctx = q->mq_ops->map_queue(q, ctx->cpu);
249 blk_mq_set_alloc_data(&alloc_data, q, gfp & ~__GFP_WAIT,
250 reserved, ctx, hctx);
249 251
250 rq = __blk_mq_alloc_request(q, hctx, ctx, rw, gfp & ~__GFP_WAIT, 252 rq = __blk_mq_alloc_request(&alloc_data, rw);
251 reserved);
252 if (!rq && (gfp & __GFP_WAIT)) { 253 if (!rq && (gfp & __GFP_WAIT)) {
253 __blk_mq_run_hw_queue(hctx); 254 __blk_mq_run_hw_queue(hctx);
254 blk_mq_put_ctx(ctx); 255 blk_mq_put_ctx(ctx);
255 256
256 ctx = blk_mq_get_ctx(q); 257 ctx = blk_mq_get_ctx(q);
257 hctx = q->mq_ops->map_queue(q, ctx->cpu); 258 hctx = q->mq_ops->map_queue(q, ctx->cpu);
258 rq = __blk_mq_alloc_request(q, hctx, ctx, rw, gfp, reserved); 259 blk_mq_set_alloc_data(&alloc_data, q, gfp, reserved, ctx,
260 hctx);
261 rq = __blk_mq_alloc_request(&alloc_data, rw);
262 ctx = alloc_data.ctx;
259 } 263 }
260 blk_mq_put_ctx(ctx); 264 blk_mq_put_ctx(ctx);
261 return rq; 265 return rq;
@@ -1136,6 +1140,7 @@ static struct request *blk_mq_map_request(struct request_queue *q,
1136 struct blk_mq_ctx *ctx; 1140 struct blk_mq_ctx *ctx;
1137 struct request *rq; 1141 struct request *rq;
1138 int rw = bio_data_dir(bio); 1142 int rw = bio_data_dir(bio);
1143 struct blk_mq_alloc_data alloc_data;
1139 1144
1140 if (unlikely(blk_mq_queue_enter(q))) { 1145 if (unlikely(blk_mq_queue_enter(q))) {
1141 bio_endio(bio, -EIO); 1146 bio_endio(bio, -EIO);
@@ -1149,7 +1154,9 @@ static struct request *blk_mq_map_request(struct request_queue *q,
1149 rw |= REQ_SYNC; 1154 rw |= REQ_SYNC;
1150 1155
1151 trace_block_getrq(q, bio, rw); 1156 trace_block_getrq(q, bio, rw);
1152 rq = __blk_mq_alloc_request(q, hctx, ctx, rw, GFP_ATOMIC, false); 1157 blk_mq_set_alloc_data(&alloc_data, q, GFP_ATOMIC, false, ctx,
1158 hctx);
1159 rq = __blk_mq_alloc_request(&alloc_data, rw);
1153 if (unlikely(!rq)) { 1160 if (unlikely(!rq)) {
1154 __blk_mq_run_hw_queue(hctx); 1161 __blk_mq_run_hw_queue(hctx);
1155 blk_mq_put_ctx(ctx); 1162 blk_mq_put_ctx(ctx);
@@ -1157,8 +1164,11 @@ static struct request *blk_mq_map_request(struct request_queue *q,
1157 1164
1158 ctx = blk_mq_get_ctx(q); 1165 ctx = blk_mq_get_ctx(q);
1159 hctx = q->mq_ops->map_queue(q, ctx->cpu); 1166 hctx = q->mq_ops->map_queue(q, ctx->cpu);
1160 rq = __blk_mq_alloc_request(q, hctx, ctx, rw, 1167 blk_mq_set_alloc_data(&alloc_data, q,
1161 __GFP_WAIT|GFP_ATOMIC, false); 1168 __GFP_WAIT|GFP_ATOMIC, false, ctx, hctx);
1169 rq = __blk_mq_alloc_request(&alloc_data, rw);
1170 ctx = alloc_data.ctx;
1171 hctx = alloc_data.hctx;
1162 } 1172 }
1163 1173
1164 hctx->queued++; 1174 hctx->queued++;
diff --git a/block/blk-mq.h b/block/blk-mq.h
index 57a7968e47b3..26460884c6cd 100644
--- a/block/blk-mq.h
+++ b/block/blk-mq.h
@@ -91,4 +91,27 @@ static inline void blk_mq_put_ctx(struct blk_mq_ctx *ctx)
91 put_cpu(); 91 put_cpu();
92} 92}
93 93
94struct blk_mq_alloc_data {
95 /* input parameter */
96 struct request_queue *q;
97 gfp_t gfp;
98 bool reserved;
99
100 /* input & output parameter */
101 struct blk_mq_ctx *ctx;
102 struct blk_mq_hw_ctx *hctx;
103};
104
105static inline void blk_mq_set_alloc_data(struct blk_mq_alloc_data *data,
106 struct request_queue *q, gfp_t gfp, bool reserved,
107 struct blk_mq_ctx *ctx,
108 struct blk_mq_hw_ctx *hctx)
109{
110 data->q = q;
111 data->gfp = gfp;
112 data->reserved = reserved;
113 data->ctx = ctx;
114 data->hctx = hctx;
115}
116
94#endif 117#endif