aboutsummaryrefslogtreecommitdiffstats
path: root/fs/exofs/ios.c
diff options
context:
space:
mode:
Diffstat (limited to 'fs/exofs/ios.c')
-rw-r--r--fs/exofs/ios.c327
1 files changed, 273 insertions, 54 deletions
diff --git a/fs/exofs/ios.c b/fs/exofs/ios.c
index 2b81f99fd62c..6e446b2670b9 100644
--- a/fs/exofs/ios.c
+++ b/fs/exofs/ios.c
@@ -23,6 +23,7 @@
23 */ 23 */
24 24
25#include <scsi/scsi_device.h> 25#include <scsi/scsi_device.h>
26#include <asm/div64.h>
26 27
27#include "exofs.h" 28#include "exofs.h"
28 29
@@ -110,7 +111,17 @@ void exofs_put_io_state(struct exofs_io_state *ios)
110unsigned exofs_layout_od_id(struct exofs_layout *layout, 111unsigned exofs_layout_od_id(struct exofs_layout *layout,
111 osd_id obj_no, unsigned layout_index) 112 osd_id obj_no, unsigned layout_index)
112{ 113{
113 return layout_index; 114/* switch (layout->lay_func) {
115 case LAYOUT_MOVING_WINDOW:
116 {*/
117 unsigned dev_mod = obj_no;
118
119 return (layout_index + dev_mod * layout->mirrors_p1) %
120 layout->s_numdevs;
121/* }
122 case LAYOUT_FUNC_IMPLICT:
123 return layout->devs[layout_index];
124 }*/
114} 125}
115 126
116static inline struct osd_dev *exofs_ios_od(struct exofs_io_state *ios, 127static inline struct osd_dev *exofs_ios_od(struct exofs_io_state *ios,
@@ -225,8 +236,8 @@ int exofs_check_io(struct exofs_io_state *ios, u64 *resid)
225 _clear_bio(ios->per_dev[i].bio); 236 _clear_bio(ios->per_dev[i].bio);
226 EXOFS_DBGMSG("start read offset passed end of file " 237 EXOFS_DBGMSG("start read offset passed end of file "
227 "offset=0x%llx, length=0x%llx\n", 238 "offset=0x%llx, length=0x%llx\n",
228 _LLU(ios->offset), 239 _LLU(ios->per_dev[i].offset),
229 _LLU(ios->length)); 240 _LLU(ios->per_dev[i].length));
230 241
231 continue; /* we recovered */ 242 continue; /* we recovered */
232 } 243 }
@@ -248,6 +259,127 @@ int exofs_check_io(struct exofs_io_state *ios, u64 *resid)
248 return acumulated_lin_err; 259 return acumulated_lin_err;
249} 260}
250 261
262/* REMOVEME: After review
263 Some quoteing from the standard
264
265 L = logical offset into the file
266 W = number of data components in a stripe
267 S = W * stripe_unit (S is Stripe length)
268 N = L / S (N is the stripe Number)
269 C = (L-(N*S)) / stripe_unit (C is the component)
270 O = (N*stripe_unit)+(L%stripe_unit) (O is the object's offset)
271*/
272
273static void _offset_dev_unit_off(struct exofs_io_state *ios, u64 file_offset,
274 u64 *obj_offset, unsigned *dev, unsigned *unit_off)
275{
276 unsigned stripe_unit = ios->layout->stripe_unit;
277 unsigned stripe_length = stripe_unit * ios->layout->group_width;
278 u64 stripe_no = file_offset;
279 unsigned stripe_mod = do_div(stripe_no, stripe_length);
280
281 *unit_off = stripe_mod % stripe_unit;
282 *obj_offset = stripe_no * stripe_unit + *unit_off;
283 *dev = stripe_mod / stripe_unit * ios->layout->mirrors_p1;
284}
285
286static int _add_stripe_unit(struct exofs_io_state *ios, unsigned *cur_bvec,
287 struct exofs_per_dev_state *per_dev, int cur_len)
288{
289 unsigned bv = *cur_bvec;
290 struct request_queue *q =
291 osd_request_queue(exofs_ios_od(ios, per_dev->dev));
292
293 per_dev->length += cur_len;
294
295 if (per_dev->bio == NULL) {
296 unsigned pages_in_stripe = ios->layout->group_width *
297 (ios->layout->stripe_unit / PAGE_SIZE);
298 unsigned bio_size = (ios->bio->bi_vcnt + pages_in_stripe) /
299 ios->layout->group_width;
300
301 per_dev->bio = bio_kmalloc(GFP_KERNEL, bio_size);
302 if (unlikely(!per_dev->bio)) {
303 EXOFS_DBGMSG("Faild to allocate BIO size=%u\n",
304 bio_size);
305 return -ENOMEM;
306 }
307 }
308
309 while (cur_len > 0) {
310 int added_len;
311 struct bio_vec *bvec = &ios->bio->bi_io_vec[bv];
312
313 BUG_ON(ios->bio->bi_vcnt <= bv);
314 cur_len -= bvec->bv_len;
315
316 added_len = bio_add_pc_page(q, per_dev->bio, bvec->bv_page,
317 bvec->bv_len, bvec->bv_offset);
318 if (unlikely(bvec->bv_len != added_len))
319 return -ENOMEM;
320 ++bv;
321 }
322 BUG_ON(cur_len);
323
324 *cur_bvec = bv;
325 return 0;
326}
327
328static int _prepare_for_striping(struct exofs_io_state *ios)
329{
330 u64 length = ios->length;
331 u64 offset = ios->offset;
332 unsigned stripe_unit = ios->layout->stripe_unit;
333 unsigned comp = 0;
334 unsigned stripes = 0;
335 unsigned cur_bvec = 0;
336 int ret;
337
338 if (!ios->bio) {
339 if (ios->kern_buff) {
340 struct exofs_per_dev_state *per_dev = &ios->per_dev[0];
341 unsigned unit_off;
342
343 _offset_dev_unit_off(ios, offset, &per_dev->offset,
344 &per_dev->dev, &unit_off);
345 /* no cross device without page array */
346 BUG_ON((ios->layout->group_width > 1) &&
347 (unit_off + length > stripe_unit));
348 }
349 ios->numdevs = ios->layout->mirrors_p1;
350 return 0;
351 }
352
353 while (length) {
354 struct exofs_per_dev_state *per_dev = &ios->per_dev[comp];
355 unsigned cur_len;
356
357 if (!per_dev->length) {
358 unsigned unit_off;
359
360 _offset_dev_unit_off(ios, offset, &per_dev->offset,
361 &per_dev->dev, &unit_off);
362 stripes++;
363 cur_len = min_t(u64, stripe_unit - unit_off, length);
364 offset += cur_len;
365 } else {
366 cur_len = min_t(u64, stripe_unit, length);
367 }
368
369 ret = _add_stripe_unit(ios, &cur_bvec, per_dev, cur_len);
370 if (unlikely(ret))
371 goto out;
372
373 comp += ios->layout->mirrors_p1;
374 comp %= ios->layout->s_numdevs;
375
376 length -= cur_len;
377 }
378out:
379 ios->numdevs = stripes * ios->layout->mirrors_p1;
380 return ret;
381}
382
251int exofs_sbi_create(struct exofs_io_state *ios) 383int exofs_sbi_create(struct exofs_io_state *ios)
252{ 384{
253 int i, ret; 385 int i, ret;
@@ -296,61 +428,71 @@ out:
296 return ret; 428 return ret;
297} 429}
298 430
299int exofs_sbi_write(struct exofs_io_state *ios) 431static int _sbi_write_mirror(struct exofs_io_state *ios, int cur_comp)
300{ 432{
301 int i, ret; 433 struct exofs_per_dev_state *master_dev = &ios->per_dev[cur_comp];
434 unsigned dev = ios->per_dev[cur_comp].dev;
435 unsigned last_comp = cur_comp + ios->layout->mirrors_p1;
436 int ret = 0;
302 437
303 for (i = 0; i < ios->layout->s_numdevs; i++) { 438 for (; cur_comp < last_comp; ++cur_comp, ++dev) {
439 struct exofs_per_dev_state *per_dev = &ios->per_dev[cur_comp];
304 struct osd_request *or; 440 struct osd_request *or;
305 441
306 or = osd_start_request(exofs_ios_od(ios, i), GFP_KERNEL); 442 or = osd_start_request(exofs_ios_od(ios, dev), GFP_KERNEL);
307 if (unlikely(!or)) { 443 if (unlikely(!or)) {
308 EXOFS_ERR("%s: osd_start_request failed\n", __func__); 444 EXOFS_ERR("%s: osd_start_request failed\n", __func__);
309 ret = -ENOMEM; 445 ret = -ENOMEM;
310 goto out; 446 goto out;
311 } 447 }
312 ios->per_dev[i].or = or; 448 per_dev->or = or;
313 ios->numdevs++; 449 per_dev->offset = master_dev->offset;
314 450
315 if (ios->bio) { 451 if (ios->bio) {
316 struct bio *bio; 452 struct bio *bio;
317 453
318 if (i != 0) { 454 if (per_dev != master_dev) {
319 bio = bio_kmalloc(GFP_KERNEL, 455 bio = bio_kmalloc(GFP_KERNEL,
320 ios->bio->bi_max_vecs); 456 master_dev->bio->bi_max_vecs);
321 if (unlikely(!bio)) { 457 if (unlikely(!bio)) {
322 EXOFS_DBGMSG( 458 EXOFS_DBGMSG(
323 "Faild to allocate BIO size=%u\n", 459 "Faild to allocate BIO size=%u\n",
324 ios->bio->bi_max_vecs); 460 master_dev->bio->bi_max_vecs);
325 ret = -ENOMEM; 461 ret = -ENOMEM;
326 goto out; 462 goto out;
327 } 463 }
328 464
329 __bio_clone(bio, ios->bio); 465 __bio_clone(bio, master_dev->bio);
330 bio->bi_bdev = NULL; 466 bio->bi_bdev = NULL;
331 bio->bi_next = NULL; 467 bio->bi_next = NULL;
332 ios->per_dev[i].bio = bio; 468 per_dev->length = master_dev->length;
469 per_dev->bio = bio;
470 per_dev->dev = dev;
333 } else { 471 } else {
334 bio = ios->bio; 472 bio = master_dev->bio;
473 /* FIXME: bio_set_dir() */
474 bio->bi_rw |= (1 << BIO_RW);
335 } 475 }
336 476
337 osd_req_write(or, &ios->obj, ios->offset, bio, 477 osd_req_write(or, &ios->obj, per_dev->offset, bio,
338 ios->length); 478 per_dev->length);
339 EXOFS_DBGMSG("write(0x%llx) offset=0x%llx " 479 EXOFS_DBGMSG("write(0x%llx) offset=0x%llx "
340 "length=0x%llx dev=%d\n", 480 "length=0x%llx dev=%d\n",
341 _LLU(ios->obj.id), _LLU(ios->offset), 481 _LLU(ios->obj.id), _LLU(per_dev->offset),
342 _LLU(ios->length), i); 482 _LLU(per_dev->length), dev);
343 } else if (ios->kern_buff) { 483 } else if (ios->kern_buff) {
344 osd_req_write_kern(or, &ios->obj, ios->offset, 484 ret = osd_req_write_kern(or, &ios->obj, per_dev->offset,
345 ios->kern_buff, ios->length); 485 ios->kern_buff, ios->length);
486 if (unlikely(ret))
487 goto out;
346 EXOFS_DBGMSG2("write_kern(0x%llx) offset=0x%llx " 488 EXOFS_DBGMSG2("write_kern(0x%llx) offset=0x%llx "
347 "length=0x%llx dev=%d\n", 489 "length=0x%llx dev=%d\n",
348 _LLU(ios->obj.id), _LLU(ios->offset), 490 _LLU(ios->obj.id), _LLU(per_dev->offset),
349 _LLU(ios->length), i); 491 _LLU(ios->length), dev);
350 } else { 492 } else {
351 osd_req_set_attributes(or, &ios->obj); 493 osd_req_set_attributes(or, &ios->obj);
352 EXOFS_DBGMSG2("obj(0x%llx) set_attributes=%d dev=%d\n", 494 EXOFS_DBGMSG2("obj(0x%llx) set_attributes=%d dev=%d\n",
353 _LLU(ios->obj.id), ios->out_attr_len, i); 495 _LLU(ios->obj.id), ios->out_attr_len, dev);
354 } 496 }
355 497
356 if (ios->out_attr) 498 if (ios->out_attr)
@@ -361,40 +503,57 @@ int exofs_sbi_write(struct exofs_io_state *ios)
361 osd_req_add_get_attr_list(or, ios->in_attr, 503 osd_req_add_get_attr_list(or, ios->in_attr,
362 ios->in_attr_len); 504 ios->in_attr_len);
363 } 505 }
364 ret = exofs_io_execute(ios);
365 506
366out: 507out:
367 return ret; 508 return ret;
368} 509}
369 510
370int exofs_sbi_read(struct exofs_io_state *ios) 511int exofs_sbi_write(struct exofs_io_state *ios)
512{
513 int i;
514 int ret;
515
516 ret = _prepare_for_striping(ios);
517 if (unlikely(ret))
518 return ret;
519
520 for (i = 0; i < ios->numdevs; i += ios->layout->mirrors_p1) {
521 ret = _sbi_write_mirror(ios, i);
522 if (unlikely(ret))
523 return ret;
524 }
525
526 ret = exofs_io_execute(ios);
527 return ret;
528}
529
530static int _sbi_read_mirror(struct exofs_io_state *ios, unsigned cur_comp)
371{ 531{
372 struct osd_request *or; 532 struct osd_request *or;
373 struct exofs_per_dev_state *per_dev = &ios->per_dev[0]; 533 struct exofs_per_dev_state *per_dev = &ios->per_dev[cur_comp];
374 unsigned first_dev = (unsigned)ios->obj.id; 534 unsigned first_dev = (unsigned)ios->obj.id;
375 535
376 first_dev %= ios->layout->s_numdevs; 536 first_dev = per_dev->dev + first_dev % ios->layout->mirrors_p1;
377 or = osd_start_request(exofs_ios_od(ios, first_dev), GFP_KERNEL); 537 or = osd_start_request(exofs_ios_od(ios, first_dev), GFP_KERNEL);
378 if (unlikely(!or)) { 538 if (unlikely(!or)) {
379 EXOFS_ERR("%s: osd_start_request failed\n", __func__); 539 EXOFS_ERR("%s: osd_start_request failed\n", __func__);
380 return -ENOMEM; 540 return -ENOMEM;
381 } 541 }
382 per_dev->or = or; 542 per_dev->or = or;
383 ios->numdevs++;
384 543
385 if (ios->bio) { 544 if (ios->bio) {
386 osd_req_read(or, &ios->obj, ios->offset, ios->bio, ios->length); 545 osd_req_read(or, &ios->obj, per_dev->offset,
546 per_dev->bio, per_dev->length);
387 EXOFS_DBGMSG("read(0x%llx) offset=0x%llx length=0x%llx" 547 EXOFS_DBGMSG("read(0x%llx) offset=0x%llx length=0x%llx"
388 " dev=%d\n", _LLU(ios->obj.id), 548 " dev=%d\n", _LLU(ios->obj.id),
389 _LLU(ios->offset), _LLU(ios->length), 549 _LLU(per_dev->offset), _LLU(per_dev->length),
390 first_dev); 550 first_dev);
391 } else if (ios->kern_buff) { 551 } else if (ios->kern_buff) {
392 int ret = osd_req_read_kern(or, &ios->obj, ios->offset, 552 int ret = osd_req_read_kern(or, &ios->obj, per_dev->offset,
393 ios->kern_buff, ios->length); 553 ios->kern_buff, ios->length);
394
395 EXOFS_DBGMSG2("read_kern(0x%llx) offset=0x%llx " 554 EXOFS_DBGMSG2("read_kern(0x%llx) offset=0x%llx "
396 "length=0x%llx dev=%d ret=>%d\n", 555 "length=0x%llx dev=%d ret=>%d\n",
397 _LLU(ios->obj.id), _LLU(ios->offset), 556 _LLU(ios->obj.id), _LLU(per_dev->offset),
398 _LLU(ios->length), first_dev, ret); 557 _LLU(ios->length), first_dev, ret);
399 if (unlikely(ret)) 558 if (unlikely(ret))
400 return ret; 559 return ret;
@@ -403,14 +562,32 @@ int exofs_sbi_read(struct exofs_io_state *ios)
403 EXOFS_DBGMSG2("obj(0x%llx) get_attributes=%d dev=%d\n", 562 EXOFS_DBGMSG2("obj(0x%llx) get_attributes=%d dev=%d\n",
404 _LLU(ios->obj.id), ios->in_attr_len, first_dev); 563 _LLU(ios->obj.id), ios->in_attr_len, first_dev);
405 } 564 }
406
407 if (ios->out_attr) 565 if (ios->out_attr)
408 osd_req_add_set_attr_list(or, ios->out_attr, ios->out_attr_len); 566 osd_req_add_set_attr_list(or, ios->out_attr, ios->out_attr_len);
409 567
410 if (ios->in_attr) 568 if (ios->in_attr)
411 osd_req_add_get_attr_list(or, ios->in_attr, ios->in_attr_len); 569 osd_req_add_get_attr_list(or, ios->in_attr, ios->in_attr_len);
412 570
413 return exofs_io_execute(ios); 571 return 0;
572}
573
574int exofs_sbi_read(struct exofs_io_state *ios)
575{
576 int i;
577 int ret;
578
579 ret = _prepare_for_striping(ios);
580 if (unlikely(ret))
581 return ret;
582
583 for (i = 0; i < ios->numdevs; i += ios->layout->mirrors_p1) {
584 ret = _sbi_read_mirror(ios, i);
585 if (unlikely(ret))
586 return ret;
587 }
588
589 ret = exofs_io_execute(ios);
590 return ret;
414} 591}
415 592
416int extract_attr_from_ios(struct exofs_io_state *ios, struct osd_attr *attr) 593int extract_attr_from_ios(struct exofs_io_state *ios, struct osd_attr *attr)
@@ -434,42 +611,84 @@ int extract_attr_from_ios(struct exofs_io_state *ios, struct osd_attr *attr)
434 return -EIO; 611 return -EIO;
435} 612}
436 613
614static int _truncate_mirrors(struct exofs_io_state *ios, unsigned cur_comp,
615 struct osd_attr *attr)
616{
617 int last_comp = cur_comp + ios->layout->mirrors_p1;
618
619 for (; cur_comp < last_comp; ++cur_comp) {
620 struct exofs_per_dev_state *per_dev = &ios->per_dev[cur_comp];
621 struct osd_request *or;
622
623 or = osd_start_request(exofs_ios_od(ios, cur_comp), GFP_KERNEL);
624 if (unlikely(!or)) {
625 EXOFS_ERR("%s: osd_start_request failed\n", __func__);
626 return -ENOMEM;
627 }
628 per_dev->or = or;
629
630 osd_req_set_attributes(or, &ios->obj);
631 osd_req_add_set_attr_list(or, attr, 1);
632 }
633
634 return 0;
635}
636
437int exofs_oi_truncate(struct exofs_i_info *oi, u64 size) 637int exofs_oi_truncate(struct exofs_i_info *oi, u64 size)
438{ 638{
439 struct exofs_sb_info *sbi = oi->vfs_inode.i_sb->s_fs_info; 639 struct exofs_sb_info *sbi = oi->vfs_inode.i_sb->s_fs_info;
440 struct exofs_io_state *ios; 640 struct exofs_io_state *ios;
441 struct osd_attr attr; 641 struct exofs_trunc_attr {
442 __be64 newsize; 642 struct osd_attr attr;
643 __be64 newsize;
644 } *size_attrs;
645 u64 this_obj_size;
646 unsigned dev;
647 unsigned unit_off;
443 int i, ret; 648 int i, ret;
444 649
445 if (exofs_get_io_state(&sbi->layout, &ios)) 650 ret = exofs_get_io_state(&sbi->layout, &ios);
446 return -ENOMEM; 651 if (unlikely(ret))
652 return ret;
653
654 size_attrs = kcalloc(ios->layout->group_width, sizeof(*size_attrs),
655 GFP_KERNEL);
656 if (unlikely(!size_attrs)) {
657 ret = -ENOMEM;
658 goto out;
659 }
447 660
448 ios->obj.id = exofs_oi_objno(oi); 661 ios->obj.id = exofs_oi_objno(oi);
449 ios->cred = oi->i_cred; 662 ios->cred = oi->i_cred;
450 663
451 newsize = cpu_to_be64(size); 664 ios->numdevs = ios->layout->s_numdevs;
452 attr = g_attr_logical_length; 665 _offset_dev_unit_off(ios, size, &this_obj_size, &dev, &unit_off);
453 attr.val_ptr = &newsize;
454 666
455 for (i = 0; i < sbi->layout.s_numdevs; i++) { 667 for (i = 0; i < ios->layout->group_width; ++i) {
456 struct osd_request *or; 668 struct exofs_trunc_attr *size_attr = &size_attrs[i];
669 u64 obj_size;
457 670
458 or = osd_start_request(exofs_ios_od(ios, i), GFP_KERNEL); 671 if (i < dev)
459 if (unlikely(!or)) { 672 obj_size = this_obj_size +
460 EXOFS_ERR("%s: osd_start_request failed\n", __func__); 673 ios->layout->stripe_unit - unit_off;
461 ret = -ENOMEM; 674 else if (i == dev)
462 goto out; 675 obj_size = this_obj_size;
463 } 676 else /* i > dev */
464 ios->per_dev[i].or = or; 677 obj_size = this_obj_size - unit_off;
465 ios->numdevs++;
466 678
467 osd_req_set_attributes(or, &ios->obj); 679 size_attr->newsize = cpu_to_be64(obj_size);
468 osd_req_add_set_attr_list(or, &attr, 1); 680 size_attr->attr = g_attr_logical_length;
681 size_attr->attr.val_ptr = &size_attr->newsize;
682
683 ret = _truncate_mirrors(ios, i * ios->layout->mirrors_p1,
684 &size_attr->attr);
685 if (unlikely(ret))
686 goto out;
469 } 687 }
470 ret = exofs_io_execute(ios); 688 ret = exofs_io_execute(ios);
471 689
472out: 690out:
691 kfree(size_attrs);
473 exofs_put_io_state(ios); 692 exofs_put_io_state(ios);
474 return ret; 693 return ret;
475} 694}