diff options
author | Yehuda Sadeh <yehuda@hq.newdream.net> | 2010-04-06 18:14:15 -0400 |
---|---|---|
committer | Sage Weil <sage@newdream.net> | 2010-10-20 18:37:28 -0400 |
commit | 3d14c5d2b6e15c21d8e5467dc62d33127c23a644 (patch) | |
tree | 7d123c47847df9d1e865b6b78dc7da3fe739b704 | |
parent | ae1533b62b3369e6ae32338f4a77d64d0e88f676 (diff) |
ceph: factor out libceph from Ceph file system
This factors out protocol and low-level storage parts of ceph into a
separate libceph module living in net/ceph and include/linux/ceph. This
is mostly a matter of moving files around. However, a few key pieces
of the interface change as well:
- ceph_client becomes ceph_fs_client and ceph_client, where the latter
captures the mon and osd clients, and the fs_client gets the mds client
and file system specific pieces.
- Mount option parsing and debugfs setup is correspondingly broken into
two pieces.
- The mon client gets a generic handler callback for otherwise unknown
messages (mds map, in this case).
- The basic supported/required feature bits can be expanded (and are by
ceph_fs_client).
No functional change, aside from some subtle error handling cases that got
cleaned up in the refactoring process.
Signed-off-by: Sage Weil <sage@newdream.net>
-rw-r--r-- | MAINTAINERS | 2 | ||||
-rw-r--r-- | fs/ceph/Kconfig | 14 | ||||
-rw-r--r-- | fs/ceph/Makefile | 11 | ||||
-rw-r--r-- | fs/ceph/README | 20 | ||||
-rw-r--r-- | fs/ceph/addr.c | 65 | ||||
-rw-r--r-- | fs/ceph/caps.c | 35 | ||||
-rw-r--r-- | fs/ceph/ceph_frag.c | 3 | ||||
-rw-r--r-- | fs/ceph/debugfs.c | 407 | ||||
-rw-r--r-- | fs/ceph/dir.c | 55 | ||||
-rw-r--r-- | fs/ceph/export.c | 5 | ||||
-rw-r--r-- | fs/ceph/file.c | 207 | ||||
-rw-r--r-- | fs/ceph/inode.c | 19 | ||||
-rw-r--r-- | fs/ceph/ioctl.c | 11 | ||||
-rw-r--r-- | fs/ceph/locks.c | 6 | ||||
-rw-r--r-- | fs/ceph/mds_client.c | 86 | ||||
-rw-r--r-- | fs/ceph/mds_client.h | 20 | ||||
-rw-r--r-- | fs/ceph/mdsmap.c | 11 | ||||
-rw-r--r-- | fs/ceph/snap.c | 10 | ||||
-rw-r--r-- | fs/ceph/strings.c (renamed from fs/ceph/ceph_strings.c) | 82 | ||||
-rw-r--r-- | fs/ceph/super.c | 1154 | ||||
-rw-r--r-- | fs/ceph/super.h | 397 | ||||
-rw-r--r-- | fs/ceph/xattr.c | 15 | ||||
-rw-r--r-- | include/linux/ceph/auth.h (renamed from fs/ceph/auth.h) | 4 | ||||
-rw-r--r-- | include/linux/ceph/buffer.h (renamed from fs/ceph/buffer.h) | 0 | ||||
-rw-r--r-- | include/linux/ceph/ceph_debug.h (renamed from fs/ceph/ceph_debug.h) | 5 | ||||
-rw-r--r-- | include/linux/ceph/ceph_frag.h (renamed from fs/ceph/ceph_frag.h) | 0 | ||||
-rw-r--r-- | include/linux/ceph/ceph_fs.h (renamed from fs/ceph/ceph_fs.h) | 0 | ||||
-rw-r--r-- | include/linux/ceph/ceph_hash.h (renamed from fs/ceph/ceph_hash.h) | 0 | ||||
-rw-r--r-- | include/linux/ceph/debugfs.h | 33 | ||||
-rw-r--r-- | include/linux/ceph/decode.h (renamed from fs/ceph/decode.h) | 0 | ||||
-rw-r--r-- | include/linux/ceph/libceph.h | 249 | ||||
-rw-r--r-- | include/linux/ceph/mdsmap.h (renamed from fs/ceph/mdsmap.h) | 0 | ||||
-rw-r--r-- | include/linux/ceph/messenger.h (renamed from fs/ceph/messenger.h) | 8 | ||||
-rw-r--r-- | include/linux/ceph/mon_client.h (renamed from fs/ceph/mon_client.h) | 1 | ||||
-rw-r--r-- | include/linux/ceph/msgpool.h (renamed from fs/ceph/msgpool.h) | 0 | ||||
-rw-r--r-- | include/linux/ceph/msgr.h (renamed from fs/ceph/msgr.h) | 0 | ||||
-rw-r--r-- | include/linux/ceph/osd_client.h (renamed from fs/ceph/osd_client.h) | 1 | ||||
-rw-r--r-- | include/linux/ceph/osdmap.h (renamed from fs/ceph/osdmap.h) | 2 | ||||
-rw-r--r-- | include/linux/ceph/pagelist.h (renamed from fs/ceph/pagelist.h) | 0 | ||||
-rw-r--r-- | include/linux/ceph/rados.h (renamed from fs/ceph/rados.h) | 0 | ||||
-rw-r--r-- | include/linux/ceph/types.h (renamed from fs/ceph/types.h) | 0 | ||||
-rw-r--r-- | include/linux/crush/crush.h (renamed from fs/ceph/crush/crush.h) | 0 | ||||
-rw-r--r-- | include/linux/crush/hash.h (renamed from fs/ceph/crush/hash.h) | 0 | ||||
-rw-r--r-- | include/linux/crush/mapper.h (renamed from fs/ceph/crush/mapper.h) | 0 | ||||
-rw-r--r-- | net/Kconfig | 1 | ||||
-rw-r--r-- | net/Makefile | 1 | ||||
-rw-r--r-- | net/ceph/Kconfig | 28 | ||||
-rw-r--r-- | net/ceph/Makefile | 37 | ||||
-rw-r--r-- | net/ceph/armor.c (renamed from fs/ceph/armor.c) | 0 | ||||
-rw-r--r-- | net/ceph/auth.c (renamed from fs/ceph/auth.c) | 10 | ||||
-rw-r--r-- | net/ceph/auth_none.c (renamed from fs/ceph/auth_none.c) | 7 | ||||
-rw-r--r-- | net/ceph/auth_none.h (renamed from fs/ceph/auth_none.h) | 3 | ||||
-rw-r--r-- | net/ceph/auth_x.c (renamed from fs/ceph/auth_x.c) | 9 | ||||
-rw-r--r-- | net/ceph/auth_x.h (renamed from fs/ceph/auth_x.h) | 3 | ||||
-rw-r--r-- | net/ceph/auth_x_protocol.h (renamed from fs/ceph/auth_x_protocol.h) | 0 | ||||
-rw-r--r-- | net/ceph/buffer.c (renamed from fs/ceph/buffer.c) | 9 | ||||
-rw-r--r-- | net/ceph/ceph_common.c | 529 | ||||
-rw-r--r-- | net/ceph/ceph_fs.c (renamed from fs/ceph/ceph_fs.c) | 5 | ||||
-rw-r--r-- | net/ceph/ceph_hash.c (renamed from fs/ceph/ceph_hash.c) | 2 | ||||
-rw-r--r-- | net/ceph/ceph_strings.c | 84 | ||||
-rw-r--r-- | net/ceph/crush/crush.c (renamed from fs/ceph/crush/crush.c) | 2 | ||||
-rw-r--r-- | net/ceph/crush/hash.c (renamed from fs/ceph/crush/hash.c) | 2 | ||||
-rw-r--r-- | net/ceph/crush/mapper.c (renamed from fs/ceph/crush/mapper.c) | 4 | ||||
-rw-r--r-- | net/ceph/crypto.c (renamed from fs/ceph/crypto.c) | 4 | ||||
-rw-r--r-- | net/ceph/crypto.h (renamed from fs/ceph/crypto.h) | 4 | ||||
-rw-r--r-- | net/ceph/debugfs.c | 268 | ||||
-rw-r--r-- | net/ceph/messenger.c (renamed from fs/ceph/messenger.c) | 77 | ||||
-rw-r--r-- | net/ceph/mon_client.c (renamed from fs/ceph/mon_client.c) | 73 | ||||
-rw-r--r-- | net/ceph/msgpool.c (renamed from fs/ceph/msgpool.c) | 4 | ||||
-rw-r--r-- | net/ceph/osd_client.c (renamed from fs/ceph/osd_client.c) | 54 | ||||
-rw-r--r-- | net/ceph/osdmap.c (renamed from fs/ceph/osdmap.c) | 17 | ||||
-rw-r--r-- | net/ceph/pagelist.c (renamed from fs/ceph/pagelist.c) | 6 | ||||
-rw-r--r-- | net/ceph/pagevec.c | 223 |
73 files changed, 2566 insertions, 1838 deletions
diff --git a/MAINTAINERS b/MAINTAINERS index 7679bf32f7bb..48d05654d456 100644 --- a/MAINTAINERS +++ b/MAINTAINERS | |||
@@ -1527,6 +1527,8 @@ T: git git://git.kernel.org/pub/scm/linux/kernel/git/sage/ceph-client.git | |||
1527 | S: Supported | 1527 | S: Supported |
1528 | F: Documentation/filesystems/ceph.txt | 1528 | F: Documentation/filesystems/ceph.txt |
1529 | F: fs/ceph | 1529 | F: fs/ceph |
1530 | F: net/ceph | ||
1531 | F: include/linux/ceph | ||
1530 | 1532 | ||
1531 | CERTIFIED WIRELESS USB (WUSB) SUBSYSTEM: | 1533 | CERTIFIED WIRELESS USB (WUSB) SUBSYSTEM: |
1532 | M: David Vrabel <david.vrabel@csr.com> | 1534 | M: David Vrabel <david.vrabel@csr.com> |
diff --git a/fs/ceph/Kconfig b/fs/ceph/Kconfig index 0fcd2640c23f..9eb134ea6eb2 100644 --- a/fs/ceph/Kconfig +++ b/fs/ceph/Kconfig | |||
@@ -1,9 +1,11 @@ | |||
1 | config CEPH_FS | 1 | config CEPH_FS |
2 | tristate "Ceph distributed file system (EXPERIMENTAL)" | 2 | tristate "Ceph distributed file system (EXPERIMENTAL)" |
3 | depends on INET && EXPERIMENTAL | 3 | depends on INET && EXPERIMENTAL |
4 | select CEPH_LIB | ||
4 | select LIBCRC32C | 5 | select LIBCRC32C |
5 | select CRYPTO_AES | 6 | select CRYPTO_AES |
6 | select CRYPTO | 7 | select CRYPTO |
8 | default n | ||
7 | help | 9 | help |
8 | Choose Y or M here to include support for mounting the | 10 | Choose Y or M here to include support for mounting the |
9 | experimental Ceph distributed file system. Ceph is an extremely | 11 | experimental Ceph distributed file system. Ceph is an extremely |
@@ -14,15 +16,3 @@ config CEPH_FS | |||
14 | 16 | ||
15 | If unsure, say N. | 17 | If unsure, say N. |
16 | 18 | ||
17 | config CEPH_FS_PRETTYDEBUG | ||
18 | bool "Include file:line in ceph debug output" | ||
19 | depends on CEPH_FS | ||
20 | default n | ||
21 | help | ||
22 | If you say Y here, debug output will include a filename and | ||
23 | line to aid debugging. This icnreases kernel size and slows | ||
24 | execution slightly when debug call sites are enabled (e.g., | ||
25 | via CONFIG_DYNAMIC_DEBUG). | ||
26 | |||
27 | If unsure, say N. | ||
28 | |||
diff --git a/fs/ceph/Makefile b/fs/ceph/Makefile index 278e1172600d..9e6c4f2e8ff1 100644 --- a/fs/ceph/Makefile +++ b/fs/ceph/Makefile | |||
@@ -8,15 +8,8 @@ obj-$(CONFIG_CEPH_FS) += ceph.o | |||
8 | 8 | ||
9 | ceph-objs := super.o inode.o dir.o file.o locks.o addr.o ioctl.o \ | 9 | ceph-objs := super.o inode.o dir.o file.o locks.o addr.o ioctl.o \ |
10 | export.o caps.o snap.o xattr.o \ | 10 | export.o caps.o snap.o xattr.o \ |
11 | messenger.o msgpool.o buffer.o pagelist.o \ | 11 | mds_client.o mdsmap.o strings.o ceph_frag.o \ |
12 | mds_client.o mdsmap.o \ | 12 | debugfs.o |
13 | mon_client.o \ | ||
14 | osd_client.o osdmap.o crush/crush.o crush/mapper.o crush/hash.o \ | ||
15 | debugfs.o \ | ||
16 | auth.o auth_none.o \ | ||
17 | crypto.o armor.o \ | ||
18 | auth_x.o \ | ||
19 | ceph_fs.o ceph_strings.o ceph_hash.o ceph_frag.o | ||
20 | 13 | ||
21 | else | 14 | else |
22 | #Otherwise we were called directly from the command | 15 | #Otherwise we were called directly from the command |
diff --git a/fs/ceph/README b/fs/ceph/README deleted file mode 100644 index 18352fab37c0..000000000000 --- a/fs/ceph/README +++ /dev/null | |||
@@ -1,20 +0,0 @@ | |||
1 | # | ||
2 | # The following files are shared by (and manually synchronized | ||
3 | # between) the Ceph userland and kernel client. | ||
4 | # | ||
5 | # userland kernel | ||
6 | src/include/ceph_fs.h fs/ceph/ceph_fs.h | ||
7 | src/include/ceph_fs.cc fs/ceph/ceph_fs.c | ||
8 | src/include/msgr.h fs/ceph/msgr.h | ||
9 | src/include/rados.h fs/ceph/rados.h | ||
10 | src/include/ceph_strings.cc fs/ceph/ceph_strings.c | ||
11 | src/include/ceph_frag.h fs/ceph/ceph_frag.h | ||
12 | src/include/ceph_frag.cc fs/ceph/ceph_frag.c | ||
13 | src/include/ceph_hash.h fs/ceph/ceph_hash.h | ||
14 | src/include/ceph_hash.cc fs/ceph/ceph_hash.c | ||
15 | src/crush/crush.c fs/ceph/crush/crush.c | ||
16 | src/crush/crush.h fs/ceph/crush/crush.h | ||
17 | src/crush/mapper.c fs/ceph/crush/mapper.c | ||
18 | src/crush/mapper.h fs/ceph/crush/mapper.h | ||
19 | src/crush/hash.h fs/ceph/crush/hash.h | ||
20 | src/crush/hash.c fs/ceph/crush/hash.c | ||
diff --git a/fs/ceph/addr.c b/fs/ceph/addr.c index efbc604001c8..51bcc5ce3230 100644 --- a/fs/ceph/addr.c +++ b/fs/ceph/addr.c | |||
@@ -1,4 +1,4 @@ | |||
1 | #include "ceph_debug.h" | 1 | #include <linux/ceph/ceph_debug.h> |
2 | 2 | ||
3 | #include <linux/backing-dev.h> | 3 | #include <linux/backing-dev.h> |
4 | #include <linux/fs.h> | 4 | #include <linux/fs.h> |
@@ -10,7 +10,8 @@ | |||
10 | #include <linux/task_io_accounting_ops.h> | 10 | #include <linux/task_io_accounting_ops.h> |
11 | 11 | ||
12 | #include "super.h" | 12 | #include "super.h" |
13 | #include "osd_client.h" | 13 | #include "mds_client.h" |
14 | #include <linux/ceph/osd_client.h> | ||
14 | 15 | ||
15 | /* | 16 | /* |
16 | * Ceph address space ops. | 17 | * Ceph address space ops. |
@@ -193,7 +194,8 @@ static int readpage_nounlock(struct file *filp, struct page *page) | |||
193 | { | 194 | { |
194 | struct inode *inode = filp->f_dentry->d_inode; | 195 | struct inode *inode = filp->f_dentry->d_inode; |
195 | struct ceph_inode_info *ci = ceph_inode(inode); | 196 | struct ceph_inode_info *ci = ceph_inode(inode); |
196 | struct ceph_osd_client *osdc = &ceph_inode_to_client(inode)->osdc; | 197 | struct ceph_osd_client *osdc = |
198 | &ceph_inode_to_client(inode)->client->osdc; | ||
197 | int err = 0; | 199 | int err = 0; |
198 | u64 len = PAGE_CACHE_SIZE; | 200 | u64 len = PAGE_CACHE_SIZE; |
199 | 201 | ||
@@ -265,7 +267,8 @@ static int ceph_readpages(struct file *file, struct address_space *mapping, | |||
265 | { | 267 | { |
266 | struct inode *inode = file->f_dentry->d_inode; | 268 | struct inode *inode = file->f_dentry->d_inode; |
267 | struct ceph_inode_info *ci = ceph_inode(inode); | 269 | struct ceph_inode_info *ci = ceph_inode(inode); |
268 | struct ceph_osd_client *osdc = &ceph_inode_to_client(inode)->osdc; | 270 | struct ceph_osd_client *osdc = |
271 | &ceph_inode_to_client(inode)->client->osdc; | ||
269 | int rc = 0; | 272 | int rc = 0; |
270 | struct page **pages; | 273 | struct page **pages; |
271 | loff_t offset; | 274 | loff_t offset; |
@@ -365,7 +368,7 @@ static int writepage_nounlock(struct page *page, struct writeback_control *wbc) | |||
365 | { | 368 | { |
366 | struct inode *inode; | 369 | struct inode *inode; |
367 | struct ceph_inode_info *ci; | 370 | struct ceph_inode_info *ci; |
368 | struct ceph_client *client; | 371 | struct ceph_fs_client *fsc; |
369 | struct ceph_osd_client *osdc; | 372 | struct ceph_osd_client *osdc; |
370 | loff_t page_off = page->index << PAGE_CACHE_SHIFT; | 373 | loff_t page_off = page->index << PAGE_CACHE_SHIFT; |
371 | int len = PAGE_CACHE_SIZE; | 374 | int len = PAGE_CACHE_SIZE; |
@@ -383,8 +386,8 @@ static int writepage_nounlock(struct page *page, struct writeback_control *wbc) | |||
383 | } | 386 | } |
384 | inode = page->mapping->host; | 387 | inode = page->mapping->host; |
385 | ci = ceph_inode(inode); | 388 | ci = ceph_inode(inode); |
386 | client = ceph_inode_to_client(inode); | 389 | fsc = ceph_inode_to_client(inode); |
387 | osdc = &client->osdc; | 390 | osdc = &fsc->client->osdc; |
388 | 391 | ||
389 | /* verify this is a writeable snap context */ | 392 | /* verify this is a writeable snap context */ |
390 | snapc = (void *)page->private; | 393 | snapc = (void *)page->private; |
@@ -414,10 +417,10 @@ static int writepage_nounlock(struct page *page, struct writeback_control *wbc) | |||
414 | dout("writepage %p page %p index %lu on %llu~%u snapc %p\n", | 417 | dout("writepage %p page %p index %lu on %llu~%u snapc %p\n", |
415 | inode, page, page->index, page_off, len, snapc); | 418 | inode, page, page->index, page_off, len, snapc); |
416 | 419 | ||
417 | writeback_stat = atomic_long_inc_return(&client->writeback_count); | 420 | writeback_stat = atomic_long_inc_return(&fsc->writeback_count); |
418 | if (writeback_stat > | 421 | if (writeback_stat > |
419 | CONGESTION_ON_THRESH(client->mount_args->congestion_kb)) | 422 | CONGESTION_ON_THRESH(fsc->mount_options->congestion_kb)) |
420 | set_bdi_congested(&client->backing_dev_info, BLK_RW_ASYNC); | 423 | set_bdi_congested(&fsc->backing_dev_info, BLK_RW_ASYNC); |
421 | 424 | ||
422 | set_page_writeback(page); | 425 | set_page_writeback(page); |
423 | err = ceph_osdc_writepages(osdc, ceph_vino(inode), | 426 | err = ceph_osdc_writepages(osdc, ceph_vino(inode), |
@@ -496,7 +499,7 @@ static void writepages_finish(struct ceph_osd_request *req, | |||
496 | struct address_space *mapping = inode->i_mapping; | 499 | struct address_space *mapping = inode->i_mapping; |
497 | __s32 rc = -EIO; | 500 | __s32 rc = -EIO; |
498 | u64 bytes = 0; | 501 | u64 bytes = 0; |
499 | struct ceph_client *client = ceph_inode_to_client(inode); | 502 | struct ceph_fs_client *fsc = ceph_inode_to_client(inode); |
500 | long writeback_stat; | 503 | long writeback_stat; |
501 | unsigned issued = ceph_caps_issued(ci); | 504 | unsigned issued = ceph_caps_issued(ci); |
502 | 505 | ||
@@ -529,10 +532,10 @@ static void writepages_finish(struct ceph_osd_request *req, | |||
529 | WARN_ON(!PageUptodate(page)); | 532 | WARN_ON(!PageUptodate(page)); |
530 | 533 | ||
531 | writeback_stat = | 534 | writeback_stat = |
532 | atomic_long_dec_return(&client->writeback_count); | 535 | atomic_long_dec_return(&fsc->writeback_count); |
533 | if (writeback_stat < | 536 | if (writeback_stat < |
534 | CONGESTION_OFF_THRESH(client->mount_args->congestion_kb)) | 537 | CONGESTION_OFF_THRESH(fsc->mount_options->congestion_kb)) |
535 | clear_bdi_congested(&client->backing_dev_info, | 538 | clear_bdi_congested(&fsc->backing_dev_info, |
536 | BLK_RW_ASYNC); | 539 | BLK_RW_ASYNC); |
537 | 540 | ||
538 | ceph_put_snap_context((void *)page->private); | 541 | ceph_put_snap_context((void *)page->private); |
@@ -569,13 +572,13 @@ static void writepages_finish(struct ceph_osd_request *req, | |||
569 | * mempool. we avoid the mempool if we can because req->r_num_pages | 572 | * mempool. we avoid the mempool if we can because req->r_num_pages |
570 | * may be less than the maximum write size. | 573 | * may be less than the maximum write size. |
571 | */ | 574 | */ |
572 | static void alloc_page_vec(struct ceph_client *client, | 575 | static void alloc_page_vec(struct ceph_fs_client *fsc, |
573 | struct ceph_osd_request *req) | 576 | struct ceph_osd_request *req) |
574 | { | 577 | { |
575 | req->r_pages = kmalloc(sizeof(struct page *) * req->r_num_pages, | 578 | req->r_pages = kmalloc(sizeof(struct page *) * req->r_num_pages, |
576 | GFP_NOFS); | 579 | GFP_NOFS); |
577 | if (!req->r_pages) { | 580 | if (!req->r_pages) { |
578 | req->r_pages = mempool_alloc(client->wb_pagevec_pool, GFP_NOFS); | 581 | req->r_pages = mempool_alloc(fsc->wb_pagevec_pool, GFP_NOFS); |
579 | req->r_pages_from_pool = 1; | 582 | req->r_pages_from_pool = 1; |
580 | WARN_ON(!req->r_pages); | 583 | WARN_ON(!req->r_pages); |
581 | } | 584 | } |
@@ -590,7 +593,7 @@ static int ceph_writepages_start(struct address_space *mapping, | |||
590 | struct inode *inode = mapping->host; | 593 | struct inode *inode = mapping->host; |
591 | struct backing_dev_info *bdi = mapping->backing_dev_info; | 594 | struct backing_dev_info *bdi = mapping->backing_dev_info; |
592 | struct ceph_inode_info *ci = ceph_inode(inode); | 595 | struct ceph_inode_info *ci = ceph_inode(inode); |
593 | struct ceph_client *client; | 596 | struct ceph_fs_client *fsc; |
594 | pgoff_t index, start, end; | 597 | pgoff_t index, start, end; |
595 | int range_whole = 0; | 598 | int range_whole = 0; |
596 | int should_loop = 1; | 599 | int should_loop = 1; |
@@ -617,13 +620,13 @@ static int ceph_writepages_start(struct address_space *mapping, | |||
617 | wbc->sync_mode == WB_SYNC_NONE ? "NONE" : | 620 | wbc->sync_mode == WB_SYNC_NONE ? "NONE" : |
618 | (wbc->sync_mode == WB_SYNC_ALL ? "ALL" : "HOLD")); | 621 | (wbc->sync_mode == WB_SYNC_ALL ? "ALL" : "HOLD")); |
619 | 622 | ||
620 | client = ceph_inode_to_client(inode); | 623 | fsc = ceph_inode_to_client(inode); |
621 | if (client->mount_state == CEPH_MOUNT_SHUTDOWN) { | 624 | if (fsc->mount_state == CEPH_MOUNT_SHUTDOWN) { |
622 | pr_warning("writepage_start %p on forced umount\n", inode); | 625 | pr_warning("writepage_start %p on forced umount\n", inode); |
623 | return -EIO; /* we're in a forced umount, don't write! */ | 626 | return -EIO; /* we're in a forced umount, don't write! */ |
624 | } | 627 | } |
625 | if (client->mount_args->wsize && client->mount_args->wsize < wsize) | 628 | if (fsc->mount_options->wsize && fsc->mount_options->wsize < wsize) |
626 | wsize = client->mount_args->wsize; | 629 | wsize = fsc->mount_options->wsize; |
627 | if (wsize < PAGE_CACHE_SIZE) | 630 | if (wsize < PAGE_CACHE_SIZE) |
628 | wsize = PAGE_CACHE_SIZE; | 631 | wsize = PAGE_CACHE_SIZE; |
629 | max_pages_ever = wsize >> PAGE_CACHE_SHIFT; | 632 | max_pages_ever = wsize >> PAGE_CACHE_SHIFT; |
@@ -769,7 +772,7 @@ get_more_pages: | |||
769 | offset = (unsigned long long)page->index | 772 | offset = (unsigned long long)page->index |
770 | << PAGE_CACHE_SHIFT; | 773 | << PAGE_CACHE_SHIFT; |
771 | len = wsize; | 774 | len = wsize; |
772 | req = ceph_osdc_new_request(&client->osdc, | 775 | req = ceph_osdc_new_request(&fsc->client->osdc, |
773 | &ci->i_layout, | 776 | &ci->i_layout, |
774 | ceph_vino(inode), | 777 | ceph_vino(inode), |
775 | offset, &len, | 778 | offset, &len, |
@@ -782,7 +785,7 @@ get_more_pages: | |||
782 | &inode->i_mtime, true, 1); | 785 | &inode->i_mtime, true, 1); |
783 | max_pages = req->r_num_pages; | 786 | max_pages = req->r_num_pages; |
784 | 787 | ||
785 | alloc_page_vec(client, req); | 788 | alloc_page_vec(fsc, req); |
786 | req->r_callback = writepages_finish; | 789 | req->r_callback = writepages_finish; |
787 | req->r_inode = inode; | 790 | req->r_inode = inode; |
788 | } | 791 | } |
@@ -794,10 +797,10 @@ get_more_pages: | |||
794 | inode, page, page->index); | 797 | inode, page, page->index); |
795 | 798 | ||
796 | writeback_stat = | 799 | writeback_stat = |
797 | atomic_long_inc_return(&client->writeback_count); | 800 | atomic_long_inc_return(&fsc->writeback_count); |
798 | if (writeback_stat > CONGESTION_ON_THRESH( | 801 | if (writeback_stat > CONGESTION_ON_THRESH( |
799 | client->mount_args->congestion_kb)) { | 802 | fsc->mount_options->congestion_kb)) { |
800 | set_bdi_congested(&client->backing_dev_info, | 803 | set_bdi_congested(&fsc->backing_dev_info, |
801 | BLK_RW_ASYNC); | 804 | BLK_RW_ASYNC); |
802 | } | 805 | } |
803 | 806 | ||
@@ -846,7 +849,7 @@ get_more_pages: | |||
846 | op->payload_len = cpu_to_le32(len); | 849 | op->payload_len = cpu_to_le32(len); |
847 | req->r_request->hdr.data_len = cpu_to_le32(len); | 850 | req->r_request->hdr.data_len = cpu_to_le32(len); |
848 | 851 | ||
849 | ceph_osdc_start_request(&client->osdc, req, true); | 852 | ceph_osdc_start_request(&fsc->client->osdc, req, true); |
850 | req = NULL; | 853 | req = NULL; |
851 | 854 | ||
852 | /* continue? */ | 855 | /* continue? */ |
@@ -915,7 +918,7 @@ static int ceph_update_writeable_page(struct file *file, | |||
915 | { | 918 | { |
916 | struct inode *inode = file->f_dentry->d_inode; | 919 | struct inode *inode = file->f_dentry->d_inode; |
917 | struct ceph_inode_info *ci = ceph_inode(inode); | 920 | struct ceph_inode_info *ci = ceph_inode(inode); |
918 | struct ceph_mds_client *mdsc = &ceph_inode_to_client(inode)->mdsc; | 921 | struct ceph_mds_client *mdsc = ceph_inode_to_client(inode)->mdsc; |
919 | loff_t page_off = pos & PAGE_CACHE_MASK; | 922 | loff_t page_off = pos & PAGE_CACHE_MASK; |
920 | int pos_in_page = pos & ~PAGE_CACHE_MASK; | 923 | int pos_in_page = pos & ~PAGE_CACHE_MASK; |
921 | int end_in_page = pos_in_page + len; | 924 | int end_in_page = pos_in_page + len; |
@@ -1053,8 +1056,8 @@ static int ceph_write_end(struct file *file, struct address_space *mapping, | |||
1053 | struct page *page, void *fsdata) | 1056 | struct page *page, void *fsdata) |
1054 | { | 1057 | { |
1055 | struct inode *inode = file->f_dentry->d_inode; | 1058 | struct inode *inode = file->f_dentry->d_inode; |
1056 | struct ceph_client *client = ceph_inode_to_client(inode); | 1059 | struct ceph_fs_client *fsc = ceph_inode_to_client(inode); |
1057 | struct ceph_mds_client *mdsc = &client->mdsc; | 1060 | struct ceph_mds_client *mdsc = fsc->mdsc; |
1058 | unsigned from = pos & (PAGE_CACHE_SIZE - 1); | 1061 | unsigned from = pos & (PAGE_CACHE_SIZE - 1); |
1059 | int check_cap = 0; | 1062 | int check_cap = 0; |
1060 | 1063 | ||
@@ -1123,7 +1126,7 @@ static int ceph_page_mkwrite(struct vm_area_struct *vma, struct vm_fault *vmf) | |||
1123 | { | 1126 | { |
1124 | struct inode *inode = vma->vm_file->f_dentry->d_inode; | 1127 | struct inode *inode = vma->vm_file->f_dentry->d_inode; |
1125 | struct page *page = vmf->page; | 1128 | struct page *page = vmf->page; |
1126 | struct ceph_mds_client *mdsc = &ceph_inode_to_client(inode)->mdsc; | 1129 | struct ceph_mds_client *mdsc = ceph_inode_to_client(inode)->mdsc; |
1127 | loff_t off = page->index << PAGE_CACHE_SHIFT; | 1130 | loff_t off = page->index << PAGE_CACHE_SHIFT; |
1128 | loff_t size, len; | 1131 | loff_t size, len; |
1129 | int ret; | 1132 | int ret; |
diff --git a/fs/ceph/caps.c b/fs/ceph/caps.c index 5e9da996a151..3cff67cbb9c0 100644 --- a/fs/ceph/caps.c +++ b/fs/ceph/caps.c | |||
@@ -1,4 +1,4 @@ | |||
1 | #include "ceph_debug.h" | 1 | #include <linux/ceph/ceph_debug.h> |
2 | 2 | ||
3 | #include <linux/fs.h> | 3 | #include <linux/fs.h> |
4 | #include <linux/kernel.h> | 4 | #include <linux/kernel.h> |
@@ -9,8 +9,9 @@ | |||
9 | #include <linux/writeback.h> | 9 | #include <linux/writeback.h> |
10 | 10 | ||
11 | #include "super.h" | 11 | #include "super.h" |
12 | #include "decode.h" | 12 | #include "mds_client.h" |
13 | #include "messenger.h" | 13 | #include <linux/ceph/decode.h> |
14 | #include <linux/ceph/messenger.h> | ||
14 | 15 | ||
15 | /* | 16 | /* |
16 | * Capability management | 17 | * Capability management |
@@ -287,11 +288,11 @@ void ceph_put_cap(struct ceph_mds_client *mdsc, struct ceph_cap *cap) | |||
287 | spin_unlock(&mdsc->caps_list_lock); | 288 | spin_unlock(&mdsc->caps_list_lock); |
288 | } | 289 | } |
289 | 290 | ||
290 | void ceph_reservation_status(struct ceph_client *client, | 291 | void ceph_reservation_status(struct ceph_fs_client *fsc, |
291 | int *total, int *avail, int *used, int *reserved, | 292 | int *total, int *avail, int *used, int *reserved, |
292 | int *min) | 293 | int *min) |
293 | { | 294 | { |
294 | struct ceph_mds_client *mdsc = &client->mdsc; | 295 | struct ceph_mds_client *mdsc = fsc->mdsc; |
295 | 296 | ||
296 | if (total) | 297 | if (total) |
297 | *total = mdsc->caps_total_count; | 298 | *total = mdsc->caps_total_count; |
@@ -399,7 +400,7 @@ static void __insert_cap_node(struct ceph_inode_info *ci, | |||
399 | static void __cap_set_timeouts(struct ceph_mds_client *mdsc, | 400 | static void __cap_set_timeouts(struct ceph_mds_client *mdsc, |
400 | struct ceph_inode_info *ci) | 401 | struct ceph_inode_info *ci) |
401 | { | 402 | { |
402 | struct ceph_mount_args *ma = mdsc->client->mount_args; | 403 | struct ceph_mount_options *ma = mdsc->fsc->mount_options; |
403 | 404 | ||
404 | ci->i_hold_caps_min = round_jiffies(jiffies + | 405 | ci->i_hold_caps_min = round_jiffies(jiffies + |
405 | ma->caps_wanted_delay_min * HZ); | 406 | ma->caps_wanted_delay_min * HZ); |
@@ -515,7 +516,7 @@ int ceph_add_cap(struct inode *inode, | |||
515 | unsigned seq, unsigned mseq, u64 realmino, int flags, | 516 | unsigned seq, unsigned mseq, u64 realmino, int flags, |
516 | struct ceph_cap_reservation *caps_reservation) | 517 | struct ceph_cap_reservation *caps_reservation) |
517 | { | 518 | { |
518 | struct ceph_mds_client *mdsc = &ceph_inode_to_client(inode)->mdsc; | 519 | struct ceph_mds_client *mdsc = ceph_inode_to_client(inode)->mdsc; |
519 | struct ceph_inode_info *ci = ceph_inode(inode); | 520 | struct ceph_inode_info *ci = ceph_inode(inode); |
520 | struct ceph_cap *new_cap = NULL; | 521 | struct ceph_cap *new_cap = NULL; |
521 | struct ceph_cap *cap; | 522 | struct ceph_cap *cap; |
@@ -873,7 +874,7 @@ void __ceph_remove_cap(struct ceph_cap *cap) | |||
873 | struct ceph_mds_session *session = cap->session; | 874 | struct ceph_mds_session *session = cap->session; |
874 | struct ceph_inode_info *ci = cap->ci; | 875 | struct ceph_inode_info *ci = cap->ci; |
875 | struct ceph_mds_client *mdsc = | 876 | struct ceph_mds_client *mdsc = |
876 | &ceph_sb_to_client(ci->vfs_inode.i_sb)->mdsc; | 877 | ceph_sb_to_client(ci->vfs_inode.i_sb)->mdsc; |
877 | int removed = 0; | 878 | int removed = 0; |
878 | 879 | ||
879 | dout("__ceph_remove_cap %p from %p\n", cap, &ci->vfs_inode); | 880 | dout("__ceph_remove_cap %p from %p\n", cap, &ci->vfs_inode); |
@@ -1210,7 +1211,7 @@ void __ceph_flush_snaps(struct ceph_inode_info *ci, | |||
1210 | int mds; | 1211 | int mds; |
1211 | struct ceph_cap_snap *capsnap; | 1212 | struct ceph_cap_snap *capsnap; |
1212 | u32 mseq; | 1213 | u32 mseq; |
1213 | struct ceph_mds_client *mdsc = &ceph_inode_to_client(inode)->mdsc; | 1214 | struct ceph_mds_client *mdsc = ceph_inode_to_client(inode)->mdsc; |
1214 | struct ceph_mds_session *session = NULL; /* if session != NULL, we hold | 1215 | struct ceph_mds_session *session = NULL; /* if session != NULL, we hold |
1215 | session->s_mutex */ | 1216 | session->s_mutex */ |
1216 | u64 next_follows = 0; /* keep track of how far we've gotten through the | 1217 | u64 next_follows = 0; /* keep track of how far we've gotten through the |
@@ -1336,7 +1337,7 @@ static void ceph_flush_snaps(struct ceph_inode_info *ci) | |||
1336 | void __ceph_mark_dirty_caps(struct ceph_inode_info *ci, int mask) | 1337 | void __ceph_mark_dirty_caps(struct ceph_inode_info *ci, int mask) |
1337 | { | 1338 | { |
1338 | struct ceph_mds_client *mdsc = | 1339 | struct ceph_mds_client *mdsc = |
1339 | &ceph_sb_to_client(ci->vfs_inode.i_sb)->mdsc; | 1340 | ceph_sb_to_client(ci->vfs_inode.i_sb)->mdsc; |
1340 | struct inode *inode = &ci->vfs_inode; | 1341 | struct inode *inode = &ci->vfs_inode; |
1341 | int was = ci->i_dirty_caps; | 1342 | int was = ci->i_dirty_caps; |
1342 | int dirty = 0; | 1343 | int dirty = 0; |
@@ -1378,7 +1379,7 @@ void __ceph_mark_dirty_caps(struct ceph_inode_info *ci, int mask) | |||
1378 | static int __mark_caps_flushing(struct inode *inode, | 1379 | static int __mark_caps_flushing(struct inode *inode, |
1379 | struct ceph_mds_session *session) | 1380 | struct ceph_mds_session *session) |
1380 | { | 1381 | { |
1381 | struct ceph_mds_client *mdsc = &ceph_sb_to_client(inode->i_sb)->mdsc; | 1382 | struct ceph_mds_client *mdsc = ceph_sb_to_client(inode->i_sb)->mdsc; |
1382 | struct ceph_inode_info *ci = ceph_inode(inode); | 1383 | struct ceph_inode_info *ci = ceph_inode(inode); |
1383 | int flushing; | 1384 | int flushing; |
1384 | 1385 | ||
@@ -1462,8 +1463,8 @@ static int try_nonblocking_invalidate(struct inode *inode) | |||
1462 | void ceph_check_caps(struct ceph_inode_info *ci, int flags, | 1463 | void ceph_check_caps(struct ceph_inode_info *ci, int flags, |
1463 | struct ceph_mds_session *session) | 1464 | struct ceph_mds_session *session) |
1464 | { | 1465 | { |
1465 | struct ceph_client *client = ceph_inode_to_client(&ci->vfs_inode); | 1466 | struct ceph_fs_client *fsc = ceph_inode_to_client(&ci->vfs_inode); |
1466 | struct ceph_mds_client *mdsc = &client->mdsc; | 1467 | struct ceph_mds_client *mdsc = fsc->mdsc; |
1467 | struct inode *inode = &ci->vfs_inode; | 1468 | struct inode *inode = &ci->vfs_inode; |
1468 | struct ceph_cap *cap; | 1469 | struct ceph_cap *cap; |
1469 | int file_wanted, used; | 1470 | int file_wanted, used; |
@@ -1706,7 +1707,7 @@ ack: | |||
1706 | static int try_flush_caps(struct inode *inode, struct ceph_mds_session *session, | 1707 | static int try_flush_caps(struct inode *inode, struct ceph_mds_session *session, |
1707 | unsigned *flush_tid) | 1708 | unsigned *flush_tid) |
1708 | { | 1709 | { |
1709 | struct ceph_mds_client *mdsc = &ceph_sb_to_client(inode->i_sb)->mdsc; | 1710 | struct ceph_mds_client *mdsc = ceph_sb_to_client(inode->i_sb)->mdsc; |
1710 | struct ceph_inode_info *ci = ceph_inode(inode); | 1711 | struct ceph_inode_info *ci = ceph_inode(inode); |
1711 | int unlock_session = session ? 0 : 1; | 1712 | int unlock_session = session ? 0 : 1; |
1712 | int flushing = 0; | 1713 | int flushing = 0; |
@@ -1872,7 +1873,7 @@ int ceph_write_inode(struct inode *inode, struct writeback_control *wbc) | |||
1872 | caps_are_flushed(inode, flush_tid)); | 1873 | caps_are_flushed(inode, flush_tid)); |
1873 | } else { | 1874 | } else { |
1874 | struct ceph_mds_client *mdsc = | 1875 | struct ceph_mds_client *mdsc = |
1875 | &ceph_sb_to_client(inode->i_sb)->mdsc; | 1876 | ceph_sb_to_client(inode->i_sb)->mdsc; |
1876 | 1877 | ||
1877 | spin_lock(&inode->i_lock); | 1878 | spin_lock(&inode->i_lock); |
1878 | if (__ceph_caps_dirty(ci)) | 1879 | if (__ceph_caps_dirty(ci)) |
@@ -2465,7 +2466,7 @@ static void handle_cap_flush_ack(struct inode *inode, u64 flush_tid, | |||
2465 | __releases(inode->i_lock) | 2466 | __releases(inode->i_lock) |
2466 | { | 2467 | { |
2467 | struct ceph_inode_info *ci = ceph_inode(inode); | 2468 | struct ceph_inode_info *ci = ceph_inode(inode); |
2468 | struct ceph_mds_client *mdsc = &ceph_sb_to_client(inode->i_sb)->mdsc; | 2469 | struct ceph_mds_client *mdsc = ceph_sb_to_client(inode->i_sb)->mdsc; |
2469 | unsigned seq = le32_to_cpu(m->seq); | 2470 | unsigned seq = le32_to_cpu(m->seq); |
2470 | int dirty = le32_to_cpu(m->dirty); | 2471 | int dirty = le32_to_cpu(m->dirty); |
2471 | int cleaned = 0; | 2472 | int cleaned = 0; |
@@ -2713,7 +2714,7 @@ void ceph_handle_caps(struct ceph_mds_session *session, | |||
2713 | struct ceph_msg *msg) | 2714 | struct ceph_msg *msg) |
2714 | { | 2715 | { |
2715 | struct ceph_mds_client *mdsc = session->s_mdsc; | 2716 | struct ceph_mds_client *mdsc = session->s_mdsc; |
2716 | struct super_block *sb = mdsc->client->sb; | 2717 | struct super_block *sb = mdsc->fsc->sb; |
2717 | struct inode *inode; | 2718 | struct inode *inode; |
2718 | struct ceph_cap *cap; | 2719 | struct ceph_cap *cap; |
2719 | struct ceph_mds_caps *h; | 2720 | struct ceph_mds_caps *h; |
diff --git a/fs/ceph/ceph_frag.c b/fs/ceph/ceph_frag.c index ab6cf35c4091..bdce8b1fbd06 100644 --- a/fs/ceph/ceph_frag.c +++ b/fs/ceph/ceph_frag.c | |||
@@ -1,7 +1,8 @@ | |||
1 | /* | 1 | /* |
2 | * Ceph 'frag' type | 2 | * Ceph 'frag' type |
3 | */ | 3 | */ |
4 | #include "types.h" | 4 | #include <linux/module.h> |
5 | #include <linux/ceph/types.h> | ||
5 | 6 | ||
6 | int ceph_frag_compare(__u32 a, __u32 b) | 7 | int ceph_frag_compare(__u32 a, __u32 b) |
7 | { | 8 | { |
diff --git a/fs/ceph/debugfs.c b/fs/ceph/debugfs.c index 6fd8b20a8611..94fe1d284c3a 100644 --- a/fs/ceph/debugfs.c +++ b/fs/ceph/debugfs.c | |||
@@ -1,4 +1,4 @@ | |||
1 | #include "ceph_debug.h" | 1 | #include <linux/ceph/ceph_debug.h> |
2 | 2 | ||
3 | #include <linux/device.h> | 3 | #include <linux/device.h> |
4 | #include <linux/slab.h> | 4 | #include <linux/slab.h> |
@@ -7,143 +7,48 @@ | |||
7 | #include <linux/debugfs.h> | 7 | #include <linux/debugfs.h> |
8 | #include <linux/seq_file.h> | 8 | #include <linux/seq_file.h> |
9 | 9 | ||
10 | #include "super.h" | 10 | #include <linux/ceph/libceph.h> |
11 | #include "mds_client.h" | 11 | #include <linux/ceph/mon_client.h> |
12 | #include "mon_client.h" | 12 | #include <linux/ceph/auth.h> |
13 | #include "auth.h" | 13 | #include <linux/ceph/debugfs.h> |
14 | 14 | ||
15 | #ifdef CONFIG_DEBUG_FS | 15 | #ifdef CONFIG_DEBUG_FS |
16 | 16 | ||
17 | /* | 17 | #include "super.h" |
18 | * Implement /sys/kernel/debug/ceph fun | 18 | #include "mds_client.h" |
19 | * | ||
20 | * /sys/kernel/debug/ceph/client* - an instance of the ceph client | ||
21 | * .../osdmap - current osdmap | ||
22 | * .../mdsmap - current mdsmap | ||
23 | * .../monmap - current monmap | ||
24 | * .../osdc - active osd requests | ||
25 | * .../mdsc - active mds requests | ||
26 | * .../monc - mon client state | ||
27 | * .../dentry_lru - dump contents of dentry lru | ||
28 | * .../caps - expose cap (reservation) stats | ||
29 | * .../bdi - symlink to ../../bdi/something | ||
30 | */ | ||
31 | |||
32 | static struct dentry *ceph_debugfs_dir; | ||
33 | |||
34 | static int monmap_show(struct seq_file *s, void *p) | ||
35 | { | ||
36 | int i; | ||
37 | struct ceph_client *client = s->private; | ||
38 | |||
39 | if (client->monc.monmap == NULL) | ||
40 | return 0; | ||
41 | |||
42 | seq_printf(s, "epoch %d\n", client->monc.monmap->epoch); | ||
43 | for (i = 0; i < client->monc.monmap->num_mon; i++) { | ||
44 | struct ceph_entity_inst *inst = | ||
45 | &client->monc.monmap->mon_inst[i]; | ||
46 | |||
47 | seq_printf(s, "\t%s%lld\t%s\n", | ||
48 | ENTITY_NAME(inst->name), | ||
49 | pr_addr(&inst->addr.in_addr)); | ||
50 | } | ||
51 | return 0; | ||
52 | } | ||
53 | 19 | ||
54 | static int mdsmap_show(struct seq_file *s, void *p) | 20 | static int mdsmap_show(struct seq_file *s, void *p) |
55 | { | 21 | { |
56 | int i; | 22 | int i; |
57 | struct ceph_client *client = s->private; | 23 | struct ceph_fs_client *fsc = s->private; |
58 | 24 | ||
59 | if (client->mdsc.mdsmap == NULL) | 25 | if (fsc->mdsc == NULL || fsc->mdsc->mdsmap == NULL) |
60 | return 0; | 26 | return 0; |
61 | seq_printf(s, "epoch %d\n", client->mdsc.mdsmap->m_epoch); | 27 | seq_printf(s, "epoch %d\n", fsc->mdsc->mdsmap->m_epoch); |
62 | seq_printf(s, "root %d\n", client->mdsc.mdsmap->m_root); | 28 | seq_printf(s, "root %d\n", fsc->mdsc->mdsmap->m_root); |
63 | seq_printf(s, "session_timeout %d\n", | 29 | seq_printf(s, "session_timeout %d\n", |
64 | client->mdsc.mdsmap->m_session_timeout); | 30 | fsc->mdsc->mdsmap->m_session_timeout); |
65 | seq_printf(s, "session_autoclose %d\n", | 31 | seq_printf(s, "session_autoclose %d\n", |
66 | client->mdsc.mdsmap->m_session_autoclose); | 32 | fsc->mdsc->mdsmap->m_session_autoclose); |
67 | for (i = 0; i < client->mdsc.mdsmap->m_max_mds; i++) { | 33 | for (i = 0; i < fsc->mdsc->mdsmap->m_max_mds; i++) { |
68 | struct ceph_entity_addr *addr = | 34 | struct ceph_entity_addr *addr = |
69 | &client->mdsc.mdsmap->m_info[i].addr; | 35 | &fsc->mdsc->mdsmap->m_info[i].addr; |
70 | int state = client->mdsc.mdsmap->m_info[i].state; | 36 | int state = fsc->mdsc->mdsmap->m_info[i].state; |
71 | 37 | ||
72 | seq_printf(s, "\tmds%d\t%s\t(%s)\n", i, pr_addr(&addr->in_addr), | 38 | seq_printf(s, "\tmds%d\t%s\t(%s)\n", i, |
39 | ceph_pr_addr(&addr->in_addr), | ||
73 | ceph_mds_state_name(state)); | 40 | ceph_mds_state_name(state)); |
74 | } | 41 | } |
75 | return 0; | 42 | return 0; |
76 | } | 43 | } |
77 | 44 | ||
78 | static int osdmap_show(struct seq_file *s, void *p) | 45 | /* |
79 | { | 46 | * mdsc debugfs |
80 | int i; | 47 | */ |
81 | struct ceph_client *client = s->private; | ||
82 | struct rb_node *n; | ||
83 | |||
84 | if (client->osdc.osdmap == NULL) | ||
85 | return 0; | ||
86 | seq_printf(s, "epoch %d\n", client->osdc.osdmap->epoch); | ||
87 | seq_printf(s, "flags%s%s\n", | ||
88 | (client->osdc.osdmap->flags & CEPH_OSDMAP_NEARFULL) ? | ||
89 | " NEARFULL" : "", | ||
90 | (client->osdc.osdmap->flags & CEPH_OSDMAP_FULL) ? | ||
91 | " FULL" : ""); | ||
92 | for (n = rb_first(&client->osdc.osdmap->pg_pools); n; n = rb_next(n)) { | ||
93 | struct ceph_pg_pool_info *pool = | ||
94 | rb_entry(n, struct ceph_pg_pool_info, node); | ||
95 | seq_printf(s, "pg_pool %d pg_num %d / %d, lpg_num %d / %d\n", | ||
96 | pool->id, pool->v.pg_num, pool->pg_num_mask, | ||
97 | pool->v.lpg_num, pool->lpg_num_mask); | ||
98 | } | ||
99 | for (i = 0; i < client->osdc.osdmap->max_osd; i++) { | ||
100 | struct ceph_entity_addr *addr = | ||
101 | &client->osdc.osdmap->osd_addr[i]; | ||
102 | int state = client->osdc.osdmap->osd_state[i]; | ||
103 | char sb[64]; | ||
104 | |||
105 | seq_printf(s, "\tosd%d\t%s\t%3d%%\t(%s)\n", | ||
106 | i, pr_addr(&addr->in_addr), | ||
107 | ((client->osdc.osdmap->osd_weight[i]*100) >> 16), | ||
108 | ceph_osdmap_state_str(sb, sizeof(sb), state)); | ||
109 | } | ||
110 | return 0; | ||
111 | } | ||
112 | |||
113 | static int monc_show(struct seq_file *s, void *p) | ||
114 | { | ||
115 | struct ceph_client *client = s->private; | ||
116 | struct ceph_mon_generic_request *req; | ||
117 | struct ceph_mon_client *monc = &client->monc; | ||
118 | struct rb_node *rp; | ||
119 | |||
120 | mutex_lock(&monc->mutex); | ||
121 | |||
122 | if (monc->have_mdsmap) | ||
123 | seq_printf(s, "have mdsmap %u\n", (unsigned)monc->have_mdsmap); | ||
124 | if (monc->have_osdmap) | ||
125 | seq_printf(s, "have osdmap %u\n", (unsigned)monc->have_osdmap); | ||
126 | if (monc->want_next_osdmap) | ||
127 | seq_printf(s, "want next osdmap\n"); | ||
128 | |||
129 | for (rp = rb_first(&monc->generic_request_tree); rp; rp = rb_next(rp)) { | ||
130 | __u16 op; | ||
131 | req = rb_entry(rp, struct ceph_mon_generic_request, node); | ||
132 | op = le16_to_cpu(req->request->hdr.type); | ||
133 | if (op == CEPH_MSG_STATFS) | ||
134 | seq_printf(s, "%lld statfs\n", req->tid); | ||
135 | else | ||
136 | seq_printf(s, "%lld unknown\n", req->tid); | ||
137 | } | ||
138 | |||
139 | mutex_unlock(&monc->mutex); | ||
140 | return 0; | ||
141 | } | ||
142 | |||
143 | static int mdsc_show(struct seq_file *s, void *p) | 48 | static int mdsc_show(struct seq_file *s, void *p) |
144 | { | 49 | { |
145 | struct ceph_client *client = s->private; | 50 | struct ceph_fs_client *fsc = s->private; |
146 | struct ceph_mds_client *mdsc = &client->mdsc; | 51 | struct ceph_mds_client *mdsc = fsc->mdsc; |
147 | struct ceph_mds_request *req; | 52 | struct ceph_mds_request *req; |
148 | struct rb_node *rp; | 53 | struct rb_node *rp; |
149 | int pathlen; | 54 | int pathlen; |
@@ -214,61 +119,12 @@ static int mdsc_show(struct seq_file *s, void *p) | |||
214 | return 0; | 119 | return 0; |
215 | } | 120 | } |
216 | 121 | ||
217 | static int osdc_show(struct seq_file *s, void *pp) | ||
218 | { | ||
219 | struct ceph_client *client = s->private; | ||
220 | struct ceph_osd_client *osdc = &client->osdc; | ||
221 | struct rb_node *p; | ||
222 | |||
223 | mutex_lock(&osdc->request_mutex); | ||
224 | for (p = rb_first(&osdc->requests); p; p = rb_next(p)) { | ||
225 | struct ceph_osd_request *req; | ||
226 | struct ceph_osd_request_head *head; | ||
227 | struct ceph_osd_op *op; | ||
228 | int num_ops; | ||
229 | int opcode, olen; | ||
230 | int i; | ||
231 | |||
232 | req = rb_entry(p, struct ceph_osd_request, r_node); | ||
233 | |||
234 | seq_printf(s, "%lld\tosd%d\t%d.%x\t", req->r_tid, | ||
235 | req->r_osd ? req->r_osd->o_osd : -1, | ||
236 | le32_to_cpu(req->r_pgid.pool), | ||
237 | le16_to_cpu(req->r_pgid.ps)); | ||
238 | |||
239 | head = req->r_request->front.iov_base; | ||
240 | op = (void *)(head + 1); | ||
241 | |||
242 | num_ops = le16_to_cpu(head->num_ops); | ||
243 | olen = le32_to_cpu(head->object_len); | ||
244 | seq_printf(s, "%.*s", olen, | ||
245 | (const char *)(head->ops + num_ops)); | ||
246 | |||
247 | if (req->r_reassert_version.epoch) | ||
248 | seq_printf(s, "\t%u'%llu", | ||
249 | (unsigned)le32_to_cpu(req->r_reassert_version.epoch), | ||
250 | le64_to_cpu(req->r_reassert_version.version)); | ||
251 | else | ||
252 | seq_printf(s, "\t"); | ||
253 | |||
254 | for (i = 0; i < num_ops; i++) { | ||
255 | opcode = le16_to_cpu(op->op); | ||
256 | seq_printf(s, "\t%s", ceph_osd_op_name(opcode)); | ||
257 | op++; | ||
258 | } | ||
259 | |||
260 | seq_printf(s, "\n"); | ||
261 | } | ||
262 | mutex_unlock(&osdc->request_mutex); | ||
263 | return 0; | ||
264 | } | ||
265 | |||
266 | static int caps_show(struct seq_file *s, void *p) | 122 | static int caps_show(struct seq_file *s, void *p) |
267 | { | 123 | { |
268 | struct ceph_client *client = s->private; | 124 | struct ceph_fs_client *fsc = s->private; |
269 | int total, avail, used, reserved, min; | 125 | int total, avail, used, reserved, min; |
270 | 126 | ||
271 | ceph_reservation_status(client, &total, &avail, &used, &reserved, &min); | 127 | ceph_reservation_status(fsc, &total, &avail, &used, &reserved, &min); |
272 | seq_printf(s, "total\t\t%d\n" | 128 | seq_printf(s, "total\t\t%d\n" |
273 | "avail\t\t%d\n" | 129 | "avail\t\t%d\n" |
274 | "used\t\t%d\n" | 130 | "used\t\t%d\n" |
@@ -280,8 +136,8 @@ static int caps_show(struct seq_file *s, void *p) | |||
280 | 136 | ||
281 | static int dentry_lru_show(struct seq_file *s, void *ptr) | 137 | static int dentry_lru_show(struct seq_file *s, void *ptr) |
282 | { | 138 | { |
283 | struct ceph_client *client = s->private; | 139 | struct ceph_fs_client *fsc = s->private; |
284 | struct ceph_mds_client *mdsc = &client->mdsc; | 140 | struct ceph_mds_client *mdsc = fsc->mdsc; |
285 | struct ceph_dentry_info *di; | 141 | struct ceph_dentry_info *di; |
286 | 142 | ||
287 | spin_lock(&mdsc->dentry_lru_lock); | 143 | spin_lock(&mdsc->dentry_lru_lock); |
@@ -295,199 +151,124 @@ static int dentry_lru_show(struct seq_file *s, void *ptr) | |||
295 | return 0; | 151 | return 0; |
296 | } | 152 | } |
297 | 153 | ||
298 | #define DEFINE_SHOW_FUNC(name) \ | 154 | CEPH_DEFINE_SHOW_FUNC(mdsmap_show) |
299 | static int name##_open(struct inode *inode, struct file *file) \ | 155 | CEPH_DEFINE_SHOW_FUNC(mdsc_show) |
300 | { \ | 156 | CEPH_DEFINE_SHOW_FUNC(caps_show) |
301 | struct seq_file *sf; \ | 157 | CEPH_DEFINE_SHOW_FUNC(dentry_lru_show) |
302 | int ret; \ | 158 | |
303 | \ | ||
304 | ret = single_open(file, name, NULL); \ | ||
305 | sf = file->private_data; \ | ||
306 | sf->private = inode->i_private; \ | ||
307 | return ret; \ | ||
308 | } \ | ||
309 | \ | ||
310 | static const struct file_operations name##_fops = { \ | ||
311 | .open = name##_open, \ | ||
312 | .read = seq_read, \ | ||
313 | .llseek = seq_lseek, \ | ||
314 | .release = single_release, \ | ||
315 | }; | ||
316 | |||
317 | DEFINE_SHOW_FUNC(monmap_show) | ||
318 | DEFINE_SHOW_FUNC(mdsmap_show) | ||
319 | DEFINE_SHOW_FUNC(osdmap_show) | ||
320 | DEFINE_SHOW_FUNC(monc_show) | ||
321 | DEFINE_SHOW_FUNC(mdsc_show) | ||
322 | DEFINE_SHOW_FUNC(osdc_show) | ||
323 | DEFINE_SHOW_FUNC(dentry_lru_show) | ||
324 | DEFINE_SHOW_FUNC(caps_show) | ||
325 | 159 | ||
160 | /* | ||
161 | * debugfs | ||
162 | */ | ||
326 | static int congestion_kb_set(void *data, u64 val) | 163 | static int congestion_kb_set(void *data, u64 val) |
327 | { | 164 | { |
328 | struct ceph_client *client = (struct ceph_client *)data; | 165 | struct ceph_fs_client *fsc = (struct ceph_fs_client *)data; |
329 | |||
330 | if (client) | ||
331 | client->mount_args->congestion_kb = (int)val; | ||
332 | 166 | ||
167 | fsc->mount_options->congestion_kb = (int)val; | ||
333 | return 0; | 168 | return 0; |
334 | } | 169 | } |
335 | 170 | ||
336 | static int congestion_kb_get(void *data, u64 *val) | 171 | static int congestion_kb_get(void *data, u64 *val) |
337 | { | 172 | { |
338 | struct ceph_client *client = (struct ceph_client *)data; | 173 | struct ceph_fs_client *fsc = (struct ceph_fs_client *)data; |
339 | |||
340 | if (client) | ||
341 | *val = (u64)client->mount_args->congestion_kb; | ||
342 | 174 | ||
175 | *val = (u64)fsc->mount_options->congestion_kb; | ||
343 | return 0; | 176 | return 0; |
344 | } | 177 | } |
345 | 178 | ||
346 | |||
347 | DEFINE_SIMPLE_ATTRIBUTE(congestion_kb_fops, congestion_kb_get, | 179 | DEFINE_SIMPLE_ATTRIBUTE(congestion_kb_fops, congestion_kb_get, |
348 | congestion_kb_set, "%llu\n"); | 180 | congestion_kb_set, "%llu\n"); |
349 | 181 | ||
350 | int __init ceph_debugfs_init(void) | ||
351 | { | ||
352 | ceph_debugfs_dir = debugfs_create_dir("ceph", NULL); | ||
353 | if (!ceph_debugfs_dir) | ||
354 | return -ENOMEM; | ||
355 | return 0; | ||
356 | } | ||
357 | 182 | ||
358 | void ceph_debugfs_cleanup(void) | 183 | void ceph_fs_debugfs_cleanup(struct ceph_fs_client *fsc) |
359 | { | 184 | { |
360 | debugfs_remove(ceph_debugfs_dir); | 185 | dout("ceph_fs_debugfs_cleanup\n"); |
186 | debugfs_remove(fsc->debugfs_bdi); | ||
187 | debugfs_remove(fsc->debugfs_congestion_kb); | ||
188 | debugfs_remove(fsc->debugfs_mdsmap); | ||
189 | debugfs_remove(fsc->debugfs_caps); | ||
190 | debugfs_remove(fsc->debugfs_mdsc); | ||
191 | debugfs_remove(fsc->debugfs_dentry_lru); | ||
361 | } | 192 | } |
362 | 193 | ||
363 | int ceph_debugfs_client_init(struct ceph_client *client) | 194 | int ceph_fs_debugfs_init(struct ceph_fs_client *fsc) |
364 | { | 195 | { |
365 | int ret = 0; | 196 | char name[100]; |
366 | char name[80]; | 197 | int err = -ENOMEM; |
367 | |||
368 | snprintf(name, sizeof(name), "%pU.client%lld", &client->fsid, | ||
369 | client->monc.auth->global_id); | ||
370 | |||
371 | client->debugfs_dir = debugfs_create_dir(name, ceph_debugfs_dir); | ||
372 | if (!client->debugfs_dir) | ||
373 | goto out; | ||
374 | 198 | ||
375 | client->monc.debugfs_file = debugfs_create_file("monc", | 199 | dout("ceph_fs_debugfs_init\n"); |
376 | 0600, | 200 | fsc->debugfs_congestion_kb = |
377 | client->debugfs_dir, | 201 | debugfs_create_file("writeback_congestion_kb", |
378 | client, | 202 | 0600, |
379 | &monc_show_fops); | 203 | fsc->client->debugfs_dir, |
380 | if (!client->monc.debugfs_file) | 204 | fsc, |
381 | goto out; | 205 | &congestion_kb_fops); |
382 | 206 | if (!fsc->debugfs_congestion_kb) | |
383 | client->mdsc.debugfs_file = debugfs_create_file("mdsc", | ||
384 | 0600, | ||
385 | client->debugfs_dir, | ||
386 | client, | ||
387 | &mdsc_show_fops); | ||
388 | if (!client->mdsc.debugfs_file) | ||
389 | goto out; | 207 | goto out; |
390 | 208 | ||
391 | client->osdc.debugfs_file = debugfs_create_file("osdc", | 209 | dout("a\n"); |
392 | 0600, | ||
393 | client->debugfs_dir, | ||
394 | client, | ||
395 | &osdc_show_fops); | ||
396 | if (!client->osdc.debugfs_file) | ||
397 | goto out; | ||
398 | 210 | ||
399 | client->debugfs_monmap = debugfs_create_file("monmap", | 211 | snprintf(name, sizeof(name), "../../bdi/%s", |
400 | 0600, | 212 | dev_name(fsc->backing_dev_info.dev)); |
401 | client->debugfs_dir, | 213 | fsc->debugfs_bdi = |
402 | client, | 214 | debugfs_create_symlink("bdi", |
403 | &monmap_show_fops); | 215 | fsc->client->debugfs_dir, |
404 | if (!client->debugfs_monmap) | 216 | name); |
217 | if (!fsc->debugfs_bdi) | ||
405 | goto out; | 218 | goto out; |
406 | 219 | ||
407 | client->debugfs_mdsmap = debugfs_create_file("mdsmap", | 220 | dout("b\n"); |
221 | fsc->debugfs_mdsmap = debugfs_create_file("mdsmap", | ||
408 | 0600, | 222 | 0600, |
409 | client->debugfs_dir, | 223 | fsc->client->debugfs_dir, |
410 | client, | 224 | fsc, |
411 | &mdsmap_show_fops); | 225 | &mdsmap_show_fops); |
412 | if (!client->debugfs_mdsmap) | 226 | if (!fsc->debugfs_mdsmap) |
413 | goto out; | 227 | goto out; |
414 | 228 | ||
415 | client->debugfs_osdmap = debugfs_create_file("osdmap", | 229 | dout("ca\n"); |
416 | 0600, | 230 | fsc->debugfs_mdsc = debugfs_create_file("mdsc", |
417 | client->debugfs_dir, | 231 | 0600, |
418 | client, | 232 | fsc->client->debugfs_dir, |
419 | &osdmap_show_fops); | 233 | fsc, |
420 | if (!client->debugfs_osdmap) | 234 | &mdsc_show_fops); |
235 | if (!fsc->debugfs_mdsc) | ||
421 | goto out; | 236 | goto out; |
422 | 237 | ||
423 | client->debugfs_dentry_lru = debugfs_create_file("dentry_lru", | 238 | dout("da\n"); |
424 | 0600, | 239 | fsc->debugfs_caps = debugfs_create_file("caps", |
425 | client->debugfs_dir, | ||
426 | client, | ||
427 | &dentry_lru_show_fops); | ||
428 | if (!client->debugfs_dentry_lru) | ||
429 | goto out; | ||
430 | |||
431 | client->debugfs_caps = debugfs_create_file("caps", | ||
432 | 0400, | 240 | 0400, |
433 | client->debugfs_dir, | 241 | fsc->client->debugfs_dir, |
434 | client, | 242 | fsc, |
435 | &caps_show_fops); | 243 | &caps_show_fops); |
436 | if (!client->debugfs_caps) | 244 | if (!fsc->debugfs_caps) |
437 | goto out; | 245 | goto out; |
438 | 246 | ||
439 | client->debugfs_congestion_kb = | 247 | dout("ea\n"); |
440 | debugfs_create_file("writeback_congestion_kb", | 248 | fsc->debugfs_dentry_lru = debugfs_create_file("dentry_lru", |
441 | 0600, | 249 | 0600, |
442 | client->debugfs_dir, | 250 | fsc->client->debugfs_dir, |
443 | client, | 251 | fsc, |
444 | &congestion_kb_fops); | 252 | &dentry_lru_show_fops); |
445 | if (!client->debugfs_congestion_kb) | 253 | if (!fsc->debugfs_dentry_lru) |
446 | goto out; | 254 | goto out; |
447 | 255 | ||
448 | sprintf(name, "../../bdi/%s", dev_name(client->sb->s_bdi->dev)); | ||
449 | client->debugfs_bdi = debugfs_create_symlink("bdi", client->debugfs_dir, | ||
450 | name); | ||
451 | |||
452 | return 0; | 256 | return 0; |
453 | 257 | ||
454 | out: | 258 | out: |
455 | ceph_debugfs_client_cleanup(client); | 259 | ceph_fs_debugfs_cleanup(fsc); |
456 | return ret; | 260 | return err; |
457 | } | 261 | } |
458 | 262 | ||
459 | void ceph_debugfs_client_cleanup(struct ceph_client *client) | ||
460 | { | ||
461 | debugfs_remove(client->debugfs_bdi); | ||
462 | debugfs_remove(client->debugfs_caps); | ||
463 | debugfs_remove(client->debugfs_dentry_lru); | ||
464 | debugfs_remove(client->debugfs_osdmap); | ||
465 | debugfs_remove(client->debugfs_mdsmap); | ||
466 | debugfs_remove(client->debugfs_monmap); | ||
467 | debugfs_remove(client->osdc.debugfs_file); | ||
468 | debugfs_remove(client->mdsc.debugfs_file); | ||
469 | debugfs_remove(client->monc.debugfs_file); | ||
470 | debugfs_remove(client->debugfs_congestion_kb); | ||
471 | debugfs_remove(client->debugfs_dir); | ||
472 | } | ||
473 | 263 | ||
474 | #else /* CONFIG_DEBUG_FS */ | 264 | #else /* CONFIG_DEBUG_FS */ |
475 | 265 | ||
476 | int __init ceph_debugfs_init(void) | 266 | int ceph_fs_debugfs_init(struct ceph_fs_client *fsc) |
477 | { | ||
478 | return 0; | ||
479 | } | ||
480 | |||
481 | void ceph_debugfs_cleanup(void) | ||
482 | { | ||
483 | } | ||
484 | |||
485 | int ceph_debugfs_client_init(struct ceph_client *client) | ||
486 | { | 267 | { |
487 | return 0; | 268 | return 0; |
488 | } | 269 | } |
489 | 270 | ||
490 | void ceph_debugfs_client_cleanup(struct ceph_client *client) | 271 | void ceph_fs_debugfs_cleanup(struct ceph_fs_client *fsc) |
491 | { | 272 | { |
492 | } | 273 | } |
493 | 274 | ||
diff --git a/fs/ceph/dir.c b/fs/ceph/dir.c index a1986eb52045..a8d2aacc612b 100644 --- a/fs/ceph/dir.c +++ b/fs/ceph/dir.c | |||
@@ -1,4 +1,4 @@ | |||
1 | #include "ceph_debug.h" | 1 | #include <linux/ceph/ceph_debug.h> |
2 | 2 | ||
3 | #include <linux/spinlock.h> | 3 | #include <linux/spinlock.h> |
4 | #include <linux/fs_struct.h> | 4 | #include <linux/fs_struct.h> |
@@ -7,6 +7,7 @@ | |||
7 | #include <linux/sched.h> | 7 | #include <linux/sched.h> |
8 | 8 | ||
9 | #include "super.h" | 9 | #include "super.h" |
10 | #include "mds_client.h" | ||
10 | 11 | ||
11 | /* | 12 | /* |
12 | * Directory operations: readdir, lookup, create, link, unlink, | 13 | * Directory operations: readdir, lookup, create, link, unlink, |
@@ -227,15 +228,15 @@ static int ceph_readdir(struct file *filp, void *dirent, filldir_t filldir) | |||
227 | struct ceph_file_info *fi = filp->private_data; | 228 | struct ceph_file_info *fi = filp->private_data; |
228 | struct inode *inode = filp->f_dentry->d_inode; | 229 | struct inode *inode = filp->f_dentry->d_inode; |
229 | struct ceph_inode_info *ci = ceph_inode(inode); | 230 | struct ceph_inode_info *ci = ceph_inode(inode); |
230 | struct ceph_client *client = ceph_inode_to_client(inode); | 231 | struct ceph_fs_client *fsc = ceph_inode_to_client(inode); |
231 | struct ceph_mds_client *mdsc = &client->mdsc; | 232 | struct ceph_mds_client *mdsc = fsc->mdsc; |
232 | unsigned frag = fpos_frag(filp->f_pos); | 233 | unsigned frag = fpos_frag(filp->f_pos); |
233 | int off = fpos_off(filp->f_pos); | 234 | int off = fpos_off(filp->f_pos); |
234 | int err; | 235 | int err; |
235 | u32 ftype; | 236 | u32 ftype; |
236 | struct ceph_mds_reply_info_parsed *rinfo; | 237 | struct ceph_mds_reply_info_parsed *rinfo; |
237 | const int max_entries = client->mount_args->max_readdir; | 238 | const int max_entries = fsc->mount_options->max_readdir; |
238 | const int max_bytes = client->mount_args->max_readdir_bytes; | 239 | const int max_bytes = fsc->mount_options->max_readdir_bytes; |
239 | 240 | ||
240 | dout("readdir %p filp %p frag %u off %u\n", inode, filp, frag, off); | 241 | dout("readdir %p filp %p frag %u off %u\n", inode, filp, frag, off); |
241 | if (fi->at_end) | 242 | if (fi->at_end) |
@@ -267,7 +268,7 @@ static int ceph_readdir(struct file *filp, void *dirent, filldir_t filldir) | |||
267 | /* can we use the dcache? */ | 268 | /* can we use the dcache? */ |
268 | spin_lock(&inode->i_lock); | 269 | spin_lock(&inode->i_lock); |
269 | if ((filp->f_pos == 2 || fi->dentry) && | 270 | if ((filp->f_pos == 2 || fi->dentry) && |
270 | !ceph_test_opt(client, NOASYNCREADDIR) && | 271 | !ceph_test_mount_opt(fsc, NOASYNCREADDIR) && |
271 | ceph_snap(inode) != CEPH_SNAPDIR && | 272 | ceph_snap(inode) != CEPH_SNAPDIR && |
272 | (ci->i_ceph_flags & CEPH_I_COMPLETE) && | 273 | (ci->i_ceph_flags & CEPH_I_COMPLETE) && |
273 | __ceph_caps_issued_mask(ci, CEPH_CAP_FILE_SHARED, 1)) { | 274 | __ceph_caps_issued_mask(ci, CEPH_CAP_FILE_SHARED, 1)) { |
@@ -487,14 +488,14 @@ static loff_t ceph_dir_llseek(struct file *file, loff_t offset, int origin) | |||
487 | struct dentry *ceph_finish_lookup(struct ceph_mds_request *req, | 488 | struct dentry *ceph_finish_lookup(struct ceph_mds_request *req, |
488 | struct dentry *dentry, int err) | 489 | struct dentry *dentry, int err) |
489 | { | 490 | { |
490 | struct ceph_client *client = ceph_sb_to_client(dentry->d_sb); | 491 | struct ceph_fs_client *fsc = ceph_sb_to_client(dentry->d_sb); |
491 | struct inode *parent = dentry->d_parent->d_inode; | 492 | struct inode *parent = dentry->d_parent->d_inode; |
492 | 493 | ||
493 | /* .snap dir? */ | 494 | /* .snap dir? */ |
494 | if (err == -ENOENT && | 495 | if (err == -ENOENT && |
495 | ceph_vino(parent).ino != CEPH_INO_ROOT && /* no .snap in root dir */ | 496 | ceph_vino(parent).ino != CEPH_INO_ROOT && /* no .snap in root dir */ |
496 | strcmp(dentry->d_name.name, | 497 | strcmp(dentry->d_name.name, |
497 | client->mount_args->snapdir_name) == 0) { | 498 | fsc->mount_options->snapdir_name) == 0) { |
498 | struct inode *inode = ceph_get_snapdir(parent); | 499 | struct inode *inode = ceph_get_snapdir(parent); |
499 | dout("ENOENT on snapdir %p '%.*s', linking to snapdir %p\n", | 500 | dout("ENOENT on snapdir %p '%.*s', linking to snapdir %p\n", |
500 | dentry, dentry->d_name.len, dentry->d_name.name, inode); | 501 | dentry, dentry->d_name.len, dentry->d_name.name, inode); |
@@ -539,8 +540,8 @@ static int is_root_ceph_dentry(struct inode *inode, struct dentry *dentry) | |||
539 | static struct dentry *ceph_lookup(struct inode *dir, struct dentry *dentry, | 540 | static struct dentry *ceph_lookup(struct inode *dir, struct dentry *dentry, |
540 | struct nameidata *nd) | 541 | struct nameidata *nd) |
541 | { | 542 | { |
542 | struct ceph_client *client = ceph_sb_to_client(dir->i_sb); | 543 | struct ceph_fs_client *fsc = ceph_sb_to_client(dir->i_sb); |
543 | struct ceph_mds_client *mdsc = &client->mdsc; | 544 | struct ceph_mds_client *mdsc = fsc->mdsc; |
544 | struct ceph_mds_request *req; | 545 | struct ceph_mds_request *req; |
545 | int op; | 546 | int op; |
546 | int err; | 547 | int err; |
@@ -572,7 +573,7 @@ static struct dentry *ceph_lookup(struct inode *dir, struct dentry *dentry, | |||
572 | spin_lock(&dir->i_lock); | 573 | spin_lock(&dir->i_lock); |
573 | dout(" dir %p flags are %d\n", dir, ci->i_ceph_flags); | 574 | dout(" dir %p flags are %d\n", dir, ci->i_ceph_flags); |
574 | if (strncmp(dentry->d_name.name, | 575 | if (strncmp(dentry->d_name.name, |
575 | client->mount_args->snapdir_name, | 576 | fsc->mount_options->snapdir_name, |
576 | dentry->d_name.len) && | 577 | dentry->d_name.len) && |
577 | !is_root_ceph_dentry(dir, dentry) && | 578 | !is_root_ceph_dentry(dir, dentry) && |
578 | (ci->i_ceph_flags & CEPH_I_COMPLETE) && | 579 | (ci->i_ceph_flags & CEPH_I_COMPLETE) && |
@@ -629,8 +630,8 @@ int ceph_handle_notrace_create(struct inode *dir, struct dentry *dentry) | |||
629 | static int ceph_mknod(struct inode *dir, struct dentry *dentry, | 630 | static int ceph_mknod(struct inode *dir, struct dentry *dentry, |
630 | int mode, dev_t rdev) | 631 | int mode, dev_t rdev) |
631 | { | 632 | { |
632 | struct ceph_client *client = ceph_sb_to_client(dir->i_sb); | 633 | struct ceph_fs_client *fsc = ceph_sb_to_client(dir->i_sb); |
633 | struct ceph_mds_client *mdsc = &client->mdsc; | 634 | struct ceph_mds_client *mdsc = fsc->mdsc; |
634 | struct ceph_mds_request *req; | 635 | struct ceph_mds_request *req; |
635 | int err; | 636 | int err; |
636 | 637 | ||
@@ -685,8 +686,8 @@ static int ceph_create(struct inode *dir, struct dentry *dentry, int mode, | |||
685 | static int ceph_symlink(struct inode *dir, struct dentry *dentry, | 686 | static int ceph_symlink(struct inode *dir, struct dentry *dentry, |
686 | const char *dest) | 687 | const char *dest) |
687 | { | 688 | { |
688 | struct ceph_client *client = ceph_sb_to_client(dir->i_sb); | 689 | struct ceph_fs_client *fsc = ceph_sb_to_client(dir->i_sb); |
689 | struct ceph_mds_client *mdsc = &client->mdsc; | 690 | struct ceph_mds_client *mdsc = fsc->mdsc; |
690 | struct ceph_mds_request *req; | 691 | struct ceph_mds_request *req; |
691 | int err; | 692 | int err; |
692 | 693 | ||
@@ -716,8 +717,8 @@ static int ceph_symlink(struct inode *dir, struct dentry *dentry, | |||
716 | 717 | ||
717 | static int ceph_mkdir(struct inode *dir, struct dentry *dentry, int mode) | 718 | static int ceph_mkdir(struct inode *dir, struct dentry *dentry, int mode) |
718 | { | 719 | { |
719 | struct ceph_client *client = ceph_sb_to_client(dir->i_sb); | 720 | struct ceph_fs_client *fsc = ceph_sb_to_client(dir->i_sb); |
720 | struct ceph_mds_client *mdsc = &client->mdsc; | 721 | struct ceph_mds_client *mdsc = fsc->mdsc; |
721 | struct ceph_mds_request *req; | 722 | struct ceph_mds_request *req; |
722 | int err = -EROFS; | 723 | int err = -EROFS; |
723 | int op; | 724 | int op; |
@@ -758,8 +759,8 @@ out: | |||
758 | static int ceph_link(struct dentry *old_dentry, struct inode *dir, | 759 | static int ceph_link(struct dentry *old_dentry, struct inode *dir, |
759 | struct dentry *dentry) | 760 | struct dentry *dentry) |
760 | { | 761 | { |
761 | struct ceph_client *client = ceph_sb_to_client(dir->i_sb); | 762 | struct ceph_fs_client *fsc = ceph_sb_to_client(dir->i_sb); |
762 | struct ceph_mds_client *mdsc = &client->mdsc; | 763 | struct ceph_mds_client *mdsc = fsc->mdsc; |
763 | struct ceph_mds_request *req; | 764 | struct ceph_mds_request *req; |
764 | int err; | 765 | int err; |
765 | 766 | ||
@@ -813,8 +814,8 @@ static int drop_caps_for_unlink(struct inode *inode) | |||
813 | */ | 814 | */ |
814 | static int ceph_unlink(struct inode *dir, struct dentry *dentry) | 815 | static int ceph_unlink(struct inode *dir, struct dentry *dentry) |
815 | { | 816 | { |
816 | struct ceph_client *client = ceph_sb_to_client(dir->i_sb); | 817 | struct ceph_fs_client *fsc = ceph_sb_to_client(dir->i_sb); |
817 | struct ceph_mds_client *mdsc = &client->mdsc; | 818 | struct ceph_mds_client *mdsc = fsc->mdsc; |
818 | struct inode *inode = dentry->d_inode; | 819 | struct inode *inode = dentry->d_inode; |
819 | struct ceph_mds_request *req; | 820 | struct ceph_mds_request *req; |
820 | int err = -EROFS; | 821 | int err = -EROFS; |
@@ -854,8 +855,8 @@ out: | |||
854 | static int ceph_rename(struct inode *old_dir, struct dentry *old_dentry, | 855 | static int ceph_rename(struct inode *old_dir, struct dentry *old_dentry, |
855 | struct inode *new_dir, struct dentry *new_dentry) | 856 | struct inode *new_dir, struct dentry *new_dentry) |
856 | { | 857 | { |
857 | struct ceph_client *client = ceph_sb_to_client(old_dir->i_sb); | 858 | struct ceph_fs_client *fsc = ceph_sb_to_client(old_dir->i_sb); |
858 | struct ceph_mds_client *mdsc = &client->mdsc; | 859 | struct ceph_mds_client *mdsc = fsc->mdsc; |
859 | struct ceph_mds_request *req; | 860 | struct ceph_mds_request *req; |
860 | int err; | 861 | int err; |
861 | 862 | ||
@@ -1076,7 +1077,7 @@ static ssize_t ceph_read_dir(struct file *file, char __user *buf, size_t size, | |||
1076 | struct ceph_inode_info *ci = ceph_inode(inode); | 1077 | struct ceph_inode_info *ci = ceph_inode(inode); |
1077 | int left; | 1078 | int left; |
1078 | 1079 | ||
1079 | if (!ceph_test_opt(ceph_sb_to_client(inode->i_sb), DIRSTAT)) | 1080 | if (!ceph_test_mount_opt(ceph_sb_to_client(inode->i_sb), DIRSTAT)) |
1080 | return -EISDIR; | 1081 | return -EISDIR; |
1081 | 1082 | ||
1082 | if (!cf->dir_info) { | 1083 | if (!cf->dir_info) { |
@@ -1177,7 +1178,7 @@ void ceph_dentry_lru_add(struct dentry *dn) | |||
1177 | dout("dentry_lru_add %p %p '%.*s'\n", di, dn, | 1178 | dout("dentry_lru_add %p %p '%.*s'\n", di, dn, |
1178 | dn->d_name.len, dn->d_name.name); | 1179 | dn->d_name.len, dn->d_name.name); |
1179 | if (di) { | 1180 | if (di) { |
1180 | mdsc = &ceph_sb_to_client(dn->d_sb)->mdsc; | 1181 | mdsc = ceph_sb_to_client(dn->d_sb)->mdsc; |
1181 | spin_lock(&mdsc->dentry_lru_lock); | 1182 | spin_lock(&mdsc->dentry_lru_lock); |
1182 | list_add_tail(&di->lru, &mdsc->dentry_lru); | 1183 | list_add_tail(&di->lru, &mdsc->dentry_lru); |
1183 | mdsc->num_dentry++; | 1184 | mdsc->num_dentry++; |
@@ -1193,7 +1194,7 @@ void ceph_dentry_lru_touch(struct dentry *dn) | |||
1193 | dout("dentry_lru_touch %p %p '%.*s' (offset %lld)\n", di, dn, | 1194 | dout("dentry_lru_touch %p %p '%.*s' (offset %lld)\n", di, dn, |
1194 | dn->d_name.len, dn->d_name.name, di->offset); | 1195 | dn->d_name.len, dn->d_name.name, di->offset); |
1195 | if (di) { | 1196 | if (di) { |
1196 | mdsc = &ceph_sb_to_client(dn->d_sb)->mdsc; | 1197 | mdsc = ceph_sb_to_client(dn->d_sb)->mdsc; |
1197 | spin_lock(&mdsc->dentry_lru_lock); | 1198 | spin_lock(&mdsc->dentry_lru_lock); |
1198 | list_move_tail(&di->lru, &mdsc->dentry_lru); | 1199 | list_move_tail(&di->lru, &mdsc->dentry_lru); |
1199 | spin_unlock(&mdsc->dentry_lru_lock); | 1200 | spin_unlock(&mdsc->dentry_lru_lock); |
@@ -1208,7 +1209,7 @@ void ceph_dentry_lru_del(struct dentry *dn) | |||
1208 | dout("dentry_lru_del %p %p '%.*s'\n", di, dn, | 1209 | dout("dentry_lru_del %p %p '%.*s'\n", di, dn, |
1209 | dn->d_name.len, dn->d_name.name); | 1210 | dn->d_name.len, dn->d_name.name); |
1210 | if (di) { | 1211 | if (di) { |
1211 | mdsc = &ceph_sb_to_client(dn->d_sb)->mdsc; | 1212 | mdsc = ceph_sb_to_client(dn->d_sb)->mdsc; |
1212 | spin_lock(&mdsc->dentry_lru_lock); | 1213 | spin_lock(&mdsc->dentry_lru_lock); |
1213 | list_del_init(&di->lru); | 1214 | list_del_init(&di->lru); |
1214 | mdsc->num_dentry--; | 1215 | mdsc->num_dentry--; |
diff --git a/fs/ceph/export.c b/fs/ceph/export.c index e38423e82f2e..2297d9426992 100644 --- a/fs/ceph/export.c +++ b/fs/ceph/export.c | |||
@@ -1,10 +1,11 @@ | |||
1 | #include "ceph_debug.h" | 1 | #include <linux/ceph/ceph_debug.h> |
2 | 2 | ||
3 | #include <linux/exportfs.h> | 3 | #include <linux/exportfs.h> |
4 | #include <linux/slab.h> | 4 | #include <linux/slab.h> |
5 | #include <asm/unaligned.h> | 5 | #include <asm/unaligned.h> |
6 | 6 | ||
7 | #include "super.h" | 7 | #include "super.h" |
8 | #include "mds_client.h" | ||
8 | 9 | ||
9 | /* | 10 | /* |
10 | * NFS export support | 11 | * NFS export support |
@@ -120,7 +121,7 @@ static struct dentry *__fh_to_dentry(struct super_block *sb, | |||
120 | static struct dentry *__cfh_to_dentry(struct super_block *sb, | 121 | static struct dentry *__cfh_to_dentry(struct super_block *sb, |
121 | struct ceph_nfs_confh *cfh) | 122 | struct ceph_nfs_confh *cfh) |
122 | { | 123 | { |
123 | struct ceph_mds_client *mdsc = &ceph_sb_to_client(sb)->mdsc; | 124 | struct ceph_mds_client *mdsc = ceph_sb_to_client(sb)->mdsc; |
124 | struct inode *inode; | 125 | struct inode *inode; |
125 | struct dentry *dentry; | 126 | struct dentry *dentry; |
126 | struct ceph_vino vino; | 127 | struct ceph_vino vino; |
diff --git a/fs/ceph/file.c b/fs/ceph/file.c index 66e4da6dba22..e77c28cf3690 100644 --- a/fs/ceph/file.c +++ b/fs/ceph/file.c | |||
@@ -1,5 +1,6 @@ | |||
1 | #include "ceph_debug.h" | 1 | #include <linux/ceph/ceph_debug.h> |
2 | 2 | ||
3 | #include <linux/module.h> | ||
3 | #include <linux/sched.h> | 4 | #include <linux/sched.h> |
4 | #include <linux/slab.h> | 5 | #include <linux/slab.h> |
5 | #include <linux/file.h> | 6 | #include <linux/file.h> |
@@ -38,8 +39,8 @@ | |||
38 | static struct ceph_mds_request * | 39 | static struct ceph_mds_request * |
39 | prepare_open_request(struct super_block *sb, int flags, int create_mode) | 40 | prepare_open_request(struct super_block *sb, int flags, int create_mode) |
40 | { | 41 | { |
41 | struct ceph_client *client = ceph_sb_to_client(sb); | 42 | struct ceph_fs_client *fsc = ceph_sb_to_client(sb); |
42 | struct ceph_mds_client *mdsc = &client->mdsc; | 43 | struct ceph_mds_client *mdsc = fsc->mdsc; |
43 | struct ceph_mds_request *req; | 44 | struct ceph_mds_request *req; |
44 | int want_auth = USE_ANY_MDS; | 45 | int want_auth = USE_ANY_MDS; |
45 | int op = (flags & O_CREAT) ? CEPH_MDS_OP_CREATE : CEPH_MDS_OP_OPEN; | 46 | int op = (flags & O_CREAT) ? CEPH_MDS_OP_CREATE : CEPH_MDS_OP_OPEN; |
@@ -117,8 +118,8 @@ static int ceph_init_file(struct inode *inode, struct file *file, int fmode) | |||
117 | int ceph_open(struct inode *inode, struct file *file) | 118 | int ceph_open(struct inode *inode, struct file *file) |
118 | { | 119 | { |
119 | struct ceph_inode_info *ci = ceph_inode(inode); | 120 | struct ceph_inode_info *ci = ceph_inode(inode); |
120 | struct ceph_client *client = ceph_sb_to_client(inode->i_sb); | 121 | struct ceph_fs_client *fsc = ceph_sb_to_client(inode->i_sb); |
121 | struct ceph_mds_client *mdsc = &client->mdsc; | 122 | struct ceph_mds_client *mdsc = fsc->mdsc; |
122 | struct ceph_mds_request *req; | 123 | struct ceph_mds_request *req; |
123 | struct ceph_file_info *cf = file->private_data; | 124 | struct ceph_file_info *cf = file->private_data; |
124 | struct inode *parent_inode = file->f_dentry->d_parent->d_inode; | 125 | struct inode *parent_inode = file->f_dentry->d_parent->d_inode; |
@@ -216,8 +217,8 @@ struct dentry *ceph_lookup_open(struct inode *dir, struct dentry *dentry, | |||
216 | struct nameidata *nd, int mode, | 217 | struct nameidata *nd, int mode, |
217 | int locked_dir) | 218 | int locked_dir) |
218 | { | 219 | { |
219 | struct ceph_client *client = ceph_sb_to_client(dir->i_sb); | 220 | struct ceph_fs_client *fsc = ceph_sb_to_client(dir->i_sb); |
220 | struct ceph_mds_client *mdsc = &client->mdsc; | 221 | struct ceph_mds_client *mdsc = fsc->mdsc; |
221 | struct file *file = nd->intent.open.file; | 222 | struct file *file = nd->intent.open.file; |
222 | struct inode *parent_inode = get_dentry_parent_inode(file->f_dentry); | 223 | struct inode *parent_inode = get_dentry_parent_inode(file->f_dentry); |
223 | struct ceph_mds_request *req; | 224 | struct ceph_mds_request *req; |
@@ -270,163 +271,6 @@ int ceph_release(struct inode *inode, struct file *file) | |||
270 | } | 271 | } |
271 | 272 | ||
272 | /* | 273 | /* |
273 | * build a vector of user pages | ||
274 | */ | ||
275 | static struct page **get_direct_page_vector(const char __user *data, | ||
276 | int num_pages, | ||
277 | loff_t off, size_t len) | ||
278 | { | ||
279 | struct page **pages; | ||
280 | int rc; | ||
281 | |||
282 | pages = kmalloc(sizeof(*pages) * num_pages, GFP_NOFS); | ||
283 | if (!pages) | ||
284 | return ERR_PTR(-ENOMEM); | ||
285 | |||
286 | down_read(¤t->mm->mmap_sem); | ||
287 | rc = get_user_pages(current, current->mm, (unsigned long)data, | ||
288 | num_pages, 0, 0, pages, NULL); | ||
289 | up_read(¤t->mm->mmap_sem); | ||
290 | if (rc < 0) | ||
291 | goto fail; | ||
292 | return pages; | ||
293 | |||
294 | fail: | ||
295 | kfree(pages); | ||
296 | return ERR_PTR(rc); | ||
297 | } | ||
298 | |||
299 | static void put_page_vector(struct page **pages, int num_pages) | ||
300 | { | ||
301 | int i; | ||
302 | |||
303 | for (i = 0; i < num_pages; i++) | ||
304 | put_page(pages[i]); | ||
305 | kfree(pages); | ||
306 | } | ||
307 | |||
308 | void ceph_release_page_vector(struct page **pages, int num_pages) | ||
309 | { | ||
310 | int i; | ||
311 | |||
312 | for (i = 0; i < num_pages; i++) | ||
313 | __free_pages(pages[i], 0); | ||
314 | kfree(pages); | ||
315 | } | ||
316 | |||
317 | /* | ||
318 | * allocate a vector new pages | ||
319 | */ | ||
320 | static struct page **ceph_alloc_page_vector(int num_pages, gfp_t flags) | ||
321 | { | ||
322 | struct page **pages; | ||
323 | int i; | ||
324 | |||
325 | pages = kmalloc(sizeof(*pages) * num_pages, flags); | ||
326 | if (!pages) | ||
327 | return ERR_PTR(-ENOMEM); | ||
328 | for (i = 0; i < num_pages; i++) { | ||
329 | pages[i] = __page_cache_alloc(flags); | ||
330 | if (pages[i] == NULL) { | ||
331 | ceph_release_page_vector(pages, i); | ||
332 | return ERR_PTR(-ENOMEM); | ||
333 | } | ||
334 | } | ||
335 | return pages; | ||
336 | } | ||
337 | |||
338 | /* | ||
339 | * copy user data into a page vector | ||
340 | */ | ||
341 | static int copy_user_to_page_vector(struct page **pages, | ||
342 | const char __user *data, | ||
343 | loff_t off, size_t len) | ||
344 | { | ||
345 | int i = 0; | ||
346 | int po = off & ~PAGE_CACHE_MASK; | ||
347 | int left = len; | ||
348 | int l, bad; | ||
349 | |||
350 | while (left > 0) { | ||
351 | l = min_t(int, PAGE_CACHE_SIZE-po, left); | ||
352 | bad = copy_from_user(page_address(pages[i]) + po, data, l); | ||
353 | if (bad == l) | ||
354 | return -EFAULT; | ||
355 | data += l - bad; | ||
356 | left -= l - bad; | ||
357 | po += l - bad; | ||
358 | if (po == PAGE_CACHE_SIZE) { | ||
359 | po = 0; | ||
360 | i++; | ||
361 | } | ||
362 | } | ||
363 | return len; | ||
364 | } | ||
365 | |||
366 | /* | ||
367 | * copy user data from a page vector into a user pointer | ||
368 | */ | ||
369 | static int copy_page_vector_to_user(struct page **pages, char __user *data, | ||
370 | loff_t off, size_t len) | ||
371 | { | ||
372 | int i = 0; | ||
373 | int po = off & ~PAGE_CACHE_MASK; | ||
374 | int left = len; | ||
375 | int l, bad; | ||
376 | |||
377 | while (left > 0) { | ||
378 | l = min_t(int, left, PAGE_CACHE_SIZE-po); | ||
379 | bad = copy_to_user(data, page_address(pages[i]) + po, l); | ||
380 | if (bad == l) | ||
381 | return -EFAULT; | ||
382 | data += l - bad; | ||
383 | left -= l - bad; | ||
384 | if (po) { | ||
385 | po += l - bad; | ||
386 | if (po == PAGE_CACHE_SIZE) | ||
387 | po = 0; | ||
388 | } | ||
389 | i++; | ||
390 | } | ||
391 | return len; | ||
392 | } | ||
393 | |||
394 | /* | ||
395 | * Zero an extent within a page vector. Offset is relative to the | ||
396 | * start of the first page. | ||
397 | */ | ||
398 | static void zero_page_vector_range(int off, int len, struct page **pages) | ||
399 | { | ||
400 | int i = off >> PAGE_CACHE_SHIFT; | ||
401 | |||
402 | off &= ~PAGE_CACHE_MASK; | ||
403 | |||
404 | dout("zero_page_vector_page %u~%u\n", off, len); | ||
405 | |||
406 | /* leading partial page? */ | ||
407 | if (off) { | ||
408 | int end = min((int)PAGE_CACHE_SIZE, off + len); | ||
409 | dout("zeroing %d %p head from %d\n", i, pages[i], | ||
410 | (int)off); | ||
411 | zero_user_segment(pages[i], off, end); | ||
412 | len -= (end - off); | ||
413 | i++; | ||
414 | } | ||
415 | while (len >= PAGE_CACHE_SIZE) { | ||
416 | dout("zeroing %d %p len=%d\n", i, pages[i], len); | ||
417 | zero_user_segment(pages[i], 0, PAGE_CACHE_SIZE); | ||
418 | len -= PAGE_CACHE_SIZE; | ||
419 | i++; | ||
420 | } | ||
421 | /* trailing partial page? */ | ||
422 | if (len) { | ||
423 | dout("zeroing %d %p tail to %d\n", i, pages[i], (int)len); | ||
424 | zero_user_segment(pages[i], 0, len); | ||
425 | } | ||
426 | } | ||
427 | |||
428 | |||
429 | /* | ||
430 | * Read a range of bytes striped over one or more objects. Iterate over | 274 | * Read a range of bytes striped over one or more objects. Iterate over |
431 | * objects we stripe over. (That's not atomic, but good enough for now.) | 275 | * objects we stripe over. (That's not atomic, but good enough for now.) |
432 | * | 276 | * |
@@ -438,7 +282,7 @@ static int striped_read(struct inode *inode, | |||
438 | struct page **pages, int num_pages, | 282 | struct page **pages, int num_pages, |
439 | int *checkeof) | 283 | int *checkeof) |
440 | { | 284 | { |
441 | struct ceph_client *client = ceph_inode_to_client(inode); | 285 | struct ceph_fs_client *fsc = ceph_inode_to_client(inode); |
442 | struct ceph_inode_info *ci = ceph_inode(inode); | 286 | struct ceph_inode_info *ci = ceph_inode(inode); |
443 | u64 pos, this_len; | 287 | u64 pos, this_len; |
444 | int page_off = off & ~PAGE_CACHE_MASK; /* first byte's offset in page */ | 288 | int page_off = off & ~PAGE_CACHE_MASK; /* first byte's offset in page */ |
@@ -459,7 +303,7 @@ static int striped_read(struct inode *inode, | |||
459 | 303 | ||
460 | more: | 304 | more: |
461 | this_len = left; | 305 | this_len = left; |
462 | ret = ceph_osdc_readpages(&client->osdc, ceph_vino(inode), | 306 | ret = ceph_osdc_readpages(&fsc->client->osdc, ceph_vino(inode), |
463 | &ci->i_layout, pos, &this_len, | 307 | &ci->i_layout, pos, &this_len, |
464 | ci->i_truncate_seq, | 308 | ci->i_truncate_seq, |
465 | ci->i_truncate_size, | 309 | ci->i_truncate_size, |
@@ -477,8 +321,8 @@ more: | |||
477 | 321 | ||
478 | if (read < pos - off) { | 322 | if (read < pos - off) { |
479 | dout(" zero gap %llu to %llu\n", off + read, pos); | 323 | dout(" zero gap %llu to %llu\n", off + read, pos); |
480 | zero_page_vector_range(page_off + read, | 324 | ceph_zero_page_vector_range(page_off + read, |
481 | pos - off - read, pages); | 325 | pos - off - read, pages); |
482 | } | 326 | } |
483 | pos += ret; | 327 | pos += ret; |
484 | read = pos - off; | 328 | read = pos - off; |
@@ -495,8 +339,8 @@ more: | |||
495 | /* was original extent fully inside i_size? */ | 339 | /* was original extent fully inside i_size? */ |
496 | if (pos + left <= inode->i_size) { | 340 | if (pos + left <= inode->i_size) { |
497 | dout("zero tail\n"); | 341 | dout("zero tail\n"); |
498 | zero_page_vector_range(page_off + read, len - read, | 342 | ceph_zero_page_vector_range(page_off + read, len - read, |
499 | pages); | 343 | pages); |
500 | read = len; | 344 | read = len; |
501 | goto out; | 345 | goto out; |
502 | } | 346 | } |
@@ -531,7 +375,7 @@ static ssize_t ceph_sync_read(struct file *file, char __user *data, | |||
531 | (file->f_flags & O_DIRECT) ? "O_DIRECT" : ""); | 375 | (file->f_flags & O_DIRECT) ? "O_DIRECT" : ""); |
532 | 376 | ||
533 | if (file->f_flags & O_DIRECT) { | 377 | if (file->f_flags & O_DIRECT) { |
534 | pages = get_direct_page_vector(data, num_pages, off, len); | 378 | pages = ceph_get_direct_page_vector(data, num_pages, off, len); |
535 | 379 | ||
536 | /* | 380 | /* |
537 | * flush any page cache pages in this range. this | 381 | * flush any page cache pages in this range. this |
@@ -552,13 +396,13 @@ static ssize_t ceph_sync_read(struct file *file, char __user *data, | |||
552 | ret = striped_read(inode, off, len, pages, num_pages, checkeof); | 396 | ret = striped_read(inode, off, len, pages, num_pages, checkeof); |
553 | 397 | ||
554 | if (ret >= 0 && (file->f_flags & O_DIRECT) == 0) | 398 | if (ret >= 0 && (file->f_flags & O_DIRECT) == 0) |
555 | ret = copy_page_vector_to_user(pages, data, off, ret); | 399 | ret = ceph_copy_page_vector_to_user(pages, data, off, ret); |
556 | if (ret >= 0) | 400 | if (ret >= 0) |
557 | *poff = off + ret; | 401 | *poff = off + ret; |
558 | 402 | ||
559 | done: | 403 | done: |
560 | if (file->f_flags & O_DIRECT) | 404 | if (file->f_flags & O_DIRECT) |
561 | put_page_vector(pages, num_pages); | 405 | ceph_put_page_vector(pages, num_pages); |
562 | else | 406 | else |
563 | ceph_release_page_vector(pages, num_pages); | 407 | ceph_release_page_vector(pages, num_pages); |
564 | dout("sync_read result %d\n", ret); | 408 | dout("sync_read result %d\n", ret); |
@@ -594,7 +438,7 @@ static ssize_t ceph_sync_write(struct file *file, const char __user *data, | |||
594 | { | 438 | { |
595 | struct inode *inode = file->f_dentry->d_inode; | 439 | struct inode *inode = file->f_dentry->d_inode; |
596 | struct ceph_inode_info *ci = ceph_inode(inode); | 440 | struct ceph_inode_info *ci = ceph_inode(inode); |
597 | struct ceph_client *client = ceph_inode_to_client(inode); | 441 | struct ceph_fs_client *fsc = ceph_inode_to_client(inode); |
598 | struct ceph_osd_request *req; | 442 | struct ceph_osd_request *req; |
599 | struct page **pages; | 443 | struct page **pages; |
600 | int num_pages; | 444 | int num_pages; |
@@ -642,7 +486,7 @@ static ssize_t ceph_sync_write(struct file *file, const char __user *data, | |||
642 | */ | 486 | */ |
643 | more: | 487 | more: |
644 | len = left; | 488 | len = left; |
645 | req = ceph_osdc_new_request(&client->osdc, &ci->i_layout, | 489 | req = ceph_osdc_new_request(&fsc->client->osdc, &ci->i_layout, |
646 | ceph_vino(inode), pos, &len, | 490 | ceph_vino(inode), pos, &len, |
647 | CEPH_OSD_OP_WRITE, flags, | 491 | CEPH_OSD_OP_WRITE, flags, |
648 | ci->i_snap_realm->cached_context, | 492 | ci->i_snap_realm->cached_context, |
@@ -655,7 +499,7 @@ more: | |||
655 | num_pages = calc_pages_for(pos, len); | 499 | num_pages = calc_pages_for(pos, len); |
656 | 500 | ||
657 | if (file->f_flags & O_DIRECT) { | 501 | if (file->f_flags & O_DIRECT) { |
658 | pages = get_direct_page_vector(data, num_pages, pos, len); | 502 | pages = ceph_get_direct_page_vector(data, num_pages, pos, len); |
659 | if (IS_ERR(pages)) { | 503 | if (IS_ERR(pages)) { |
660 | ret = PTR_ERR(pages); | 504 | ret = PTR_ERR(pages); |
661 | goto out; | 505 | goto out; |
@@ -673,7 +517,7 @@ more: | |||
673 | ret = PTR_ERR(pages); | 517 | ret = PTR_ERR(pages); |
674 | goto out; | 518 | goto out; |
675 | } | 519 | } |
676 | ret = copy_user_to_page_vector(pages, data, pos, len); | 520 | ret = ceph_copy_user_to_page_vector(pages, data, pos, len); |
677 | if (ret < 0) { | 521 | if (ret < 0) { |
678 | ceph_release_page_vector(pages, num_pages); | 522 | ceph_release_page_vector(pages, num_pages); |
679 | goto out; | 523 | goto out; |
@@ -689,7 +533,7 @@ more: | |||
689 | req->r_num_pages = num_pages; | 533 | req->r_num_pages = num_pages; |
690 | req->r_inode = inode; | 534 | req->r_inode = inode; |
691 | 535 | ||
692 | ret = ceph_osdc_start_request(&client->osdc, req, false); | 536 | ret = ceph_osdc_start_request(&fsc->client->osdc, req, false); |
693 | if (!ret) { | 537 | if (!ret) { |
694 | if (req->r_safe_callback) { | 538 | if (req->r_safe_callback) { |
695 | /* | 539 | /* |
@@ -701,11 +545,11 @@ more: | |||
701 | spin_unlock(&ci->i_unsafe_lock); | 545 | spin_unlock(&ci->i_unsafe_lock); |
702 | ceph_get_cap_refs(ci, CEPH_CAP_FILE_WR); | 546 | ceph_get_cap_refs(ci, CEPH_CAP_FILE_WR); |
703 | } | 547 | } |
704 | ret = ceph_osdc_wait_request(&client->osdc, req); | 548 | ret = ceph_osdc_wait_request(&fsc->client->osdc, req); |
705 | } | 549 | } |
706 | 550 | ||
707 | if (file->f_flags & O_DIRECT) | 551 | if (file->f_flags & O_DIRECT) |
708 | put_page_vector(pages, num_pages); | 552 | ceph_put_page_vector(pages, num_pages); |
709 | else if (file->f_flags & O_SYNC) | 553 | else if (file->f_flags & O_SYNC) |
710 | ceph_release_page_vector(pages, num_pages); | 554 | ceph_release_page_vector(pages, num_pages); |
711 | 555 | ||
@@ -814,7 +658,8 @@ static ssize_t ceph_aio_write(struct kiocb *iocb, const struct iovec *iov, | |||
814 | struct ceph_file_info *fi = file->private_data; | 658 | struct ceph_file_info *fi = file->private_data; |
815 | struct inode *inode = file->f_dentry->d_inode; | 659 | struct inode *inode = file->f_dentry->d_inode; |
816 | struct ceph_inode_info *ci = ceph_inode(inode); | 660 | struct ceph_inode_info *ci = ceph_inode(inode); |
817 | struct ceph_osd_client *osdc = &ceph_sb_to_client(inode->i_sb)->osdc; | 661 | struct ceph_osd_client *osdc = |
662 | &ceph_sb_to_client(inode->i_sb)->client->osdc; | ||
818 | loff_t endoff = pos + iov->iov_len; | 663 | loff_t endoff = pos + iov->iov_len; |
819 | int want, got = 0; | 664 | int want, got = 0; |
820 | int ret, err; | 665 | int ret, err; |
diff --git a/fs/ceph/inode.c b/fs/ceph/inode.c index 62377ec37edf..1d6a45b5a04c 100644 --- a/fs/ceph/inode.c +++ b/fs/ceph/inode.c | |||
@@ -1,4 +1,4 @@ | |||
1 | #include "ceph_debug.h" | 1 | #include <linux/ceph/ceph_debug.h> |
2 | 2 | ||
3 | #include <linux/module.h> | 3 | #include <linux/module.h> |
4 | #include <linux/fs.h> | 4 | #include <linux/fs.h> |
@@ -13,7 +13,8 @@ | |||
13 | #include <linux/pagevec.h> | 13 | #include <linux/pagevec.h> |
14 | 14 | ||
15 | #include "super.h" | 15 | #include "super.h" |
16 | #include "decode.h" | 16 | #include "mds_client.h" |
17 | #include <linux/ceph/decode.h> | ||
17 | 18 | ||
18 | /* | 19 | /* |
19 | * Ceph inode operations | 20 | * Ceph inode operations |
@@ -384,7 +385,7 @@ void ceph_destroy_inode(struct inode *inode) | |||
384 | */ | 385 | */ |
385 | if (ci->i_snap_realm) { | 386 | if (ci->i_snap_realm) { |
386 | struct ceph_mds_client *mdsc = | 387 | struct ceph_mds_client *mdsc = |
387 | &ceph_sb_to_client(ci->vfs_inode.i_sb)->mdsc; | 388 | ceph_sb_to_client(ci->vfs_inode.i_sb)->mdsc; |
388 | struct ceph_snap_realm *realm = ci->i_snap_realm; | 389 | struct ceph_snap_realm *realm = ci->i_snap_realm; |
389 | 390 | ||
390 | dout(" dropping residual ref to snap realm %p\n", realm); | 391 | dout(" dropping residual ref to snap realm %p\n", realm); |
@@ -685,7 +686,7 @@ static int fill_inode(struct inode *inode, | |||
685 | } | 686 | } |
686 | 687 | ||
687 | /* it may be better to set st_size in getattr instead? */ | 688 | /* it may be better to set st_size in getattr instead? */ |
688 | if (ceph_test_opt(ceph_sb_to_client(inode->i_sb), RBYTES)) | 689 | if (ceph_test_mount_opt(ceph_sb_to_client(inode->i_sb), RBYTES)) |
689 | inode->i_size = ci->i_rbytes; | 690 | inode->i_size = ci->i_rbytes; |
690 | break; | 691 | break; |
691 | default: | 692 | default: |
@@ -901,7 +902,7 @@ int ceph_fill_trace(struct super_block *sb, struct ceph_mds_request *req, | |||
901 | struct inode *in = NULL; | 902 | struct inode *in = NULL; |
902 | struct ceph_mds_reply_inode *ininfo; | 903 | struct ceph_mds_reply_inode *ininfo; |
903 | struct ceph_vino vino; | 904 | struct ceph_vino vino; |
904 | struct ceph_client *client = ceph_sb_to_client(sb); | 905 | struct ceph_fs_client *fsc = ceph_sb_to_client(sb); |
905 | int i = 0; | 906 | int i = 0; |
906 | int err = 0; | 907 | int err = 0; |
907 | 908 | ||
@@ -965,7 +966,7 @@ int ceph_fill_trace(struct super_block *sb, struct ceph_mds_request *req, | |||
965 | */ | 966 | */ |
966 | if (rinfo->head->is_dentry && !req->r_aborted && | 967 | if (rinfo->head->is_dentry && !req->r_aborted && |
967 | (rinfo->head->is_target || strncmp(req->r_dentry->d_name.name, | 968 | (rinfo->head->is_target || strncmp(req->r_dentry->d_name.name, |
968 | client->mount_args->snapdir_name, | 969 | fsc->mount_options->snapdir_name, |
969 | req->r_dentry->d_name.len))) { | 970 | req->r_dentry->d_name.len))) { |
970 | /* | 971 | /* |
971 | * lookup link rename : null -> possibly existing inode | 972 | * lookup link rename : null -> possibly existing inode |
@@ -1533,7 +1534,7 @@ int ceph_setattr(struct dentry *dentry, struct iattr *attr) | |||
1533 | struct inode *parent_inode = dentry->d_parent->d_inode; | 1534 | struct inode *parent_inode = dentry->d_parent->d_inode; |
1534 | const unsigned int ia_valid = attr->ia_valid; | 1535 | const unsigned int ia_valid = attr->ia_valid; |
1535 | struct ceph_mds_request *req; | 1536 | struct ceph_mds_request *req; |
1536 | struct ceph_mds_client *mdsc = &ceph_sb_to_client(dentry->d_sb)->mdsc; | 1537 | struct ceph_mds_client *mdsc = ceph_sb_to_client(dentry->d_sb)->mdsc; |
1537 | int issued; | 1538 | int issued; |
1538 | int release = 0, dirtied = 0; | 1539 | int release = 0, dirtied = 0; |
1539 | int mask = 0; | 1540 | int mask = 0; |
@@ -1728,8 +1729,8 @@ out: | |||
1728 | */ | 1729 | */ |
1729 | int ceph_do_getattr(struct inode *inode, int mask) | 1730 | int ceph_do_getattr(struct inode *inode, int mask) |
1730 | { | 1731 | { |
1731 | struct ceph_client *client = ceph_sb_to_client(inode->i_sb); | 1732 | struct ceph_fs_client *fsc = ceph_sb_to_client(inode->i_sb); |
1732 | struct ceph_mds_client *mdsc = &client->mdsc; | 1733 | struct ceph_mds_client *mdsc = fsc->mdsc; |
1733 | struct ceph_mds_request *req; | 1734 | struct ceph_mds_request *req; |
1734 | int err; | 1735 | int err; |
1735 | 1736 | ||
diff --git a/fs/ceph/ioctl.c b/fs/ceph/ioctl.c index 76e307d2aba1..899578b0c46b 100644 --- a/fs/ceph/ioctl.c +++ b/fs/ceph/ioctl.c | |||
@@ -1,8 +1,10 @@ | |||
1 | #include <linux/in.h> | 1 | #include <linux/in.h> |
2 | 2 | ||
3 | #include "ioctl.h" | ||
4 | #include "super.h" | 3 | #include "super.h" |
5 | #include "ceph_debug.h" | 4 | #include "mds_client.h" |
5 | #include <linux/ceph/ceph_debug.h> | ||
6 | |||
7 | #include "ioctl.h" | ||
6 | 8 | ||
7 | 9 | ||
8 | /* | 10 | /* |
@@ -37,7 +39,7 @@ static long ceph_ioctl_set_layout(struct file *file, void __user *arg) | |||
37 | { | 39 | { |
38 | struct inode *inode = file->f_dentry->d_inode; | 40 | struct inode *inode = file->f_dentry->d_inode; |
39 | struct inode *parent_inode = file->f_dentry->d_parent->d_inode; | 41 | struct inode *parent_inode = file->f_dentry->d_parent->d_inode; |
40 | struct ceph_mds_client *mdsc = &ceph_sb_to_client(inode->i_sb)->mdsc; | 42 | struct ceph_mds_client *mdsc = ceph_sb_to_client(inode->i_sb)->mdsc; |
41 | struct ceph_mds_request *req; | 43 | struct ceph_mds_request *req; |
42 | struct ceph_ioctl_layout l; | 44 | struct ceph_ioctl_layout l; |
43 | int err, i; | 45 | int err, i; |
@@ -98,7 +100,8 @@ static long ceph_ioctl_get_dataloc(struct file *file, void __user *arg) | |||
98 | struct ceph_ioctl_dataloc dl; | 100 | struct ceph_ioctl_dataloc dl; |
99 | struct inode *inode = file->f_dentry->d_inode; | 101 | struct inode *inode = file->f_dentry->d_inode; |
100 | struct ceph_inode_info *ci = ceph_inode(inode); | 102 | struct ceph_inode_info *ci = ceph_inode(inode); |
101 | struct ceph_osd_client *osdc = &ceph_sb_to_client(inode->i_sb)->osdc; | 103 | struct ceph_osd_client *osdc = |
104 | &ceph_sb_to_client(inode->i_sb)->client->osdc; | ||
102 | u64 len = 1, olen; | 105 | u64 len = 1, olen; |
103 | u64 tmp; | 106 | u64 tmp; |
104 | struct ceph_object_layout ol; | 107 | struct ceph_object_layout ol; |
diff --git a/fs/ceph/locks.c b/fs/ceph/locks.c index ff4e753aae92..087afe9ca367 100644 --- a/fs/ceph/locks.c +++ b/fs/ceph/locks.c | |||
@@ -1,11 +1,11 @@ | |||
1 | #include "ceph_debug.h" | 1 | #include <linux/ceph/ceph_debug.h> |
2 | 2 | ||
3 | #include <linux/file.h> | 3 | #include <linux/file.h> |
4 | #include <linux/namei.h> | 4 | #include <linux/namei.h> |
5 | 5 | ||
6 | #include "super.h" | 6 | #include "super.h" |
7 | #include "mds_client.h" | 7 | #include "mds_client.h" |
8 | #include "pagelist.h" | 8 | #include <linux/ceph/pagelist.h> |
9 | 9 | ||
10 | /** | 10 | /** |
11 | * Implement fcntl and flock locking functions. | 11 | * Implement fcntl and flock locking functions. |
@@ -16,7 +16,7 @@ static int ceph_lock_message(u8 lock_type, u16 operation, struct file *file, | |||
16 | { | 16 | { |
17 | struct inode *inode = file->f_dentry->d_inode; | 17 | struct inode *inode = file->f_dentry->d_inode; |
18 | struct ceph_mds_client *mdsc = | 18 | struct ceph_mds_client *mdsc = |
19 | &ceph_sb_to_client(inode->i_sb)->mdsc; | 19 | ceph_sb_to_client(inode->i_sb)->mdsc; |
20 | struct ceph_mds_request *req; | 20 | struct ceph_mds_request *req; |
21 | int err; | 21 | int err; |
22 | 22 | ||
diff --git a/fs/ceph/mds_client.c b/fs/ceph/mds_client.c index fad95f8f2608..33568239a08e 100644 --- a/fs/ceph/mds_client.c +++ b/fs/ceph/mds_client.c | |||
@@ -1,17 +1,20 @@ | |||
1 | #include "ceph_debug.h" | 1 | #include <linux/ceph/ceph_debug.h> |
2 | 2 | ||
3 | #include <linux/wait.h> | 3 | #include <linux/wait.h> |
4 | #include <linux/slab.h> | 4 | #include <linux/slab.h> |
5 | #include <linux/sched.h> | 5 | #include <linux/sched.h> |
6 | #include <linux/smp_lock.h> | 6 | #include <linux/smp_lock.h> |
7 | #include <linux/debugfs.h> | ||
8 | #include <linux/seq_file.h> | ||
7 | 9 | ||
8 | #include "mds_client.h" | ||
9 | #include "mon_client.h" | ||
10 | #include "super.h" | 10 | #include "super.h" |
11 | #include "messenger.h" | 11 | #include "mds_client.h" |
12 | #include "decode.h" | 12 | |
13 | #include "auth.h" | 13 | #include <linux/ceph/messenger.h> |
14 | #include "pagelist.h" | 14 | #include <linux/ceph/decode.h> |
15 | #include <linux/ceph/pagelist.h> | ||
16 | #include <linux/ceph/auth.h> | ||
17 | #include <linux/ceph/debugfs.h> | ||
15 | 18 | ||
16 | /* | 19 | /* |
17 | * A cluster of MDS (metadata server) daemons is responsible for | 20 | * A cluster of MDS (metadata server) daemons is responsible for |
@@ -286,8 +289,9 @@ void ceph_put_mds_session(struct ceph_mds_session *s) | |||
286 | atomic_read(&s->s_ref), atomic_read(&s->s_ref)-1); | 289 | atomic_read(&s->s_ref), atomic_read(&s->s_ref)-1); |
287 | if (atomic_dec_and_test(&s->s_ref)) { | 290 | if (atomic_dec_and_test(&s->s_ref)) { |
288 | if (s->s_authorizer) | 291 | if (s->s_authorizer) |
289 | s->s_mdsc->client->monc.auth->ops->destroy_authorizer( | 292 | s->s_mdsc->fsc->client->monc.auth->ops->destroy_authorizer( |
290 | s->s_mdsc->client->monc.auth, s->s_authorizer); | 293 | s->s_mdsc->fsc->client->monc.auth, |
294 | s->s_authorizer); | ||
291 | kfree(s); | 295 | kfree(s); |
292 | } | 296 | } |
293 | } | 297 | } |
@@ -344,7 +348,7 @@ static struct ceph_mds_session *register_session(struct ceph_mds_client *mdsc, | |||
344 | s->s_seq = 0; | 348 | s->s_seq = 0; |
345 | mutex_init(&s->s_mutex); | 349 | mutex_init(&s->s_mutex); |
346 | 350 | ||
347 | ceph_con_init(mdsc->client->msgr, &s->s_con); | 351 | ceph_con_init(mdsc->fsc->client->msgr, &s->s_con); |
348 | s->s_con.private = s; | 352 | s->s_con.private = s; |
349 | s->s_con.ops = &mds_con_ops; | 353 | s->s_con.ops = &mds_con_ops; |
350 | s->s_con.peer_name.type = CEPH_ENTITY_TYPE_MDS; | 354 | s->s_con.peer_name.type = CEPH_ENTITY_TYPE_MDS; |
@@ -599,7 +603,7 @@ static int __choose_mds(struct ceph_mds_client *mdsc, | |||
599 | } else if (req->r_dentry) { | 603 | } else if (req->r_dentry) { |
600 | struct inode *dir = req->r_dentry->d_parent->d_inode; | 604 | struct inode *dir = req->r_dentry->d_parent->d_inode; |
601 | 605 | ||
602 | if (dir->i_sb != mdsc->client->sb) { | 606 | if (dir->i_sb != mdsc->fsc->sb) { |
603 | /* not this fs! */ | 607 | /* not this fs! */ |
604 | inode = req->r_dentry->d_inode; | 608 | inode = req->r_dentry->d_inode; |
605 | } else if (ceph_snap(dir) != CEPH_NOSNAP) { | 609 | } else if (ceph_snap(dir) != CEPH_NOSNAP) { |
@@ -884,7 +888,7 @@ static int remove_session_caps_cb(struct inode *inode, struct ceph_cap *cap, | |||
884 | __ceph_remove_cap(cap); | 888 | __ceph_remove_cap(cap); |
885 | if (!__ceph_is_any_real_caps(ci)) { | 889 | if (!__ceph_is_any_real_caps(ci)) { |
886 | struct ceph_mds_client *mdsc = | 890 | struct ceph_mds_client *mdsc = |
887 | &ceph_sb_to_client(inode->i_sb)->mdsc; | 891 | ceph_sb_to_client(inode->i_sb)->mdsc; |
888 | 892 | ||
889 | spin_lock(&mdsc->cap_dirty_lock); | 893 | spin_lock(&mdsc->cap_dirty_lock); |
890 | if (!list_empty(&ci->i_dirty_item)) { | 894 | if (!list_empty(&ci->i_dirty_item)) { |
@@ -1146,7 +1150,7 @@ int ceph_add_cap_releases(struct ceph_mds_client *mdsc, | |||
1146 | struct ceph_msg *msg, *partial = NULL; | 1150 | struct ceph_msg *msg, *partial = NULL; |
1147 | struct ceph_mds_cap_release *head; | 1151 | struct ceph_mds_cap_release *head; |
1148 | int err = -ENOMEM; | 1152 | int err = -ENOMEM; |
1149 | int extra = mdsc->client->mount_args->cap_release_safety; | 1153 | int extra = mdsc->fsc->mount_options->cap_release_safety; |
1150 | int num; | 1154 | int num; |
1151 | 1155 | ||
1152 | dout("add_cap_releases %p mds%d extra %d\n", session, session->s_mds, | 1156 | dout("add_cap_releases %p mds%d extra %d\n", session, session->s_mds, |
@@ -2085,7 +2089,7 @@ static void handle_reply(struct ceph_mds_session *session, struct ceph_msg *msg) | |||
2085 | 2089 | ||
2086 | /* insert trace into our cache */ | 2090 | /* insert trace into our cache */ |
2087 | mutex_lock(&req->r_fill_mutex); | 2091 | mutex_lock(&req->r_fill_mutex); |
2088 | err = ceph_fill_trace(mdsc->client->sb, req, req->r_session); | 2092 | err = ceph_fill_trace(mdsc->fsc->sb, req, req->r_session); |
2089 | if (err == 0) { | 2093 | if (err == 0) { |
2090 | if (result == 0 && rinfo->dir_nr) | 2094 | if (result == 0 && rinfo->dir_nr) |
2091 | ceph_readdir_prepopulate(req, req->r_session); | 2095 | ceph_readdir_prepopulate(req, req->r_session); |
@@ -2613,7 +2617,7 @@ static void handle_lease(struct ceph_mds_client *mdsc, | |||
2613 | struct ceph_mds_session *session, | 2617 | struct ceph_mds_session *session, |
2614 | struct ceph_msg *msg) | 2618 | struct ceph_msg *msg) |
2615 | { | 2619 | { |
2616 | struct super_block *sb = mdsc->client->sb; | 2620 | struct super_block *sb = mdsc->fsc->sb; |
2617 | struct inode *inode; | 2621 | struct inode *inode; |
2618 | struct ceph_inode_info *ci; | 2622 | struct ceph_inode_info *ci; |
2619 | struct dentry *parent, *dentry; | 2623 | struct dentry *parent, *dentry; |
@@ -2891,10 +2895,16 @@ static void delayed_work(struct work_struct *work) | |||
2891 | schedule_delayed(mdsc); | 2895 | schedule_delayed(mdsc); |
2892 | } | 2896 | } |
2893 | 2897 | ||
2898 | int ceph_mdsc_init(struct ceph_fs_client *fsc) | ||
2894 | 2899 | ||
2895 | int ceph_mdsc_init(struct ceph_mds_client *mdsc, struct ceph_client *client) | ||
2896 | { | 2900 | { |
2897 | mdsc->client = client; | 2901 | struct ceph_mds_client *mdsc; |
2902 | |||
2903 | mdsc = kzalloc(sizeof(struct ceph_mds_client), GFP_NOFS); | ||
2904 | if (!mdsc) | ||
2905 | return -ENOMEM; | ||
2906 | mdsc->fsc = fsc; | ||
2907 | fsc->mdsc = mdsc; | ||
2898 | mutex_init(&mdsc->mutex); | 2908 | mutex_init(&mdsc->mutex); |
2899 | mdsc->mdsmap = kzalloc(sizeof(*mdsc->mdsmap), GFP_NOFS); | 2909 | mdsc->mdsmap = kzalloc(sizeof(*mdsc->mdsmap), GFP_NOFS); |
2900 | if (mdsc->mdsmap == NULL) | 2910 | if (mdsc->mdsmap == NULL) |
@@ -2927,7 +2937,7 @@ int ceph_mdsc_init(struct ceph_mds_client *mdsc, struct ceph_client *client) | |||
2927 | INIT_LIST_HEAD(&mdsc->dentry_lru); | 2937 | INIT_LIST_HEAD(&mdsc->dentry_lru); |
2928 | 2938 | ||
2929 | ceph_caps_init(mdsc); | 2939 | ceph_caps_init(mdsc); |
2930 | ceph_adjust_min_caps(mdsc, client->min_caps); | 2940 | ceph_adjust_min_caps(mdsc, fsc->min_caps); |
2931 | 2941 | ||
2932 | return 0; | 2942 | return 0; |
2933 | } | 2943 | } |
@@ -2939,7 +2949,7 @@ int ceph_mdsc_init(struct ceph_mds_client *mdsc, struct ceph_client *client) | |||
2939 | static void wait_requests(struct ceph_mds_client *mdsc) | 2949 | static void wait_requests(struct ceph_mds_client *mdsc) |
2940 | { | 2950 | { |
2941 | struct ceph_mds_request *req; | 2951 | struct ceph_mds_request *req; |
2942 | struct ceph_client *client = mdsc->client; | 2952 | struct ceph_fs_client *fsc = mdsc->fsc; |
2943 | 2953 | ||
2944 | mutex_lock(&mdsc->mutex); | 2954 | mutex_lock(&mdsc->mutex); |
2945 | if (__get_oldest_req(mdsc)) { | 2955 | if (__get_oldest_req(mdsc)) { |
@@ -2947,7 +2957,7 @@ static void wait_requests(struct ceph_mds_client *mdsc) | |||
2947 | 2957 | ||
2948 | dout("wait_requests waiting for requests\n"); | 2958 | dout("wait_requests waiting for requests\n"); |
2949 | wait_for_completion_timeout(&mdsc->safe_umount_waiters, | 2959 | wait_for_completion_timeout(&mdsc->safe_umount_waiters, |
2950 | client->mount_args->mount_timeout * HZ); | 2960 | fsc->client->options->mount_timeout * HZ); |
2951 | 2961 | ||
2952 | /* tear down remaining requests */ | 2962 | /* tear down remaining requests */ |
2953 | mutex_lock(&mdsc->mutex); | 2963 | mutex_lock(&mdsc->mutex); |
@@ -3030,7 +3040,7 @@ void ceph_mdsc_sync(struct ceph_mds_client *mdsc) | |||
3030 | { | 3040 | { |
3031 | u64 want_tid, want_flush; | 3041 | u64 want_tid, want_flush; |
3032 | 3042 | ||
3033 | if (mdsc->client->mount_state == CEPH_MOUNT_SHUTDOWN) | 3043 | if (mdsc->fsc->mount_state == CEPH_MOUNT_SHUTDOWN) |
3034 | return; | 3044 | return; |
3035 | 3045 | ||
3036 | dout("sync\n"); | 3046 | dout("sync\n"); |
@@ -3053,7 +3063,7 @@ bool done_closing_sessions(struct ceph_mds_client *mdsc) | |||
3053 | { | 3063 | { |
3054 | int i, n = 0; | 3064 | int i, n = 0; |
3055 | 3065 | ||
3056 | if (mdsc->client->mount_state == CEPH_MOUNT_SHUTDOWN) | 3066 | if (mdsc->fsc->mount_state == CEPH_MOUNT_SHUTDOWN) |
3057 | return true; | 3067 | return true; |
3058 | 3068 | ||
3059 | mutex_lock(&mdsc->mutex); | 3069 | mutex_lock(&mdsc->mutex); |
@@ -3071,8 +3081,8 @@ void ceph_mdsc_close_sessions(struct ceph_mds_client *mdsc) | |||
3071 | { | 3081 | { |
3072 | struct ceph_mds_session *session; | 3082 | struct ceph_mds_session *session; |
3073 | int i; | 3083 | int i; |
3074 | struct ceph_client *client = mdsc->client; | 3084 | struct ceph_fs_client *fsc = mdsc->fsc; |
3075 | unsigned long timeout = client->mount_args->mount_timeout * HZ; | 3085 | unsigned long timeout = fsc->client->options->mount_timeout * HZ; |
3076 | 3086 | ||
3077 | dout("close_sessions\n"); | 3087 | dout("close_sessions\n"); |
3078 | 3088 | ||
@@ -3119,7 +3129,7 @@ void ceph_mdsc_close_sessions(struct ceph_mds_client *mdsc) | |||
3119 | dout("stopped\n"); | 3129 | dout("stopped\n"); |
3120 | } | 3130 | } |
3121 | 3131 | ||
3122 | void ceph_mdsc_stop(struct ceph_mds_client *mdsc) | 3132 | static void ceph_mdsc_stop(struct ceph_mds_client *mdsc) |
3123 | { | 3133 | { |
3124 | dout("stop\n"); | 3134 | dout("stop\n"); |
3125 | cancel_delayed_work_sync(&mdsc->delayed_work); /* cancel timer */ | 3135 | cancel_delayed_work_sync(&mdsc->delayed_work); /* cancel timer */ |
@@ -3129,6 +3139,15 @@ void ceph_mdsc_stop(struct ceph_mds_client *mdsc) | |||
3129 | ceph_caps_finalize(mdsc); | 3139 | ceph_caps_finalize(mdsc); |
3130 | } | 3140 | } |
3131 | 3141 | ||
3142 | void ceph_mdsc_destroy(struct ceph_fs_client *fsc) | ||
3143 | { | ||
3144 | struct ceph_mds_client *mdsc = fsc->mdsc; | ||
3145 | |||
3146 | ceph_mdsc_stop(mdsc); | ||
3147 | fsc->mdsc = NULL; | ||
3148 | kfree(mdsc); | ||
3149 | } | ||
3150 | |||
3132 | 3151 | ||
3133 | /* | 3152 | /* |
3134 | * handle mds map update. | 3153 | * handle mds map update. |
@@ -3145,14 +3164,14 @@ void ceph_mdsc_handle_map(struct ceph_mds_client *mdsc, struct ceph_msg *msg) | |||
3145 | 3164 | ||
3146 | ceph_decode_need(&p, end, sizeof(fsid)+2*sizeof(u32), bad); | 3165 | ceph_decode_need(&p, end, sizeof(fsid)+2*sizeof(u32), bad); |
3147 | ceph_decode_copy(&p, &fsid, sizeof(fsid)); | 3166 | ceph_decode_copy(&p, &fsid, sizeof(fsid)); |
3148 | if (ceph_check_fsid(mdsc->client, &fsid) < 0) | 3167 | if (ceph_check_fsid(mdsc->fsc->client, &fsid) < 0) |
3149 | return; | 3168 | return; |
3150 | epoch = ceph_decode_32(&p); | 3169 | epoch = ceph_decode_32(&p); |
3151 | maplen = ceph_decode_32(&p); | 3170 | maplen = ceph_decode_32(&p); |
3152 | dout("handle_map epoch %u len %d\n", epoch, (int)maplen); | 3171 | dout("handle_map epoch %u len %d\n", epoch, (int)maplen); |
3153 | 3172 | ||
3154 | /* do we need it? */ | 3173 | /* do we need it? */ |
3155 | ceph_monc_got_mdsmap(&mdsc->client->monc, epoch); | 3174 | ceph_monc_got_mdsmap(&mdsc->fsc->client->monc, epoch); |
3156 | mutex_lock(&mdsc->mutex); | 3175 | mutex_lock(&mdsc->mutex); |
3157 | if (mdsc->mdsmap && epoch <= mdsc->mdsmap->m_epoch) { | 3176 | if (mdsc->mdsmap && epoch <= mdsc->mdsmap->m_epoch) { |
3158 | dout("handle_map epoch %u <= our %u\n", | 3177 | dout("handle_map epoch %u <= our %u\n", |
@@ -3176,7 +3195,7 @@ void ceph_mdsc_handle_map(struct ceph_mds_client *mdsc, struct ceph_msg *msg) | |||
3176 | } else { | 3195 | } else { |
3177 | mdsc->mdsmap = newmap; /* first mds map */ | 3196 | mdsc->mdsmap = newmap; /* first mds map */ |
3178 | } | 3197 | } |
3179 | mdsc->client->sb->s_maxbytes = mdsc->mdsmap->m_max_file_size; | 3198 | mdsc->fsc->sb->s_maxbytes = mdsc->mdsmap->m_max_file_size; |
3180 | 3199 | ||
3181 | __wake_requests(mdsc, &mdsc->waiting_for_map); | 3200 | __wake_requests(mdsc, &mdsc->waiting_for_map); |
3182 | 3201 | ||
@@ -3277,7 +3296,7 @@ static int get_authorizer(struct ceph_connection *con, | |||
3277 | { | 3296 | { |
3278 | struct ceph_mds_session *s = con->private; | 3297 | struct ceph_mds_session *s = con->private; |
3279 | struct ceph_mds_client *mdsc = s->s_mdsc; | 3298 | struct ceph_mds_client *mdsc = s->s_mdsc; |
3280 | struct ceph_auth_client *ac = mdsc->client->monc.auth; | 3299 | struct ceph_auth_client *ac = mdsc->fsc->client->monc.auth; |
3281 | int ret = 0; | 3300 | int ret = 0; |
3282 | 3301 | ||
3283 | if (force_new && s->s_authorizer) { | 3302 | if (force_new && s->s_authorizer) { |
@@ -3311,7 +3330,7 @@ static int verify_authorizer_reply(struct ceph_connection *con, int len) | |||
3311 | { | 3330 | { |
3312 | struct ceph_mds_session *s = con->private; | 3331 | struct ceph_mds_session *s = con->private; |
3313 | struct ceph_mds_client *mdsc = s->s_mdsc; | 3332 | struct ceph_mds_client *mdsc = s->s_mdsc; |
3314 | struct ceph_auth_client *ac = mdsc->client->monc.auth; | 3333 | struct ceph_auth_client *ac = mdsc->fsc->client->monc.auth; |
3315 | 3334 | ||
3316 | return ac->ops->verify_authorizer_reply(ac, s->s_authorizer, len); | 3335 | return ac->ops->verify_authorizer_reply(ac, s->s_authorizer, len); |
3317 | } | 3336 | } |
@@ -3320,12 +3339,12 @@ static int invalidate_authorizer(struct ceph_connection *con) | |||
3320 | { | 3339 | { |
3321 | struct ceph_mds_session *s = con->private; | 3340 | struct ceph_mds_session *s = con->private; |
3322 | struct ceph_mds_client *mdsc = s->s_mdsc; | 3341 | struct ceph_mds_client *mdsc = s->s_mdsc; |
3323 | struct ceph_auth_client *ac = mdsc->client->monc.auth; | 3342 | struct ceph_auth_client *ac = mdsc->fsc->client->monc.auth; |
3324 | 3343 | ||
3325 | if (ac->ops->invalidate_authorizer) | 3344 | if (ac->ops->invalidate_authorizer) |
3326 | ac->ops->invalidate_authorizer(ac, CEPH_ENTITY_TYPE_MDS); | 3345 | ac->ops->invalidate_authorizer(ac, CEPH_ENTITY_TYPE_MDS); |
3327 | 3346 | ||
3328 | return ceph_monc_validate_auth(&mdsc->client->monc); | 3347 | return ceph_monc_validate_auth(&mdsc->fsc->client->monc); |
3329 | } | 3348 | } |
3330 | 3349 | ||
3331 | static const struct ceph_connection_operations mds_con_ops = { | 3350 | static const struct ceph_connection_operations mds_con_ops = { |
@@ -3338,7 +3357,4 @@ static const struct ceph_connection_operations mds_con_ops = { | |||
3338 | .peer_reset = peer_reset, | 3357 | .peer_reset = peer_reset, |
3339 | }; | 3358 | }; |
3340 | 3359 | ||
3341 | |||
3342 | |||
3343 | |||
3344 | /* eof */ | 3360 | /* eof */ |
diff --git a/fs/ceph/mds_client.h b/fs/ceph/mds_client.h index c98267ce6d2a..d66d63c72355 100644 --- a/fs/ceph/mds_client.h +++ b/fs/ceph/mds_client.h | |||
@@ -8,9 +8,9 @@ | |||
8 | #include <linux/rbtree.h> | 8 | #include <linux/rbtree.h> |
9 | #include <linux/spinlock.h> | 9 | #include <linux/spinlock.h> |
10 | 10 | ||
11 | #include "types.h" | 11 | #include <linux/ceph/types.h> |
12 | #include "messenger.h" | 12 | #include <linux/ceph/messenger.h> |
13 | #include "mdsmap.h" | 13 | #include <linux/ceph/mdsmap.h> |
14 | 14 | ||
15 | /* | 15 | /* |
16 | * Some lock dependencies: | 16 | * Some lock dependencies: |
@@ -26,7 +26,7 @@ | |||
26 | * | 26 | * |
27 | */ | 27 | */ |
28 | 28 | ||
29 | struct ceph_client; | 29 | struct ceph_fs_client; |
30 | struct ceph_cap; | 30 | struct ceph_cap; |
31 | 31 | ||
32 | /* | 32 | /* |
@@ -230,7 +230,7 @@ struct ceph_mds_request { | |||
230 | * mds client state | 230 | * mds client state |
231 | */ | 231 | */ |
232 | struct ceph_mds_client { | 232 | struct ceph_mds_client { |
233 | struct ceph_client *client; | 233 | struct ceph_fs_client *fsc; |
234 | struct mutex mutex; /* all nested structures */ | 234 | struct mutex mutex; /* all nested structures */ |
235 | 235 | ||
236 | struct ceph_mdsmap *mdsmap; | 236 | struct ceph_mdsmap *mdsmap; |
@@ -289,11 +289,6 @@ struct ceph_mds_client { | |||
289 | int caps_avail_count; /* unused, unreserved */ | 289 | int caps_avail_count; /* unused, unreserved */ |
290 | int caps_min_count; /* keep at least this many | 290 | int caps_min_count; /* keep at least this many |
291 | (unreserved) */ | 291 | (unreserved) */ |
292 | |||
293 | #ifdef CONFIG_DEBUG_FS | ||
294 | struct dentry *debugfs_file; | ||
295 | #endif | ||
296 | |||
297 | spinlock_t dentry_lru_lock; | 292 | spinlock_t dentry_lru_lock; |
298 | struct list_head dentry_lru; | 293 | struct list_head dentry_lru; |
299 | int num_dentry; | 294 | int num_dentry; |
@@ -316,10 +311,9 @@ extern void ceph_put_mds_session(struct ceph_mds_session *s); | |||
316 | extern int ceph_send_msg_mds(struct ceph_mds_client *mdsc, | 311 | extern int ceph_send_msg_mds(struct ceph_mds_client *mdsc, |
317 | struct ceph_msg *msg, int mds); | 312 | struct ceph_msg *msg, int mds); |
318 | 313 | ||
319 | extern int ceph_mdsc_init(struct ceph_mds_client *mdsc, | 314 | extern int ceph_mdsc_init(struct ceph_fs_client *fsc); |
320 | struct ceph_client *client); | ||
321 | extern void ceph_mdsc_close_sessions(struct ceph_mds_client *mdsc); | 315 | extern void ceph_mdsc_close_sessions(struct ceph_mds_client *mdsc); |
322 | extern void ceph_mdsc_stop(struct ceph_mds_client *mdsc); | 316 | extern void ceph_mdsc_destroy(struct ceph_fs_client *fsc); |
323 | 317 | ||
324 | extern void ceph_mdsc_sync(struct ceph_mds_client *mdsc); | 318 | extern void ceph_mdsc_sync(struct ceph_mds_client *mdsc); |
325 | 319 | ||
diff --git a/fs/ceph/mdsmap.c b/fs/ceph/mdsmap.c index 040be6d1150b..73b7d44e8a35 100644 --- a/fs/ceph/mdsmap.c +++ b/fs/ceph/mdsmap.c | |||
@@ -1,4 +1,4 @@ | |||
1 | #include "ceph_debug.h" | 1 | #include <linux/ceph/ceph_debug.h> |
2 | 2 | ||
3 | #include <linux/bug.h> | 3 | #include <linux/bug.h> |
4 | #include <linux/err.h> | 4 | #include <linux/err.h> |
@@ -6,9 +6,9 @@ | |||
6 | #include <linux/slab.h> | 6 | #include <linux/slab.h> |
7 | #include <linux/types.h> | 7 | #include <linux/types.h> |
8 | 8 | ||
9 | #include "mdsmap.h" | 9 | #include <linux/ceph/mdsmap.h> |
10 | #include "messenger.h" | 10 | #include <linux/ceph/messenger.h> |
11 | #include "decode.h" | 11 | #include <linux/ceph/decode.h> |
12 | 12 | ||
13 | #include "super.h" | 13 | #include "super.h" |
14 | 14 | ||
@@ -117,7 +117,8 @@ struct ceph_mdsmap *ceph_mdsmap_decode(void **p, void *end) | |||
117 | } | 117 | } |
118 | 118 | ||
119 | dout("mdsmap_decode %d/%d %lld mds%d.%d %s %s\n", | 119 | dout("mdsmap_decode %d/%d %lld mds%d.%d %s %s\n", |
120 | i+1, n, global_id, mds, inc, pr_addr(&addr.in_addr), | 120 | i+1, n, global_id, mds, inc, |
121 | ceph_pr_addr(&addr.in_addr), | ||
121 | ceph_mds_state_name(state)); | 122 | ceph_mds_state_name(state)); |
122 | if (mds >= 0 && mds < m->m_max_mds && state > 0) { | 123 | if (mds >= 0 && mds < m->m_max_mds && state > 0) { |
123 | m->m_info[mds].global_id = global_id; | 124 | m->m_info[mds].global_id = global_id; |
diff --git a/fs/ceph/snap.c b/fs/ceph/snap.c index 190b6c4a6f2b..39c243acd062 100644 --- a/fs/ceph/snap.c +++ b/fs/ceph/snap.c | |||
@@ -1,10 +1,12 @@ | |||
1 | #include "ceph_debug.h" | 1 | #include <linux/ceph/ceph_debug.h> |
2 | 2 | ||
3 | #include <linux/sort.h> | 3 | #include <linux/sort.h> |
4 | #include <linux/slab.h> | 4 | #include <linux/slab.h> |
5 | 5 | ||
6 | #include "super.h" | 6 | #include "super.h" |
7 | #include "decode.h" | 7 | #include "mds_client.h" |
8 | |||
9 | #include <linux/ceph/decode.h> | ||
8 | 10 | ||
9 | /* | 11 | /* |
10 | * Snapshots in ceph are driven in large part by cooperation from the | 12 | * Snapshots in ceph are driven in large part by cooperation from the |
@@ -526,7 +528,7 @@ int __ceph_finish_cap_snap(struct ceph_inode_info *ci, | |||
526 | struct ceph_cap_snap *capsnap) | 528 | struct ceph_cap_snap *capsnap) |
527 | { | 529 | { |
528 | struct inode *inode = &ci->vfs_inode; | 530 | struct inode *inode = &ci->vfs_inode; |
529 | struct ceph_mds_client *mdsc = &ceph_sb_to_client(inode->i_sb)->mdsc; | 531 | struct ceph_mds_client *mdsc = ceph_sb_to_client(inode->i_sb)->mdsc; |
530 | 532 | ||
531 | BUG_ON(capsnap->writing); | 533 | BUG_ON(capsnap->writing); |
532 | capsnap->size = inode->i_size; | 534 | capsnap->size = inode->i_size; |
@@ -747,7 +749,7 @@ void ceph_handle_snap(struct ceph_mds_client *mdsc, | |||
747 | struct ceph_mds_session *session, | 749 | struct ceph_mds_session *session, |
748 | struct ceph_msg *msg) | 750 | struct ceph_msg *msg) |
749 | { | 751 | { |
750 | struct super_block *sb = mdsc->client->sb; | 752 | struct super_block *sb = mdsc->fsc->sb; |
751 | int mds = session->s_mds; | 753 | int mds = session->s_mds; |
752 | u64 split; | 754 | u64 split; |
753 | int op; | 755 | int op; |
diff --git a/fs/ceph/ceph_strings.c b/fs/ceph/strings.c index c6179d3a26a2..cd5097d7c804 100644 --- a/fs/ceph/ceph_strings.c +++ b/fs/ceph/strings.c | |||
@@ -1,71 +1,9 @@ | |||
1 | /* | 1 | /* |
2 | * Ceph string constants | 2 | * Ceph fs string constants |
3 | */ | 3 | */ |
4 | #include "types.h" | 4 | #include <linux/module.h> |
5 | #include <linux/ceph/types.h> | ||
5 | 6 | ||
6 | const char *ceph_entity_type_name(int type) | ||
7 | { | ||
8 | switch (type) { | ||
9 | case CEPH_ENTITY_TYPE_MDS: return "mds"; | ||
10 | case CEPH_ENTITY_TYPE_OSD: return "osd"; | ||
11 | case CEPH_ENTITY_TYPE_MON: return "mon"; | ||
12 | case CEPH_ENTITY_TYPE_CLIENT: return "client"; | ||
13 | case CEPH_ENTITY_TYPE_AUTH: return "auth"; | ||
14 | default: return "unknown"; | ||
15 | } | ||
16 | } | ||
17 | |||
18 | const char *ceph_osd_op_name(int op) | ||
19 | { | ||
20 | switch (op) { | ||
21 | case CEPH_OSD_OP_READ: return "read"; | ||
22 | case CEPH_OSD_OP_STAT: return "stat"; | ||
23 | |||
24 | case CEPH_OSD_OP_MASKTRUNC: return "masktrunc"; | ||
25 | |||
26 | case CEPH_OSD_OP_WRITE: return "write"; | ||
27 | case CEPH_OSD_OP_DELETE: return "delete"; | ||
28 | case CEPH_OSD_OP_TRUNCATE: return "truncate"; | ||
29 | case CEPH_OSD_OP_ZERO: return "zero"; | ||
30 | case CEPH_OSD_OP_WRITEFULL: return "writefull"; | ||
31 | case CEPH_OSD_OP_ROLLBACK: return "rollback"; | ||
32 | |||
33 | case CEPH_OSD_OP_APPEND: return "append"; | ||
34 | case CEPH_OSD_OP_STARTSYNC: return "startsync"; | ||
35 | case CEPH_OSD_OP_SETTRUNC: return "settrunc"; | ||
36 | case CEPH_OSD_OP_TRIMTRUNC: return "trimtrunc"; | ||
37 | |||
38 | case CEPH_OSD_OP_TMAPUP: return "tmapup"; | ||
39 | case CEPH_OSD_OP_TMAPGET: return "tmapget"; | ||
40 | case CEPH_OSD_OP_TMAPPUT: return "tmapput"; | ||
41 | |||
42 | case CEPH_OSD_OP_GETXATTR: return "getxattr"; | ||
43 | case CEPH_OSD_OP_GETXATTRS: return "getxattrs"; | ||
44 | case CEPH_OSD_OP_SETXATTR: return "setxattr"; | ||
45 | case CEPH_OSD_OP_SETXATTRS: return "setxattrs"; | ||
46 | case CEPH_OSD_OP_RESETXATTRS: return "resetxattrs"; | ||
47 | case CEPH_OSD_OP_RMXATTR: return "rmxattr"; | ||
48 | case CEPH_OSD_OP_CMPXATTR: return "cmpxattr"; | ||
49 | |||
50 | case CEPH_OSD_OP_PULL: return "pull"; | ||
51 | case CEPH_OSD_OP_PUSH: return "push"; | ||
52 | case CEPH_OSD_OP_BALANCEREADS: return "balance-reads"; | ||
53 | case CEPH_OSD_OP_UNBALANCEREADS: return "unbalance-reads"; | ||
54 | case CEPH_OSD_OP_SCRUB: return "scrub"; | ||
55 | |||
56 | case CEPH_OSD_OP_WRLOCK: return "wrlock"; | ||
57 | case CEPH_OSD_OP_WRUNLOCK: return "wrunlock"; | ||
58 | case CEPH_OSD_OP_RDLOCK: return "rdlock"; | ||
59 | case CEPH_OSD_OP_RDUNLOCK: return "rdunlock"; | ||
60 | case CEPH_OSD_OP_UPLOCK: return "uplock"; | ||
61 | case CEPH_OSD_OP_DNLOCK: return "dnlock"; | ||
62 | |||
63 | case CEPH_OSD_OP_CALL: return "call"; | ||
64 | |||
65 | case CEPH_OSD_OP_PGLS: return "pgls"; | ||
66 | } | ||
67 | return "???"; | ||
68 | } | ||
69 | 7 | ||
70 | const char *ceph_mds_state_name(int s) | 8 | const char *ceph_mds_state_name(int s) |
71 | { | 9 | { |
@@ -177,17 +115,3 @@ const char *ceph_snap_op_name(int o) | |||
177 | } | 115 | } |
178 | return "???"; | 116 | return "???"; |
179 | } | 117 | } |
180 | |||
181 | const char *ceph_pool_op_name(int op) | ||
182 | { | ||
183 | switch (op) { | ||
184 | case POOL_OP_CREATE: return "create"; | ||
185 | case POOL_OP_DELETE: return "delete"; | ||
186 | case POOL_OP_AUID_CHANGE: return "auid change"; | ||
187 | case POOL_OP_CREATE_SNAP: return "create snap"; | ||
188 | case POOL_OP_DELETE_SNAP: return "delete snap"; | ||
189 | case POOL_OP_CREATE_UNMANAGED_SNAP: return "create unmanaged snap"; | ||
190 | case POOL_OP_DELETE_UNMANAGED_SNAP: return "delete unmanaged snap"; | ||
191 | } | ||
192 | return "???"; | ||
193 | } | ||
diff --git a/fs/ceph/super.c b/fs/ceph/super.c index 9922628532b2..d6e0e0421891 100644 --- a/fs/ceph/super.c +++ b/fs/ceph/super.c | |||
@@ -1,5 +1,5 @@ | |||
1 | 1 | ||
2 | #include "ceph_debug.h" | 2 | #include <linux/ceph/ceph_debug.h> |
3 | 3 | ||
4 | #include <linux/backing-dev.h> | 4 | #include <linux/backing-dev.h> |
5 | #include <linux/ctype.h> | 5 | #include <linux/ctype.h> |
@@ -15,10 +15,13 @@ | |||
15 | #include <linux/statfs.h> | 15 | #include <linux/statfs.h> |
16 | #include <linux/string.h> | 16 | #include <linux/string.h> |
17 | 17 | ||
18 | #include "decode.h" | ||
19 | #include "super.h" | 18 | #include "super.h" |
20 | #include "mon_client.h" | 19 | #include "mds_client.h" |
21 | #include "auth.h" | 20 | |
21 | #include <linux/ceph/decode.h> | ||
22 | #include <linux/ceph/mon_client.h> | ||
23 | #include <linux/ceph/auth.h> | ||
24 | #include <linux/ceph/debugfs.h> | ||
22 | 25 | ||
23 | /* | 26 | /* |
24 | * Ceph superblock operations | 27 | * Ceph superblock operations |
@@ -26,36 +29,22 @@ | |||
26 | * Handle the basics of mounting, unmounting. | 29 | * Handle the basics of mounting, unmounting. |
27 | */ | 30 | */ |
28 | 31 | ||
29 | |||
30 | /* | ||
31 | * find filename portion of a path (/foo/bar/baz -> baz) | ||
32 | */ | ||
33 | const char *ceph_file_part(const char *s, int len) | ||
34 | { | ||
35 | const char *e = s + len; | ||
36 | |||
37 | while (e != s && *(e-1) != '/') | ||
38 | e--; | ||
39 | return e; | ||
40 | } | ||
41 | |||
42 | |||
43 | /* | 32 | /* |
44 | * super ops | 33 | * super ops |
45 | */ | 34 | */ |
46 | static void ceph_put_super(struct super_block *s) | 35 | static void ceph_put_super(struct super_block *s) |
47 | { | 36 | { |
48 | struct ceph_client *client = ceph_sb_to_client(s); | 37 | struct ceph_fs_client *fsc = ceph_sb_to_client(s); |
49 | 38 | ||
50 | dout("put_super\n"); | 39 | dout("put_super\n"); |
51 | ceph_mdsc_close_sessions(&client->mdsc); | 40 | ceph_mdsc_close_sessions(fsc->mdsc); |
52 | 41 | ||
53 | /* | 42 | /* |
54 | * ensure we release the bdi before put_anon_super releases | 43 | * ensure we release the bdi before put_anon_super releases |
55 | * the device name. | 44 | * the device name. |
56 | */ | 45 | */ |
57 | if (s->s_bdi == &client->backing_dev_info) { | 46 | if (s->s_bdi == &fsc->backing_dev_info) { |
58 | bdi_unregister(&client->backing_dev_info); | 47 | bdi_unregister(&fsc->backing_dev_info); |
59 | s->s_bdi = NULL; | 48 | s->s_bdi = NULL; |
60 | } | 49 | } |
61 | 50 | ||
@@ -64,14 +53,14 @@ static void ceph_put_super(struct super_block *s) | |||
64 | 53 | ||
65 | static int ceph_statfs(struct dentry *dentry, struct kstatfs *buf) | 54 | static int ceph_statfs(struct dentry *dentry, struct kstatfs *buf) |
66 | { | 55 | { |
67 | struct ceph_client *client = ceph_inode_to_client(dentry->d_inode); | 56 | struct ceph_fs_client *fsc = ceph_inode_to_client(dentry->d_inode); |
68 | struct ceph_monmap *monmap = client->monc.monmap; | 57 | struct ceph_monmap *monmap = fsc->client->monc.monmap; |
69 | struct ceph_statfs st; | 58 | struct ceph_statfs st; |
70 | u64 fsid; | 59 | u64 fsid; |
71 | int err; | 60 | int err; |
72 | 61 | ||
73 | dout("statfs\n"); | 62 | dout("statfs\n"); |
74 | err = ceph_monc_do_statfs(&client->monc, &st); | 63 | err = ceph_monc_do_statfs(&fsc->client->monc, &st); |
75 | if (err < 0) | 64 | if (err < 0) |
76 | return err; | 65 | return err; |
77 | 66 | ||
@@ -104,238 +93,28 @@ static int ceph_statfs(struct dentry *dentry, struct kstatfs *buf) | |||
104 | 93 | ||
105 | static int ceph_sync_fs(struct super_block *sb, int wait) | 94 | static int ceph_sync_fs(struct super_block *sb, int wait) |
106 | { | 95 | { |
107 | struct ceph_client *client = ceph_sb_to_client(sb); | 96 | struct ceph_fs_client *fsc = ceph_sb_to_client(sb); |
108 | 97 | ||
109 | if (!wait) { | 98 | if (!wait) { |
110 | dout("sync_fs (non-blocking)\n"); | 99 | dout("sync_fs (non-blocking)\n"); |
111 | ceph_flush_dirty_caps(&client->mdsc); | 100 | ceph_flush_dirty_caps(fsc->mdsc); |
112 | dout("sync_fs (non-blocking) done\n"); | 101 | dout("sync_fs (non-blocking) done\n"); |
113 | return 0; | 102 | return 0; |
114 | } | 103 | } |
115 | 104 | ||
116 | dout("sync_fs (blocking)\n"); | 105 | dout("sync_fs (blocking)\n"); |
117 | ceph_osdc_sync(&ceph_sb_to_client(sb)->osdc); | 106 | ceph_osdc_sync(&fsc->client->osdc); |
118 | ceph_mdsc_sync(&ceph_sb_to_client(sb)->mdsc); | 107 | ceph_mdsc_sync(fsc->mdsc); |
119 | dout("sync_fs (blocking) done\n"); | 108 | dout("sync_fs (blocking) done\n"); |
120 | return 0; | 109 | return 0; |
121 | } | 110 | } |
122 | 111 | ||
123 | static int default_congestion_kb(void) | ||
124 | { | ||
125 | int congestion_kb; | ||
126 | |||
127 | /* | ||
128 | * Copied from NFS | ||
129 | * | ||
130 | * congestion size, scale with available memory. | ||
131 | * | ||
132 | * 64MB: 8192k | ||
133 | * 128MB: 11585k | ||
134 | * 256MB: 16384k | ||
135 | * 512MB: 23170k | ||
136 | * 1GB: 32768k | ||
137 | * 2GB: 46340k | ||
138 | * 4GB: 65536k | ||
139 | * 8GB: 92681k | ||
140 | * 16GB: 131072k | ||
141 | * | ||
142 | * This allows larger machines to have larger/more transfers. | ||
143 | * Limit the default to 256M | ||
144 | */ | ||
145 | congestion_kb = (16*int_sqrt(totalram_pages)) << (PAGE_SHIFT-10); | ||
146 | if (congestion_kb > 256*1024) | ||
147 | congestion_kb = 256*1024; | ||
148 | |||
149 | return congestion_kb; | ||
150 | } | ||
151 | |||
152 | /** | ||
153 | * ceph_show_options - Show mount options in /proc/mounts | ||
154 | * @m: seq_file to write to | ||
155 | * @mnt: mount descriptor | ||
156 | */ | ||
157 | static int ceph_show_options(struct seq_file *m, struct vfsmount *mnt) | ||
158 | { | ||
159 | struct ceph_client *client = ceph_sb_to_client(mnt->mnt_sb); | ||
160 | struct ceph_mount_args *args = client->mount_args; | ||
161 | |||
162 | if (args->flags & CEPH_OPT_FSID) | ||
163 | seq_printf(m, ",fsid=%pU", &args->fsid); | ||
164 | if (args->flags & CEPH_OPT_NOSHARE) | ||
165 | seq_puts(m, ",noshare"); | ||
166 | if (args->flags & CEPH_OPT_DIRSTAT) | ||
167 | seq_puts(m, ",dirstat"); | ||
168 | if ((args->flags & CEPH_OPT_RBYTES) == 0) | ||
169 | seq_puts(m, ",norbytes"); | ||
170 | if (args->flags & CEPH_OPT_NOCRC) | ||
171 | seq_puts(m, ",nocrc"); | ||
172 | if (args->flags & CEPH_OPT_NOASYNCREADDIR) | ||
173 | seq_puts(m, ",noasyncreaddir"); | ||
174 | |||
175 | if (args->mount_timeout != CEPH_MOUNT_TIMEOUT_DEFAULT) | ||
176 | seq_printf(m, ",mount_timeout=%d", args->mount_timeout); | ||
177 | if (args->osd_idle_ttl != CEPH_OSD_IDLE_TTL_DEFAULT) | ||
178 | seq_printf(m, ",osd_idle_ttl=%d", args->osd_idle_ttl); | ||
179 | if (args->osd_timeout != CEPH_OSD_TIMEOUT_DEFAULT) | ||
180 | seq_printf(m, ",osdtimeout=%d", args->osd_timeout); | ||
181 | if (args->osd_keepalive_timeout != CEPH_OSD_KEEPALIVE_DEFAULT) | ||
182 | seq_printf(m, ",osdkeepalivetimeout=%d", | ||
183 | args->osd_keepalive_timeout); | ||
184 | if (args->wsize) | ||
185 | seq_printf(m, ",wsize=%d", args->wsize); | ||
186 | if (args->rsize != CEPH_MOUNT_RSIZE_DEFAULT) | ||
187 | seq_printf(m, ",rsize=%d", args->rsize); | ||
188 | if (args->congestion_kb != default_congestion_kb()) | ||
189 | seq_printf(m, ",write_congestion_kb=%d", args->congestion_kb); | ||
190 | if (args->caps_wanted_delay_min != CEPH_CAPS_WANTED_DELAY_MIN_DEFAULT) | ||
191 | seq_printf(m, ",caps_wanted_delay_min=%d", | ||
192 | args->caps_wanted_delay_min); | ||
193 | if (args->caps_wanted_delay_max != CEPH_CAPS_WANTED_DELAY_MAX_DEFAULT) | ||
194 | seq_printf(m, ",caps_wanted_delay_max=%d", | ||
195 | args->caps_wanted_delay_max); | ||
196 | if (args->cap_release_safety != CEPH_CAP_RELEASE_SAFETY_DEFAULT) | ||
197 | seq_printf(m, ",cap_release_safety=%d", | ||
198 | args->cap_release_safety); | ||
199 | if (args->max_readdir != CEPH_MAX_READDIR_DEFAULT) | ||
200 | seq_printf(m, ",readdir_max_entries=%d", args->max_readdir); | ||
201 | if (args->max_readdir_bytes != CEPH_MAX_READDIR_BYTES_DEFAULT) | ||
202 | seq_printf(m, ",readdir_max_bytes=%d", args->max_readdir_bytes); | ||
203 | if (strcmp(args->snapdir_name, CEPH_SNAPDIRNAME_DEFAULT)) | ||
204 | seq_printf(m, ",snapdirname=%s", args->snapdir_name); | ||
205 | if (args->name) | ||
206 | seq_printf(m, ",name=%s", args->name); | ||
207 | if (args->secret) | ||
208 | seq_puts(m, ",secret=<hidden>"); | ||
209 | return 0; | ||
210 | } | ||
211 | |||
212 | /* | ||
213 | * caches | ||
214 | */ | ||
215 | struct kmem_cache *ceph_inode_cachep; | ||
216 | struct kmem_cache *ceph_cap_cachep; | ||
217 | struct kmem_cache *ceph_dentry_cachep; | ||
218 | struct kmem_cache *ceph_file_cachep; | ||
219 | |||
220 | static void ceph_inode_init_once(void *foo) | ||
221 | { | ||
222 | struct ceph_inode_info *ci = foo; | ||
223 | inode_init_once(&ci->vfs_inode); | ||
224 | } | ||
225 | |||
226 | static int __init init_caches(void) | ||
227 | { | ||
228 | ceph_inode_cachep = kmem_cache_create("ceph_inode_info", | ||
229 | sizeof(struct ceph_inode_info), | ||
230 | __alignof__(struct ceph_inode_info), | ||
231 | (SLAB_RECLAIM_ACCOUNT|SLAB_MEM_SPREAD), | ||
232 | ceph_inode_init_once); | ||
233 | if (ceph_inode_cachep == NULL) | ||
234 | return -ENOMEM; | ||
235 | |||
236 | ceph_cap_cachep = KMEM_CACHE(ceph_cap, | ||
237 | SLAB_RECLAIM_ACCOUNT|SLAB_MEM_SPREAD); | ||
238 | if (ceph_cap_cachep == NULL) | ||
239 | goto bad_cap; | ||
240 | |||
241 | ceph_dentry_cachep = KMEM_CACHE(ceph_dentry_info, | ||
242 | SLAB_RECLAIM_ACCOUNT|SLAB_MEM_SPREAD); | ||
243 | if (ceph_dentry_cachep == NULL) | ||
244 | goto bad_dentry; | ||
245 | |||
246 | ceph_file_cachep = KMEM_CACHE(ceph_file_info, | ||
247 | SLAB_RECLAIM_ACCOUNT|SLAB_MEM_SPREAD); | ||
248 | if (ceph_file_cachep == NULL) | ||
249 | goto bad_file; | ||
250 | |||
251 | return 0; | ||
252 | |||
253 | bad_file: | ||
254 | kmem_cache_destroy(ceph_dentry_cachep); | ||
255 | bad_dentry: | ||
256 | kmem_cache_destroy(ceph_cap_cachep); | ||
257 | bad_cap: | ||
258 | kmem_cache_destroy(ceph_inode_cachep); | ||
259 | return -ENOMEM; | ||
260 | } | ||
261 | |||
262 | static void destroy_caches(void) | ||
263 | { | ||
264 | kmem_cache_destroy(ceph_inode_cachep); | ||
265 | kmem_cache_destroy(ceph_cap_cachep); | ||
266 | kmem_cache_destroy(ceph_dentry_cachep); | ||
267 | kmem_cache_destroy(ceph_file_cachep); | ||
268 | } | ||
269 | |||
270 | |||
271 | /* | ||
272 | * ceph_umount_begin - initiate forced umount. Tear down down the | ||
273 | * mount, skipping steps that may hang while waiting for server(s). | ||
274 | */ | ||
275 | static void ceph_umount_begin(struct super_block *sb) | ||
276 | { | ||
277 | struct ceph_client *client = ceph_sb_to_client(sb); | ||
278 | |||
279 | dout("ceph_umount_begin - starting forced umount\n"); | ||
280 | if (!client) | ||
281 | return; | ||
282 | client->mount_state = CEPH_MOUNT_SHUTDOWN; | ||
283 | return; | ||
284 | } | ||
285 | |||
286 | static const struct super_operations ceph_super_ops = { | ||
287 | .alloc_inode = ceph_alloc_inode, | ||
288 | .destroy_inode = ceph_destroy_inode, | ||
289 | .write_inode = ceph_write_inode, | ||
290 | .sync_fs = ceph_sync_fs, | ||
291 | .put_super = ceph_put_super, | ||
292 | .show_options = ceph_show_options, | ||
293 | .statfs = ceph_statfs, | ||
294 | .umount_begin = ceph_umount_begin, | ||
295 | }; | ||
296 | |||
297 | |||
298 | const char *ceph_msg_type_name(int type) | ||
299 | { | ||
300 | switch (type) { | ||
301 | case CEPH_MSG_SHUTDOWN: return "shutdown"; | ||
302 | case CEPH_MSG_PING: return "ping"; | ||
303 | case CEPH_MSG_AUTH: return "auth"; | ||
304 | case CEPH_MSG_AUTH_REPLY: return "auth_reply"; | ||
305 | case CEPH_MSG_MON_MAP: return "mon_map"; | ||
306 | case CEPH_MSG_MON_GET_MAP: return "mon_get_map"; | ||
307 | case CEPH_MSG_MON_SUBSCRIBE: return "mon_subscribe"; | ||
308 | case CEPH_MSG_MON_SUBSCRIBE_ACK: return "mon_subscribe_ack"; | ||
309 | case CEPH_MSG_STATFS: return "statfs"; | ||
310 | case CEPH_MSG_STATFS_REPLY: return "statfs_reply"; | ||
311 | case CEPH_MSG_MDS_MAP: return "mds_map"; | ||
312 | case CEPH_MSG_CLIENT_SESSION: return "client_session"; | ||
313 | case CEPH_MSG_CLIENT_RECONNECT: return "client_reconnect"; | ||
314 | case CEPH_MSG_CLIENT_REQUEST: return "client_request"; | ||
315 | case CEPH_MSG_CLIENT_REQUEST_FORWARD: return "client_request_forward"; | ||
316 | case CEPH_MSG_CLIENT_REPLY: return "client_reply"; | ||
317 | case CEPH_MSG_CLIENT_CAPS: return "client_caps"; | ||
318 | case CEPH_MSG_CLIENT_CAPRELEASE: return "client_cap_release"; | ||
319 | case CEPH_MSG_CLIENT_SNAP: return "client_snap"; | ||
320 | case CEPH_MSG_CLIENT_LEASE: return "client_lease"; | ||
321 | case CEPH_MSG_OSD_MAP: return "osd_map"; | ||
322 | case CEPH_MSG_OSD_OP: return "osd_op"; | ||
323 | case CEPH_MSG_OSD_OPREPLY: return "osd_opreply"; | ||
324 | default: return "unknown"; | ||
325 | } | ||
326 | } | ||
327 | |||
328 | |||
329 | /* | 112 | /* |
330 | * mount options | 113 | * mount options |
331 | */ | 114 | */ |
332 | enum { | 115 | enum { |
333 | Opt_wsize, | 116 | Opt_wsize, |
334 | Opt_rsize, | 117 | Opt_rsize, |
335 | Opt_osdtimeout, | ||
336 | Opt_osdkeepalivetimeout, | ||
337 | Opt_mount_timeout, | ||
338 | Opt_osd_idle_ttl, | ||
339 | Opt_caps_wanted_delay_min, | 118 | Opt_caps_wanted_delay_min, |
340 | Opt_caps_wanted_delay_max, | 119 | Opt_caps_wanted_delay_max, |
341 | Opt_cap_release_safety, | 120 | Opt_cap_release_safety, |
@@ -344,29 +123,19 @@ enum { | |||
344 | Opt_congestion_kb, | 123 | Opt_congestion_kb, |
345 | Opt_last_int, | 124 | Opt_last_int, |
346 | /* int args above */ | 125 | /* int args above */ |
347 | Opt_fsid, | ||
348 | Opt_snapdirname, | 126 | Opt_snapdirname, |
349 | Opt_name, | ||
350 | Opt_secret, | ||
351 | Opt_last_string, | 127 | Opt_last_string, |
352 | /* string args above */ | 128 | /* string args above */ |
353 | Opt_ip, | ||
354 | Opt_noshare, | ||
355 | Opt_dirstat, | 129 | Opt_dirstat, |
356 | Opt_nodirstat, | 130 | Opt_nodirstat, |
357 | Opt_rbytes, | 131 | Opt_rbytes, |
358 | Opt_norbytes, | 132 | Opt_norbytes, |
359 | Opt_nocrc, | ||
360 | Opt_noasyncreaddir, | 133 | Opt_noasyncreaddir, |
361 | }; | 134 | }; |
362 | 135 | ||
363 | static match_table_t arg_tokens = { | 136 | static match_table_t fsopt_tokens = { |
364 | {Opt_wsize, "wsize=%d"}, | 137 | {Opt_wsize, "wsize=%d"}, |
365 | {Opt_rsize, "rsize=%d"}, | 138 | {Opt_rsize, "rsize=%d"}, |
366 | {Opt_osdtimeout, "osdtimeout=%d"}, | ||
367 | {Opt_osdkeepalivetimeout, "osdkeepalive=%d"}, | ||
368 | {Opt_mount_timeout, "mount_timeout=%d"}, | ||
369 | {Opt_osd_idle_ttl, "osd_idle_ttl=%d"}, | ||
370 | {Opt_caps_wanted_delay_min, "caps_wanted_delay_min=%d"}, | 139 | {Opt_caps_wanted_delay_min, "caps_wanted_delay_min=%d"}, |
371 | {Opt_caps_wanted_delay_max, "caps_wanted_delay_max=%d"}, | 140 | {Opt_caps_wanted_delay_max, "caps_wanted_delay_max=%d"}, |
372 | {Opt_cap_release_safety, "cap_release_safety=%d"}, | 141 | {Opt_cap_release_safety, "cap_release_safety=%d"}, |
@@ -374,403 +143,459 @@ static match_table_t arg_tokens = { | |||
374 | {Opt_readdir_max_bytes, "readdir_max_bytes=%d"}, | 143 | {Opt_readdir_max_bytes, "readdir_max_bytes=%d"}, |
375 | {Opt_congestion_kb, "write_congestion_kb=%d"}, | 144 | {Opt_congestion_kb, "write_congestion_kb=%d"}, |
376 | /* int args above */ | 145 | /* int args above */ |
377 | {Opt_fsid, "fsid=%s"}, | ||
378 | {Opt_snapdirname, "snapdirname=%s"}, | 146 | {Opt_snapdirname, "snapdirname=%s"}, |
379 | {Opt_name, "name=%s"}, | ||
380 | {Opt_secret, "secret=%s"}, | ||
381 | /* string args above */ | 147 | /* string args above */ |
382 | {Opt_ip, "ip=%s"}, | ||
383 | {Opt_noshare, "noshare"}, | ||
384 | {Opt_dirstat, "dirstat"}, | 148 | {Opt_dirstat, "dirstat"}, |
385 | {Opt_nodirstat, "nodirstat"}, | 149 | {Opt_nodirstat, "nodirstat"}, |
386 | {Opt_rbytes, "rbytes"}, | 150 | {Opt_rbytes, "rbytes"}, |
387 | {Opt_norbytes, "norbytes"}, | 151 | {Opt_norbytes, "norbytes"}, |
388 | {Opt_nocrc, "nocrc"}, | ||
389 | {Opt_noasyncreaddir, "noasyncreaddir"}, | 152 | {Opt_noasyncreaddir, "noasyncreaddir"}, |
390 | {-1, NULL} | 153 | {-1, NULL} |
391 | }; | 154 | }; |
392 | 155 | ||
393 | static int parse_fsid(const char *str, struct ceph_fsid *fsid) | 156 | static int parse_fsopt_token(char *c, void *private) |
394 | { | 157 | { |
395 | int i = 0; | 158 | struct ceph_mount_options *fsopt = private; |
396 | char tmp[3]; | 159 | substring_t argstr[MAX_OPT_ARGS]; |
397 | int err = -EINVAL; | 160 | int token, intval, ret; |
398 | int d; | 161 | |
399 | 162 | token = match_token((char *)c, fsopt_tokens, argstr); | |
400 | dout("parse_fsid '%s'\n", str); | 163 | if (token < 0) |
401 | tmp[2] = 0; | 164 | return -EINVAL; |
402 | while (*str && i < 16) { | 165 | |
403 | if (ispunct(*str)) { | 166 | if (token < Opt_last_int) { |
404 | str++; | 167 | ret = match_int(&argstr[0], &intval); |
405 | continue; | 168 | if (ret < 0) { |
169 | pr_err("bad mount option arg (not int) " | ||
170 | "at '%s'\n", c); | ||
171 | return ret; | ||
406 | } | 172 | } |
407 | if (!isxdigit(str[0]) || !isxdigit(str[1])) | 173 | dout("got int token %d val %d\n", token, intval); |
408 | break; | 174 | } else if (token > Opt_last_int && token < Opt_last_string) { |
409 | tmp[0] = str[0]; | 175 | dout("got string token %d val %s\n", token, |
410 | tmp[1] = str[1]; | 176 | argstr[0].from); |
411 | if (sscanf(tmp, "%x", &d) < 1) | 177 | } else { |
412 | break; | 178 | dout("got token %d\n", token); |
413 | fsid->fsid[i] = d & 0xff; | ||
414 | i++; | ||
415 | str += 2; | ||
416 | } | 179 | } |
417 | 180 | ||
418 | if (i == 16) | 181 | switch (token) { |
419 | err = 0; | 182 | case Opt_snapdirname: |
420 | dout("parse_fsid ret %d got fsid %pU", err, fsid); | 183 | kfree(fsopt->snapdir_name); |
421 | return err; | 184 | fsopt->snapdir_name = kstrndup(argstr[0].from, |
185 | argstr[0].to-argstr[0].from, | ||
186 | GFP_KERNEL); | ||
187 | if (!fsopt->snapdir_name) | ||
188 | return -ENOMEM; | ||
189 | break; | ||
190 | |||
191 | /* misc */ | ||
192 | case Opt_wsize: | ||
193 | fsopt->wsize = intval; | ||
194 | break; | ||
195 | case Opt_rsize: | ||
196 | fsopt->rsize = intval; | ||
197 | break; | ||
198 | case Opt_caps_wanted_delay_min: | ||
199 | fsopt->caps_wanted_delay_min = intval; | ||
200 | break; | ||
201 | case Opt_caps_wanted_delay_max: | ||
202 | fsopt->caps_wanted_delay_max = intval; | ||
203 | break; | ||
204 | case Opt_readdir_max_entries: | ||
205 | fsopt->max_readdir = intval; | ||
206 | break; | ||
207 | case Opt_readdir_max_bytes: | ||
208 | fsopt->max_readdir_bytes = intval; | ||
209 | break; | ||
210 | case Opt_congestion_kb: | ||
211 | fsopt->congestion_kb = intval; | ||
212 | break; | ||
213 | case Opt_dirstat: | ||
214 | fsopt->flags |= CEPH_MOUNT_OPT_DIRSTAT; | ||
215 | break; | ||
216 | case Opt_nodirstat: | ||
217 | fsopt->flags &= ~CEPH_MOUNT_OPT_DIRSTAT; | ||
218 | break; | ||
219 | case Opt_rbytes: | ||
220 | fsopt->flags |= CEPH_MOUNT_OPT_RBYTES; | ||
221 | break; | ||
222 | case Opt_norbytes: | ||
223 | fsopt->flags &= ~CEPH_MOUNT_OPT_RBYTES; | ||
224 | break; | ||
225 | case Opt_noasyncreaddir: | ||
226 | fsopt->flags |= CEPH_MOUNT_OPT_NOASYNCREADDIR; | ||
227 | break; | ||
228 | default: | ||
229 | BUG_ON(token); | ||
230 | } | ||
231 | return 0; | ||
422 | } | 232 | } |
423 | 233 | ||
424 | static struct ceph_mount_args *parse_mount_args(int flags, char *options, | 234 | static void destroy_mount_options(struct ceph_mount_options *args) |
425 | const char *dev_name, | ||
426 | const char **path) | ||
427 | { | 235 | { |
428 | struct ceph_mount_args *args; | 236 | dout("destroy_mount_options %p\n", args); |
429 | const char *c; | 237 | kfree(args->snapdir_name); |
430 | int err = -ENOMEM; | 238 | kfree(args); |
431 | substring_t argstr[MAX_OPT_ARGS]; | 239 | } |
432 | 240 | ||
433 | args = kzalloc(sizeof(*args), GFP_KERNEL); | 241 | static int strcmp_null(const char *s1, const char *s2) |
434 | if (!args) | 242 | { |
435 | return ERR_PTR(-ENOMEM); | 243 | if (!s1 && !s2) |
436 | args->mon_addr = kcalloc(CEPH_MAX_MON, sizeof(*args->mon_addr), | 244 | return 0; |
437 | GFP_KERNEL); | 245 | if (s1 && !s2) |
438 | if (!args->mon_addr) | 246 | return -1; |
439 | goto out; | 247 | if (!s1 && s2) |
248 | return 1; | ||
249 | return strcmp(s1, s2); | ||
250 | } | ||
440 | 251 | ||
441 | dout("parse_mount_args %p, dev_name '%s'\n", args, dev_name); | 252 | static int compare_mount_options(struct ceph_mount_options *new_fsopt, |
442 | 253 | struct ceph_options *new_opt, | |
443 | /* start with defaults */ | 254 | struct ceph_fs_client *fsc) |
444 | args->sb_flags = flags; | 255 | { |
445 | args->flags = CEPH_OPT_DEFAULT; | 256 | struct ceph_mount_options *fsopt1 = new_fsopt; |
446 | args->osd_timeout = CEPH_OSD_TIMEOUT_DEFAULT; | 257 | struct ceph_mount_options *fsopt2 = fsc->mount_options; |
447 | args->osd_keepalive_timeout = CEPH_OSD_KEEPALIVE_DEFAULT; | 258 | int ofs = offsetof(struct ceph_mount_options, snapdir_name); |
448 | args->mount_timeout = CEPH_MOUNT_TIMEOUT_DEFAULT; /* seconds */ | 259 | int ret; |
449 | args->osd_idle_ttl = CEPH_OSD_IDLE_TTL_DEFAULT; /* seconds */ | ||
450 | args->caps_wanted_delay_min = CEPH_CAPS_WANTED_DELAY_MIN_DEFAULT; | ||
451 | args->caps_wanted_delay_max = CEPH_CAPS_WANTED_DELAY_MAX_DEFAULT; | ||
452 | args->rsize = CEPH_MOUNT_RSIZE_DEFAULT; | ||
453 | args->snapdir_name = kstrdup(CEPH_SNAPDIRNAME_DEFAULT, GFP_KERNEL); | ||
454 | args->cap_release_safety = CEPH_CAP_RELEASE_SAFETY_DEFAULT; | ||
455 | args->max_readdir = CEPH_MAX_READDIR_DEFAULT; | ||
456 | args->max_readdir_bytes = CEPH_MAX_READDIR_BYTES_DEFAULT; | ||
457 | args->congestion_kb = default_congestion_kb(); | ||
458 | |||
459 | /* ip1[:port1][,ip2[:port2]...]:/subdir/in/fs */ | ||
460 | err = -EINVAL; | ||
461 | if (!dev_name) | ||
462 | goto out; | ||
463 | *path = strstr(dev_name, ":/"); | ||
464 | if (*path == NULL) { | ||
465 | pr_err("device name is missing path (no :/ in %s)\n", | ||
466 | dev_name); | ||
467 | goto out; | ||
468 | } | ||
469 | 260 | ||
470 | /* get mon ip(s) */ | 261 | ret = memcmp(fsopt1, fsopt2, ofs); |
471 | err = ceph_parse_ips(dev_name, *path, args->mon_addr, | 262 | if (ret) |
472 | CEPH_MAX_MON, &args->num_mon); | 263 | return ret; |
473 | if (err < 0) | 264 | |
474 | goto out; | 265 | ret = strcmp_null(fsopt1->snapdir_name, fsopt2->snapdir_name); |
266 | if (ret) | ||
267 | return ret; | ||
268 | |||
269 | return ceph_compare_options(new_opt, fsc->client); | ||
270 | } | ||
271 | |||
272 | static int parse_mount_options(struct ceph_mount_options **pfsopt, | ||
273 | struct ceph_options **popt, | ||
274 | int flags, char *options, | ||
275 | const char *dev_name, | ||
276 | const char **path) | ||
277 | { | ||
278 | struct ceph_mount_options *fsopt; | ||
279 | const char *dev_name_end; | ||
280 | int err = -ENOMEM; | ||
281 | |||
282 | fsopt = kzalloc(sizeof(*fsopt), GFP_KERNEL); | ||
283 | if (!fsopt) | ||
284 | return -ENOMEM; | ||
285 | |||
286 | dout("parse_mount_options %p, dev_name '%s'\n", fsopt, dev_name); | ||
287 | |||
288 | fsopt->sb_flags = flags; | ||
289 | fsopt->flags = CEPH_MOUNT_OPT_DEFAULT; | ||
290 | |||
291 | fsopt->rsize = CEPH_MOUNT_RSIZE_DEFAULT; | ||
292 | fsopt->snapdir_name = kstrdup(CEPH_SNAPDIRNAME_DEFAULT, GFP_KERNEL); | ||
293 | fsopt->cap_release_safety = CEPH_CAP_RELEASE_SAFETY_DEFAULT; | ||
294 | fsopt->max_readdir = CEPH_MAX_READDIR_DEFAULT; | ||
295 | fsopt->max_readdir_bytes = CEPH_MAX_READDIR_BYTES_DEFAULT; | ||
296 | fsopt->congestion_kb = default_congestion_kb(); | ||
297 | |||
298 | /* ip1[:port1][,ip2[:port2]...]:/subdir/in/fs */ | ||
299 | err = -EINVAL; | ||
300 | if (!dev_name) | ||
301 | goto out; | ||
302 | *path = strstr(dev_name, ":/"); | ||
303 | if (*path == NULL) { | ||
304 | pr_err("device name is missing path (no :/ in %s)\n", | ||
305 | dev_name); | ||
306 | goto out; | ||
307 | } | ||
308 | dev_name_end = *path; | ||
309 | dout("device name '%.*s'\n", (int)(dev_name_end - dev_name), dev_name); | ||
475 | 310 | ||
476 | /* path on server */ | 311 | /* path on server */ |
477 | *path += 2; | 312 | *path += 2; |
478 | dout("server path '%s'\n", *path); | 313 | dout("server path '%s'\n", *path); |
479 | 314 | ||
480 | /* parse mount options */ | 315 | err = ceph_parse_options(popt, options, dev_name, dev_name_end, |
481 | while ((c = strsep(&options, ",")) != NULL) { | 316 | parse_fsopt_token, (void *)fsopt); |
482 | int token, intval, ret; | 317 | if (err) |
483 | if (!*c) | 318 | goto out; |
484 | continue; | 319 | |
485 | err = -EINVAL; | 320 | /* success */ |
486 | token = match_token((char *)c, arg_tokens, argstr); | 321 | *pfsopt = fsopt; |
487 | if (token < 0) { | 322 | return 0; |
488 | pr_err("bad mount option at '%s'\n", c); | ||
489 | goto out; | ||
490 | } | ||
491 | if (token < Opt_last_int) { | ||
492 | ret = match_int(&argstr[0], &intval); | ||
493 | if (ret < 0) { | ||
494 | pr_err("bad mount option arg (not int) " | ||
495 | "at '%s'\n", c); | ||
496 | continue; | ||
497 | } | ||
498 | dout("got int token %d val %d\n", token, intval); | ||
499 | } else if (token > Opt_last_int && token < Opt_last_string) { | ||
500 | dout("got string token %d val %s\n", token, | ||
501 | argstr[0].from); | ||
502 | } else { | ||
503 | dout("got token %d\n", token); | ||
504 | } | ||
505 | switch (token) { | ||
506 | case Opt_ip: | ||
507 | err = ceph_parse_ips(argstr[0].from, | ||
508 | argstr[0].to, | ||
509 | &args->my_addr, | ||
510 | 1, NULL); | ||
511 | if (err < 0) | ||
512 | goto out; | ||
513 | args->flags |= CEPH_OPT_MYIP; | ||
514 | break; | ||
515 | |||
516 | case Opt_fsid: | ||
517 | err = parse_fsid(argstr[0].from, &args->fsid); | ||
518 | if (err == 0) | ||
519 | args->flags |= CEPH_OPT_FSID; | ||
520 | break; | ||
521 | case Opt_snapdirname: | ||
522 | kfree(args->snapdir_name); | ||
523 | args->snapdir_name = kstrndup(argstr[0].from, | ||
524 | argstr[0].to-argstr[0].from, | ||
525 | GFP_KERNEL); | ||
526 | break; | ||
527 | case Opt_name: | ||
528 | args->name = kstrndup(argstr[0].from, | ||
529 | argstr[0].to-argstr[0].from, | ||
530 | GFP_KERNEL); | ||
531 | break; | ||
532 | case Opt_secret: | ||
533 | args->secret = kstrndup(argstr[0].from, | ||
534 | argstr[0].to-argstr[0].from, | ||
535 | GFP_KERNEL); | ||
536 | break; | ||
537 | |||
538 | /* misc */ | ||
539 | case Opt_wsize: | ||
540 | args->wsize = intval; | ||
541 | break; | ||
542 | case Opt_rsize: | ||
543 | args->rsize = intval; | ||
544 | break; | ||
545 | case Opt_osdtimeout: | ||
546 | args->osd_timeout = intval; | ||
547 | break; | ||
548 | case Opt_osdkeepalivetimeout: | ||
549 | args->osd_keepalive_timeout = intval; | ||
550 | break; | ||
551 | case Opt_osd_idle_ttl: | ||
552 | args->osd_idle_ttl = intval; | ||
553 | break; | ||
554 | case Opt_mount_timeout: | ||
555 | args->mount_timeout = intval; | ||
556 | break; | ||
557 | case Opt_caps_wanted_delay_min: | ||
558 | args->caps_wanted_delay_min = intval; | ||
559 | break; | ||
560 | case Opt_caps_wanted_delay_max: | ||
561 | args->caps_wanted_delay_max = intval; | ||
562 | break; | ||
563 | case Opt_readdir_max_entries: | ||
564 | args->max_readdir = intval; | ||
565 | break; | ||
566 | case Opt_readdir_max_bytes: | ||
567 | args->max_readdir_bytes = intval; | ||
568 | break; | ||
569 | case Opt_congestion_kb: | ||
570 | args->congestion_kb = intval; | ||
571 | break; | ||
572 | |||
573 | case Opt_noshare: | ||
574 | args->flags |= CEPH_OPT_NOSHARE; | ||
575 | break; | ||
576 | |||
577 | case Opt_dirstat: | ||
578 | args->flags |= CEPH_OPT_DIRSTAT; | ||
579 | break; | ||
580 | case Opt_nodirstat: | ||
581 | args->flags &= ~CEPH_OPT_DIRSTAT; | ||
582 | break; | ||
583 | case Opt_rbytes: | ||
584 | args->flags |= CEPH_OPT_RBYTES; | ||
585 | break; | ||
586 | case Opt_norbytes: | ||
587 | args->flags &= ~CEPH_OPT_RBYTES; | ||
588 | break; | ||
589 | case Opt_nocrc: | ||
590 | args->flags |= CEPH_OPT_NOCRC; | ||
591 | break; | ||
592 | case Opt_noasyncreaddir: | ||
593 | args->flags |= CEPH_OPT_NOASYNCREADDIR; | ||
594 | break; | ||
595 | |||
596 | default: | ||
597 | BUG_ON(token); | ||
598 | } | ||
599 | } | ||
600 | return args; | ||
601 | 323 | ||
602 | out: | 324 | out: |
603 | kfree(args->mon_addr); | 325 | destroy_mount_options(fsopt); |
604 | kfree(args); | 326 | return err; |
605 | return ERR_PTR(err); | ||
606 | } | 327 | } |
607 | 328 | ||
608 | static void destroy_mount_args(struct ceph_mount_args *args) | 329 | /** |
330 | * ceph_show_options - Show mount options in /proc/mounts | ||
331 | * @m: seq_file to write to | ||
332 | * @mnt: mount descriptor | ||
333 | */ | ||
334 | static int ceph_show_options(struct seq_file *m, struct vfsmount *mnt) | ||
609 | { | 335 | { |
610 | dout("destroy_mount_args %p\n", args); | 336 | struct ceph_fs_client *fsc = ceph_sb_to_client(mnt->mnt_sb); |
611 | kfree(args->snapdir_name); | 337 | struct ceph_mount_options *fsopt = fsc->mount_options; |
612 | args->snapdir_name = NULL; | 338 | struct ceph_options *opt = fsc->client->options; |
613 | kfree(args->name); | 339 | |
614 | args->name = NULL; | 340 | if (opt->flags & CEPH_OPT_FSID) |
615 | kfree(args->secret); | 341 | seq_printf(m, ",fsid=%pU", &opt->fsid); |
616 | args->secret = NULL; | 342 | if (opt->flags & CEPH_OPT_NOSHARE) |
617 | kfree(args); | 343 | seq_puts(m, ",noshare"); |
344 | if (opt->flags & CEPH_OPT_NOCRC) | ||
345 | seq_puts(m, ",nocrc"); | ||
346 | |||
347 | if (opt->name) | ||
348 | seq_printf(m, ",name=%s", opt->name); | ||
349 | if (opt->secret) | ||
350 | seq_puts(m, ",secret=<hidden>"); | ||
351 | |||
352 | if (opt->mount_timeout != CEPH_MOUNT_TIMEOUT_DEFAULT) | ||
353 | seq_printf(m, ",mount_timeout=%d", opt->mount_timeout); | ||
354 | if (opt->osd_idle_ttl != CEPH_OSD_IDLE_TTL_DEFAULT) | ||
355 | seq_printf(m, ",osd_idle_ttl=%d", opt->osd_idle_ttl); | ||
356 | if (opt->osd_timeout != CEPH_OSD_TIMEOUT_DEFAULT) | ||
357 | seq_printf(m, ",osdtimeout=%d", opt->osd_timeout); | ||
358 | if (opt->osd_keepalive_timeout != CEPH_OSD_KEEPALIVE_DEFAULT) | ||
359 | seq_printf(m, ",osdkeepalivetimeout=%d", | ||
360 | opt->osd_keepalive_timeout); | ||
361 | |||
362 | if (fsopt->flags & CEPH_MOUNT_OPT_DIRSTAT) | ||
363 | seq_puts(m, ",dirstat"); | ||
364 | if ((fsopt->flags & CEPH_MOUNT_OPT_RBYTES) == 0) | ||
365 | seq_puts(m, ",norbytes"); | ||
366 | if (fsopt->flags & CEPH_MOUNT_OPT_NOASYNCREADDIR) | ||
367 | seq_puts(m, ",noasyncreaddir"); | ||
368 | |||
369 | if (fsopt->wsize) | ||
370 | seq_printf(m, ",wsize=%d", fsopt->wsize); | ||
371 | if (fsopt->rsize != CEPH_MOUNT_RSIZE_DEFAULT) | ||
372 | seq_printf(m, ",rsize=%d", fsopt->rsize); | ||
373 | if (fsopt->congestion_kb != default_congestion_kb()) | ||
374 | seq_printf(m, ",write_congestion_kb=%d", fsopt->congestion_kb); | ||
375 | if (fsopt->caps_wanted_delay_min != CEPH_CAPS_WANTED_DELAY_MIN_DEFAULT) | ||
376 | seq_printf(m, ",caps_wanted_delay_min=%d", | ||
377 | fsopt->caps_wanted_delay_min); | ||
378 | if (fsopt->caps_wanted_delay_max != CEPH_CAPS_WANTED_DELAY_MAX_DEFAULT) | ||
379 | seq_printf(m, ",caps_wanted_delay_max=%d", | ||
380 | fsopt->caps_wanted_delay_max); | ||
381 | if (fsopt->cap_release_safety != CEPH_CAP_RELEASE_SAFETY_DEFAULT) | ||
382 | seq_printf(m, ",cap_release_safety=%d", | ||
383 | fsopt->cap_release_safety); | ||
384 | if (fsopt->max_readdir != CEPH_MAX_READDIR_DEFAULT) | ||
385 | seq_printf(m, ",readdir_max_entries=%d", fsopt->max_readdir); | ||
386 | if (fsopt->max_readdir_bytes != CEPH_MAX_READDIR_BYTES_DEFAULT) | ||
387 | seq_printf(m, ",readdir_max_bytes=%d", fsopt->max_readdir_bytes); | ||
388 | if (strcmp(fsopt->snapdir_name, CEPH_SNAPDIRNAME_DEFAULT)) | ||
389 | seq_printf(m, ",snapdirname=%s", fsopt->snapdir_name); | ||
390 | return 0; | ||
618 | } | 391 | } |
619 | 392 | ||
620 | /* | 393 | /* |
621 | * create a fresh client instance | 394 | * handle any mon messages the standard library doesn't understand. |
395 | * return error if we don't either. | ||
622 | */ | 396 | */ |
623 | static struct ceph_client *ceph_create_client(struct ceph_mount_args *args) | 397 | static int extra_mon_dispatch(struct ceph_client *client, struct ceph_msg *msg) |
624 | { | 398 | { |
625 | struct ceph_client *client; | 399 | struct ceph_fs_client *fsc = client->private; |
400 | int type = le16_to_cpu(msg->hdr.type); | ||
401 | |||
402 | switch (type) { | ||
403 | case CEPH_MSG_MDS_MAP: | ||
404 | ceph_mdsc_handle_map(fsc->mdsc, msg); | ||
405 | return 0; | ||
406 | |||
407 | default: | ||
408 | return -1; | ||
409 | } | ||
410 | } | ||
411 | |||
412 | /* | ||
413 | * create a new fs client | ||
414 | */ | ||
415 | struct ceph_fs_client *create_fs_client(struct ceph_mount_options *fsopt, | ||
416 | struct ceph_options *opt) | ||
417 | { | ||
418 | struct ceph_fs_client *fsc; | ||
626 | int err = -ENOMEM; | 419 | int err = -ENOMEM; |
627 | 420 | ||
628 | client = kzalloc(sizeof(*client), GFP_KERNEL); | 421 | fsc = kzalloc(sizeof(*fsc), GFP_KERNEL); |
629 | if (client == NULL) | 422 | if (!fsc) |
630 | return ERR_PTR(-ENOMEM); | 423 | return ERR_PTR(-ENOMEM); |
631 | 424 | ||
632 | mutex_init(&client->mount_mutex); | 425 | fsc->client = ceph_create_client(opt, fsc); |
633 | 426 | if (IS_ERR(fsc->client)) { | |
634 | init_waitqueue_head(&client->auth_wq); | 427 | err = PTR_ERR(fsc->client); |
428 | goto fail; | ||
429 | } | ||
430 | fsc->client->extra_mon_dispatch = extra_mon_dispatch; | ||
431 | fsc->client->supported_features |= CEPH_FEATURE_FLOCK; | ||
432 | fsc->client->monc.want_mdsmap = 1; | ||
635 | 433 | ||
636 | client->sb = NULL; | 434 | fsc->mount_options = fsopt; |
637 | client->mount_state = CEPH_MOUNT_MOUNTING; | ||
638 | client->mount_args = args; | ||
639 | 435 | ||
640 | client->msgr = NULL; | 436 | fsc->sb = NULL; |
437 | fsc->mount_state = CEPH_MOUNT_MOUNTING; | ||
641 | 438 | ||
642 | client->auth_err = 0; | 439 | atomic_long_set(&fsc->writeback_count, 0); |
643 | atomic_long_set(&client->writeback_count, 0); | ||
644 | 440 | ||
645 | err = bdi_init(&client->backing_dev_info); | 441 | err = bdi_init(&fsc->backing_dev_info); |
646 | if (err < 0) | 442 | if (err < 0) |
647 | goto fail; | 443 | goto fail_client; |
648 | 444 | ||
649 | err = -ENOMEM; | 445 | err = -ENOMEM; |
650 | client->wb_wq = create_workqueue("ceph-writeback"); | 446 | fsc->wb_wq = create_workqueue("ceph-writeback"); |
651 | if (client->wb_wq == NULL) | 447 | if (fsc->wb_wq == NULL) |
652 | goto fail_bdi; | 448 | goto fail_bdi; |
653 | client->pg_inv_wq = create_singlethread_workqueue("ceph-pg-invalid"); | 449 | fsc->pg_inv_wq = create_singlethread_workqueue("ceph-pg-invalid"); |
654 | if (client->pg_inv_wq == NULL) | 450 | if (fsc->pg_inv_wq == NULL) |
655 | goto fail_wb_wq; | 451 | goto fail_wb_wq; |
656 | client->trunc_wq = create_singlethread_workqueue("ceph-trunc"); | 452 | fsc->trunc_wq = create_singlethread_workqueue("ceph-trunc"); |
657 | if (client->trunc_wq == NULL) | 453 | if (fsc->trunc_wq == NULL) |
658 | goto fail_pg_inv_wq; | 454 | goto fail_pg_inv_wq; |
659 | 455 | ||
660 | /* set up mempools */ | 456 | /* set up mempools */ |
661 | err = -ENOMEM; | 457 | err = -ENOMEM; |
662 | client->wb_pagevec_pool = mempool_create_kmalloc_pool(10, | 458 | fsc->wb_pagevec_pool = mempool_create_kmalloc_pool(10, |
663 | client->mount_args->wsize >> PAGE_CACHE_SHIFT); | 459 | fsc->mount_options->wsize >> PAGE_CACHE_SHIFT); |
664 | if (!client->wb_pagevec_pool) | 460 | if (!fsc->wb_pagevec_pool) |
665 | goto fail_trunc_wq; | 461 | goto fail_trunc_wq; |
666 | 462 | ||
667 | /* caps */ | 463 | /* caps */ |
668 | client->min_caps = args->max_readdir; | 464 | fsc->min_caps = fsopt->max_readdir; |
465 | |||
466 | return fsc; | ||
669 | 467 | ||
670 | /* subsystems */ | ||
671 | err = ceph_monc_init(&client->monc, client); | ||
672 | if (err < 0) | ||
673 | goto fail_mempool; | ||
674 | err = ceph_osdc_init(&client->osdc, client); | ||
675 | if (err < 0) | ||
676 | goto fail_monc; | ||
677 | err = ceph_mdsc_init(&client->mdsc, client); | ||
678 | if (err < 0) | ||
679 | goto fail_osdc; | ||
680 | return client; | ||
681 | |||
682 | fail_osdc: | ||
683 | ceph_osdc_stop(&client->osdc); | ||
684 | fail_monc: | ||
685 | ceph_monc_stop(&client->monc); | ||
686 | fail_mempool: | ||
687 | mempool_destroy(client->wb_pagevec_pool); | ||
688 | fail_trunc_wq: | 468 | fail_trunc_wq: |
689 | destroy_workqueue(client->trunc_wq); | 469 | destroy_workqueue(fsc->trunc_wq); |
690 | fail_pg_inv_wq: | 470 | fail_pg_inv_wq: |
691 | destroy_workqueue(client->pg_inv_wq); | 471 | destroy_workqueue(fsc->pg_inv_wq); |
692 | fail_wb_wq: | 472 | fail_wb_wq: |
693 | destroy_workqueue(client->wb_wq); | 473 | destroy_workqueue(fsc->wb_wq); |
694 | fail_bdi: | 474 | fail_bdi: |
695 | bdi_destroy(&client->backing_dev_info); | 475 | bdi_destroy(&fsc->backing_dev_info); |
476 | fail_client: | ||
477 | ceph_destroy_client(fsc->client); | ||
696 | fail: | 478 | fail: |
697 | kfree(client); | 479 | kfree(fsc); |
698 | return ERR_PTR(err); | 480 | return ERR_PTR(err); |
699 | } | 481 | } |
700 | 482 | ||
701 | static void ceph_destroy_client(struct ceph_client *client) | 483 | void destroy_fs_client(struct ceph_fs_client *fsc) |
702 | { | 484 | { |
703 | dout("destroy_client %p\n", client); | 485 | dout("destroy_fs_client %p\n", fsc); |
704 | 486 | ||
705 | /* unmount */ | 487 | destroy_workqueue(fsc->wb_wq); |
706 | ceph_mdsc_stop(&client->mdsc); | 488 | destroy_workqueue(fsc->pg_inv_wq); |
707 | ceph_osdc_stop(&client->osdc); | 489 | destroy_workqueue(fsc->trunc_wq); |
708 | 490 | ||
709 | /* | 491 | bdi_destroy(&fsc->backing_dev_info); |
710 | * make sure mds and osd connections close out before destroying | ||
711 | * the auth module, which is needed to free those connections' | ||
712 | * ceph_authorizers. | ||
713 | */ | ||
714 | ceph_msgr_flush(); | ||
715 | |||
716 | ceph_monc_stop(&client->monc); | ||
717 | 492 | ||
718 | ceph_debugfs_client_cleanup(client); | 493 | mempool_destroy(fsc->wb_pagevec_pool); |
719 | destroy_workqueue(client->wb_wq); | ||
720 | destroy_workqueue(client->pg_inv_wq); | ||
721 | destroy_workqueue(client->trunc_wq); | ||
722 | 494 | ||
723 | bdi_destroy(&client->backing_dev_info); | 495 | destroy_mount_options(fsc->mount_options); |
724 | 496 | ||
725 | if (client->msgr) | 497 | ceph_fs_debugfs_cleanup(fsc); |
726 | ceph_messenger_destroy(client->msgr); | ||
727 | mempool_destroy(client->wb_pagevec_pool); | ||
728 | 498 | ||
729 | destroy_mount_args(client->mount_args); | 499 | ceph_destroy_client(fsc->client); |
730 | 500 | ||
731 | kfree(client); | 501 | kfree(fsc); |
732 | dout("destroy_client %p done\n", client); | 502 | dout("destroy_fs_client %p done\n", fsc); |
733 | } | 503 | } |
734 | 504 | ||
735 | /* | 505 | /* |
736 | * Initially learn our fsid, or verify an fsid matches. | 506 | * caches |
737 | */ | 507 | */ |
738 | int ceph_check_fsid(struct ceph_client *client, struct ceph_fsid *fsid) | 508 | struct kmem_cache *ceph_inode_cachep; |
509 | struct kmem_cache *ceph_cap_cachep; | ||
510 | struct kmem_cache *ceph_dentry_cachep; | ||
511 | struct kmem_cache *ceph_file_cachep; | ||
512 | |||
513 | static void ceph_inode_init_once(void *foo) | ||
739 | { | 514 | { |
740 | if (client->have_fsid) { | 515 | struct ceph_inode_info *ci = foo; |
741 | if (ceph_fsid_compare(&client->fsid, fsid)) { | 516 | inode_init_once(&ci->vfs_inode); |
742 | pr_err("bad fsid, had %pU got %pU", | 517 | } |
743 | &client->fsid, fsid); | 518 | |
744 | return -1; | 519 | static int __init init_caches(void) |
745 | } | 520 | { |
746 | } else { | 521 | ceph_inode_cachep = kmem_cache_create("ceph_inode_info", |
747 | pr_info("client%lld fsid %pU\n", client->monc.auth->global_id, | 522 | sizeof(struct ceph_inode_info), |
748 | fsid); | 523 | __alignof__(struct ceph_inode_info), |
749 | memcpy(&client->fsid, fsid, sizeof(*fsid)); | 524 | (SLAB_RECLAIM_ACCOUNT|SLAB_MEM_SPREAD), |
750 | ceph_debugfs_client_init(client); | 525 | ceph_inode_init_once); |
751 | client->have_fsid = true; | 526 | if (ceph_inode_cachep == NULL) |
752 | } | 527 | return -ENOMEM; |
528 | |||
529 | ceph_cap_cachep = KMEM_CACHE(ceph_cap, | ||
530 | SLAB_RECLAIM_ACCOUNT|SLAB_MEM_SPREAD); | ||
531 | if (ceph_cap_cachep == NULL) | ||
532 | goto bad_cap; | ||
533 | |||
534 | ceph_dentry_cachep = KMEM_CACHE(ceph_dentry_info, | ||
535 | SLAB_RECLAIM_ACCOUNT|SLAB_MEM_SPREAD); | ||
536 | if (ceph_dentry_cachep == NULL) | ||
537 | goto bad_dentry; | ||
538 | |||
539 | ceph_file_cachep = KMEM_CACHE(ceph_file_info, | ||
540 | SLAB_RECLAIM_ACCOUNT|SLAB_MEM_SPREAD); | ||
541 | if (ceph_file_cachep == NULL) | ||
542 | goto bad_file; | ||
543 | |||
753 | return 0; | 544 | return 0; |
545 | |||
546 | bad_file: | ||
547 | kmem_cache_destroy(ceph_dentry_cachep); | ||
548 | bad_dentry: | ||
549 | kmem_cache_destroy(ceph_cap_cachep); | ||
550 | bad_cap: | ||
551 | kmem_cache_destroy(ceph_inode_cachep); | ||
552 | return -ENOMEM; | ||
754 | } | 553 | } |
755 | 554 | ||
555 | static void destroy_caches(void) | ||
556 | { | ||
557 | kmem_cache_destroy(ceph_inode_cachep); | ||
558 | kmem_cache_destroy(ceph_cap_cachep); | ||
559 | kmem_cache_destroy(ceph_dentry_cachep); | ||
560 | kmem_cache_destroy(ceph_file_cachep); | ||
561 | } | ||
562 | |||
563 | |||
756 | /* | 564 | /* |
757 | * true if we have the mon map (and have thus joined the cluster) | 565 | * ceph_umount_begin - initiate forced umount. Tear down down the |
566 | * mount, skipping steps that may hang while waiting for server(s). | ||
758 | */ | 567 | */ |
759 | static int have_mon_and_osd_map(struct ceph_client *client) | 568 | static void ceph_umount_begin(struct super_block *sb) |
760 | { | 569 | { |
761 | return client->monc.monmap && client->monc.monmap->epoch && | 570 | struct ceph_fs_client *fsc = ceph_sb_to_client(sb); |
762 | client->osdc.osdmap && client->osdc.osdmap->epoch; | 571 | |
572 | dout("ceph_umount_begin - starting forced umount\n"); | ||
573 | if (!fsc) | ||
574 | return; | ||
575 | fsc->mount_state = CEPH_MOUNT_SHUTDOWN; | ||
576 | return; | ||
763 | } | 577 | } |
764 | 578 | ||
579 | static const struct super_operations ceph_super_ops = { | ||
580 | .alloc_inode = ceph_alloc_inode, | ||
581 | .destroy_inode = ceph_destroy_inode, | ||
582 | .write_inode = ceph_write_inode, | ||
583 | .sync_fs = ceph_sync_fs, | ||
584 | .put_super = ceph_put_super, | ||
585 | .show_options = ceph_show_options, | ||
586 | .statfs = ceph_statfs, | ||
587 | .umount_begin = ceph_umount_begin, | ||
588 | }; | ||
589 | |||
765 | /* | 590 | /* |
766 | * Bootstrap mount by opening the root directory. Note the mount | 591 | * Bootstrap mount by opening the root directory. Note the mount |
767 | * @started time from caller, and time out if this takes too long. | 592 | * @started time from caller, and time out if this takes too long. |
768 | */ | 593 | */ |
769 | static struct dentry *open_root_dentry(struct ceph_client *client, | 594 | static struct dentry *open_root_dentry(struct ceph_fs_client *fsc, |
770 | const char *path, | 595 | const char *path, |
771 | unsigned long started) | 596 | unsigned long started) |
772 | { | 597 | { |
773 | struct ceph_mds_client *mdsc = &client->mdsc; | 598 | struct ceph_mds_client *mdsc = fsc->mdsc; |
774 | struct ceph_mds_request *req = NULL; | 599 | struct ceph_mds_request *req = NULL; |
775 | int err; | 600 | int err; |
776 | struct dentry *root; | 601 | struct dentry *root; |
@@ -784,14 +609,14 @@ static struct dentry *open_root_dentry(struct ceph_client *client, | |||
784 | req->r_ino1.ino = CEPH_INO_ROOT; | 609 | req->r_ino1.ino = CEPH_INO_ROOT; |
785 | req->r_ino1.snap = CEPH_NOSNAP; | 610 | req->r_ino1.snap = CEPH_NOSNAP; |
786 | req->r_started = started; | 611 | req->r_started = started; |
787 | req->r_timeout = client->mount_args->mount_timeout * HZ; | 612 | req->r_timeout = fsc->client->options->mount_timeout * HZ; |
788 | req->r_args.getattr.mask = cpu_to_le32(CEPH_STAT_CAP_INODE); | 613 | req->r_args.getattr.mask = cpu_to_le32(CEPH_STAT_CAP_INODE); |
789 | req->r_num_caps = 2; | 614 | req->r_num_caps = 2; |
790 | err = ceph_mdsc_do_request(mdsc, NULL, req); | 615 | err = ceph_mdsc_do_request(mdsc, NULL, req); |
791 | if (err == 0) { | 616 | if (err == 0) { |
792 | dout("open_root_inode success\n"); | 617 | dout("open_root_inode success\n"); |
793 | if (ceph_ino(req->r_target_inode) == CEPH_INO_ROOT && | 618 | if (ceph_ino(req->r_target_inode) == CEPH_INO_ROOT && |
794 | client->sb->s_root == NULL) | 619 | fsc->sb->s_root == NULL) |
795 | root = d_alloc_root(req->r_target_inode); | 620 | root = d_alloc_root(req->r_target_inode); |
796 | else | 621 | else |
797 | root = d_obtain_alias(req->r_target_inode); | 622 | root = d_obtain_alias(req->r_target_inode); |
@@ -804,105 +629,86 @@ static struct dentry *open_root_dentry(struct ceph_client *client, | |||
804 | return root; | 629 | return root; |
805 | } | 630 | } |
806 | 631 | ||
632 | |||
633 | |||
634 | |||
807 | /* | 635 | /* |
808 | * mount: join the ceph cluster, and open root directory. | 636 | * mount: join the ceph cluster, and open root directory. |
809 | */ | 637 | */ |
810 | static int ceph_mount(struct ceph_client *client, struct vfsmount *mnt, | 638 | static int ceph_mount(struct ceph_fs_client *fsc, struct vfsmount *mnt, |
811 | const char *path) | 639 | const char *path) |
812 | { | 640 | { |
813 | struct ceph_entity_addr *myaddr = NULL; | ||
814 | int err; | 641 | int err; |
815 | unsigned long timeout = client->mount_args->mount_timeout * HZ; | ||
816 | unsigned long started = jiffies; /* note the start time */ | 642 | unsigned long started = jiffies; /* note the start time */ |
817 | struct dentry *root; | 643 | struct dentry *root; |
644 | int first = 0; /* first vfsmount for this super_block */ | ||
818 | 645 | ||
819 | dout("mount start\n"); | 646 | dout("mount start\n"); |
820 | mutex_lock(&client->mount_mutex); | 647 | mutex_lock(&fsc->client->mount_mutex); |
821 | |||
822 | /* initialize the messenger */ | ||
823 | if (client->msgr == NULL) { | ||
824 | if (ceph_test_opt(client, MYIP)) | ||
825 | myaddr = &client->mount_args->my_addr; | ||
826 | client->msgr = ceph_messenger_create(myaddr); | ||
827 | if (IS_ERR(client->msgr)) { | ||
828 | err = PTR_ERR(client->msgr); | ||
829 | client->msgr = NULL; | ||
830 | goto out; | ||
831 | } | ||
832 | client->msgr->nocrc = ceph_test_opt(client, NOCRC); | ||
833 | } | ||
834 | 648 | ||
835 | /* open session, and wait for mon, mds, and osd maps */ | 649 | err = __ceph_open_session(fsc->client, started); |
836 | err = ceph_monc_open_session(&client->monc); | ||
837 | if (err < 0) | 650 | if (err < 0) |
838 | goto out; | 651 | goto out; |
839 | 652 | ||
840 | while (!have_mon_and_osd_map(client)) { | ||
841 | err = -EIO; | ||
842 | if (timeout && time_after_eq(jiffies, started + timeout)) | ||
843 | goto out; | ||
844 | |||
845 | /* wait */ | ||
846 | dout("mount waiting for mon_map\n"); | ||
847 | err = wait_event_interruptible_timeout(client->auth_wq, | ||
848 | have_mon_and_osd_map(client) || (client->auth_err < 0), | ||
849 | timeout); | ||
850 | if (err == -EINTR || err == -ERESTARTSYS) | ||
851 | goto out; | ||
852 | if (client->auth_err < 0) { | ||
853 | err = client->auth_err; | ||
854 | goto out; | ||
855 | } | ||
856 | } | ||
857 | |||
858 | dout("mount opening root\n"); | 653 | dout("mount opening root\n"); |
859 | root = open_root_dentry(client, "", started); | 654 | root = open_root_dentry(fsc, "", started); |
860 | if (IS_ERR(root)) { | 655 | if (IS_ERR(root)) { |
861 | err = PTR_ERR(root); | 656 | err = PTR_ERR(root); |
862 | goto out; | 657 | goto out; |
863 | } | 658 | } |
864 | if (client->sb->s_root) | 659 | if (fsc->sb->s_root) { |
865 | dput(root); | 660 | dput(root); |
866 | else | 661 | } else { |
867 | client->sb->s_root = root; | 662 | fsc->sb->s_root = root; |
663 | first = 1; | ||
664 | |||
665 | err = ceph_fs_debugfs_init(fsc); | ||
666 | if (err < 0) | ||
667 | goto fail; | ||
668 | } | ||
868 | 669 | ||
869 | if (path[0] == 0) { | 670 | if (path[0] == 0) { |
870 | dget(root); | 671 | dget(root); |
871 | } else { | 672 | } else { |
872 | dout("mount opening base mountpoint\n"); | 673 | dout("mount opening base mountpoint\n"); |
873 | root = open_root_dentry(client, path, started); | 674 | root = open_root_dentry(fsc, path, started); |
874 | if (IS_ERR(root)) { | 675 | if (IS_ERR(root)) { |
875 | err = PTR_ERR(root); | 676 | err = PTR_ERR(root); |
876 | dput(client->sb->s_root); | 677 | goto fail; |
877 | client->sb->s_root = NULL; | ||
878 | goto out; | ||
879 | } | 678 | } |
880 | } | 679 | } |
881 | 680 | ||
882 | mnt->mnt_root = root; | 681 | mnt->mnt_root = root; |
883 | mnt->mnt_sb = client->sb; | 682 | mnt->mnt_sb = fsc->sb; |
884 | 683 | ||
885 | client->mount_state = CEPH_MOUNT_MOUNTED; | 684 | fsc->mount_state = CEPH_MOUNT_MOUNTED; |
886 | dout("mount success\n"); | 685 | dout("mount success\n"); |
887 | err = 0; | 686 | err = 0; |
888 | 687 | ||
889 | out: | 688 | out: |
890 | mutex_unlock(&client->mount_mutex); | 689 | mutex_unlock(&fsc->client->mount_mutex); |
891 | return err; | 690 | return err; |
691 | |||
692 | fail: | ||
693 | if (first) { | ||
694 | dput(fsc->sb->s_root); | ||
695 | fsc->sb->s_root = NULL; | ||
696 | } | ||
697 | goto out; | ||
892 | } | 698 | } |
893 | 699 | ||
894 | static int ceph_set_super(struct super_block *s, void *data) | 700 | static int ceph_set_super(struct super_block *s, void *data) |
895 | { | 701 | { |
896 | struct ceph_client *client = data; | 702 | struct ceph_fs_client *fsc = data; |
897 | int ret; | 703 | int ret; |
898 | 704 | ||
899 | dout("set_super %p data %p\n", s, data); | 705 | dout("set_super %p data %p\n", s, data); |
900 | 706 | ||
901 | s->s_flags = client->mount_args->sb_flags; | 707 | s->s_flags = fsc->mount_options->sb_flags; |
902 | s->s_maxbytes = 1ULL << 40; /* temp value until we get mdsmap */ | 708 | s->s_maxbytes = 1ULL << 40; /* temp value until we get mdsmap */ |
903 | 709 | ||
904 | s->s_fs_info = client; | 710 | s->s_fs_info = fsc; |
905 | client->sb = s; | 711 | fsc->sb = s; |
906 | 712 | ||
907 | s->s_op = &ceph_super_ops; | 713 | s->s_op = &ceph_super_ops; |
908 | s->s_export_op = &ceph_export_ops; | 714 | s->s_export_op = &ceph_export_ops; |
@@ -917,7 +723,7 @@ static int ceph_set_super(struct super_block *s, void *data) | |||
917 | 723 | ||
918 | fail: | 724 | fail: |
919 | s->s_fs_info = NULL; | 725 | s->s_fs_info = NULL; |
920 | client->sb = NULL; | 726 | fsc->sb = NULL; |
921 | return ret; | 727 | return ret; |
922 | } | 728 | } |
923 | 729 | ||
@@ -926,30 +732,23 @@ fail: | |||
926 | */ | 732 | */ |
927 | static int ceph_compare_super(struct super_block *sb, void *data) | 733 | static int ceph_compare_super(struct super_block *sb, void *data) |
928 | { | 734 | { |
929 | struct ceph_client *new = data; | 735 | struct ceph_fs_client *new = data; |
930 | struct ceph_mount_args *args = new->mount_args; | 736 | struct ceph_mount_options *fsopt = new->mount_options; |
931 | struct ceph_client *other = ceph_sb_to_client(sb); | 737 | struct ceph_options *opt = new->client->options; |
932 | int i; | 738 | struct ceph_fs_client *other = ceph_sb_to_client(sb); |
933 | 739 | ||
934 | dout("ceph_compare_super %p\n", sb); | 740 | dout("ceph_compare_super %p\n", sb); |
935 | if (args->flags & CEPH_OPT_FSID) { | 741 | |
936 | if (ceph_fsid_compare(&args->fsid, &other->fsid)) { | 742 | if (compare_mount_options(fsopt, opt, other)) { |
937 | dout("fsid doesn't match\n"); | 743 | dout("monitor(s)/mount options don't match\n"); |
938 | return 0; | 744 | return 0; |
939 | } | ||
940 | } else { | ||
941 | /* do we share (a) monitor? */ | ||
942 | for (i = 0; i < new->monc.monmap->num_mon; i++) | ||
943 | if (ceph_monmap_contains(other->monc.monmap, | ||
944 | &new->monc.monmap->mon_inst[i].addr)) | ||
945 | break; | ||
946 | if (i == new->monc.monmap->num_mon) { | ||
947 | dout("mon ip not part of monmap\n"); | ||
948 | return 0; | ||
949 | } | ||
950 | dout("mon ip matches existing sb %p\n", sb); | ||
951 | } | 745 | } |
952 | if (args->sb_flags != other->mount_args->sb_flags) { | 746 | if ((opt->flags & CEPH_OPT_FSID) && |
747 | ceph_fsid_compare(&opt->fsid, &other->client->fsid)) { | ||
748 | dout("fsid doesn't match\n"); | ||
749 | return 0; | ||
750 | } | ||
751 | if (fsopt->sb_flags != other->mount_options->sb_flags) { | ||
953 | dout("flags differ\n"); | 752 | dout("flags differ\n"); |
954 | return 0; | 753 | return 0; |
955 | } | 754 | } |
@@ -961,19 +760,20 @@ static int ceph_compare_super(struct super_block *sb, void *data) | |||
961 | */ | 760 | */ |
962 | static atomic_long_t bdi_seq = ATOMIC_LONG_INIT(0); | 761 | static atomic_long_t bdi_seq = ATOMIC_LONG_INIT(0); |
963 | 762 | ||
964 | static int ceph_register_bdi(struct super_block *sb, struct ceph_client *client) | 763 | static int ceph_register_bdi(struct super_block *sb, |
764 | struct ceph_fs_client *fsc) | ||
965 | { | 765 | { |
966 | int err; | 766 | int err; |
967 | 767 | ||
968 | /* set ra_pages based on rsize mount option? */ | 768 | /* set ra_pages based on rsize mount option? */ |
969 | if (client->mount_args->rsize >= PAGE_CACHE_SIZE) | 769 | if (fsc->mount_options->rsize >= PAGE_CACHE_SIZE) |
970 | client->backing_dev_info.ra_pages = | 770 | fsc->backing_dev_info.ra_pages = |
971 | (client->mount_args->rsize + PAGE_CACHE_SIZE - 1) | 771 | (fsc->mount_options->rsize + PAGE_CACHE_SIZE - 1) |
972 | >> PAGE_SHIFT; | 772 | >> PAGE_SHIFT; |
973 | err = bdi_register(&client->backing_dev_info, NULL, "ceph-%d", | 773 | err = bdi_register(&fsc->backing_dev_info, NULL, "ceph-%d", |
974 | atomic_long_inc_return(&bdi_seq)); | 774 | atomic_long_inc_return(&bdi_seq)); |
975 | if (!err) | 775 | if (!err) |
976 | sb->s_bdi = &client->backing_dev_info; | 776 | sb->s_bdi = &fsc->backing_dev_info; |
977 | return err; | 777 | return err; |
978 | } | 778 | } |
979 | 779 | ||
@@ -982,46 +782,52 @@ static int ceph_get_sb(struct file_system_type *fs_type, | |||
982 | struct vfsmount *mnt) | 782 | struct vfsmount *mnt) |
983 | { | 783 | { |
984 | struct super_block *sb; | 784 | struct super_block *sb; |
985 | struct ceph_client *client; | 785 | struct ceph_fs_client *fsc; |
986 | int err; | 786 | int err; |
987 | int (*compare_super)(struct super_block *, void *) = ceph_compare_super; | 787 | int (*compare_super)(struct super_block *, void *) = ceph_compare_super; |
988 | const char *path = NULL; | 788 | const char *path = NULL; |
989 | struct ceph_mount_args *args; | 789 | struct ceph_mount_options *fsopt = NULL; |
790 | struct ceph_options *opt = NULL; | ||
990 | 791 | ||
991 | dout("ceph_get_sb\n"); | 792 | dout("ceph_get_sb\n"); |
992 | args = parse_mount_args(flags, data, dev_name, &path); | 793 | err = parse_mount_options(&fsopt, &opt, flags, data, dev_name, &path); |
993 | if (IS_ERR(args)) { | 794 | if (err < 0) |
994 | err = PTR_ERR(args); | ||
995 | goto out_final; | 795 | goto out_final; |
996 | } | ||
997 | 796 | ||
998 | /* create client (which we may/may not use) */ | 797 | /* create client (which we may/may not use) */ |
999 | client = ceph_create_client(args); | 798 | fsc = create_fs_client(fsopt, opt); |
1000 | if (IS_ERR(client)) { | 799 | if (IS_ERR(fsc)) { |
1001 | err = PTR_ERR(client); | 800 | err = PTR_ERR(fsc); |
801 | kfree(fsopt); | ||
802 | kfree(opt); | ||
1002 | goto out_final; | 803 | goto out_final; |
1003 | } | 804 | } |
1004 | 805 | ||
1005 | if (client->mount_args->flags & CEPH_OPT_NOSHARE) | 806 | err = ceph_mdsc_init(fsc); |
807 | if (err < 0) | ||
808 | goto out; | ||
809 | |||
810 | if (ceph_test_opt(fsc->client, NOSHARE)) | ||
1006 | compare_super = NULL; | 811 | compare_super = NULL; |
1007 | sb = sget(fs_type, compare_super, ceph_set_super, client); | 812 | sb = sget(fs_type, compare_super, ceph_set_super, fsc); |
1008 | if (IS_ERR(sb)) { | 813 | if (IS_ERR(sb)) { |
1009 | err = PTR_ERR(sb); | 814 | err = PTR_ERR(sb); |
1010 | goto out; | 815 | goto out; |
1011 | } | 816 | } |
1012 | 817 | ||
1013 | if (ceph_sb_to_client(sb) != client) { | 818 | if (ceph_sb_to_client(sb) != fsc) { |
1014 | ceph_destroy_client(client); | 819 | ceph_mdsc_destroy(fsc); |
1015 | client = ceph_sb_to_client(sb); | 820 | destroy_fs_client(fsc); |
1016 | dout("get_sb got existing client %p\n", client); | 821 | fsc = ceph_sb_to_client(sb); |
822 | dout("get_sb got existing client %p\n", fsc); | ||
1017 | } else { | 823 | } else { |
1018 | dout("get_sb using new client %p\n", client); | 824 | dout("get_sb using new client %p\n", fsc); |
1019 | err = ceph_register_bdi(sb, client); | 825 | err = ceph_register_bdi(sb, fsc); |
1020 | if (err < 0) | 826 | if (err < 0) |
1021 | goto out_splat; | 827 | goto out_splat; |
1022 | } | 828 | } |
1023 | 829 | ||
1024 | err = ceph_mount(client, mnt, path); | 830 | err = ceph_mount(fsc, mnt, path); |
1025 | if (err < 0) | 831 | if (err < 0) |
1026 | goto out_splat; | 832 | goto out_splat; |
1027 | dout("root %p inode %p ino %llx.%llx\n", mnt->mnt_root, | 833 | dout("root %p inode %p ino %llx.%llx\n", mnt->mnt_root, |
@@ -1029,12 +835,13 @@ static int ceph_get_sb(struct file_system_type *fs_type, | |||
1029 | return 0; | 835 | return 0; |
1030 | 836 | ||
1031 | out_splat: | 837 | out_splat: |
1032 | ceph_mdsc_close_sessions(&client->mdsc); | 838 | ceph_mdsc_close_sessions(fsc->mdsc); |
1033 | deactivate_locked_super(sb); | 839 | deactivate_locked_super(sb); |
1034 | goto out_final; | 840 | goto out_final; |
1035 | 841 | ||
1036 | out: | 842 | out: |
1037 | ceph_destroy_client(client); | 843 | ceph_mdsc_destroy(fsc); |
844 | destroy_fs_client(fsc); | ||
1038 | out_final: | 845 | out_final: |
1039 | dout("ceph_get_sb fail %d\n", err); | 846 | dout("ceph_get_sb fail %d\n", err); |
1040 | return err; | 847 | return err; |
@@ -1042,11 +849,12 @@ out_final: | |||
1042 | 849 | ||
1043 | static void ceph_kill_sb(struct super_block *s) | 850 | static void ceph_kill_sb(struct super_block *s) |
1044 | { | 851 | { |
1045 | struct ceph_client *client = ceph_sb_to_client(s); | 852 | struct ceph_fs_client *fsc = ceph_sb_to_client(s); |
1046 | dout("kill_sb %p\n", s); | 853 | dout("kill_sb %p\n", s); |
1047 | ceph_mdsc_pre_umount(&client->mdsc); | 854 | ceph_mdsc_pre_umount(fsc->mdsc); |
1048 | kill_anon_super(s); /* will call put_super after sb is r/o */ | 855 | kill_anon_super(s); /* will call put_super after sb is r/o */ |
1049 | ceph_destroy_client(client); | 856 | ceph_mdsc_destroy(fsc); |
857 | destroy_fs_client(fsc); | ||
1050 | } | 858 | } |
1051 | 859 | ||
1052 | static struct file_system_type ceph_fs_type = { | 860 | static struct file_system_type ceph_fs_type = { |
@@ -1062,36 +870,20 @@ static struct file_system_type ceph_fs_type = { | |||
1062 | 870 | ||
1063 | static int __init init_ceph(void) | 871 | static int __init init_ceph(void) |
1064 | { | 872 | { |
1065 | int ret = 0; | 873 | int ret = init_caches(); |
1066 | |||
1067 | ret = ceph_debugfs_init(); | ||
1068 | if (ret < 0) | ||
1069 | goto out; | ||
1070 | |||
1071 | ret = ceph_msgr_init(); | ||
1072 | if (ret < 0) | ||
1073 | goto out_debugfs; | ||
1074 | |||
1075 | ret = init_caches(); | ||
1076 | if (ret) | 874 | if (ret) |
1077 | goto out_msgr; | 875 | goto out; |
1078 | 876 | ||
1079 | ret = register_filesystem(&ceph_fs_type); | 877 | ret = register_filesystem(&ceph_fs_type); |
1080 | if (ret) | 878 | if (ret) |
1081 | goto out_icache; | 879 | goto out_icache; |
1082 | 880 | ||
1083 | pr_info("loaded (mon/mds/osd proto %d/%d/%d, osdmap %d/%d %d/%d)\n", | 881 | pr_info("loaded (mds proto %d)\n", CEPH_MDSC_PROTOCOL); |
1084 | CEPH_MONC_PROTOCOL, CEPH_MDSC_PROTOCOL, CEPH_OSDC_PROTOCOL, | 882 | |
1085 | CEPH_OSDMAP_VERSION, CEPH_OSDMAP_VERSION_EXT, | ||
1086 | CEPH_OSDMAP_INC_VERSION, CEPH_OSDMAP_INC_VERSION_EXT); | ||
1087 | return 0; | 883 | return 0; |
1088 | 884 | ||
1089 | out_icache: | 885 | out_icache: |
1090 | destroy_caches(); | 886 | destroy_caches(); |
1091 | out_msgr: | ||
1092 | ceph_msgr_exit(); | ||
1093 | out_debugfs: | ||
1094 | ceph_debugfs_cleanup(); | ||
1095 | out: | 887 | out: |
1096 | return ret; | 888 | return ret; |
1097 | } | 889 | } |
@@ -1101,8 +893,6 @@ static void __exit exit_ceph(void) | |||
1101 | dout("exit_ceph\n"); | 893 | dout("exit_ceph\n"); |
1102 | unregister_filesystem(&ceph_fs_type); | 894 | unregister_filesystem(&ceph_fs_type); |
1103 | destroy_caches(); | 895 | destroy_caches(); |
1104 | ceph_msgr_exit(); | ||
1105 | ceph_debugfs_cleanup(); | ||
1106 | } | 896 | } |
1107 | 897 | ||
1108 | module_init(init_ceph); | 898 | module_init(init_ceph); |
diff --git a/fs/ceph/super.h b/fs/ceph/super.h index b87638e84c4b..e2e904442ce2 100644 --- a/fs/ceph/super.h +++ b/fs/ceph/super.h | |||
@@ -1,7 +1,7 @@ | |||
1 | #ifndef _FS_CEPH_SUPER_H | 1 | #ifndef _FS_CEPH_SUPER_H |
2 | #define _FS_CEPH_SUPER_H | 2 | #define _FS_CEPH_SUPER_H |
3 | 3 | ||
4 | #include "ceph_debug.h" | 4 | #include <linux/ceph/ceph_debug.h> |
5 | 5 | ||
6 | #include <asm/unaligned.h> | 6 | #include <asm/unaligned.h> |
7 | #include <linux/backing-dev.h> | 7 | #include <linux/backing-dev.h> |
@@ -14,13 +14,7 @@ | |||
14 | #include <linux/writeback.h> | 14 | #include <linux/writeback.h> |
15 | #include <linux/slab.h> | 15 | #include <linux/slab.h> |
16 | 16 | ||
17 | #include "types.h" | 17 | #include <linux/ceph/libceph.h> |
18 | #include "messenger.h" | ||
19 | #include "msgpool.h" | ||
20 | #include "mon_client.h" | ||
21 | #include "mds_client.h" | ||
22 | #include "osd_client.h" | ||
23 | #include "ceph_fs.h" | ||
24 | 18 | ||
25 | /* f_type in struct statfs */ | 19 | /* f_type in struct statfs */ |
26 | #define CEPH_SUPER_MAGIC 0x00c36400 | 20 | #define CEPH_SUPER_MAGIC 0x00c36400 |
@@ -30,42 +24,25 @@ | |||
30 | #define CEPH_BLOCK_SHIFT 20 /* 1 MB */ | 24 | #define CEPH_BLOCK_SHIFT 20 /* 1 MB */ |
31 | #define CEPH_BLOCK (1 << CEPH_BLOCK_SHIFT) | 25 | #define CEPH_BLOCK (1 << CEPH_BLOCK_SHIFT) |
32 | 26 | ||
33 | /* | 27 | #define CEPH_MOUNT_OPT_DIRSTAT (1<<4) /* `cat dirname` for stats */ |
34 | * Supported features | 28 | #define CEPH_MOUNT_OPT_RBYTES (1<<5) /* dir st_bytes = rbytes */ |
35 | */ | 29 | #define CEPH_MOUNT_OPT_NOASYNCREADDIR (1<<7) /* no dcache readdir */ |
36 | #define CEPH_FEATURE_SUPPORTED CEPH_FEATURE_NOSRCADDR | CEPH_FEATURE_FLOCK | ||
37 | #define CEPH_FEATURE_REQUIRED CEPH_FEATURE_NOSRCADDR | ||
38 | 30 | ||
39 | /* | 31 | #define CEPH_MOUNT_OPT_DEFAULT (CEPH_MOUNT_OPT_RBYTES) |
40 | * mount options | ||
41 | */ | ||
42 | #define CEPH_OPT_FSID (1<<0) | ||
43 | #define CEPH_OPT_NOSHARE (1<<1) /* don't share client with other sbs */ | ||
44 | #define CEPH_OPT_MYIP (1<<2) /* specified my ip */ | ||
45 | #define CEPH_OPT_DIRSTAT (1<<4) /* funky `cat dirname` for stats */ | ||
46 | #define CEPH_OPT_RBYTES (1<<5) /* dir st_bytes = rbytes */ | ||
47 | #define CEPH_OPT_NOCRC (1<<6) /* no data crc on writes */ | ||
48 | #define CEPH_OPT_NOASYNCREADDIR (1<<7) /* no dcache readdir */ | ||
49 | 32 | ||
50 | #define CEPH_OPT_DEFAULT (CEPH_OPT_RBYTES) | 33 | #define ceph_set_mount_opt(fsc, opt) \ |
34 | (fsc)->mount_options->flags |= CEPH_MOUNT_OPT_##opt; | ||
35 | #define ceph_test_mount_opt(fsc, opt) \ | ||
36 | (!!((fsc)->mount_options->flags & CEPH_MOUNT_OPT_##opt)) | ||
51 | 37 | ||
52 | #define ceph_set_opt(client, opt) \ | 38 | #define CEPH_MAX_READDIR_DEFAULT 1024 |
53 | (client)->mount_args->flags |= CEPH_OPT_##opt; | 39 | #define CEPH_MAX_READDIR_BYTES_DEFAULT (512*1024) |
54 | #define ceph_test_opt(client, opt) \ | 40 | #define CEPH_SNAPDIRNAME_DEFAULT ".snap" |
55 | (!!((client)->mount_args->flags & CEPH_OPT_##opt)) | ||
56 | 41 | ||
57 | 42 | struct ceph_mount_options { | |
58 | struct ceph_mount_args { | ||
59 | int sb_flags; | ||
60 | int flags; | 43 | int flags; |
61 | struct ceph_fsid fsid; | 44 | int sb_flags; |
62 | struct ceph_entity_addr my_addr; | 45 | |
63 | int num_mon; | ||
64 | struct ceph_entity_addr *mon_addr; | ||
65 | int mount_timeout; | ||
66 | int osd_idle_ttl; | ||
67 | int osd_timeout; | ||
68 | int osd_keepalive_timeout; | ||
69 | int wsize; | 46 | int wsize; |
70 | int rsize; /* max readahead */ | 47 | int rsize; /* max readahead */ |
71 | int congestion_kb; /* max writeback in flight */ | 48 | int congestion_kb; /* max writeback in flight */ |
@@ -73,82 +50,25 @@ struct ceph_mount_args { | |||
73 | int cap_release_safety; | 50 | int cap_release_safety; |
74 | int max_readdir; /* max readdir result (entires) */ | 51 | int max_readdir; /* max readdir result (entires) */ |
75 | int max_readdir_bytes; /* max readdir result (bytes) */ | 52 | int max_readdir_bytes; /* max readdir result (bytes) */ |
76 | char *snapdir_name; /* default ".snap" */ | ||
77 | char *name; | ||
78 | char *secret; | ||
79 | }; | ||
80 | |||
81 | /* | ||
82 | * defaults | ||
83 | */ | ||
84 | #define CEPH_MOUNT_TIMEOUT_DEFAULT 60 | ||
85 | #define CEPH_OSD_TIMEOUT_DEFAULT 60 /* seconds */ | ||
86 | #define CEPH_OSD_KEEPALIVE_DEFAULT 5 | ||
87 | #define CEPH_OSD_IDLE_TTL_DEFAULT 60 | ||
88 | #define CEPH_MOUNT_RSIZE_DEFAULT (512*1024) /* readahead */ | ||
89 | #define CEPH_MAX_READDIR_DEFAULT 1024 | ||
90 | #define CEPH_MAX_READDIR_BYTES_DEFAULT (512*1024) | ||
91 | |||
92 | #define CEPH_MSG_MAX_FRONT_LEN (16*1024*1024) | ||
93 | #define CEPH_MSG_MAX_DATA_LEN (16*1024*1024) | ||
94 | |||
95 | #define CEPH_SNAPDIRNAME_DEFAULT ".snap" | ||
96 | #define CEPH_AUTH_NAME_DEFAULT "guest" | ||
97 | /* | ||
98 | * Delay telling the MDS we no longer want caps, in case we reopen | ||
99 | * the file. Delay a minimum amount of time, even if we send a cap | ||
100 | * message for some other reason. Otherwise, take the oppotunity to | ||
101 | * update the mds to avoid sending another message later. | ||
102 | */ | ||
103 | #define CEPH_CAPS_WANTED_DELAY_MIN_DEFAULT 5 /* cap release delay */ | ||
104 | #define CEPH_CAPS_WANTED_DELAY_MAX_DEFAULT 60 /* cap release delay */ | ||
105 | |||
106 | #define CEPH_CAP_RELEASE_SAFETY_DEFAULT (CEPH_CAPS_PER_RELEASE * 4) | ||
107 | |||
108 | /* mount state */ | ||
109 | enum { | ||
110 | CEPH_MOUNT_MOUNTING, | ||
111 | CEPH_MOUNT_MOUNTED, | ||
112 | CEPH_MOUNT_UNMOUNTING, | ||
113 | CEPH_MOUNT_UNMOUNTED, | ||
114 | CEPH_MOUNT_SHUTDOWN, | ||
115 | }; | ||
116 | 53 | ||
117 | /* | 54 | /* |
118 | * subtract jiffies | 55 | * everything above this point can be memcmp'd; everything below |
119 | */ | 56 | * is handled in compare_mount_options() |
120 | static inline unsigned long time_sub(unsigned long a, unsigned long b) | 57 | */ |
121 | { | ||
122 | BUG_ON(time_after(b, a)); | ||
123 | return (long)a - (long)b; | ||
124 | } | ||
125 | |||
126 | /* | ||
127 | * per-filesystem client state | ||
128 | * | ||
129 | * possibly shared by multiple mount points, if they are | ||
130 | * mounting the same ceph filesystem/cluster. | ||
131 | */ | ||
132 | struct ceph_client { | ||
133 | struct ceph_fsid fsid; | ||
134 | bool have_fsid; | ||
135 | 58 | ||
136 | struct mutex mount_mutex; /* serialize mount attempts */ | 59 | char *snapdir_name; /* default ".snap" */ |
137 | struct ceph_mount_args *mount_args; | 60 | }; |
138 | 61 | ||
62 | struct ceph_fs_client { | ||
139 | struct super_block *sb; | 63 | struct super_block *sb; |
140 | 64 | ||
141 | unsigned long mount_state; | 65 | struct ceph_mount_options *mount_options; |
142 | wait_queue_head_t auth_wq; | 66 | struct ceph_client *client; |
143 | |||
144 | int auth_err; | ||
145 | 67 | ||
68 | unsigned long mount_state; | ||
146 | int min_caps; /* min caps i added */ | 69 | int min_caps; /* min caps i added */ |
147 | 70 | ||
148 | struct ceph_messenger *msgr; /* messenger instance */ | 71 | struct ceph_mds_client *mdsc; |
149 | struct ceph_mon_client monc; | ||
150 | struct ceph_mds_client mdsc; | ||
151 | struct ceph_osd_client osdc; | ||
152 | 72 | ||
153 | /* writeback */ | 73 | /* writeback */ |
154 | mempool_t *wb_pagevec_pool; | 74 | mempool_t *wb_pagevec_pool; |
@@ -160,14 +80,14 @@ struct ceph_client { | |||
160 | struct backing_dev_info backing_dev_info; | 80 | struct backing_dev_info backing_dev_info; |
161 | 81 | ||
162 | #ifdef CONFIG_DEBUG_FS | 82 | #ifdef CONFIG_DEBUG_FS |
163 | struct dentry *debugfs_monmap; | 83 | struct dentry *debugfs_dentry_lru, *debugfs_caps; |
164 | struct dentry *debugfs_mdsmap, *debugfs_osdmap; | ||
165 | struct dentry *debugfs_dir, *debugfs_dentry_lru, *debugfs_caps; | ||
166 | struct dentry *debugfs_congestion_kb; | 84 | struct dentry *debugfs_congestion_kb; |
167 | struct dentry *debugfs_bdi; | 85 | struct dentry *debugfs_bdi; |
86 | struct dentry *debugfs_mdsc, *debugfs_mdsmap; | ||
168 | #endif | 87 | #endif |
169 | }; | 88 | }; |
170 | 89 | ||
90 | |||
171 | /* | 91 | /* |
172 | * File i/o capability. This tracks shared state with the metadata | 92 | * File i/o capability. This tracks shared state with the metadata |
173 | * server that allows us to cache or writeback attributes or to read | 93 | * server that allows us to cache or writeback attributes or to read |
@@ -275,6 +195,20 @@ struct ceph_inode_xattr { | |||
275 | int should_free_val; | 195 | int should_free_val; |
276 | }; | 196 | }; |
277 | 197 | ||
198 | /* | ||
199 | * Ceph dentry state | ||
200 | */ | ||
201 | struct ceph_dentry_info { | ||
202 | struct ceph_mds_session *lease_session; | ||
203 | u32 lease_gen, lease_shared_gen; | ||
204 | u32 lease_seq; | ||
205 | unsigned long lease_renew_after, lease_renew_from; | ||
206 | struct list_head lru; | ||
207 | struct dentry *dentry; | ||
208 | u64 time; | ||
209 | u64 offset; | ||
210 | }; | ||
211 | |||
278 | struct ceph_inode_xattrs_info { | 212 | struct ceph_inode_xattrs_info { |
279 | /* | 213 | /* |
280 | * (still encoded) xattr blob. we avoid the overhead of parsing | 214 | * (still encoded) xattr blob. we avoid the overhead of parsing |
@@ -296,11 +230,6 @@ struct ceph_inode_xattrs_info { | |||
296 | /* | 230 | /* |
297 | * Ceph inode. | 231 | * Ceph inode. |
298 | */ | 232 | */ |
299 | #define CEPH_I_COMPLETE 1 /* we have complete directory cached */ | ||
300 | #define CEPH_I_NODELAY 4 /* do not delay cap release */ | ||
301 | #define CEPH_I_FLUSH 8 /* do not delay flush of dirty metadata */ | ||
302 | #define CEPH_I_NOFLUSH 16 /* do not flush dirty caps */ | ||
303 | |||
304 | struct ceph_inode_info { | 233 | struct ceph_inode_info { |
305 | struct ceph_vino i_vino; /* ceph ino + snap */ | 234 | struct ceph_vino i_vino; /* ceph ino + snap */ |
306 | 235 | ||
@@ -391,6 +320,63 @@ static inline struct ceph_inode_info *ceph_inode(struct inode *inode) | |||
391 | return container_of(inode, struct ceph_inode_info, vfs_inode); | 320 | return container_of(inode, struct ceph_inode_info, vfs_inode); |
392 | } | 321 | } |
393 | 322 | ||
323 | static inline struct ceph_vino ceph_vino(struct inode *inode) | ||
324 | { | ||
325 | return ceph_inode(inode)->i_vino; | ||
326 | } | ||
327 | |||
328 | /* | ||
329 | * ino_t is <64 bits on many architectures, blech. | ||
330 | * | ||
331 | * don't include snap in ino hash, at least for now. | ||
332 | */ | ||
333 | static inline ino_t ceph_vino_to_ino(struct ceph_vino vino) | ||
334 | { | ||
335 | ino_t ino = (ino_t)vino.ino; /* ^ (vino.snap << 20); */ | ||
336 | #if BITS_PER_LONG == 32 | ||
337 | ino ^= vino.ino >> (sizeof(u64)-sizeof(ino_t)) * 8; | ||
338 | if (!ino) | ||
339 | ino = 1; | ||
340 | #endif | ||
341 | return ino; | ||
342 | } | ||
343 | |||
344 | /* for printf-style formatting */ | ||
345 | #define ceph_vinop(i) ceph_inode(i)->i_vino.ino, ceph_inode(i)->i_vino.snap | ||
346 | |||
347 | static inline u64 ceph_ino(struct inode *inode) | ||
348 | { | ||
349 | return ceph_inode(inode)->i_vino.ino; | ||
350 | } | ||
351 | static inline u64 ceph_snap(struct inode *inode) | ||
352 | { | ||
353 | return ceph_inode(inode)->i_vino.snap; | ||
354 | } | ||
355 | |||
356 | static inline int ceph_ino_compare(struct inode *inode, void *data) | ||
357 | { | ||
358 | struct ceph_vino *pvino = (struct ceph_vino *)data; | ||
359 | struct ceph_inode_info *ci = ceph_inode(inode); | ||
360 | return ci->i_vino.ino == pvino->ino && | ||
361 | ci->i_vino.snap == pvino->snap; | ||
362 | } | ||
363 | |||
364 | static inline struct inode *ceph_find_inode(struct super_block *sb, | ||
365 | struct ceph_vino vino) | ||
366 | { | ||
367 | ino_t t = ceph_vino_to_ino(vino); | ||
368 | return ilookup5(sb, t, ceph_ino_compare, &vino); | ||
369 | } | ||
370 | |||
371 | |||
372 | /* | ||
373 | * Ceph inode. | ||
374 | */ | ||
375 | #define CEPH_I_COMPLETE 1 /* we have complete directory cached */ | ||
376 | #define CEPH_I_NODELAY 4 /* do not delay cap release */ | ||
377 | #define CEPH_I_FLUSH 8 /* do not delay flush of dirty metadata */ | ||
378 | #define CEPH_I_NOFLUSH 16 /* do not flush dirty caps */ | ||
379 | |||
394 | static inline void ceph_i_clear(struct inode *inode, unsigned mask) | 380 | static inline void ceph_i_clear(struct inode *inode, unsigned mask) |
395 | { | 381 | { |
396 | struct ceph_inode_info *ci = ceph_inode(inode); | 382 | struct ceph_inode_info *ci = ceph_inode(inode); |
@@ -432,20 +418,6 @@ extern u32 ceph_choose_frag(struct ceph_inode_info *ci, u32 v, | |||
432 | struct ceph_inode_frag *pfrag, | 418 | struct ceph_inode_frag *pfrag, |
433 | int *found); | 419 | int *found); |
434 | 420 | ||
435 | /* | ||
436 | * Ceph dentry state | ||
437 | */ | ||
438 | struct ceph_dentry_info { | ||
439 | struct ceph_mds_session *lease_session; | ||
440 | u32 lease_gen, lease_shared_gen; | ||
441 | u32 lease_seq; | ||
442 | unsigned long lease_renew_after, lease_renew_from; | ||
443 | struct list_head lru; | ||
444 | struct dentry *dentry; | ||
445 | u64 time; | ||
446 | u64 offset; | ||
447 | }; | ||
448 | |||
449 | static inline struct ceph_dentry_info *ceph_dentry(struct dentry *dentry) | 421 | static inline struct ceph_dentry_info *ceph_dentry(struct dentry *dentry) |
450 | { | 422 | { |
451 | return (struct ceph_dentry_info *)dentry->d_fsdata; | 423 | return (struct ceph_dentry_info *)dentry->d_fsdata; |
@@ -456,22 +428,6 @@ static inline loff_t ceph_make_fpos(unsigned frag, unsigned off) | |||
456 | return ((loff_t)frag << 32) | (loff_t)off; | 428 | return ((loff_t)frag << 32) | (loff_t)off; |
457 | } | 429 | } |
458 | 430 | ||
459 | /* | ||
460 | * ino_t is <64 bits on many architectures, blech. | ||
461 | * | ||
462 | * don't include snap in ino hash, at least for now. | ||
463 | */ | ||
464 | static inline ino_t ceph_vino_to_ino(struct ceph_vino vino) | ||
465 | { | ||
466 | ino_t ino = (ino_t)vino.ino; /* ^ (vino.snap << 20); */ | ||
467 | #if BITS_PER_LONG == 32 | ||
468 | ino ^= vino.ino >> (sizeof(u64)-sizeof(ino_t)) * 8; | ||
469 | if (!ino) | ||
470 | ino = 1; | ||
471 | #endif | ||
472 | return ino; | ||
473 | } | ||
474 | |||
475 | static inline int ceph_set_ino_cb(struct inode *inode, void *data) | 431 | static inline int ceph_set_ino_cb(struct inode *inode, void *data) |
476 | { | 432 | { |
477 | ceph_inode(inode)->i_vino = *(struct ceph_vino *)data; | 433 | ceph_inode(inode)->i_vino = *(struct ceph_vino *)data; |
@@ -479,39 +435,6 @@ static inline int ceph_set_ino_cb(struct inode *inode, void *data) | |||
479 | return 0; | 435 | return 0; |
480 | } | 436 | } |
481 | 437 | ||
482 | static inline struct ceph_vino ceph_vino(struct inode *inode) | ||
483 | { | ||
484 | return ceph_inode(inode)->i_vino; | ||
485 | } | ||
486 | |||
487 | /* for printf-style formatting */ | ||
488 | #define ceph_vinop(i) ceph_inode(i)->i_vino.ino, ceph_inode(i)->i_vino.snap | ||
489 | |||
490 | static inline u64 ceph_ino(struct inode *inode) | ||
491 | { | ||
492 | return ceph_inode(inode)->i_vino.ino; | ||
493 | } | ||
494 | static inline u64 ceph_snap(struct inode *inode) | ||
495 | { | ||
496 | return ceph_inode(inode)->i_vino.snap; | ||
497 | } | ||
498 | |||
499 | static inline int ceph_ino_compare(struct inode *inode, void *data) | ||
500 | { | ||
501 | struct ceph_vino *pvino = (struct ceph_vino *)data; | ||
502 | struct ceph_inode_info *ci = ceph_inode(inode); | ||
503 | return ci->i_vino.ino == pvino->ino && | ||
504 | ci->i_vino.snap == pvino->snap; | ||
505 | } | ||
506 | |||
507 | static inline struct inode *ceph_find_inode(struct super_block *sb, | ||
508 | struct ceph_vino vino) | ||
509 | { | ||
510 | ino_t t = ceph_vino_to_ino(vino); | ||
511 | return ilookup5(sb, t, ceph_ino_compare, &vino); | ||
512 | } | ||
513 | |||
514 | |||
515 | /* | 438 | /* |
516 | * caps helpers | 439 | * caps helpers |
517 | */ | 440 | */ |
@@ -576,18 +499,18 @@ extern int ceph_reserve_caps(struct ceph_mds_client *mdsc, | |||
576 | struct ceph_cap_reservation *ctx, int need); | 499 | struct ceph_cap_reservation *ctx, int need); |
577 | extern int ceph_unreserve_caps(struct ceph_mds_client *mdsc, | 500 | extern int ceph_unreserve_caps(struct ceph_mds_client *mdsc, |
578 | struct ceph_cap_reservation *ctx); | 501 | struct ceph_cap_reservation *ctx); |
579 | extern void ceph_reservation_status(struct ceph_client *client, | 502 | extern void ceph_reservation_status(struct ceph_fs_client *client, |
580 | int *total, int *avail, int *used, | 503 | int *total, int *avail, int *used, |
581 | int *reserved, int *min); | 504 | int *reserved, int *min); |
582 | 505 | ||
583 | static inline struct ceph_client *ceph_inode_to_client(struct inode *inode) | 506 | static inline struct ceph_fs_client *ceph_inode_to_client(struct inode *inode) |
584 | { | 507 | { |
585 | return (struct ceph_client *)inode->i_sb->s_fs_info; | 508 | return (struct ceph_fs_client *)inode->i_sb->s_fs_info; |
586 | } | 509 | } |
587 | 510 | ||
588 | static inline struct ceph_client *ceph_sb_to_client(struct super_block *sb) | 511 | static inline struct ceph_fs_client *ceph_sb_to_client(struct super_block *sb) |
589 | { | 512 | { |
590 | return (struct ceph_client *)sb->s_fs_info; | 513 | return (struct ceph_fs_client *)sb->s_fs_info; |
591 | } | 514 | } |
592 | 515 | ||
593 | 516 | ||
@@ -617,51 +540,6 @@ struct ceph_file_info { | |||
617 | 540 | ||
618 | 541 | ||
619 | /* | 542 | /* |
620 | * snapshots | ||
621 | */ | ||
622 | |||
623 | /* | ||
624 | * A "snap context" is the set of existing snapshots when we | ||
625 | * write data. It is used by the OSD to guide its COW behavior. | ||
626 | * | ||
627 | * The ceph_snap_context is refcounted, and attached to each dirty | ||
628 | * page, indicating which context the dirty data belonged when it was | ||
629 | * dirtied. | ||
630 | */ | ||
631 | struct ceph_snap_context { | ||
632 | atomic_t nref; | ||
633 | u64 seq; | ||
634 | int num_snaps; | ||
635 | u64 snaps[]; | ||
636 | }; | ||
637 | |||
638 | static inline struct ceph_snap_context * | ||
639 | ceph_get_snap_context(struct ceph_snap_context *sc) | ||
640 | { | ||
641 | /* | ||
642 | printk("get_snap_context %p %d -> %d\n", sc, atomic_read(&sc->nref), | ||
643 | atomic_read(&sc->nref)+1); | ||
644 | */ | ||
645 | if (sc) | ||
646 | atomic_inc(&sc->nref); | ||
647 | return sc; | ||
648 | } | ||
649 | |||
650 | static inline void ceph_put_snap_context(struct ceph_snap_context *sc) | ||
651 | { | ||
652 | if (!sc) | ||
653 | return; | ||
654 | /* | ||
655 | printk("put_snap_context %p %d -> %d\n", sc, atomic_read(&sc->nref), | ||
656 | atomic_read(&sc->nref)-1); | ||
657 | */ | ||
658 | if (atomic_dec_and_test(&sc->nref)) { | ||
659 | /*printk(" deleting snap_context %p\n", sc);*/ | ||
660 | kfree(sc); | ||
661 | } | ||
662 | } | ||
663 | |||
664 | /* | ||
665 | * A "snap realm" describes a subset of the file hierarchy sharing | 543 | * A "snap realm" describes a subset of the file hierarchy sharing |
666 | * the same set of snapshots that apply to it. The realms themselves | 544 | * the same set of snapshots that apply to it. The realms themselves |
667 | * are organized into a hierarchy, such that children inherit (some of) | 545 | * are organized into a hierarchy, such that children inherit (some of) |
@@ -699,16 +577,33 @@ struct ceph_snap_realm { | |||
699 | spinlock_t inodes_with_caps_lock; | 577 | spinlock_t inodes_with_caps_lock; |
700 | }; | 578 | }; |
701 | 579 | ||
702 | 580 | static inline int default_congestion_kb(void) | |
703 | |||
704 | /* | ||
705 | * calculate the number of pages a given length and offset map onto, | ||
706 | * if we align the data. | ||
707 | */ | ||
708 | static inline int calc_pages_for(u64 off, u64 len) | ||
709 | { | 581 | { |
710 | return ((off+len+PAGE_CACHE_SIZE-1) >> PAGE_CACHE_SHIFT) - | 582 | int congestion_kb; |
711 | (off >> PAGE_CACHE_SHIFT); | 583 | |
584 | /* | ||
585 | * Copied from NFS | ||
586 | * | ||
587 | * congestion size, scale with available memory. | ||
588 | * | ||
589 | * 64MB: 8192k | ||
590 | * 128MB: 11585k | ||
591 | * 256MB: 16384k | ||
592 | * 512MB: 23170k | ||
593 | * 1GB: 32768k | ||
594 | * 2GB: 46340k | ||
595 | * 4GB: 65536k | ||
596 | * 8GB: 92681k | ||
597 | * 16GB: 131072k | ||
598 | * | ||
599 | * This allows larger machines to have larger/more transfers. | ||
600 | * Limit the default to 256M | ||
601 | */ | ||
602 | congestion_kb = (16*int_sqrt(totalram_pages)) << (PAGE_SHIFT-10); | ||
603 | if (congestion_kb > 256*1024) | ||
604 | congestion_kb = 256*1024; | ||
605 | |||
606 | return congestion_kb; | ||
712 | } | 607 | } |
713 | 608 | ||
714 | 609 | ||
@@ -741,16 +636,6 @@ static inline bool __ceph_have_pending_cap_snap(struct ceph_inode_info *ci) | |||
741 | ci_item)->writing; | 636 | ci_item)->writing; |
742 | } | 637 | } |
743 | 638 | ||
744 | |||
745 | /* super.c */ | ||
746 | extern struct kmem_cache *ceph_inode_cachep; | ||
747 | extern struct kmem_cache *ceph_cap_cachep; | ||
748 | extern struct kmem_cache *ceph_dentry_cachep; | ||
749 | extern struct kmem_cache *ceph_file_cachep; | ||
750 | |||
751 | extern const char *ceph_msg_type_name(int type); | ||
752 | extern int ceph_check_fsid(struct ceph_client *client, struct ceph_fsid *fsid); | ||
753 | |||
754 | /* inode.c */ | 639 | /* inode.c */ |
755 | extern const struct inode_operations ceph_file_iops; | 640 | extern const struct inode_operations ceph_file_iops; |
756 | 641 | ||
@@ -857,12 +742,18 @@ extern int ceph_mmap(struct file *file, struct vm_area_struct *vma); | |||
857 | /* file.c */ | 742 | /* file.c */ |
858 | extern const struct file_operations ceph_file_fops; | 743 | extern const struct file_operations ceph_file_fops; |
859 | extern const struct address_space_operations ceph_aops; | 744 | extern const struct address_space_operations ceph_aops; |
745 | extern int ceph_copy_to_page_vector(struct page **pages, | ||
746 | const char *data, | ||
747 | loff_t off, size_t len); | ||
748 | extern int ceph_copy_from_page_vector(struct page **pages, | ||
749 | char *data, | ||
750 | loff_t off, size_t len); | ||
751 | extern struct page **ceph_alloc_page_vector(int num_pages, gfp_t flags); | ||
860 | extern int ceph_open(struct inode *inode, struct file *file); | 752 | extern int ceph_open(struct inode *inode, struct file *file); |
861 | extern struct dentry *ceph_lookup_open(struct inode *dir, struct dentry *dentry, | 753 | extern struct dentry *ceph_lookup_open(struct inode *dir, struct dentry *dentry, |
862 | struct nameidata *nd, int mode, | 754 | struct nameidata *nd, int mode, |
863 | int locked_dir); | 755 | int locked_dir); |
864 | extern int ceph_release(struct inode *inode, struct file *filp); | 756 | extern int ceph_release(struct inode *inode, struct file *filp); |
865 | extern void ceph_release_page_vector(struct page **pages, int num_pages); | ||
866 | 757 | ||
867 | /* dir.c */ | 758 | /* dir.c */ |
868 | extern const struct file_operations ceph_dir_fops; | 759 | extern const struct file_operations ceph_dir_fops; |
@@ -892,12 +783,6 @@ extern long ceph_ioctl(struct file *file, unsigned int cmd, unsigned long arg); | |||
892 | /* export.c */ | 783 | /* export.c */ |
893 | extern const struct export_operations ceph_export_ops; | 784 | extern const struct export_operations ceph_export_ops; |
894 | 785 | ||
895 | /* debugfs.c */ | ||
896 | extern int ceph_debugfs_init(void); | ||
897 | extern void ceph_debugfs_cleanup(void); | ||
898 | extern int ceph_debugfs_client_init(struct ceph_client *client); | ||
899 | extern void ceph_debugfs_client_cleanup(struct ceph_client *client); | ||
900 | |||
901 | /* locks.c */ | 786 | /* locks.c */ |
902 | extern int ceph_lock(struct file *file, int cmd, struct file_lock *fl); | 787 | extern int ceph_lock(struct file *file, int cmd, struct file_lock *fl); |
903 | extern int ceph_flock(struct file *file, int cmd, struct file_lock *fl); | 788 | extern int ceph_flock(struct file *file, int cmd, struct file_lock *fl); |
@@ -914,4 +799,8 @@ static inline struct inode *get_dentry_parent_inode(struct dentry *dentry) | |||
914 | return NULL; | 799 | return NULL; |
915 | } | 800 | } |
916 | 801 | ||
802 | /* debugfs.c */ | ||
803 | extern int ceph_fs_debugfs_init(struct ceph_fs_client *client); | ||
804 | extern void ceph_fs_debugfs_cleanup(struct ceph_fs_client *client); | ||
805 | |||
917 | #endif /* _FS_CEPH_SUPER_H */ | 806 | #endif /* _FS_CEPH_SUPER_H */ |
diff --git a/fs/ceph/xattr.c b/fs/ceph/xattr.c index 9578af610b73..70e919960acb 100644 --- a/fs/ceph/xattr.c +++ b/fs/ceph/xattr.c | |||
@@ -1,6 +1,9 @@ | |||
1 | #include "ceph_debug.h" | 1 | #include <linux/ceph/ceph_debug.h> |
2 | |||
2 | #include "super.h" | 3 | #include "super.h" |
3 | #include "decode.h" | 4 | #include "mds_client.h" |
5 | |||
6 | #include <linux/ceph/decode.h> | ||
4 | 7 | ||
5 | #include <linux/xattr.h> | 8 | #include <linux/xattr.h> |
6 | #include <linux/slab.h> | 9 | #include <linux/slab.h> |
@@ -620,12 +623,12 @@ out: | |||
620 | static int ceph_sync_setxattr(struct dentry *dentry, const char *name, | 623 | static int ceph_sync_setxattr(struct dentry *dentry, const char *name, |
621 | const char *value, size_t size, int flags) | 624 | const char *value, size_t size, int flags) |
622 | { | 625 | { |
623 | struct ceph_client *client = ceph_sb_to_client(dentry->d_sb); | 626 | struct ceph_fs_client *fsc = ceph_sb_to_client(dentry->d_sb); |
624 | struct inode *inode = dentry->d_inode; | 627 | struct inode *inode = dentry->d_inode; |
625 | struct ceph_inode_info *ci = ceph_inode(inode); | 628 | struct ceph_inode_info *ci = ceph_inode(inode); |
626 | struct inode *parent_inode = dentry->d_parent->d_inode; | 629 | struct inode *parent_inode = dentry->d_parent->d_inode; |
627 | struct ceph_mds_request *req; | 630 | struct ceph_mds_request *req; |
628 | struct ceph_mds_client *mdsc = &client->mdsc; | 631 | struct ceph_mds_client *mdsc = fsc->mdsc; |
629 | int err; | 632 | int err; |
630 | int i, nr_pages; | 633 | int i, nr_pages; |
631 | struct page **pages = NULL; | 634 | struct page **pages = NULL; |
@@ -777,8 +780,8 @@ out: | |||
777 | 780 | ||
778 | static int ceph_send_removexattr(struct dentry *dentry, const char *name) | 781 | static int ceph_send_removexattr(struct dentry *dentry, const char *name) |
779 | { | 782 | { |
780 | struct ceph_client *client = ceph_sb_to_client(dentry->d_sb); | 783 | struct ceph_fs_client *fsc = ceph_sb_to_client(dentry->d_sb); |
781 | struct ceph_mds_client *mdsc = &client->mdsc; | 784 | struct ceph_mds_client *mdsc = fsc->mdsc; |
782 | struct inode *inode = dentry->d_inode; | 785 | struct inode *inode = dentry->d_inode; |
783 | struct inode *parent_inode = dentry->d_parent->d_inode; | 786 | struct inode *parent_inode = dentry->d_parent->d_inode; |
784 | struct ceph_mds_request *req; | 787 | struct ceph_mds_request *req; |
diff --git a/fs/ceph/auth.h b/include/linux/ceph/auth.h index d38a2fb4a137..7fff521d7eb5 100644 --- a/fs/ceph/auth.h +++ b/include/linux/ceph/auth.h | |||
@@ -1,8 +1,8 @@ | |||
1 | #ifndef _FS_CEPH_AUTH_H | 1 | #ifndef _FS_CEPH_AUTH_H |
2 | #define _FS_CEPH_AUTH_H | 2 | #define _FS_CEPH_AUTH_H |
3 | 3 | ||
4 | #include "types.h" | 4 | #include <linux/ceph/types.h> |
5 | #include "buffer.h" | 5 | #include <linux/ceph/buffer.h> |
6 | 6 | ||
7 | /* | 7 | /* |
8 | * Abstract interface for communicating with the authenticate module. | 8 | * Abstract interface for communicating with the authenticate module. |
diff --git a/fs/ceph/buffer.h b/include/linux/ceph/buffer.h index 58d19014068f..58d19014068f 100644 --- a/fs/ceph/buffer.h +++ b/include/linux/ceph/buffer.h | |||
diff --git a/fs/ceph/ceph_debug.h b/include/linux/ceph/ceph_debug.h index 1818c2305610..aa2e19182d99 100644 --- a/fs/ceph/ceph_debug.h +++ b/include/linux/ceph/ceph_debug.h | |||
@@ -3,7 +3,7 @@ | |||
3 | 3 | ||
4 | #define pr_fmt(fmt) KBUILD_MODNAME ": " fmt | 4 | #define pr_fmt(fmt) KBUILD_MODNAME ": " fmt |
5 | 5 | ||
6 | #ifdef CONFIG_CEPH_FS_PRETTYDEBUG | 6 | #ifdef CONFIG_CEPH_LIB_PRETTYDEBUG |
7 | 7 | ||
8 | /* | 8 | /* |
9 | * wrap pr_debug to include a filename:lineno prefix on each line. | 9 | * wrap pr_debug to include a filename:lineno prefix on each line. |
@@ -14,7 +14,8 @@ | |||
14 | # if defined(DEBUG) || defined(CONFIG_DYNAMIC_DEBUG) | 14 | # if defined(DEBUG) || defined(CONFIG_DYNAMIC_DEBUG) |
15 | extern const char *ceph_file_part(const char *s, int len); | 15 | extern const char *ceph_file_part(const char *s, int len); |
16 | # define dout(fmt, ...) \ | 16 | # define dout(fmt, ...) \ |
17 | pr_debug(" %12.12s:%-4d : " fmt, \ | 17 | pr_debug("%.*s %12.12s:%-4d : " fmt, \ |
18 | 8 - (int)sizeof(KBUILD_MODNAME), " ", \ | ||
18 | ceph_file_part(__FILE__, sizeof(__FILE__)), \ | 19 | ceph_file_part(__FILE__, sizeof(__FILE__)), \ |
19 | __LINE__, ##__VA_ARGS__) | 20 | __LINE__, ##__VA_ARGS__) |
20 | # else | 21 | # else |
diff --git a/fs/ceph/ceph_frag.h b/include/linux/ceph/ceph_frag.h index 5babb8e95352..5babb8e95352 100644 --- a/fs/ceph/ceph_frag.h +++ b/include/linux/ceph/ceph_frag.h | |||
diff --git a/fs/ceph/ceph_fs.h b/include/linux/ceph/ceph_fs.h index d5619ac86711..d5619ac86711 100644 --- a/fs/ceph/ceph_fs.h +++ b/include/linux/ceph/ceph_fs.h | |||
diff --git a/fs/ceph/ceph_hash.h b/include/linux/ceph/ceph_hash.h index d099c3f90236..d099c3f90236 100644 --- a/fs/ceph/ceph_hash.h +++ b/include/linux/ceph/ceph_hash.h | |||
diff --git a/include/linux/ceph/debugfs.h b/include/linux/ceph/debugfs.h new file mode 100644 index 000000000000..2a79702e092b --- /dev/null +++ b/include/linux/ceph/debugfs.h | |||
@@ -0,0 +1,33 @@ | |||
1 | #ifndef _FS_CEPH_DEBUGFS_H | ||
2 | #define _FS_CEPH_DEBUGFS_H | ||
3 | |||
4 | #include "ceph_debug.h" | ||
5 | #include "types.h" | ||
6 | |||
7 | #define CEPH_DEFINE_SHOW_FUNC(name) \ | ||
8 | static int name##_open(struct inode *inode, struct file *file) \ | ||
9 | { \ | ||
10 | struct seq_file *sf; \ | ||
11 | int ret; \ | ||
12 | \ | ||
13 | ret = single_open(file, name, NULL); \ | ||
14 | sf = file->private_data; \ | ||
15 | sf->private = inode->i_private; \ | ||
16 | return ret; \ | ||
17 | } \ | ||
18 | \ | ||
19 | static const struct file_operations name##_fops = { \ | ||
20 | .open = name##_open, \ | ||
21 | .read = seq_read, \ | ||
22 | .llseek = seq_lseek, \ | ||
23 | .release = single_release, \ | ||
24 | }; | ||
25 | |||
26 | /* debugfs.c */ | ||
27 | extern int ceph_debugfs_init(void); | ||
28 | extern void ceph_debugfs_cleanup(void); | ||
29 | extern int ceph_debugfs_client_init(struct ceph_client *client); | ||
30 | extern void ceph_debugfs_client_cleanup(struct ceph_client *client); | ||
31 | |||
32 | #endif | ||
33 | |||
diff --git a/fs/ceph/decode.h b/include/linux/ceph/decode.h index c5b6939fb32a..c5b6939fb32a 100644 --- a/fs/ceph/decode.h +++ b/include/linux/ceph/decode.h | |||
diff --git a/include/linux/ceph/libceph.h b/include/linux/ceph/libceph.h new file mode 100644 index 000000000000..f22b2e941686 --- /dev/null +++ b/include/linux/ceph/libceph.h | |||
@@ -0,0 +1,249 @@ | |||
1 | #ifndef _FS_CEPH_LIBCEPH_H | ||
2 | #define _FS_CEPH_LIBCEPH_H | ||
3 | |||
4 | #include "ceph_debug.h" | ||
5 | |||
6 | #include <asm/unaligned.h> | ||
7 | #include <linux/backing-dev.h> | ||
8 | #include <linux/completion.h> | ||
9 | #include <linux/exportfs.h> | ||
10 | #include <linux/fs.h> | ||
11 | #include <linux/mempool.h> | ||
12 | #include <linux/pagemap.h> | ||
13 | #include <linux/wait.h> | ||
14 | #include <linux/writeback.h> | ||
15 | #include <linux/slab.h> | ||
16 | |||
17 | #include "types.h" | ||
18 | #include "messenger.h" | ||
19 | #include "msgpool.h" | ||
20 | #include "mon_client.h" | ||
21 | #include "osd_client.h" | ||
22 | #include "ceph_fs.h" | ||
23 | |||
24 | /* | ||
25 | * Supported features | ||
26 | */ | ||
27 | #define CEPH_FEATURE_SUPPORTED_DEFAULT CEPH_FEATURE_NOSRCADDR | ||
28 | #define CEPH_FEATURE_REQUIRED_DEFAULT CEPH_FEATURE_NOSRCADDR | ||
29 | |||
30 | /* | ||
31 | * mount options | ||
32 | */ | ||
33 | #define CEPH_OPT_FSID (1<<0) | ||
34 | #define CEPH_OPT_NOSHARE (1<<1) /* don't share client with other sbs */ | ||
35 | #define CEPH_OPT_MYIP (1<<2) /* specified my ip */ | ||
36 | #define CEPH_OPT_NOCRC (1<<3) /* no data crc on writes */ | ||
37 | |||
38 | #define CEPH_OPT_DEFAULT (0); | ||
39 | |||
40 | #define ceph_set_opt(client, opt) \ | ||
41 | (client)->options->flags |= CEPH_OPT_##opt; | ||
42 | #define ceph_test_opt(client, opt) \ | ||
43 | (!!((client)->options->flags & CEPH_OPT_##opt)) | ||
44 | |||
45 | struct ceph_options { | ||
46 | int flags; | ||
47 | struct ceph_fsid fsid; | ||
48 | struct ceph_entity_addr my_addr; | ||
49 | int mount_timeout; | ||
50 | int osd_idle_ttl; | ||
51 | int osd_timeout; | ||
52 | int osd_keepalive_timeout; | ||
53 | |||
54 | /* | ||
55 | * any type that can't be simply compared or doesn't need need | ||
56 | * to be compared should go beyond this point, | ||
57 | * ceph_compare_options() should be updated accordingly | ||
58 | */ | ||
59 | |||
60 | struct ceph_entity_addr *mon_addr; /* should be the first | ||
61 | pointer type of args */ | ||
62 | int num_mon; | ||
63 | char *name; | ||
64 | char *secret; | ||
65 | }; | ||
66 | |||
67 | /* | ||
68 | * defaults | ||
69 | */ | ||
70 | #define CEPH_MOUNT_TIMEOUT_DEFAULT 60 | ||
71 | #define CEPH_OSD_TIMEOUT_DEFAULT 60 /* seconds */ | ||
72 | #define CEPH_OSD_KEEPALIVE_DEFAULT 5 | ||
73 | #define CEPH_OSD_IDLE_TTL_DEFAULT 60 | ||
74 | #define CEPH_MOUNT_RSIZE_DEFAULT (512*1024) /* readahead */ | ||
75 | |||
76 | #define CEPH_MSG_MAX_FRONT_LEN (16*1024*1024) | ||
77 | #define CEPH_MSG_MAX_DATA_LEN (16*1024*1024) | ||
78 | |||
79 | #define CEPH_AUTH_NAME_DEFAULT "guest" | ||
80 | |||
81 | /* | ||
82 | * Delay telling the MDS we no longer want caps, in case we reopen | ||
83 | * the file. Delay a minimum amount of time, even if we send a cap | ||
84 | * message for some other reason. Otherwise, take the oppotunity to | ||
85 | * update the mds to avoid sending another message later. | ||
86 | */ | ||
87 | #define CEPH_CAPS_WANTED_DELAY_MIN_DEFAULT 5 /* cap release delay */ | ||
88 | #define CEPH_CAPS_WANTED_DELAY_MAX_DEFAULT 60 /* cap release delay */ | ||
89 | |||
90 | #define CEPH_CAP_RELEASE_SAFETY_DEFAULT (CEPH_CAPS_PER_RELEASE * 4) | ||
91 | |||
92 | /* mount state */ | ||
93 | enum { | ||
94 | CEPH_MOUNT_MOUNTING, | ||
95 | CEPH_MOUNT_MOUNTED, | ||
96 | CEPH_MOUNT_UNMOUNTING, | ||
97 | CEPH_MOUNT_UNMOUNTED, | ||
98 | CEPH_MOUNT_SHUTDOWN, | ||
99 | }; | ||
100 | |||
101 | /* | ||
102 | * subtract jiffies | ||
103 | */ | ||
104 | static inline unsigned long time_sub(unsigned long a, unsigned long b) | ||
105 | { | ||
106 | BUG_ON(time_after(b, a)); | ||
107 | return (long)a - (long)b; | ||
108 | } | ||
109 | |||
110 | struct ceph_mds_client; | ||
111 | |||
112 | /* | ||
113 | * per client state | ||
114 | * | ||
115 | * possibly shared by multiple mount points, if they are | ||
116 | * mounting the same ceph filesystem/cluster. | ||
117 | */ | ||
118 | struct ceph_client { | ||
119 | struct ceph_fsid fsid; | ||
120 | bool have_fsid; | ||
121 | |||
122 | void *private; | ||
123 | |||
124 | struct ceph_options *options; | ||
125 | |||
126 | struct mutex mount_mutex; /* serialize mount attempts */ | ||
127 | wait_queue_head_t auth_wq; | ||
128 | int auth_err; | ||
129 | |||
130 | int (*extra_mon_dispatch)(struct ceph_client *, struct ceph_msg *); | ||
131 | |||
132 | u32 supported_features; | ||
133 | u32 required_features; | ||
134 | |||
135 | struct ceph_messenger *msgr; /* messenger instance */ | ||
136 | struct ceph_mon_client monc; | ||
137 | struct ceph_osd_client osdc; | ||
138 | |||
139 | #ifdef CONFIG_DEBUG_FS | ||
140 | struct dentry *debugfs_dir; | ||
141 | struct dentry *debugfs_monmap; | ||
142 | struct dentry *debugfs_osdmap; | ||
143 | #endif | ||
144 | }; | ||
145 | |||
146 | |||
147 | |||
148 | /* | ||
149 | * snapshots | ||
150 | */ | ||
151 | |||
152 | /* | ||
153 | * A "snap context" is the set of existing snapshots when we | ||
154 | * write data. It is used by the OSD to guide its COW behavior. | ||
155 | * | ||
156 | * The ceph_snap_context is refcounted, and attached to each dirty | ||
157 | * page, indicating which context the dirty data belonged when it was | ||
158 | * dirtied. | ||
159 | */ | ||
160 | struct ceph_snap_context { | ||
161 | atomic_t nref; | ||
162 | u64 seq; | ||
163 | int num_snaps; | ||
164 | u64 snaps[]; | ||
165 | }; | ||
166 | |||
167 | static inline struct ceph_snap_context * | ||
168 | ceph_get_snap_context(struct ceph_snap_context *sc) | ||
169 | { | ||
170 | /* | ||
171 | printk("get_snap_context %p %d -> %d\n", sc, atomic_read(&sc->nref), | ||
172 | atomic_read(&sc->nref)+1); | ||
173 | */ | ||
174 | if (sc) | ||
175 | atomic_inc(&sc->nref); | ||
176 | return sc; | ||
177 | } | ||
178 | |||
179 | static inline void ceph_put_snap_context(struct ceph_snap_context *sc) | ||
180 | { | ||
181 | if (!sc) | ||
182 | return; | ||
183 | /* | ||
184 | printk("put_snap_context %p %d -> %d\n", sc, atomic_read(&sc->nref), | ||
185 | atomic_read(&sc->nref)-1); | ||
186 | */ | ||
187 | if (atomic_dec_and_test(&sc->nref)) { | ||
188 | /*printk(" deleting snap_context %p\n", sc);*/ | ||
189 | kfree(sc); | ||
190 | } | ||
191 | } | ||
192 | |||
193 | /* | ||
194 | * calculate the number of pages a given length and offset map onto, | ||
195 | * if we align the data. | ||
196 | */ | ||
197 | static inline int calc_pages_for(u64 off, u64 len) | ||
198 | { | ||
199 | return ((off+len+PAGE_CACHE_SIZE-1) >> PAGE_CACHE_SHIFT) - | ||
200 | (off >> PAGE_CACHE_SHIFT); | ||
201 | } | ||
202 | |||
203 | /* ceph_common.c */ | ||
204 | extern const char *ceph_msg_type_name(int type); | ||
205 | extern int ceph_check_fsid(struct ceph_client *client, struct ceph_fsid *fsid); | ||
206 | extern struct kmem_cache *ceph_inode_cachep; | ||
207 | extern struct kmem_cache *ceph_cap_cachep; | ||
208 | extern struct kmem_cache *ceph_dentry_cachep; | ||
209 | extern struct kmem_cache *ceph_file_cachep; | ||
210 | |||
211 | extern int ceph_parse_options(struct ceph_options **popt, char *options, | ||
212 | const char *dev_name, const char *dev_name_end, | ||
213 | int (*parse_extra_token)(char *c, void *private), | ||
214 | void *private); | ||
215 | extern void ceph_destroy_options(struct ceph_options *opt); | ||
216 | extern int ceph_compare_options(struct ceph_options *new_opt, | ||
217 | struct ceph_client *client); | ||
218 | extern struct ceph_client *ceph_create_client(struct ceph_options *opt, | ||
219 | void *private); | ||
220 | extern u64 ceph_client_id(struct ceph_client *client); | ||
221 | extern void ceph_destroy_client(struct ceph_client *client); | ||
222 | extern int __ceph_open_session(struct ceph_client *client, | ||
223 | unsigned long started); | ||
224 | extern int ceph_open_session(struct ceph_client *client); | ||
225 | |||
226 | /* pagevec.c */ | ||
227 | extern void ceph_release_page_vector(struct page **pages, int num_pages); | ||
228 | |||
229 | extern struct page **ceph_get_direct_page_vector(const char __user *data, | ||
230 | int num_pages, | ||
231 | loff_t off, size_t len); | ||
232 | extern void ceph_put_page_vector(struct page **pages, int num_pages); | ||
233 | extern void ceph_release_page_vector(struct page **pages, int num_pages); | ||
234 | extern struct page **ceph_alloc_page_vector(int num_pages, gfp_t flags); | ||
235 | extern int ceph_copy_user_to_page_vector(struct page **pages, | ||
236 | const char __user *data, | ||
237 | loff_t off, size_t len); | ||
238 | extern int ceph_copy_to_page_vector(struct page **pages, | ||
239 | const char *data, | ||
240 | loff_t off, size_t len); | ||
241 | extern int ceph_copy_from_page_vector(struct page **pages, | ||
242 | char *data, | ||
243 | loff_t off, size_t len); | ||
244 | extern int ceph_copy_page_vector_to_user(struct page **pages, char __user *data, | ||
245 | loff_t off, size_t len); | ||
246 | extern void ceph_zero_page_vector_range(int off, int len, struct page **pages); | ||
247 | |||
248 | |||
249 | #endif /* _FS_CEPH_SUPER_H */ | ||
diff --git a/fs/ceph/mdsmap.h b/include/linux/ceph/mdsmap.h index 4c5cb0880bba..4c5cb0880bba 100644 --- a/fs/ceph/mdsmap.h +++ b/include/linux/ceph/mdsmap.h | |||
diff --git a/fs/ceph/messenger.h b/include/linux/ceph/messenger.h index 5a79450604ef..5956d62c3057 100644 --- a/fs/ceph/messenger.h +++ b/include/linux/ceph/messenger.h | |||
@@ -65,6 +65,9 @@ struct ceph_messenger { | |||
65 | */ | 65 | */ |
66 | u32 global_seq; | 66 | u32 global_seq; |
67 | spinlock_t global_seq_lock; | 67 | spinlock_t global_seq_lock; |
68 | |||
69 | u32 supported_features; | ||
70 | u32 required_features; | ||
68 | }; | 71 | }; |
69 | 72 | ||
70 | /* | 73 | /* |
@@ -209,7 +212,7 @@ struct ceph_connection { | |||
209 | }; | 212 | }; |
210 | 213 | ||
211 | 214 | ||
212 | extern const char *pr_addr(const struct sockaddr_storage *ss); | 215 | extern const char *ceph_pr_addr(const struct sockaddr_storage *ss); |
213 | extern int ceph_parse_ips(const char *c, const char *end, | 216 | extern int ceph_parse_ips(const char *c, const char *end, |
214 | struct ceph_entity_addr *addr, | 217 | struct ceph_entity_addr *addr, |
215 | int max_count, int *count); | 218 | int max_count, int *count); |
@@ -220,7 +223,8 @@ extern void ceph_msgr_exit(void); | |||
220 | extern void ceph_msgr_flush(void); | 223 | extern void ceph_msgr_flush(void); |
221 | 224 | ||
222 | extern struct ceph_messenger *ceph_messenger_create( | 225 | extern struct ceph_messenger *ceph_messenger_create( |
223 | struct ceph_entity_addr *myaddr); | 226 | struct ceph_entity_addr *myaddr, |
227 | u32 features, u32 required); | ||
224 | extern void ceph_messenger_destroy(struct ceph_messenger *); | 228 | extern void ceph_messenger_destroy(struct ceph_messenger *); |
225 | 229 | ||
226 | extern void ceph_con_init(struct ceph_messenger *msgr, | 230 | extern void ceph_con_init(struct ceph_messenger *msgr, |
diff --git a/fs/ceph/mon_client.h b/include/linux/ceph/mon_client.h index 8e396f2c0963..545f85917780 100644 --- a/fs/ceph/mon_client.h +++ b/include/linux/ceph/mon_client.h | |||
@@ -79,6 +79,7 @@ struct ceph_mon_client { | |||
79 | u64 last_tid; | 79 | u64 last_tid; |
80 | 80 | ||
81 | /* mds/osd map */ | 81 | /* mds/osd map */ |
82 | int want_mdsmap; | ||
82 | int want_next_osdmap; /* 1 = want, 2 = want+asked */ | 83 | int want_next_osdmap; /* 1 = want, 2 = want+asked */ |
83 | u32 have_osdmap, have_mdsmap; | 84 | u32 have_osdmap, have_mdsmap; |
84 | 85 | ||
diff --git a/fs/ceph/msgpool.h b/include/linux/ceph/msgpool.h index a362605f9368..a362605f9368 100644 --- a/fs/ceph/msgpool.h +++ b/include/linux/ceph/msgpool.h | |||
diff --git a/fs/ceph/msgr.h b/include/linux/ceph/msgr.h index 680d3d648cac..680d3d648cac 100644 --- a/fs/ceph/msgr.h +++ b/include/linux/ceph/msgr.h | |||
diff --git a/fs/ceph/osd_client.h b/include/linux/ceph/osd_client.h index 65c9c560f1ac..6c91fb032c39 100644 --- a/fs/ceph/osd_client.h +++ b/include/linux/ceph/osd_client.h | |||
@@ -69,6 +69,7 @@ struct ceph_osd_request { | |||
69 | struct list_head r_unsafe_item; | 69 | struct list_head r_unsafe_item; |
70 | 70 | ||
71 | struct inode *r_inode; /* for use by callbacks */ | 71 | struct inode *r_inode; /* for use by callbacks */ |
72 | void *r_priv; /* ditto */ | ||
72 | 73 | ||
73 | char r_oid[40]; /* object name */ | 74 | char r_oid[40]; /* object name */ |
74 | int r_oid_len; | 75 | int r_oid_len; |
diff --git a/fs/ceph/osdmap.h b/include/linux/ceph/osdmap.h index a592b211be39..ba4c205cbb01 100644 --- a/fs/ceph/osdmap.h +++ b/include/linux/ceph/osdmap.h | |||
@@ -4,7 +4,7 @@ | |||
4 | #include <linux/rbtree.h> | 4 | #include <linux/rbtree.h> |
5 | #include "types.h" | 5 | #include "types.h" |
6 | #include "ceph_fs.h" | 6 | #include "ceph_fs.h" |
7 | #include "crush/crush.h" | 7 | #include <linux/crush/crush.h> |
8 | 8 | ||
9 | /* | 9 | /* |
10 | * The osd map describes the current membership of the osd cluster and | 10 | * The osd map describes the current membership of the osd cluster and |
diff --git a/fs/ceph/pagelist.h b/include/linux/ceph/pagelist.h index cc9327aa1c98..cc9327aa1c98 100644 --- a/fs/ceph/pagelist.h +++ b/include/linux/ceph/pagelist.h | |||
diff --git a/fs/ceph/rados.h b/include/linux/ceph/rados.h index 6d5247f2e81b..6d5247f2e81b 100644 --- a/fs/ceph/rados.h +++ b/include/linux/ceph/rados.h | |||
diff --git a/fs/ceph/types.h b/include/linux/ceph/types.h index 28b35a005ec2..28b35a005ec2 100644 --- a/fs/ceph/types.h +++ b/include/linux/ceph/types.h | |||
diff --git a/fs/ceph/crush/crush.h b/include/linux/crush/crush.h index 97e435b191f4..97e435b191f4 100644 --- a/fs/ceph/crush/crush.h +++ b/include/linux/crush/crush.h | |||
diff --git a/fs/ceph/crush/hash.h b/include/linux/crush/hash.h index 91e884230d5d..91e884230d5d 100644 --- a/fs/ceph/crush/hash.h +++ b/include/linux/crush/hash.h | |||
diff --git a/fs/ceph/crush/mapper.h b/include/linux/crush/mapper.h index c46b99c18bb0..c46b99c18bb0 100644 --- a/fs/ceph/crush/mapper.h +++ b/include/linux/crush/mapper.h | |||
diff --git a/net/Kconfig b/net/Kconfig index e926884c1675..55fd82e9ffd9 100644 --- a/net/Kconfig +++ b/net/Kconfig | |||
@@ -293,6 +293,7 @@ source "net/wimax/Kconfig" | |||
293 | source "net/rfkill/Kconfig" | 293 | source "net/rfkill/Kconfig" |
294 | source "net/9p/Kconfig" | 294 | source "net/9p/Kconfig" |
295 | source "net/caif/Kconfig" | 295 | source "net/caif/Kconfig" |
296 | source "net/ceph/Kconfig" | ||
296 | 297 | ||
297 | 298 | ||
298 | endif # if NET | 299 | endif # if NET |
diff --git a/net/Makefile b/net/Makefile index ea60fbce9b1b..6b7bfd7f1416 100644 --- a/net/Makefile +++ b/net/Makefile | |||
@@ -68,3 +68,4 @@ obj-$(CONFIG_SYSCTL) += sysctl_net.o | |||
68 | endif | 68 | endif |
69 | obj-$(CONFIG_WIMAX) += wimax/ | 69 | obj-$(CONFIG_WIMAX) += wimax/ |
70 | obj-$(CONFIG_DNS_RESOLVER) += dns_resolver/ | 70 | obj-$(CONFIG_DNS_RESOLVER) += dns_resolver/ |
71 | obj-$(CONFIG_CEPH_LIB) += ceph/ | ||
diff --git a/net/ceph/Kconfig b/net/ceph/Kconfig new file mode 100644 index 000000000000..ad424049b0cf --- /dev/null +++ b/net/ceph/Kconfig | |||
@@ -0,0 +1,28 @@ | |||
1 | config CEPH_LIB | ||
2 | tristate "Ceph core library (EXPERIMENTAL)" | ||
3 | depends on INET && EXPERIMENTAL | ||
4 | select LIBCRC32C | ||
5 | select CRYPTO_AES | ||
6 | select CRYPTO | ||
7 | default n | ||
8 | help | ||
9 | Choose Y or M here to include cephlib, which provides the | ||
10 | common functionality to both the Ceph filesystem and | ||
11 | to the rados block device (rbd). | ||
12 | |||
13 | More information at http://ceph.newdream.net/. | ||
14 | |||
15 | If unsure, say N. | ||
16 | |||
17 | config CEPH_LIB_PRETTYDEBUG | ||
18 | bool "Include file:line in ceph debug output" | ||
19 | depends on CEPH_LIB | ||
20 | default n | ||
21 | help | ||
22 | If you say Y here, debug output will include a filename and | ||
23 | line to aid debugging. This increases kernel size and slows | ||
24 | execution slightly when debug call sites are enabled (e.g., | ||
25 | via CONFIG_DYNAMIC_DEBUG). | ||
26 | |||
27 | If unsure, say N. | ||
28 | |||
diff --git a/net/ceph/Makefile b/net/ceph/Makefile new file mode 100644 index 000000000000..aab1cabb8035 --- /dev/null +++ b/net/ceph/Makefile | |||
@@ -0,0 +1,37 @@ | |||
1 | # | ||
2 | # Makefile for CEPH filesystem. | ||
3 | # | ||
4 | |||
5 | ifneq ($(KERNELRELEASE),) | ||
6 | |||
7 | obj-$(CONFIG_CEPH_LIB) += libceph.o | ||
8 | |||
9 | libceph-objs := ceph_common.o messenger.o msgpool.o buffer.o pagelist.o \ | ||
10 | mon_client.o \ | ||
11 | osd_client.o osdmap.o crush/crush.o crush/mapper.o crush/hash.o \ | ||
12 | debugfs.o \ | ||
13 | auth.o auth_none.o \ | ||
14 | crypto.o armor.o \ | ||
15 | auth_x.o \ | ||
16 | ceph_fs.o ceph_strings.o ceph_hash.o \ | ||
17 | pagevec.o | ||
18 | |||
19 | else | ||
20 | #Otherwise we were called directly from the command | ||
21 | # line; invoke the kernel build system. | ||
22 | |||
23 | KERNELDIR ?= /lib/modules/$(shell uname -r)/build | ||
24 | PWD := $(shell pwd) | ||
25 | |||
26 | default: all | ||
27 | |||
28 | all: | ||
29 | $(MAKE) -C $(KERNELDIR) M=$(PWD) CONFIG_CEPH_LIB=m modules | ||
30 | |||
31 | modules_install: | ||
32 | $(MAKE) -C $(KERNELDIR) M=$(PWD) CONFIG_CEPH_LIB=m modules_install | ||
33 | |||
34 | clean: | ||
35 | $(MAKE) -C $(KERNELDIR) M=$(PWD) clean | ||
36 | |||
37 | endif | ||
diff --git a/fs/ceph/armor.c b/net/ceph/armor.c index eb2a666b0be7..eb2a666b0be7 100644 --- a/fs/ceph/armor.c +++ b/net/ceph/armor.c | |||
diff --git a/fs/ceph/auth.c b/net/ceph/auth.c index 6d2e30600627..549c1f43e1d5 100644 --- a/fs/ceph/auth.c +++ b/net/ceph/auth.c | |||
@@ -1,16 +1,16 @@ | |||
1 | #include "ceph_debug.h" | 1 | #include <linux/ceph/ceph_debug.h> |
2 | 2 | ||
3 | #include <linux/module.h> | 3 | #include <linux/module.h> |
4 | #include <linux/err.h> | 4 | #include <linux/err.h> |
5 | #include <linux/slab.h> | 5 | #include <linux/slab.h> |
6 | 6 | ||
7 | #include "types.h" | 7 | #include <linux/ceph/types.h> |
8 | #include <linux/ceph/decode.h> | ||
9 | #include <linux/ceph/libceph.h> | ||
10 | #include <linux/ceph/messenger.h> | ||
8 | #include "auth_none.h" | 11 | #include "auth_none.h" |
9 | #include "auth_x.h" | 12 | #include "auth_x.h" |
10 | #include "decode.h" | ||
11 | #include "super.h" | ||
12 | 13 | ||
13 | #include "messenger.h" | ||
14 | 14 | ||
15 | /* | 15 | /* |
16 | * get protocol handler | 16 | * get protocol handler |
diff --git a/fs/ceph/auth_none.c b/net/ceph/auth_none.c index ad1dc21286c7..214c2bb43d62 100644 --- a/fs/ceph/auth_none.c +++ b/net/ceph/auth_none.c | |||
@@ -1,14 +1,15 @@ | |||
1 | 1 | ||
2 | #include "ceph_debug.h" | 2 | #include <linux/ceph/ceph_debug.h> |
3 | 3 | ||
4 | #include <linux/err.h> | 4 | #include <linux/err.h> |
5 | #include <linux/module.h> | 5 | #include <linux/module.h> |
6 | #include <linux/random.h> | 6 | #include <linux/random.h> |
7 | #include <linux/slab.h> | 7 | #include <linux/slab.h> |
8 | 8 | ||
9 | #include <linux/ceph/decode.h> | ||
10 | #include <linux/ceph/auth.h> | ||
11 | |||
9 | #include "auth_none.h" | 12 | #include "auth_none.h" |
10 | #include "auth.h" | ||
11 | #include "decode.h" | ||
12 | 13 | ||
13 | static void reset(struct ceph_auth_client *ac) | 14 | static void reset(struct ceph_auth_client *ac) |
14 | { | 15 | { |
diff --git a/fs/ceph/auth_none.h b/net/ceph/auth_none.h index 8164df1a08be..ed7d088b1bc9 100644 --- a/fs/ceph/auth_none.h +++ b/net/ceph/auth_none.h | |||
@@ -2,8 +2,7 @@ | |||
2 | #define _FS_CEPH_AUTH_NONE_H | 2 | #define _FS_CEPH_AUTH_NONE_H |
3 | 3 | ||
4 | #include <linux/slab.h> | 4 | #include <linux/slab.h> |
5 | 5 | #include <linux/ceph/auth.h> | |
6 | #include "auth.h" | ||
7 | 6 | ||
8 | /* | 7 | /* |
9 | * null security mode. | 8 | * null security mode. |
diff --git a/fs/ceph/auth_x.c b/net/ceph/auth_x.c index a2d002cbdec2..7fd5dfcf6e18 100644 --- a/fs/ceph/auth_x.c +++ b/net/ceph/auth_x.c | |||
@@ -1,16 +1,17 @@ | |||
1 | 1 | ||
2 | #include "ceph_debug.h" | 2 | #include <linux/ceph/ceph_debug.h> |
3 | 3 | ||
4 | #include <linux/err.h> | 4 | #include <linux/err.h> |
5 | #include <linux/module.h> | 5 | #include <linux/module.h> |
6 | #include <linux/random.h> | 6 | #include <linux/random.h> |
7 | #include <linux/slab.h> | 7 | #include <linux/slab.h> |
8 | 8 | ||
9 | #include <linux/ceph/decode.h> | ||
10 | #include <linux/ceph/auth.h> | ||
11 | |||
12 | #include "crypto.h" | ||
9 | #include "auth_x.h" | 13 | #include "auth_x.h" |
10 | #include "auth_x_protocol.h" | 14 | #include "auth_x_protocol.h" |
11 | #include "crypto.h" | ||
12 | #include "auth.h" | ||
13 | #include "decode.h" | ||
14 | 15 | ||
15 | #define TEMP_TICKET_BUF_LEN 256 | 16 | #define TEMP_TICKET_BUF_LEN 256 |
16 | 17 | ||
diff --git a/fs/ceph/auth_x.h b/net/ceph/auth_x.h index ff6f8180e681..e02da7a5c5a1 100644 --- a/fs/ceph/auth_x.h +++ b/net/ceph/auth_x.h | |||
@@ -3,8 +3,9 @@ | |||
3 | 3 | ||
4 | #include <linux/rbtree.h> | 4 | #include <linux/rbtree.h> |
5 | 5 | ||
6 | #include <linux/ceph/auth.h> | ||
7 | |||
6 | #include "crypto.h" | 8 | #include "crypto.h" |
7 | #include "auth.h" | ||
8 | #include "auth_x_protocol.h" | 9 | #include "auth_x_protocol.h" |
9 | 10 | ||
10 | /* | 11 | /* |
diff --git a/fs/ceph/auth_x_protocol.h b/net/ceph/auth_x_protocol.h index 671d30576c4f..671d30576c4f 100644 --- a/fs/ceph/auth_x_protocol.h +++ b/net/ceph/auth_x_protocol.h | |||
diff --git a/fs/ceph/buffer.c b/net/ceph/buffer.c index cd39f17021de..53d8abfa25d5 100644 --- a/fs/ceph/buffer.c +++ b/net/ceph/buffer.c | |||
@@ -1,10 +1,11 @@ | |||
1 | 1 | ||
2 | #include "ceph_debug.h" | 2 | #include <linux/ceph/ceph_debug.h> |
3 | 3 | ||
4 | #include <linux/module.h> | ||
4 | #include <linux/slab.h> | 5 | #include <linux/slab.h> |
5 | 6 | ||
6 | #include "buffer.h" | 7 | #include <linux/ceph/buffer.h> |
7 | #include "decode.h" | 8 | #include <linux/ceph/decode.h> |
8 | 9 | ||
9 | struct ceph_buffer *ceph_buffer_new(size_t len, gfp_t gfp) | 10 | struct ceph_buffer *ceph_buffer_new(size_t len, gfp_t gfp) |
10 | { | 11 | { |
@@ -32,6 +33,7 @@ struct ceph_buffer *ceph_buffer_new(size_t len, gfp_t gfp) | |||
32 | dout("buffer_new %p\n", b); | 33 | dout("buffer_new %p\n", b); |
33 | return b; | 34 | return b; |
34 | } | 35 | } |
36 | EXPORT_SYMBOL(ceph_buffer_new); | ||
35 | 37 | ||
36 | void ceph_buffer_release(struct kref *kref) | 38 | void ceph_buffer_release(struct kref *kref) |
37 | { | 39 | { |
@@ -46,6 +48,7 @@ void ceph_buffer_release(struct kref *kref) | |||
46 | } | 48 | } |
47 | kfree(b); | 49 | kfree(b); |
48 | } | 50 | } |
51 | EXPORT_SYMBOL(ceph_buffer_release); | ||
49 | 52 | ||
50 | int ceph_decode_buffer(struct ceph_buffer **b, void **p, void *end) | 53 | int ceph_decode_buffer(struct ceph_buffer **b, void **p, void *end) |
51 | { | 54 | { |
diff --git a/net/ceph/ceph_common.c b/net/ceph/ceph_common.c new file mode 100644 index 000000000000..f6f2eebc0767 --- /dev/null +++ b/net/ceph/ceph_common.c | |||
@@ -0,0 +1,529 @@ | |||
1 | |||
2 | #include <linux/ceph/ceph_debug.h> | ||
3 | #include <linux/backing-dev.h> | ||
4 | #include <linux/ctype.h> | ||
5 | #include <linux/fs.h> | ||
6 | #include <linux/inet.h> | ||
7 | #include <linux/in6.h> | ||
8 | #include <linux/module.h> | ||
9 | #include <linux/mount.h> | ||
10 | #include <linux/parser.h> | ||
11 | #include <linux/sched.h> | ||
12 | #include <linux/seq_file.h> | ||
13 | #include <linux/slab.h> | ||
14 | #include <linux/statfs.h> | ||
15 | #include <linux/string.h> | ||
16 | |||
17 | |||
18 | #include <linux/ceph/libceph.h> | ||
19 | #include <linux/ceph/debugfs.h> | ||
20 | #include <linux/ceph/decode.h> | ||
21 | #include <linux/ceph/mon_client.h> | ||
22 | #include <linux/ceph/auth.h> | ||
23 | |||
24 | |||
25 | |||
26 | /* | ||
27 | * find filename portion of a path (/foo/bar/baz -> baz) | ||
28 | */ | ||
29 | const char *ceph_file_part(const char *s, int len) | ||
30 | { | ||
31 | const char *e = s + len; | ||
32 | |||
33 | while (e != s && *(e-1) != '/') | ||
34 | e--; | ||
35 | return e; | ||
36 | } | ||
37 | EXPORT_SYMBOL(ceph_file_part); | ||
38 | |||
39 | const char *ceph_msg_type_name(int type) | ||
40 | { | ||
41 | switch (type) { | ||
42 | case CEPH_MSG_SHUTDOWN: return "shutdown"; | ||
43 | case CEPH_MSG_PING: return "ping"; | ||
44 | case CEPH_MSG_AUTH: return "auth"; | ||
45 | case CEPH_MSG_AUTH_REPLY: return "auth_reply"; | ||
46 | case CEPH_MSG_MON_MAP: return "mon_map"; | ||
47 | case CEPH_MSG_MON_GET_MAP: return "mon_get_map"; | ||
48 | case CEPH_MSG_MON_SUBSCRIBE: return "mon_subscribe"; | ||
49 | case CEPH_MSG_MON_SUBSCRIBE_ACK: return "mon_subscribe_ack"; | ||
50 | case CEPH_MSG_STATFS: return "statfs"; | ||
51 | case CEPH_MSG_STATFS_REPLY: return "statfs_reply"; | ||
52 | case CEPH_MSG_MDS_MAP: return "mds_map"; | ||
53 | case CEPH_MSG_CLIENT_SESSION: return "client_session"; | ||
54 | case CEPH_MSG_CLIENT_RECONNECT: return "client_reconnect"; | ||
55 | case CEPH_MSG_CLIENT_REQUEST: return "client_request"; | ||
56 | case CEPH_MSG_CLIENT_REQUEST_FORWARD: return "client_request_forward"; | ||
57 | case CEPH_MSG_CLIENT_REPLY: return "client_reply"; | ||
58 | case CEPH_MSG_CLIENT_CAPS: return "client_caps"; | ||
59 | case CEPH_MSG_CLIENT_CAPRELEASE: return "client_cap_release"; | ||
60 | case CEPH_MSG_CLIENT_SNAP: return "client_snap"; | ||
61 | case CEPH_MSG_CLIENT_LEASE: return "client_lease"; | ||
62 | case CEPH_MSG_OSD_MAP: return "osd_map"; | ||
63 | case CEPH_MSG_OSD_OP: return "osd_op"; | ||
64 | case CEPH_MSG_OSD_OPREPLY: return "osd_opreply"; | ||
65 | default: return "unknown"; | ||
66 | } | ||
67 | } | ||
68 | EXPORT_SYMBOL(ceph_msg_type_name); | ||
69 | |||
70 | /* | ||
71 | * Initially learn our fsid, or verify an fsid matches. | ||
72 | */ | ||
73 | int ceph_check_fsid(struct ceph_client *client, struct ceph_fsid *fsid) | ||
74 | { | ||
75 | if (client->have_fsid) { | ||
76 | if (ceph_fsid_compare(&client->fsid, fsid)) { | ||
77 | pr_err("bad fsid, had %pU got %pU", | ||
78 | &client->fsid, fsid); | ||
79 | return -1; | ||
80 | } | ||
81 | } else { | ||
82 | pr_info("client%lld fsid %pU\n", ceph_client_id(client), fsid); | ||
83 | memcpy(&client->fsid, fsid, sizeof(*fsid)); | ||
84 | ceph_debugfs_client_init(client); | ||
85 | client->have_fsid = true; | ||
86 | } | ||
87 | return 0; | ||
88 | } | ||
89 | EXPORT_SYMBOL(ceph_check_fsid); | ||
90 | |||
91 | static int strcmp_null(const char *s1, const char *s2) | ||
92 | { | ||
93 | if (!s1 && !s2) | ||
94 | return 0; | ||
95 | if (s1 && !s2) | ||
96 | return -1; | ||
97 | if (!s1 && s2) | ||
98 | return 1; | ||
99 | return strcmp(s1, s2); | ||
100 | } | ||
101 | |||
102 | int ceph_compare_options(struct ceph_options *new_opt, | ||
103 | struct ceph_client *client) | ||
104 | { | ||
105 | struct ceph_options *opt1 = new_opt; | ||
106 | struct ceph_options *opt2 = client->options; | ||
107 | int ofs = offsetof(struct ceph_options, mon_addr); | ||
108 | int i; | ||
109 | int ret; | ||
110 | |||
111 | ret = memcmp(opt1, opt2, ofs); | ||
112 | if (ret) | ||
113 | return ret; | ||
114 | |||
115 | ret = strcmp_null(opt1->name, opt2->name); | ||
116 | if (ret) | ||
117 | return ret; | ||
118 | |||
119 | ret = strcmp_null(opt1->secret, opt2->secret); | ||
120 | if (ret) | ||
121 | return ret; | ||
122 | |||
123 | /* any matching mon ip implies a match */ | ||
124 | for (i = 0; i < opt1->num_mon; i++) { | ||
125 | if (ceph_monmap_contains(client->monc.monmap, | ||
126 | &opt1->mon_addr[i])) | ||
127 | return 0; | ||
128 | } | ||
129 | return -1; | ||
130 | } | ||
131 | EXPORT_SYMBOL(ceph_compare_options); | ||
132 | |||
133 | |||
134 | static int parse_fsid(const char *str, struct ceph_fsid *fsid) | ||
135 | { | ||
136 | int i = 0; | ||
137 | char tmp[3]; | ||
138 | int err = -EINVAL; | ||
139 | int d; | ||
140 | |||
141 | dout("parse_fsid '%s'\n", str); | ||
142 | tmp[2] = 0; | ||
143 | while (*str && i < 16) { | ||
144 | if (ispunct(*str)) { | ||
145 | str++; | ||
146 | continue; | ||
147 | } | ||
148 | if (!isxdigit(str[0]) || !isxdigit(str[1])) | ||
149 | break; | ||
150 | tmp[0] = str[0]; | ||
151 | tmp[1] = str[1]; | ||
152 | if (sscanf(tmp, "%x", &d) < 1) | ||
153 | break; | ||
154 | fsid->fsid[i] = d & 0xff; | ||
155 | i++; | ||
156 | str += 2; | ||
157 | } | ||
158 | |||
159 | if (i == 16) | ||
160 | err = 0; | ||
161 | dout("parse_fsid ret %d got fsid %pU", err, fsid); | ||
162 | return err; | ||
163 | } | ||
164 | |||
165 | /* | ||
166 | * ceph options | ||
167 | */ | ||
168 | enum { | ||
169 | Opt_osdtimeout, | ||
170 | Opt_osdkeepalivetimeout, | ||
171 | Opt_mount_timeout, | ||
172 | Opt_osd_idle_ttl, | ||
173 | Opt_last_int, | ||
174 | /* int args above */ | ||
175 | Opt_fsid, | ||
176 | Opt_name, | ||
177 | Opt_secret, | ||
178 | Opt_ip, | ||
179 | Opt_last_string, | ||
180 | /* string args above */ | ||
181 | Opt_noshare, | ||
182 | Opt_nocrc, | ||
183 | }; | ||
184 | |||
185 | static match_table_t opt_tokens = { | ||
186 | {Opt_osdtimeout, "osdtimeout=%d"}, | ||
187 | {Opt_osdkeepalivetimeout, "osdkeepalive=%d"}, | ||
188 | {Opt_mount_timeout, "mount_timeout=%d"}, | ||
189 | {Opt_osd_idle_ttl, "osd_idle_ttl=%d"}, | ||
190 | /* int args above */ | ||
191 | {Opt_fsid, "fsid=%s"}, | ||
192 | {Opt_name, "name=%s"}, | ||
193 | {Opt_secret, "secret=%s"}, | ||
194 | {Opt_ip, "ip=%s"}, | ||
195 | /* string args above */ | ||
196 | {Opt_noshare, "noshare"}, | ||
197 | {Opt_nocrc, "nocrc"}, | ||
198 | {-1, NULL} | ||
199 | }; | ||
200 | |||
201 | void ceph_destroy_options(struct ceph_options *opt) | ||
202 | { | ||
203 | dout("destroy_options %p\n", opt); | ||
204 | kfree(opt->name); | ||
205 | kfree(opt->secret); | ||
206 | kfree(opt); | ||
207 | } | ||
208 | EXPORT_SYMBOL(ceph_destroy_options); | ||
209 | |||
210 | int ceph_parse_options(struct ceph_options **popt, char *options, | ||
211 | const char *dev_name, const char *dev_name_end, | ||
212 | int (*parse_extra_token)(char *c, void *private), | ||
213 | void *private) | ||
214 | { | ||
215 | struct ceph_options *opt; | ||
216 | const char *c; | ||
217 | int err = -ENOMEM; | ||
218 | substring_t argstr[MAX_OPT_ARGS]; | ||
219 | |||
220 | opt = kzalloc(sizeof(*opt), GFP_KERNEL); | ||
221 | if (!opt) | ||
222 | return err; | ||
223 | opt->mon_addr = kcalloc(CEPH_MAX_MON, sizeof(*opt->mon_addr), | ||
224 | GFP_KERNEL); | ||
225 | if (!opt->mon_addr) | ||
226 | goto out; | ||
227 | |||
228 | dout("parse_options %p options '%s' dev_name '%s'\n", opt, options, | ||
229 | dev_name); | ||
230 | |||
231 | /* start with defaults */ | ||
232 | opt->flags = CEPH_OPT_DEFAULT; | ||
233 | opt->osd_timeout = CEPH_OSD_TIMEOUT_DEFAULT; | ||
234 | opt->osd_keepalive_timeout = CEPH_OSD_KEEPALIVE_DEFAULT; | ||
235 | opt->mount_timeout = CEPH_MOUNT_TIMEOUT_DEFAULT; /* seconds */ | ||
236 | opt->osd_idle_ttl = CEPH_OSD_IDLE_TTL_DEFAULT; /* seconds */ | ||
237 | |||
238 | /* get mon ip(s) */ | ||
239 | /* ip1[:port1][,ip2[:port2]...] */ | ||
240 | err = ceph_parse_ips(dev_name, dev_name_end, opt->mon_addr, | ||
241 | CEPH_MAX_MON, &opt->num_mon); | ||
242 | if (err < 0) | ||
243 | goto out; | ||
244 | |||
245 | /* parse mount options */ | ||
246 | while ((c = strsep(&options, ",")) != NULL) { | ||
247 | int token, intval, ret; | ||
248 | if (!*c) | ||
249 | continue; | ||
250 | err = -EINVAL; | ||
251 | token = match_token((char *)c, opt_tokens, argstr); | ||
252 | if (token < 0) { | ||
253 | /* extra? */ | ||
254 | err = parse_extra_token((char *)c, private); | ||
255 | if (err < 0) { | ||
256 | pr_err("bad option at '%s'\n", c); | ||
257 | goto out; | ||
258 | } | ||
259 | continue; | ||
260 | } | ||
261 | if (token < Opt_last_int) { | ||
262 | ret = match_int(&argstr[0], &intval); | ||
263 | if (ret < 0) { | ||
264 | pr_err("bad mount option arg (not int) " | ||
265 | "at '%s'\n", c); | ||
266 | continue; | ||
267 | } | ||
268 | dout("got int token %d val %d\n", token, intval); | ||
269 | } else if (token > Opt_last_int && token < Opt_last_string) { | ||
270 | dout("got string token %d val %s\n", token, | ||
271 | argstr[0].from); | ||
272 | } else { | ||
273 | dout("got token %d\n", token); | ||
274 | } | ||
275 | switch (token) { | ||
276 | case Opt_ip: | ||
277 | err = ceph_parse_ips(argstr[0].from, | ||
278 | argstr[0].to, | ||
279 | &opt->my_addr, | ||
280 | 1, NULL); | ||
281 | if (err < 0) | ||
282 | goto out; | ||
283 | opt->flags |= CEPH_OPT_MYIP; | ||
284 | break; | ||
285 | |||
286 | case Opt_fsid: | ||
287 | err = parse_fsid(argstr[0].from, &opt->fsid); | ||
288 | if (err == 0) | ||
289 | opt->flags |= CEPH_OPT_FSID; | ||
290 | break; | ||
291 | case Opt_name: | ||
292 | opt->name = kstrndup(argstr[0].from, | ||
293 | argstr[0].to-argstr[0].from, | ||
294 | GFP_KERNEL); | ||
295 | break; | ||
296 | case Opt_secret: | ||
297 | opt->secret = kstrndup(argstr[0].from, | ||
298 | argstr[0].to-argstr[0].from, | ||
299 | GFP_KERNEL); | ||
300 | break; | ||
301 | |||
302 | /* misc */ | ||
303 | case Opt_osdtimeout: | ||
304 | opt->osd_timeout = intval; | ||
305 | break; | ||
306 | case Opt_osdkeepalivetimeout: | ||
307 | opt->osd_keepalive_timeout = intval; | ||
308 | break; | ||
309 | case Opt_osd_idle_ttl: | ||
310 | opt->osd_idle_ttl = intval; | ||
311 | break; | ||
312 | case Opt_mount_timeout: | ||
313 | opt->mount_timeout = intval; | ||
314 | break; | ||
315 | |||
316 | case Opt_noshare: | ||
317 | opt->flags |= CEPH_OPT_NOSHARE; | ||
318 | break; | ||
319 | |||
320 | case Opt_nocrc: | ||
321 | opt->flags |= CEPH_OPT_NOCRC; | ||
322 | break; | ||
323 | |||
324 | default: | ||
325 | BUG_ON(token); | ||
326 | } | ||
327 | } | ||
328 | |||
329 | /* success */ | ||
330 | *popt = opt; | ||
331 | return 0; | ||
332 | |||
333 | out: | ||
334 | ceph_destroy_options(opt); | ||
335 | return err; | ||
336 | } | ||
337 | EXPORT_SYMBOL(ceph_parse_options); | ||
338 | |||
339 | u64 ceph_client_id(struct ceph_client *client) | ||
340 | { | ||
341 | return client->monc.auth->global_id; | ||
342 | } | ||
343 | EXPORT_SYMBOL(ceph_client_id); | ||
344 | |||
345 | /* | ||
346 | * create a fresh client instance | ||
347 | */ | ||
348 | struct ceph_client *ceph_create_client(struct ceph_options *opt, void *private) | ||
349 | { | ||
350 | struct ceph_client *client; | ||
351 | int err = -ENOMEM; | ||
352 | |||
353 | client = kzalloc(sizeof(*client), GFP_KERNEL); | ||
354 | if (client == NULL) | ||
355 | return ERR_PTR(-ENOMEM); | ||
356 | |||
357 | client->private = private; | ||
358 | client->options = opt; | ||
359 | |||
360 | mutex_init(&client->mount_mutex); | ||
361 | init_waitqueue_head(&client->auth_wq); | ||
362 | client->auth_err = 0; | ||
363 | |||
364 | client->extra_mon_dispatch = NULL; | ||
365 | client->supported_features = CEPH_FEATURE_SUPPORTED_DEFAULT; | ||
366 | client->required_features = CEPH_FEATURE_REQUIRED_DEFAULT; | ||
367 | |||
368 | client->msgr = NULL; | ||
369 | |||
370 | /* subsystems */ | ||
371 | err = ceph_monc_init(&client->monc, client); | ||
372 | if (err < 0) | ||
373 | goto fail; | ||
374 | err = ceph_osdc_init(&client->osdc, client); | ||
375 | if (err < 0) | ||
376 | goto fail_monc; | ||
377 | |||
378 | return client; | ||
379 | |||
380 | fail_monc: | ||
381 | ceph_monc_stop(&client->monc); | ||
382 | fail: | ||
383 | kfree(client); | ||
384 | return ERR_PTR(err); | ||
385 | } | ||
386 | EXPORT_SYMBOL(ceph_create_client); | ||
387 | |||
388 | void ceph_destroy_client(struct ceph_client *client) | ||
389 | { | ||
390 | dout("destroy_client %p\n", client); | ||
391 | |||
392 | /* unmount */ | ||
393 | ceph_osdc_stop(&client->osdc); | ||
394 | |||
395 | /* | ||
396 | * make sure mds and osd connections close out before destroying | ||
397 | * the auth module, which is needed to free those connections' | ||
398 | * ceph_authorizers. | ||
399 | */ | ||
400 | ceph_msgr_flush(); | ||
401 | |||
402 | ceph_monc_stop(&client->monc); | ||
403 | |||
404 | ceph_debugfs_client_cleanup(client); | ||
405 | |||
406 | if (client->msgr) | ||
407 | ceph_messenger_destroy(client->msgr); | ||
408 | |||
409 | ceph_destroy_options(client->options); | ||
410 | |||
411 | kfree(client); | ||
412 | dout("destroy_client %p done\n", client); | ||
413 | } | ||
414 | EXPORT_SYMBOL(ceph_destroy_client); | ||
415 | |||
416 | /* | ||
417 | * true if we have the mon map (and have thus joined the cluster) | ||
418 | */ | ||
419 | static int have_mon_and_osd_map(struct ceph_client *client) | ||
420 | { | ||
421 | return client->monc.monmap && client->monc.monmap->epoch && | ||
422 | client->osdc.osdmap && client->osdc.osdmap->epoch; | ||
423 | } | ||
424 | |||
425 | /* | ||
426 | * mount: join the ceph cluster, and open root directory. | ||
427 | */ | ||
428 | int __ceph_open_session(struct ceph_client *client, unsigned long started) | ||
429 | { | ||
430 | struct ceph_entity_addr *myaddr = NULL; | ||
431 | int err; | ||
432 | unsigned long timeout = client->options->mount_timeout * HZ; | ||
433 | |||
434 | /* initialize the messenger */ | ||
435 | if (client->msgr == NULL) { | ||
436 | if (ceph_test_opt(client, MYIP)) | ||
437 | myaddr = &client->options->my_addr; | ||
438 | client->msgr = ceph_messenger_create(myaddr, | ||
439 | client->supported_features, | ||
440 | client->required_features); | ||
441 | if (IS_ERR(client->msgr)) { | ||
442 | client->msgr = NULL; | ||
443 | return PTR_ERR(client->msgr); | ||
444 | } | ||
445 | client->msgr->nocrc = ceph_test_opt(client, NOCRC); | ||
446 | } | ||
447 | |||
448 | /* open session, and wait for mon and osd maps */ | ||
449 | err = ceph_monc_open_session(&client->monc); | ||
450 | if (err < 0) | ||
451 | return err; | ||
452 | |||
453 | while (!have_mon_and_osd_map(client)) { | ||
454 | err = -EIO; | ||
455 | if (timeout && time_after_eq(jiffies, started + timeout)) | ||
456 | return err; | ||
457 | |||
458 | /* wait */ | ||
459 | dout("mount waiting for mon_map\n"); | ||
460 | err = wait_event_interruptible_timeout(client->auth_wq, | ||
461 | have_mon_and_osd_map(client) || (client->auth_err < 0), | ||
462 | timeout); | ||
463 | if (err == -EINTR || err == -ERESTARTSYS) | ||
464 | return err; | ||
465 | if (client->auth_err < 0) | ||
466 | return client->auth_err; | ||
467 | } | ||
468 | |||
469 | return 0; | ||
470 | } | ||
471 | EXPORT_SYMBOL(__ceph_open_session); | ||
472 | |||
473 | |||
474 | int ceph_open_session(struct ceph_client *client) | ||
475 | { | ||
476 | int ret; | ||
477 | unsigned long started = jiffies; /* note the start time */ | ||
478 | |||
479 | dout("open_session start\n"); | ||
480 | mutex_lock(&client->mount_mutex); | ||
481 | |||
482 | ret = __ceph_open_session(client, started); | ||
483 | |||
484 | mutex_unlock(&client->mount_mutex); | ||
485 | return ret; | ||
486 | } | ||
487 | EXPORT_SYMBOL(ceph_open_session); | ||
488 | |||
489 | |||
490 | static int __init init_ceph_lib(void) | ||
491 | { | ||
492 | int ret = 0; | ||
493 | |||
494 | ret = ceph_debugfs_init(); | ||
495 | if (ret < 0) | ||
496 | goto out; | ||
497 | |||
498 | ret = ceph_msgr_init(); | ||
499 | if (ret < 0) | ||
500 | goto out_debugfs; | ||
501 | |||
502 | pr_info("loaded (mon/osd proto %d/%d, osdmap %d/%d %d/%d)\n", | ||
503 | CEPH_MONC_PROTOCOL, CEPH_OSDC_PROTOCOL, | ||
504 | CEPH_OSDMAP_VERSION, CEPH_OSDMAP_VERSION_EXT, | ||
505 | CEPH_OSDMAP_INC_VERSION, CEPH_OSDMAP_INC_VERSION_EXT); | ||
506 | |||
507 | return 0; | ||
508 | |||
509 | out_debugfs: | ||
510 | ceph_debugfs_cleanup(); | ||
511 | out: | ||
512 | return ret; | ||
513 | } | ||
514 | |||
515 | static void __exit exit_ceph_lib(void) | ||
516 | { | ||
517 | dout("exit_ceph_lib\n"); | ||
518 | ceph_msgr_exit(); | ||
519 | ceph_debugfs_cleanup(); | ||
520 | } | ||
521 | |||
522 | module_init(init_ceph_lib); | ||
523 | module_exit(exit_ceph_lib); | ||
524 | |||
525 | MODULE_AUTHOR("Sage Weil <sage@newdream.net>"); | ||
526 | MODULE_AUTHOR("Yehuda Sadeh <yehuda@hq.newdream.net>"); | ||
527 | MODULE_AUTHOR("Patience Warnick <patience@newdream.net>"); | ||
528 | MODULE_DESCRIPTION("Ceph filesystem for Linux"); | ||
529 | MODULE_LICENSE("GPL"); | ||
diff --git a/fs/ceph/ceph_fs.c b/net/ceph/ceph_fs.c index 3ac6cc7c1156..a3a3a31d3c37 100644 --- a/fs/ceph/ceph_fs.c +++ b/net/ceph/ceph_fs.c | |||
@@ -1,7 +1,8 @@ | |||
1 | /* | 1 | /* |
2 | * Some non-inline ceph helpers | 2 | * Some non-inline ceph helpers |
3 | */ | 3 | */ |
4 | #include "types.h" | 4 | #include <linux/module.h> |
5 | #include <linux/ceph/types.h> | ||
5 | 6 | ||
6 | /* | 7 | /* |
7 | * return true if @layout appears to be valid | 8 | * return true if @layout appears to be valid |
@@ -52,6 +53,7 @@ int ceph_flags_to_mode(int flags) | |||
52 | 53 | ||
53 | return mode; | 54 | return mode; |
54 | } | 55 | } |
56 | EXPORT_SYMBOL(ceph_flags_to_mode); | ||
55 | 57 | ||
56 | int ceph_caps_for_mode(int mode) | 58 | int ceph_caps_for_mode(int mode) |
57 | { | 59 | { |
@@ -70,3 +72,4 @@ int ceph_caps_for_mode(int mode) | |||
70 | 72 | ||
71 | return caps; | 73 | return caps; |
72 | } | 74 | } |
75 | EXPORT_SYMBOL(ceph_caps_for_mode); | ||
diff --git a/fs/ceph/ceph_hash.c b/net/ceph/ceph_hash.c index bd570015d147..815ef8826796 100644 --- a/fs/ceph/ceph_hash.c +++ b/net/ceph/ceph_hash.c | |||
@@ -1,5 +1,5 @@ | |||
1 | 1 | ||
2 | #include "types.h" | 2 | #include <linux/ceph/types.h> |
3 | 3 | ||
4 | /* | 4 | /* |
5 | * Robert Jenkin's hash function. | 5 | * Robert Jenkin's hash function. |
diff --git a/net/ceph/ceph_strings.c b/net/ceph/ceph_strings.c new file mode 100644 index 000000000000..3fbda04de29c --- /dev/null +++ b/net/ceph/ceph_strings.c | |||
@@ -0,0 +1,84 @@ | |||
1 | /* | ||
2 | * Ceph string constants | ||
3 | */ | ||
4 | #include <linux/module.h> | ||
5 | #include <linux/ceph/types.h> | ||
6 | |||
7 | const char *ceph_entity_type_name(int type) | ||
8 | { | ||
9 | switch (type) { | ||
10 | case CEPH_ENTITY_TYPE_MDS: return "mds"; | ||
11 | case CEPH_ENTITY_TYPE_OSD: return "osd"; | ||
12 | case CEPH_ENTITY_TYPE_MON: return "mon"; | ||
13 | case CEPH_ENTITY_TYPE_CLIENT: return "client"; | ||
14 | case CEPH_ENTITY_TYPE_AUTH: return "auth"; | ||
15 | default: return "unknown"; | ||
16 | } | ||
17 | } | ||
18 | |||
19 | const char *ceph_osd_op_name(int op) | ||
20 | { | ||
21 | switch (op) { | ||
22 | case CEPH_OSD_OP_READ: return "read"; | ||
23 | case CEPH_OSD_OP_STAT: return "stat"; | ||
24 | |||
25 | case CEPH_OSD_OP_MASKTRUNC: return "masktrunc"; | ||
26 | |||
27 | case CEPH_OSD_OP_WRITE: return "write"; | ||
28 | case CEPH_OSD_OP_DELETE: return "delete"; | ||
29 | case CEPH_OSD_OP_TRUNCATE: return "truncate"; | ||
30 | case CEPH_OSD_OP_ZERO: return "zero"; | ||
31 | case CEPH_OSD_OP_WRITEFULL: return "writefull"; | ||
32 | case CEPH_OSD_OP_ROLLBACK: return "rollback"; | ||
33 | |||
34 | case CEPH_OSD_OP_APPEND: return "append"; | ||
35 | case CEPH_OSD_OP_STARTSYNC: return "startsync"; | ||
36 | case CEPH_OSD_OP_SETTRUNC: return "settrunc"; | ||
37 | case CEPH_OSD_OP_TRIMTRUNC: return "trimtrunc"; | ||
38 | |||
39 | case CEPH_OSD_OP_TMAPUP: return "tmapup"; | ||
40 | case CEPH_OSD_OP_TMAPGET: return "tmapget"; | ||
41 | case CEPH_OSD_OP_TMAPPUT: return "tmapput"; | ||
42 | |||
43 | case CEPH_OSD_OP_GETXATTR: return "getxattr"; | ||
44 | case CEPH_OSD_OP_GETXATTRS: return "getxattrs"; | ||
45 | case CEPH_OSD_OP_SETXATTR: return "setxattr"; | ||
46 | case CEPH_OSD_OP_SETXATTRS: return "setxattrs"; | ||
47 | case CEPH_OSD_OP_RESETXATTRS: return "resetxattrs"; | ||
48 | case CEPH_OSD_OP_RMXATTR: return "rmxattr"; | ||
49 | case CEPH_OSD_OP_CMPXATTR: return "cmpxattr"; | ||
50 | |||
51 | case CEPH_OSD_OP_PULL: return "pull"; | ||
52 | case CEPH_OSD_OP_PUSH: return "push"; | ||
53 | case CEPH_OSD_OP_BALANCEREADS: return "balance-reads"; | ||
54 | case CEPH_OSD_OP_UNBALANCEREADS: return "unbalance-reads"; | ||
55 | case CEPH_OSD_OP_SCRUB: return "scrub"; | ||
56 | |||
57 | case CEPH_OSD_OP_WRLOCK: return "wrlock"; | ||
58 | case CEPH_OSD_OP_WRUNLOCK: return "wrunlock"; | ||
59 | case CEPH_OSD_OP_RDLOCK: return "rdlock"; | ||
60 | case CEPH_OSD_OP_RDUNLOCK: return "rdunlock"; | ||
61 | case CEPH_OSD_OP_UPLOCK: return "uplock"; | ||
62 | case CEPH_OSD_OP_DNLOCK: return "dnlock"; | ||
63 | |||
64 | case CEPH_OSD_OP_CALL: return "call"; | ||
65 | |||
66 | case CEPH_OSD_OP_PGLS: return "pgls"; | ||
67 | } | ||
68 | return "???"; | ||
69 | } | ||
70 | |||
71 | |||
72 | const char *ceph_pool_op_name(int op) | ||
73 | { | ||
74 | switch (op) { | ||
75 | case POOL_OP_CREATE: return "create"; | ||
76 | case POOL_OP_DELETE: return "delete"; | ||
77 | case POOL_OP_AUID_CHANGE: return "auid change"; | ||
78 | case POOL_OP_CREATE_SNAP: return "create snap"; | ||
79 | case POOL_OP_DELETE_SNAP: return "delete snap"; | ||
80 | case POOL_OP_CREATE_UNMANAGED_SNAP: return "create unmanaged snap"; | ||
81 | case POOL_OP_DELETE_UNMANAGED_SNAP: return "delete unmanaged snap"; | ||
82 | } | ||
83 | return "???"; | ||
84 | } | ||
diff --git a/fs/ceph/crush/crush.c b/net/ceph/crush/crush.c index fabd302e5779..d6ebb13a18a4 100644 --- a/fs/ceph/crush/crush.c +++ b/net/ceph/crush/crush.c | |||
@@ -8,7 +8,7 @@ | |||
8 | # define BUG_ON(x) assert(!(x)) | 8 | # define BUG_ON(x) assert(!(x)) |
9 | #endif | 9 | #endif |
10 | 10 | ||
11 | #include "crush.h" | 11 | #include <linux/crush/crush.h> |
12 | 12 | ||
13 | const char *crush_bucket_alg_name(int alg) | 13 | const char *crush_bucket_alg_name(int alg) |
14 | { | 14 | { |
diff --git a/fs/ceph/crush/hash.c b/net/ceph/crush/hash.c index 5873aed694bf..5bb63e37a8a1 100644 --- a/fs/ceph/crush/hash.c +++ b/net/ceph/crush/hash.c | |||
@@ -1,6 +1,6 @@ | |||
1 | 1 | ||
2 | #include <linux/types.h> | 2 | #include <linux/types.h> |
3 | #include "hash.h" | 3 | #include <linux/crush/hash.h> |
4 | 4 | ||
5 | /* | 5 | /* |
6 | * Robert Jenkins' function for mixing 32-bit values | 6 | * Robert Jenkins' function for mixing 32-bit values |
diff --git a/fs/ceph/crush/mapper.c b/net/ceph/crush/mapper.c index a4eec133258e..42599e31dcad 100644 --- a/fs/ceph/crush/mapper.c +++ b/net/ceph/crush/mapper.c | |||
@@ -18,8 +18,8 @@ | |||
18 | # define kfree(x) free(x) | 18 | # define kfree(x) free(x) |
19 | #endif | 19 | #endif |
20 | 20 | ||
21 | #include "crush.h" | 21 | #include <linux/crush/crush.h> |
22 | #include "hash.h" | 22 | #include <linux/crush/hash.h> |
23 | 23 | ||
24 | /* | 24 | /* |
25 | * Implement the core CRUSH mapping algorithm. | 25 | * Implement the core CRUSH mapping algorithm. |
diff --git a/fs/ceph/crypto.c b/net/ceph/crypto.c index a3e627f63293..7b505b0c983f 100644 --- a/fs/ceph/crypto.c +++ b/net/ceph/crypto.c | |||
@@ -1,13 +1,13 @@ | |||
1 | 1 | ||
2 | #include "ceph_debug.h" | 2 | #include <linux/ceph/ceph_debug.h> |
3 | 3 | ||
4 | #include <linux/err.h> | 4 | #include <linux/err.h> |
5 | #include <linux/scatterlist.h> | 5 | #include <linux/scatterlist.h> |
6 | #include <linux/slab.h> | 6 | #include <linux/slab.h> |
7 | #include <crypto/hash.h> | 7 | #include <crypto/hash.h> |
8 | 8 | ||
9 | #include <linux/ceph/decode.h> | ||
9 | #include "crypto.h" | 10 | #include "crypto.h" |
10 | #include "decode.h" | ||
11 | 11 | ||
12 | int ceph_crypto_key_encode(struct ceph_crypto_key *key, void **p, void *end) | 12 | int ceph_crypto_key_encode(struct ceph_crypto_key *key, void **p, void *end) |
13 | { | 13 | { |
diff --git a/fs/ceph/crypto.h b/net/ceph/crypto.h index bdf38607323c..f9eccace592b 100644 --- a/fs/ceph/crypto.h +++ b/net/ceph/crypto.h | |||
@@ -1,8 +1,8 @@ | |||
1 | #ifndef _FS_CEPH_CRYPTO_H | 1 | #ifndef _FS_CEPH_CRYPTO_H |
2 | #define _FS_CEPH_CRYPTO_H | 2 | #define _FS_CEPH_CRYPTO_H |
3 | 3 | ||
4 | #include "types.h" | 4 | #include <linux/ceph/types.h> |
5 | #include "buffer.h" | 5 | #include <linux/ceph/buffer.h> |
6 | 6 | ||
7 | /* | 7 | /* |
8 | * cryptographic secret | 8 | * cryptographic secret |
diff --git a/net/ceph/debugfs.c b/net/ceph/debugfs.c new file mode 100644 index 000000000000..33d04999f4f2 --- /dev/null +++ b/net/ceph/debugfs.c | |||
@@ -0,0 +1,268 @@ | |||
1 | #include <linux/ceph/ceph_debug.h> | ||
2 | |||
3 | #include <linux/device.h> | ||
4 | #include <linux/slab.h> | ||
5 | #include <linux/module.h> | ||
6 | #include <linux/ctype.h> | ||
7 | #include <linux/debugfs.h> | ||
8 | #include <linux/seq_file.h> | ||
9 | |||
10 | #include <linux/ceph/libceph.h> | ||
11 | #include <linux/ceph/mon_client.h> | ||
12 | #include <linux/ceph/auth.h> | ||
13 | #include <linux/ceph/debugfs.h> | ||
14 | |||
15 | #ifdef CONFIG_DEBUG_FS | ||
16 | |||
17 | /* | ||
18 | * Implement /sys/kernel/debug/ceph fun | ||
19 | * | ||
20 | * /sys/kernel/debug/ceph/client* - an instance of the ceph client | ||
21 | * .../osdmap - current osdmap | ||
22 | * .../monmap - current monmap | ||
23 | * .../osdc - active osd requests | ||
24 | * .../monc - mon client state | ||
25 | * .../dentry_lru - dump contents of dentry lru | ||
26 | * .../caps - expose cap (reservation) stats | ||
27 | * .../bdi - symlink to ../../bdi/something | ||
28 | */ | ||
29 | |||
30 | static struct dentry *ceph_debugfs_dir; | ||
31 | |||
32 | static int monmap_show(struct seq_file *s, void *p) | ||
33 | { | ||
34 | int i; | ||
35 | struct ceph_client *client = s->private; | ||
36 | |||
37 | if (client->monc.monmap == NULL) | ||
38 | return 0; | ||
39 | |||
40 | seq_printf(s, "epoch %d\n", client->monc.monmap->epoch); | ||
41 | for (i = 0; i < client->monc.monmap->num_mon; i++) { | ||
42 | struct ceph_entity_inst *inst = | ||
43 | &client->monc.monmap->mon_inst[i]; | ||
44 | |||
45 | seq_printf(s, "\t%s%lld\t%s\n", | ||
46 | ENTITY_NAME(inst->name), | ||
47 | ceph_pr_addr(&inst->addr.in_addr)); | ||
48 | } | ||
49 | return 0; | ||
50 | } | ||
51 | |||
52 | static int osdmap_show(struct seq_file *s, void *p) | ||
53 | { | ||
54 | int i; | ||
55 | struct ceph_client *client = s->private; | ||
56 | struct rb_node *n; | ||
57 | |||
58 | if (client->osdc.osdmap == NULL) | ||
59 | return 0; | ||
60 | seq_printf(s, "epoch %d\n", client->osdc.osdmap->epoch); | ||
61 | seq_printf(s, "flags%s%s\n", | ||
62 | (client->osdc.osdmap->flags & CEPH_OSDMAP_NEARFULL) ? | ||
63 | " NEARFULL" : "", | ||
64 | (client->osdc.osdmap->flags & CEPH_OSDMAP_FULL) ? | ||
65 | " FULL" : ""); | ||
66 | for (n = rb_first(&client->osdc.osdmap->pg_pools); n; n = rb_next(n)) { | ||
67 | struct ceph_pg_pool_info *pool = | ||
68 | rb_entry(n, struct ceph_pg_pool_info, node); | ||
69 | seq_printf(s, "pg_pool %d pg_num %d / %d, lpg_num %d / %d\n", | ||
70 | pool->id, pool->v.pg_num, pool->pg_num_mask, | ||
71 | pool->v.lpg_num, pool->lpg_num_mask); | ||
72 | } | ||
73 | for (i = 0; i < client->osdc.osdmap->max_osd; i++) { | ||
74 | struct ceph_entity_addr *addr = | ||
75 | &client->osdc.osdmap->osd_addr[i]; | ||
76 | int state = client->osdc.osdmap->osd_state[i]; | ||
77 | char sb[64]; | ||
78 | |||
79 | seq_printf(s, "\tosd%d\t%s\t%3d%%\t(%s)\n", | ||
80 | i, ceph_pr_addr(&addr->in_addr), | ||
81 | ((client->osdc.osdmap->osd_weight[i]*100) >> 16), | ||
82 | ceph_osdmap_state_str(sb, sizeof(sb), state)); | ||
83 | } | ||
84 | return 0; | ||
85 | } | ||
86 | |||
87 | static int monc_show(struct seq_file *s, void *p) | ||
88 | { | ||
89 | struct ceph_client *client = s->private; | ||
90 | struct ceph_mon_generic_request *req; | ||
91 | struct ceph_mon_client *monc = &client->monc; | ||
92 | struct rb_node *rp; | ||
93 | |||
94 | mutex_lock(&monc->mutex); | ||
95 | |||
96 | if (monc->have_mdsmap) | ||
97 | seq_printf(s, "have mdsmap %u\n", (unsigned)monc->have_mdsmap); | ||
98 | if (monc->have_osdmap) | ||
99 | seq_printf(s, "have osdmap %u\n", (unsigned)monc->have_osdmap); | ||
100 | if (monc->want_next_osdmap) | ||
101 | seq_printf(s, "want next osdmap\n"); | ||
102 | |||
103 | for (rp = rb_first(&monc->generic_request_tree); rp; rp = rb_next(rp)) { | ||
104 | __u16 op; | ||
105 | req = rb_entry(rp, struct ceph_mon_generic_request, node); | ||
106 | op = le16_to_cpu(req->request->hdr.type); | ||
107 | if (op == CEPH_MSG_STATFS) | ||
108 | seq_printf(s, "%lld statfs\n", req->tid); | ||
109 | else | ||
110 | seq_printf(s, "%lld unknown\n", req->tid); | ||
111 | } | ||
112 | |||
113 | mutex_unlock(&monc->mutex); | ||
114 | return 0; | ||
115 | } | ||
116 | |||
117 | static int osdc_show(struct seq_file *s, void *pp) | ||
118 | { | ||
119 | struct ceph_client *client = s->private; | ||
120 | struct ceph_osd_client *osdc = &client->osdc; | ||
121 | struct rb_node *p; | ||
122 | |||
123 | mutex_lock(&osdc->request_mutex); | ||
124 | for (p = rb_first(&osdc->requests); p; p = rb_next(p)) { | ||
125 | struct ceph_osd_request *req; | ||
126 | struct ceph_osd_request_head *head; | ||
127 | struct ceph_osd_op *op; | ||
128 | int num_ops; | ||
129 | int opcode, olen; | ||
130 | int i; | ||
131 | |||
132 | req = rb_entry(p, struct ceph_osd_request, r_node); | ||
133 | |||
134 | seq_printf(s, "%lld\tosd%d\t%d.%x\t", req->r_tid, | ||
135 | req->r_osd ? req->r_osd->o_osd : -1, | ||
136 | le32_to_cpu(req->r_pgid.pool), | ||
137 | le16_to_cpu(req->r_pgid.ps)); | ||
138 | |||
139 | head = req->r_request->front.iov_base; | ||
140 | op = (void *)(head + 1); | ||
141 | |||
142 | num_ops = le16_to_cpu(head->num_ops); | ||
143 | olen = le32_to_cpu(head->object_len); | ||
144 | seq_printf(s, "%.*s", olen, | ||
145 | (const char *)(head->ops + num_ops)); | ||
146 | |||
147 | if (req->r_reassert_version.epoch) | ||
148 | seq_printf(s, "\t%u'%llu", | ||
149 | (unsigned)le32_to_cpu(req->r_reassert_version.epoch), | ||
150 | le64_to_cpu(req->r_reassert_version.version)); | ||
151 | else | ||
152 | seq_printf(s, "\t"); | ||
153 | |||
154 | for (i = 0; i < num_ops; i++) { | ||
155 | opcode = le16_to_cpu(op->op); | ||
156 | seq_printf(s, "\t%s", ceph_osd_op_name(opcode)); | ||
157 | op++; | ||
158 | } | ||
159 | |||
160 | seq_printf(s, "\n"); | ||
161 | } | ||
162 | mutex_unlock(&osdc->request_mutex); | ||
163 | return 0; | ||
164 | } | ||
165 | |||
166 | CEPH_DEFINE_SHOW_FUNC(monmap_show) | ||
167 | CEPH_DEFINE_SHOW_FUNC(osdmap_show) | ||
168 | CEPH_DEFINE_SHOW_FUNC(monc_show) | ||
169 | CEPH_DEFINE_SHOW_FUNC(osdc_show) | ||
170 | |||
171 | int ceph_debugfs_init(void) | ||
172 | { | ||
173 | ceph_debugfs_dir = debugfs_create_dir("ceph", NULL); | ||
174 | if (!ceph_debugfs_dir) | ||
175 | return -ENOMEM; | ||
176 | return 0; | ||
177 | } | ||
178 | |||
179 | void ceph_debugfs_cleanup(void) | ||
180 | { | ||
181 | debugfs_remove(ceph_debugfs_dir); | ||
182 | } | ||
183 | |||
184 | int ceph_debugfs_client_init(struct ceph_client *client) | ||
185 | { | ||
186 | int ret = -ENOMEM; | ||
187 | char name[80]; | ||
188 | |||
189 | snprintf(name, sizeof(name), "%pU.client%lld", &client->fsid, | ||
190 | client->monc.auth->global_id); | ||
191 | |||
192 | client->debugfs_dir = debugfs_create_dir(name, ceph_debugfs_dir); | ||
193 | if (!client->debugfs_dir) | ||
194 | goto out; | ||
195 | |||
196 | client->monc.debugfs_file = debugfs_create_file("monc", | ||
197 | 0600, | ||
198 | client->debugfs_dir, | ||
199 | client, | ||
200 | &monc_show_fops); | ||
201 | if (!client->monc.debugfs_file) | ||
202 | goto out; | ||
203 | |||
204 | client->osdc.debugfs_file = debugfs_create_file("osdc", | ||
205 | 0600, | ||
206 | client->debugfs_dir, | ||
207 | client, | ||
208 | &osdc_show_fops); | ||
209 | if (!client->osdc.debugfs_file) | ||
210 | goto out; | ||
211 | |||
212 | client->debugfs_monmap = debugfs_create_file("monmap", | ||
213 | 0600, | ||
214 | client->debugfs_dir, | ||
215 | client, | ||
216 | &monmap_show_fops); | ||
217 | if (!client->debugfs_monmap) | ||
218 | goto out; | ||
219 | |||
220 | client->debugfs_osdmap = debugfs_create_file("osdmap", | ||
221 | 0600, | ||
222 | client->debugfs_dir, | ||
223 | client, | ||
224 | &osdmap_show_fops); | ||
225 | if (!client->debugfs_osdmap) | ||
226 | goto out; | ||
227 | |||
228 | return 0; | ||
229 | |||
230 | out: | ||
231 | ceph_debugfs_client_cleanup(client); | ||
232 | return ret; | ||
233 | } | ||
234 | |||
235 | void ceph_debugfs_client_cleanup(struct ceph_client *client) | ||
236 | { | ||
237 | debugfs_remove(client->debugfs_osdmap); | ||
238 | debugfs_remove(client->debugfs_monmap); | ||
239 | debugfs_remove(client->osdc.debugfs_file); | ||
240 | debugfs_remove(client->monc.debugfs_file); | ||
241 | debugfs_remove(client->debugfs_dir); | ||
242 | } | ||
243 | |||
244 | #else /* CONFIG_DEBUG_FS */ | ||
245 | |||
246 | int ceph_debugfs_init(void) | ||
247 | { | ||
248 | return 0; | ||
249 | } | ||
250 | |||
251 | void ceph_debugfs_cleanup(void) | ||
252 | { | ||
253 | } | ||
254 | |||
255 | int ceph_debugfs_client_init(struct ceph_client *client, | ||
256 | int (*module_debugfs_init)(struct ceph_client *)) | ||
257 | { | ||
258 | return 0; | ||
259 | } | ||
260 | |||
261 | void ceph_debugfs_client_cleanup(struct ceph_client *client) | ||
262 | { | ||
263 | } | ||
264 | |||
265 | #endif /* CONFIG_DEBUG_FS */ | ||
266 | |||
267 | EXPORT_SYMBOL(ceph_debugfs_init); | ||
268 | EXPORT_SYMBOL(ceph_debugfs_cleanup); | ||
diff --git a/fs/ceph/messenger.c b/net/ceph/messenger.c index 17a09b32a591..0e8157ee5d43 100644 --- a/fs/ceph/messenger.c +++ b/net/ceph/messenger.c | |||
@@ -1,4 +1,4 @@ | |||
1 | #include "ceph_debug.h" | 1 | #include <linux/ceph/ceph_debug.h> |
2 | 2 | ||
3 | #include <linux/crc32c.h> | 3 | #include <linux/crc32c.h> |
4 | #include <linux/ctype.h> | 4 | #include <linux/ctype.h> |
@@ -13,10 +13,10 @@ | |||
13 | #include <linux/blkdev.h> | 13 | #include <linux/blkdev.h> |
14 | #include <net/tcp.h> | 14 | #include <net/tcp.h> |
15 | 15 | ||
16 | #include "super.h" | 16 | #include <linux/ceph/libceph.h> |
17 | #include "messenger.h" | 17 | #include <linux/ceph/messenger.h> |
18 | #include "decode.h" | 18 | #include <linux/ceph/decode.h> |
19 | #include "pagelist.h" | 19 | #include <linux/ceph/pagelist.h> |
20 | 20 | ||
21 | /* | 21 | /* |
22 | * Ceph uses the messenger to exchange ceph_msg messages with other | 22 | * Ceph uses the messenger to exchange ceph_msg messages with other |
@@ -50,7 +50,7 @@ static char addr_str[MAX_ADDR_STR][MAX_ADDR_STR_LEN]; | |||
50 | static DEFINE_SPINLOCK(addr_str_lock); | 50 | static DEFINE_SPINLOCK(addr_str_lock); |
51 | static int last_addr_str; | 51 | static int last_addr_str; |
52 | 52 | ||
53 | const char *pr_addr(const struct sockaddr_storage *ss) | 53 | const char *ceph_pr_addr(const struct sockaddr_storage *ss) |
54 | { | 54 | { |
55 | int i; | 55 | int i; |
56 | char *s; | 56 | char *s; |
@@ -81,6 +81,7 @@ const char *pr_addr(const struct sockaddr_storage *ss) | |||
81 | 81 | ||
82 | return s; | 82 | return s; |
83 | } | 83 | } |
84 | EXPORT_SYMBOL(ceph_pr_addr); | ||
84 | 85 | ||
85 | static void encode_my_addr(struct ceph_messenger *msgr) | 86 | static void encode_my_addr(struct ceph_messenger *msgr) |
86 | { | 87 | { |
@@ -93,7 +94,7 @@ static void encode_my_addr(struct ceph_messenger *msgr) | |||
93 | */ | 94 | */ |
94 | struct workqueue_struct *ceph_msgr_wq; | 95 | struct workqueue_struct *ceph_msgr_wq; |
95 | 96 | ||
96 | int __init ceph_msgr_init(void) | 97 | int ceph_msgr_init(void) |
97 | { | 98 | { |
98 | ceph_msgr_wq = create_workqueue("ceph-msgr"); | 99 | ceph_msgr_wq = create_workqueue("ceph-msgr"); |
99 | if (IS_ERR(ceph_msgr_wq)) { | 100 | if (IS_ERR(ceph_msgr_wq)) { |
@@ -104,16 +105,19 @@ int __init ceph_msgr_init(void) | |||
104 | } | 105 | } |
105 | return 0; | 106 | return 0; |
106 | } | 107 | } |
108 | EXPORT_SYMBOL(ceph_msgr_init); | ||
107 | 109 | ||
108 | void ceph_msgr_exit(void) | 110 | void ceph_msgr_exit(void) |
109 | { | 111 | { |
110 | destroy_workqueue(ceph_msgr_wq); | 112 | destroy_workqueue(ceph_msgr_wq); |
111 | } | 113 | } |
114 | EXPORT_SYMBOL(ceph_msgr_exit); | ||
112 | 115 | ||
113 | void ceph_msgr_flush(void) | 116 | void ceph_msgr_flush(void) |
114 | { | 117 | { |
115 | flush_workqueue(ceph_msgr_wq); | 118 | flush_workqueue(ceph_msgr_wq); |
116 | } | 119 | } |
120 | EXPORT_SYMBOL(ceph_msgr_flush); | ||
117 | 121 | ||
118 | 122 | ||
119 | /* | 123 | /* |
@@ -223,19 +227,19 @@ static struct socket *ceph_tcp_connect(struct ceph_connection *con) | |||
223 | 227 | ||
224 | set_sock_callbacks(sock, con); | 228 | set_sock_callbacks(sock, con); |
225 | 229 | ||
226 | dout("connect %s\n", pr_addr(&con->peer_addr.in_addr)); | 230 | dout("connect %s\n", ceph_pr_addr(&con->peer_addr.in_addr)); |
227 | 231 | ||
228 | ret = sock->ops->connect(sock, (struct sockaddr *)paddr, sizeof(*paddr), | 232 | ret = sock->ops->connect(sock, (struct sockaddr *)paddr, sizeof(*paddr), |
229 | O_NONBLOCK); | 233 | O_NONBLOCK); |
230 | if (ret == -EINPROGRESS) { | 234 | if (ret == -EINPROGRESS) { |
231 | dout("connect %s EINPROGRESS sk_state = %u\n", | 235 | dout("connect %s EINPROGRESS sk_state = %u\n", |
232 | pr_addr(&con->peer_addr.in_addr), | 236 | ceph_pr_addr(&con->peer_addr.in_addr), |
233 | sock->sk->sk_state); | 237 | sock->sk->sk_state); |
234 | ret = 0; | 238 | ret = 0; |
235 | } | 239 | } |
236 | if (ret < 0) { | 240 | if (ret < 0) { |
237 | pr_err("connect %s error %d\n", | 241 | pr_err("connect %s error %d\n", |
238 | pr_addr(&con->peer_addr.in_addr), ret); | 242 | ceph_pr_addr(&con->peer_addr.in_addr), ret); |
239 | sock_release(sock); | 243 | sock_release(sock); |
240 | con->sock = NULL; | 244 | con->sock = NULL; |
241 | con->error_msg = "connect error"; | 245 | con->error_msg = "connect error"; |
@@ -336,7 +340,8 @@ static void reset_connection(struct ceph_connection *con) | |||
336 | */ | 340 | */ |
337 | void ceph_con_close(struct ceph_connection *con) | 341 | void ceph_con_close(struct ceph_connection *con) |
338 | { | 342 | { |
339 | dout("con_close %p peer %s\n", con, pr_addr(&con->peer_addr.in_addr)); | 343 | dout("con_close %p peer %s\n", con, |
344 | ceph_pr_addr(&con->peer_addr.in_addr)); | ||
340 | set_bit(CLOSED, &con->state); /* in case there's queued work */ | 345 | set_bit(CLOSED, &con->state); /* in case there's queued work */ |
341 | clear_bit(STANDBY, &con->state); /* avoid connect_seq bump */ | 346 | clear_bit(STANDBY, &con->state); /* avoid connect_seq bump */ |
342 | clear_bit(LOSSYTX, &con->state); /* so we retry next connect */ | 347 | clear_bit(LOSSYTX, &con->state); /* so we retry next connect */ |
@@ -349,19 +354,21 @@ void ceph_con_close(struct ceph_connection *con) | |||
349 | mutex_unlock(&con->mutex); | 354 | mutex_unlock(&con->mutex); |
350 | queue_con(con); | 355 | queue_con(con); |
351 | } | 356 | } |
357 | EXPORT_SYMBOL(ceph_con_close); | ||
352 | 358 | ||
353 | /* | 359 | /* |
354 | * Reopen a closed connection, with a new peer address. | 360 | * Reopen a closed connection, with a new peer address. |
355 | */ | 361 | */ |
356 | void ceph_con_open(struct ceph_connection *con, struct ceph_entity_addr *addr) | 362 | void ceph_con_open(struct ceph_connection *con, struct ceph_entity_addr *addr) |
357 | { | 363 | { |
358 | dout("con_open %p %s\n", con, pr_addr(&addr->in_addr)); | 364 | dout("con_open %p %s\n", con, ceph_pr_addr(&addr->in_addr)); |
359 | set_bit(OPENING, &con->state); | 365 | set_bit(OPENING, &con->state); |
360 | clear_bit(CLOSED, &con->state); | 366 | clear_bit(CLOSED, &con->state); |
361 | memcpy(&con->peer_addr, addr, sizeof(*addr)); | 367 | memcpy(&con->peer_addr, addr, sizeof(*addr)); |
362 | con->delay = 0; /* reset backoff memory */ | 368 | con->delay = 0; /* reset backoff memory */ |
363 | queue_con(con); | 369 | queue_con(con); |
364 | } | 370 | } |
371 | EXPORT_SYMBOL(ceph_con_open); | ||
365 | 372 | ||
366 | /* | 373 | /* |
367 | * return true if this connection ever successfully opened | 374 | * return true if this connection ever successfully opened |
@@ -408,6 +415,7 @@ void ceph_con_init(struct ceph_messenger *msgr, struct ceph_connection *con) | |||
408 | INIT_LIST_HEAD(&con->out_sent); | 415 | INIT_LIST_HEAD(&con->out_sent); |
409 | INIT_DELAYED_WORK(&con->work, con_work); | 416 | INIT_DELAYED_WORK(&con->work, con_work); |
410 | } | 417 | } |
418 | EXPORT_SYMBOL(ceph_con_init); | ||
411 | 419 | ||
412 | 420 | ||
413 | /* | 421 | /* |
@@ -652,7 +660,7 @@ static void prepare_write_connect(struct ceph_messenger *msgr, | |||
652 | dout("prepare_write_connect %p cseq=%d gseq=%d proto=%d\n", con, | 660 | dout("prepare_write_connect %p cseq=%d gseq=%d proto=%d\n", con, |
653 | con->connect_seq, global_seq, proto); | 661 | con->connect_seq, global_seq, proto); |
654 | 662 | ||
655 | con->out_connect.features = cpu_to_le64(CEPH_FEATURE_SUPPORTED); | 663 | con->out_connect.features = cpu_to_le64(msgr->supported_features); |
656 | con->out_connect.host_type = cpu_to_le32(CEPH_ENTITY_TYPE_CLIENT); | 664 | con->out_connect.host_type = cpu_to_le32(CEPH_ENTITY_TYPE_CLIENT); |
657 | con->out_connect.connect_seq = cpu_to_le32(con->connect_seq); | 665 | con->out_connect.connect_seq = cpu_to_le32(con->connect_seq); |
658 | con->out_connect.global_seq = cpu_to_le32(global_seq); | 666 | con->out_connect.global_seq = cpu_to_le32(global_seq); |
@@ -1013,7 +1021,7 @@ static int verify_hello(struct ceph_connection *con) | |||
1013 | { | 1021 | { |
1014 | if (memcmp(con->in_banner, CEPH_BANNER, strlen(CEPH_BANNER))) { | 1022 | if (memcmp(con->in_banner, CEPH_BANNER, strlen(CEPH_BANNER))) { |
1015 | pr_err("connect to %s got bad banner\n", | 1023 | pr_err("connect to %s got bad banner\n", |
1016 | pr_addr(&con->peer_addr.in_addr)); | 1024 | ceph_pr_addr(&con->peer_addr.in_addr)); |
1017 | con->error_msg = "protocol error, bad banner"; | 1025 | con->error_msg = "protocol error, bad banner"; |
1018 | return -1; | 1026 | return -1; |
1019 | } | 1027 | } |
@@ -1116,7 +1124,7 @@ int ceph_parse_ips(const char *c, const char *end, | |||
1116 | 1124 | ||
1117 | addr_set_port(ss, port); | 1125 | addr_set_port(ss, port); |
1118 | 1126 | ||
1119 | dout("parse_ips got %s\n", pr_addr(ss)); | 1127 | dout("parse_ips got %s\n", ceph_pr_addr(ss)); |
1120 | 1128 | ||
1121 | if (p == end) | 1129 | if (p == end) |
1122 | break; | 1130 | break; |
@@ -1136,6 +1144,7 @@ bad: | |||
1136 | pr_err("parse_ips bad ip '%.*s'\n", (int)(end - c), c); | 1144 | pr_err("parse_ips bad ip '%.*s'\n", (int)(end - c), c); |
1137 | return -EINVAL; | 1145 | return -EINVAL; |
1138 | } | 1146 | } |
1147 | EXPORT_SYMBOL(ceph_parse_ips); | ||
1139 | 1148 | ||
1140 | static int process_banner(struct ceph_connection *con) | 1149 | static int process_banner(struct ceph_connection *con) |
1141 | { | 1150 | { |
@@ -1157,9 +1166,9 @@ static int process_banner(struct ceph_connection *con) | |||
1157 | !(addr_is_blank(&con->actual_peer_addr.in_addr) && | 1166 | !(addr_is_blank(&con->actual_peer_addr.in_addr) && |
1158 | con->actual_peer_addr.nonce == con->peer_addr.nonce)) { | 1167 | con->actual_peer_addr.nonce == con->peer_addr.nonce)) { |
1159 | pr_warning("wrong peer, want %s/%d, got %s/%d\n", | 1168 | pr_warning("wrong peer, want %s/%d, got %s/%d\n", |
1160 | pr_addr(&con->peer_addr.in_addr), | 1169 | ceph_pr_addr(&con->peer_addr.in_addr), |
1161 | (int)le32_to_cpu(con->peer_addr.nonce), | 1170 | (int)le32_to_cpu(con->peer_addr.nonce), |
1162 | pr_addr(&con->actual_peer_addr.in_addr), | 1171 | ceph_pr_addr(&con->actual_peer_addr.in_addr), |
1163 | (int)le32_to_cpu(con->actual_peer_addr.nonce)); | 1172 | (int)le32_to_cpu(con->actual_peer_addr.nonce)); |
1164 | con->error_msg = "wrong peer at address"; | 1173 | con->error_msg = "wrong peer at address"; |
1165 | return -1; | 1174 | return -1; |
@@ -1177,7 +1186,7 @@ static int process_banner(struct ceph_connection *con) | |||
1177 | addr_set_port(&con->msgr->inst.addr.in_addr, port); | 1186 | addr_set_port(&con->msgr->inst.addr.in_addr, port); |
1178 | encode_my_addr(con->msgr); | 1187 | encode_my_addr(con->msgr); |
1179 | dout("process_banner learned my addr is %s\n", | 1188 | dout("process_banner learned my addr is %s\n", |
1180 | pr_addr(&con->msgr->inst.addr.in_addr)); | 1189 | ceph_pr_addr(&con->msgr->inst.addr.in_addr)); |
1181 | } | 1190 | } |
1182 | 1191 | ||
1183 | set_bit(NEGOTIATING, &con->state); | 1192 | set_bit(NEGOTIATING, &con->state); |
@@ -1198,8 +1207,8 @@ static void fail_protocol(struct ceph_connection *con) | |||
1198 | 1207 | ||
1199 | static int process_connect(struct ceph_connection *con) | 1208 | static int process_connect(struct ceph_connection *con) |
1200 | { | 1209 | { |
1201 | u64 sup_feat = CEPH_FEATURE_SUPPORTED; | 1210 | u64 sup_feat = con->msgr->supported_features; |
1202 | u64 req_feat = CEPH_FEATURE_REQUIRED; | 1211 | u64 req_feat = con->msgr->required_features; |
1203 | u64 server_feat = le64_to_cpu(con->in_reply.features); | 1212 | u64 server_feat = le64_to_cpu(con->in_reply.features); |
1204 | 1213 | ||
1205 | dout("process_connect on %p tag %d\n", con, (int)con->in_tag); | 1214 | dout("process_connect on %p tag %d\n", con, (int)con->in_tag); |
@@ -1209,7 +1218,7 @@ static int process_connect(struct ceph_connection *con) | |||
1209 | pr_err("%s%lld %s feature set mismatch," | 1218 | pr_err("%s%lld %s feature set mismatch," |
1210 | " my %llx < server's %llx, missing %llx\n", | 1219 | " my %llx < server's %llx, missing %llx\n", |
1211 | ENTITY_NAME(con->peer_name), | 1220 | ENTITY_NAME(con->peer_name), |
1212 | pr_addr(&con->peer_addr.in_addr), | 1221 | ceph_pr_addr(&con->peer_addr.in_addr), |
1213 | sup_feat, server_feat, server_feat & ~sup_feat); | 1222 | sup_feat, server_feat, server_feat & ~sup_feat); |
1214 | con->error_msg = "missing required protocol features"; | 1223 | con->error_msg = "missing required protocol features"; |
1215 | fail_protocol(con); | 1224 | fail_protocol(con); |
@@ -1219,7 +1228,7 @@ static int process_connect(struct ceph_connection *con) | |||
1219 | pr_err("%s%lld %s protocol version mismatch," | 1228 | pr_err("%s%lld %s protocol version mismatch," |
1220 | " my %d != server's %d\n", | 1229 | " my %d != server's %d\n", |
1221 | ENTITY_NAME(con->peer_name), | 1230 | ENTITY_NAME(con->peer_name), |
1222 | pr_addr(&con->peer_addr.in_addr), | 1231 | ceph_pr_addr(&con->peer_addr.in_addr), |
1223 | le32_to_cpu(con->out_connect.protocol_version), | 1232 | le32_to_cpu(con->out_connect.protocol_version), |
1224 | le32_to_cpu(con->in_reply.protocol_version)); | 1233 | le32_to_cpu(con->in_reply.protocol_version)); |
1225 | con->error_msg = "protocol version mismatch"; | 1234 | con->error_msg = "protocol version mismatch"; |
@@ -1253,7 +1262,7 @@ static int process_connect(struct ceph_connection *con) | |||
1253 | le32_to_cpu(con->in_connect.connect_seq)); | 1262 | le32_to_cpu(con->in_connect.connect_seq)); |
1254 | pr_err("%s%lld %s connection reset\n", | 1263 | pr_err("%s%lld %s connection reset\n", |
1255 | ENTITY_NAME(con->peer_name), | 1264 | ENTITY_NAME(con->peer_name), |
1256 | pr_addr(&con->peer_addr.in_addr)); | 1265 | ceph_pr_addr(&con->peer_addr.in_addr)); |
1257 | reset_connection(con); | 1266 | reset_connection(con); |
1258 | prepare_write_connect(con->msgr, con, 0); | 1267 | prepare_write_connect(con->msgr, con, 0); |
1259 | prepare_read_connect(con); | 1268 | prepare_read_connect(con); |
@@ -1298,7 +1307,7 @@ static int process_connect(struct ceph_connection *con) | |||
1298 | pr_err("%s%lld %s protocol feature mismatch," | 1307 | pr_err("%s%lld %s protocol feature mismatch," |
1299 | " my required %llx > server's %llx, need %llx\n", | 1308 | " my required %llx > server's %llx, need %llx\n", |
1300 | ENTITY_NAME(con->peer_name), | 1309 | ENTITY_NAME(con->peer_name), |
1301 | pr_addr(&con->peer_addr.in_addr), | 1310 | ceph_pr_addr(&con->peer_addr.in_addr), |
1302 | req_feat, server_feat, req_feat & ~server_feat); | 1311 | req_feat, server_feat, req_feat & ~server_feat); |
1303 | con->error_msg = "missing required protocol features"; | 1312 | con->error_msg = "missing required protocol features"; |
1304 | fail_protocol(con); | 1313 | fail_protocol(con); |
@@ -1525,7 +1534,7 @@ static int read_partial_message(struct ceph_connection *con) | |||
1525 | if ((s64)seq - (s64)con->in_seq < 1) { | 1534 | if ((s64)seq - (s64)con->in_seq < 1) { |
1526 | pr_info("skipping %s%lld %s seq %lld, expected %lld\n", | 1535 | pr_info("skipping %s%lld %s seq %lld, expected %lld\n", |
1527 | ENTITY_NAME(con->peer_name), | 1536 | ENTITY_NAME(con->peer_name), |
1528 | pr_addr(&con->peer_addr.in_addr), | 1537 | ceph_pr_addr(&con->peer_addr.in_addr), |
1529 | seq, con->in_seq + 1); | 1538 | seq, con->in_seq + 1); |
1530 | con->in_base_pos = -front_len - middle_len - data_len - | 1539 | con->in_base_pos = -front_len - middle_len - data_len - |
1531 | sizeof(m->footer); | 1540 | sizeof(m->footer); |
@@ -2023,9 +2032,9 @@ out: | |||
2023 | static void ceph_fault(struct ceph_connection *con) | 2032 | static void ceph_fault(struct ceph_connection *con) |
2024 | { | 2033 | { |
2025 | pr_err("%s%lld %s %s\n", ENTITY_NAME(con->peer_name), | 2034 | pr_err("%s%lld %s %s\n", ENTITY_NAME(con->peer_name), |
2026 | pr_addr(&con->peer_addr.in_addr), con->error_msg); | 2035 | ceph_pr_addr(&con->peer_addr.in_addr), con->error_msg); |
2027 | dout("fault %p state %lu to peer %s\n", | 2036 | dout("fault %p state %lu to peer %s\n", |
2028 | con, con->state, pr_addr(&con->peer_addr.in_addr)); | 2037 | con, con->state, ceph_pr_addr(&con->peer_addr.in_addr)); |
2029 | 2038 | ||
2030 | if (test_bit(LOSSYTX, &con->state)) { | 2039 | if (test_bit(LOSSYTX, &con->state)) { |
2031 | dout("fault on LOSSYTX channel\n"); | 2040 | dout("fault on LOSSYTX channel\n"); |
@@ -2085,7 +2094,9 @@ out: | |||
2085 | /* | 2094 | /* |
2086 | * create a new messenger instance | 2095 | * create a new messenger instance |
2087 | */ | 2096 | */ |
2088 | struct ceph_messenger *ceph_messenger_create(struct ceph_entity_addr *myaddr) | 2097 | struct ceph_messenger *ceph_messenger_create(struct ceph_entity_addr *myaddr, |
2098 | u32 supported_features, | ||
2099 | u32 required_features) | ||
2089 | { | 2100 | { |
2090 | struct ceph_messenger *msgr; | 2101 | struct ceph_messenger *msgr; |
2091 | 2102 | ||
@@ -2093,6 +2104,9 @@ struct ceph_messenger *ceph_messenger_create(struct ceph_entity_addr *myaddr) | |||
2093 | if (msgr == NULL) | 2104 | if (msgr == NULL) |
2094 | return ERR_PTR(-ENOMEM); | 2105 | return ERR_PTR(-ENOMEM); |
2095 | 2106 | ||
2107 | msgr->supported_features = supported_features; | ||
2108 | msgr->required_features = required_features; | ||
2109 | |||
2096 | spin_lock_init(&msgr->global_seq_lock); | 2110 | spin_lock_init(&msgr->global_seq_lock); |
2097 | 2111 | ||
2098 | /* the zero page is needed if a request is "canceled" while the message | 2112 | /* the zero page is needed if a request is "canceled" while the message |
@@ -2115,6 +2129,7 @@ struct ceph_messenger *ceph_messenger_create(struct ceph_entity_addr *myaddr) | |||
2115 | dout("messenger_create %p\n", msgr); | 2129 | dout("messenger_create %p\n", msgr); |
2116 | return msgr; | 2130 | return msgr; |
2117 | } | 2131 | } |
2132 | EXPORT_SYMBOL(ceph_messenger_create); | ||
2118 | 2133 | ||
2119 | void ceph_messenger_destroy(struct ceph_messenger *msgr) | 2134 | void ceph_messenger_destroy(struct ceph_messenger *msgr) |
2120 | { | 2135 | { |
@@ -2124,6 +2139,7 @@ void ceph_messenger_destroy(struct ceph_messenger *msgr) | |||
2124 | kfree(msgr); | 2139 | kfree(msgr); |
2125 | dout("destroyed messenger %p\n", msgr); | 2140 | dout("destroyed messenger %p\n", msgr); |
2126 | } | 2141 | } |
2142 | EXPORT_SYMBOL(ceph_messenger_destroy); | ||
2127 | 2143 | ||
2128 | /* | 2144 | /* |
2129 | * Queue up an outgoing message on the given connection. | 2145 | * Queue up an outgoing message on the given connection. |
@@ -2160,6 +2176,7 @@ void ceph_con_send(struct ceph_connection *con, struct ceph_msg *msg) | |||
2160 | if (test_and_set_bit(WRITE_PENDING, &con->state) == 0) | 2176 | if (test_and_set_bit(WRITE_PENDING, &con->state) == 0) |
2161 | queue_con(con); | 2177 | queue_con(con); |
2162 | } | 2178 | } |
2179 | EXPORT_SYMBOL(ceph_con_send); | ||
2163 | 2180 | ||
2164 | /* | 2181 | /* |
2165 | * Revoke a message that was previously queued for send | 2182 | * Revoke a message that was previously queued for send |
@@ -2225,6 +2242,7 @@ void ceph_con_keepalive(struct ceph_connection *con) | |||
2225 | test_and_set_bit(WRITE_PENDING, &con->state) == 0) | 2242 | test_and_set_bit(WRITE_PENDING, &con->state) == 0) |
2226 | queue_con(con); | 2243 | queue_con(con); |
2227 | } | 2244 | } |
2245 | EXPORT_SYMBOL(ceph_con_keepalive); | ||
2228 | 2246 | ||
2229 | 2247 | ||
2230 | /* | 2248 | /* |
@@ -2299,6 +2317,7 @@ out: | |||
2299 | pr_err("msg_new can't create type %d front %d\n", type, front_len); | 2317 | pr_err("msg_new can't create type %d front %d\n", type, front_len); |
2300 | return NULL; | 2318 | return NULL; |
2301 | } | 2319 | } |
2320 | EXPORT_SYMBOL(ceph_msg_new); | ||
2302 | 2321 | ||
2303 | /* | 2322 | /* |
2304 | * Allocate "middle" portion of a message, if it is needed and wasn't | 2323 | * Allocate "middle" portion of a message, if it is needed and wasn't |
@@ -2410,6 +2429,7 @@ void ceph_msg_last_put(struct kref *kref) | |||
2410 | else | 2429 | else |
2411 | ceph_msg_kfree(m); | 2430 | ceph_msg_kfree(m); |
2412 | } | 2431 | } |
2432 | EXPORT_SYMBOL(ceph_msg_last_put); | ||
2413 | 2433 | ||
2414 | void ceph_msg_dump(struct ceph_msg *msg) | 2434 | void ceph_msg_dump(struct ceph_msg *msg) |
2415 | { | 2435 | { |
@@ -2430,3 +2450,4 @@ void ceph_msg_dump(struct ceph_msg *msg) | |||
2430 | DUMP_PREFIX_OFFSET, 16, 1, | 2450 | DUMP_PREFIX_OFFSET, 16, 1, |
2431 | &msg->footer, sizeof(msg->footer), true); | 2451 | &msg->footer, sizeof(msg->footer), true); |
2432 | } | 2452 | } |
2453 | EXPORT_SYMBOL(ceph_msg_dump); | ||
diff --git a/fs/ceph/mon_client.c b/net/ceph/mon_client.c index b2a5a3e4a671..8a079399174a 100644 --- a/fs/ceph/mon_client.c +++ b/net/ceph/mon_client.c | |||
@@ -1,14 +1,16 @@ | |||
1 | #include "ceph_debug.h" | 1 | #include <linux/ceph/ceph_debug.h> |
2 | 2 | ||
3 | #include <linux/module.h> | ||
3 | #include <linux/types.h> | 4 | #include <linux/types.h> |
4 | #include <linux/slab.h> | 5 | #include <linux/slab.h> |
5 | #include <linux/random.h> | 6 | #include <linux/random.h> |
6 | #include <linux/sched.h> | 7 | #include <linux/sched.h> |
7 | 8 | ||
8 | #include "mon_client.h" | 9 | #include <linux/ceph/mon_client.h> |
9 | #include "super.h" | 10 | #include <linux/ceph/libceph.h> |
10 | #include "auth.h" | 11 | #include <linux/ceph/decode.h> |
11 | #include "decode.h" | 12 | |
13 | #include <linux/ceph/auth.h> | ||
12 | 14 | ||
13 | /* | 15 | /* |
14 | * Interact with Ceph monitor cluster. Handle requests for new map | 16 | * Interact with Ceph monitor cluster. Handle requests for new map |
@@ -74,7 +76,7 @@ struct ceph_monmap *ceph_monmap_decode(void *p, void *end) | |||
74 | m->num_mon); | 76 | m->num_mon); |
75 | for (i = 0; i < m->num_mon; i++) | 77 | for (i = 0; i < m->num_mon; i++) |
76 | dout("monmap_decode mon%d is %s\n", i, | 78 | dout("monmap_decode mon%d is %s\n", i, |
77 | pr_addr(&m->mon_inst[i].addr.in_addr)); | 79 | ceph_pr_addr(&m->mon_inst[i].addr.in_addr)); |
78 | return m; | 80 | return m; |
79 | 81 | ||
80 | bad: | 82 | bad: |
@@ -191,30 +193,33 @@ static void __send_subscribe(struct ceph_mon_client *monc) | |||
191 | struct ceph_msg *msg = monc->m_subscribe; | 193 | struct ceph_msg *msg = monc->m_subscribe; |
192 | struct ceph_mon_subscribe_item *i; | 194 | struct ceph_mon_subscribe_item *i; |
193 | void *p, *end; | 195 | void *p, *end; |
196 | int num; | ||
194 | 197 | ||
195 | p = msg->front.iov_base; | 198 | p = msg->front.iov_base; |
196 | end = p + msg->front_max; | 199 | end = p + msg->front_max; |
197 | 200 | ||
198 | dout("__send_subscribe to 'mdsmap' %u+\n", | 201 | num = 1 + !!monc->want_next_osdmap + !!monc->want_mdsmap; |
199 | (unsigned)monc->have_mdsmap); | 202 | ceph_encode_32(&p, num); |
203 | |||
200 | if (monc->want_next_osdmap) { | 204 | if (monc->want_next_osdmap) { |
201 | dout("__send_subscribe to 'osdmap' %u\n", | 205 | dout("__send_subscribe to 'osdmap' %u\n", |
202 | (unsigned)monc->have_osdmap); | 206 | (unsigned)monc->have_osdmap); |
203 | ceph_encode_32(&p, 3); | ||
204 | ceph_encode_string(&p, end, "osdmap", 6); | 207 | ceph_encode_string(&p, end, "osdmap", 6); |
205 | i = p; | 208 | i = p; |
206 | i->have = cpu_to_le64(monc->have_osdmap); | 209 | i->have = cpu_to_le64(monc->have_osdmap); |
207 | i->onetime = 1; | 210 | i->onetime = 1; |
208 | p += sizeof(*i); | 211 | p += sizeof(*i); |
209 | monc->want_next_osdmap = 2; /* requested */ | 212 | monc->want_next_osdmap = 2; /* requested */ |
210 | } else { | ||
211 | ceph_encode_32(&p, 2); | ||
212 | } | 213 | } |
213 | ceph_encode_string(&p, end, "mdsmap", 6); | 214 | if (monc->want_mdsmap) { |
214 | i = p; | 215 | dout("__send_subscribe to 'mdsmap' %u+\n", |
215 | i->have = cpu_to_le64(monc->have_mdsmap); | 216 | (unsigned)monc->have_mdsmap); |
216 | i->onetime = 0; | 217 | ceph_encode_string(&p, end, "mdsmap", 6); |
217 | p += sizeof(*i); | 218 | i = p; |
219 | i->have = cpu_to_le64(monc->have_mdsmap); | ||
220 | i->onetime = 0; | ||
221 | p += sizeof(*i); | ||
222 | } | ||
218 | ceph_encode_string(&p, end, "monmap", 6); | 223 | ceph_encode_string(&p, end, "monmap", 6); |
219 | i = p; | 224 | i = p; |
220 | i->have = 0; | 225 | i->have = 0; |
@@ -243,7 +248,8 @@ static void handle_subscribe_ack(struct ceph_mon_client *monc, | |||
243 | mutex_lock(&monc->mutex); | 248 | mutex_lock(&monc->mutex); |
244 | if (monc->hunting) { | 249 | if (monc->hunting) { |
245 | pr_info("mon%d %s session established\n", | 250 | pr_info("mon%d %s session established\n", |
246 | monc->cur_mon, pr_addr(&monc->con->peer_addr.in_addr)); | 251 | monc->cur_mon, |
252 | ceph_pr_addr(&monc->con->peer_addr.in_addr)); | ||
247 | monc->hunting = false; | 253 | monc->hunting = false; |
248 | } | 254 | } |
249 | dout("handle_subscribe_ack after %d seconds\n", seconds); | 255 | dout("handle_subscribe_ack after %d seconds\n", seconds); |
@@ -266,6 +272,7 @@ int ceph_monc_got_mdsmap(struct ceph_mon_client *monc, u32 got) | |||
266 | mutex_unlock(&monc->mutex); | 272 | mutex_unlock(&monc->mutex); |
267 | return 0; | 273 | return 0; |
268 | } | 274 | } |
275 | EXPORT_SYMBOL(ceph_monc_got_mdsmap); | ||
269 | 276 | ||
270 | int ceph_monc_got_osdmap(struct ceph_mon_client *monc, u32 got) | 277 | int ceph_monc_got_osdmap(struct ceph_mon_client *monc, u32 got) |
271 | { | 278 | { |
@@ -310,6 +317,7 @@ int ceph_monc_open_session(struct ceph_mon_client *monc) | |||
310 | mutex_unlock(&monc->mutex); | 317 | mutex_unlock(&monc->mutex); |
311 | return 0; | 318 | return 0; |
312 | } | 319 | } |
320 | EXPORT_SYMBOL(ceph_monc_open_session); | ||
313 | 321 | ||
314 | /* | 322 | /* |
315 | * The monitor responds with mount ack indicate mount success. The | 323 | * The monitor responds with mount ack indicate mount success. The |
@@ -540,6 +548,7 @@ out: | |||
540 | kref_put(&req->kref, release_generic_request); | 548 | kref_put(&req->kref, release_generic_request); |
541 | return err; | 549 | return err; |
542 | } | 550 | } |
551 | EXPORT_SYMBOL(ceph_monc_do_statfs); | ||
543 | 552 | ||
544 | /* | 553 | /* |
545 | * pool ops | 554 | * pool ops |
@@ -651,6 +660,7 @@ int ceph_monc_create_snapid(struct ceph_mon_client *monc, | |||
651 | pool, 0, (char *)snapid, sizeof(*snapid)); | 660 | pool, 0, (char *)snapid, sizeof(*snapid)); |
652 | 661 | ||
653 | } | 662 | } |
663 | EXPORT_SYMBOL(ceph_monc_create_snapid); | ||
654 | 664 | ||
655 | int ceph_monc_delete_snapid(struct ceph_mon_client *monc, | 665 | int ceph_monc_delete_snapid(struct ceph_mon_client *monc, |
656 | u32 pool, u64 snapid) | 666 | u32 pool, u64 snapid) |
@@ -708,9 +718,9 @@ static void delayed_work(struct work_struct *work) | |||
708 | */ | 718 | */ |
709 | static int build_initial_monmap(struct ceph_mon_client *monc) | 719 | static int build_initial_monmap(struct ceph_mon_client *monc) |
710 | { | 720 | { |
711 | struct ceph_mount_args *args = monc->client->mount_args; | 721 | struct ceph_options *opt = monc->client->options; |
712 | struct ceph_entity_addr *mon_addr = args->mon_addr; | 722 | struct ceph_entity_addr *mon_addr = opt->mon_addr; |
713 | int num_mon = args->num_mon; | 723 | int num_mon = opt->num_mon; |
714 | int i; | 724 | int i; |
715 | 725 | ||
716 | /* build initial monmap */ | 726 | /* build initial monmap */ |
@@ -728,11 +738,6 @@ static int build_initial_monmap(struct ceph_mon_client *monc) | |||
728 | } | 738 | } |
729 | monc->monmap->num_mon = num_mon; | 739 | monc->monmap->num_mon = num_mon; |
730 | monc->have_fsid = false; | 740 | monc->have_fsid = false; |
731 | |||
732 | /* release addr memory */ | ||
733 | kfree(args->mon_addr); | ||
734 | args->mon_addr = NULL; | ||
735 | args->num_mon = 0; | ||
736 | return 0; | 741 | return 0; |
737 | } | 742 | } |
738 | 743 | ||
@@ -753,8 +758,8 @@ int ceph_monc_init(struct ceph_mon_client *monc, struct ceph_client *cl) | |||
753 | monc->con = NULL; | 758 | monc->con = NULL; |
754 | 759 | ||
755 | /* authentication */ | 760 | /* authentication */ |
756 | monc->auth = ceph_auth_init(cl->mount_args->name, | 761 | monc->auth = ceph_auth_init(cl->options->name, |
757 | cl->mount_args->secret); | 762 | cl->options->secret); |
758 | if (IS_ERR(monc->auth)) | 763 | if (IS_ERR(monc->auth)) |
759 | return PTR_ERR(monc->auth); | 764 | return PTR_ERR(monc->auth); |
760 | monc->auth->want_keys = | 765 | monc->auth->want_keys = |
@@ -808,6 +813,7 @@ out_monmap: | |||
808 | out: | 813 | out: |
809 | return err; | 814 | return err; |
810 | } | 815 | } |
816 | EXPORT_SYMBOL(ceph_monc_init); | ||
811 | 817 | ||
812 | void ceph_monc_stop(struct ceph_mon_client *monc) | 818 | void ceph_monc_stop(struct ceph_mon_client *monc) |
813 | { | 819 | { |
@@ -832,6 +838,7 @@ void ceph_monc_stop(struct ceph_mon_client *monc) | |||
832 | 838 | ||
833 | kfree(monc->monmap); | 839 | kfree(monc->monmap); |
834 | } | 840 | } |
841 | EXPORT_SYMBOL(ceph_monc_stop); | ||
835 | 842 | ||
836 | static void handle_auth_reply(struct ceph_mon_client *monc, | 843 | static void handle_auth_reply(struct ceph_mon_client *monc, |
837 | struct ceph_msg *msg) | 844 | struct ceph_msg *msg) |
@@ -889,6 +896,7 @@ int ceph_monc_validate_auth(struct ceph_mon_client *monc) | |||
889 | mutex_unlock(&monc->mutex); | 896 | mutex_unlock(&monc->mutex); |
890 | return ret; | 897 | return ret; |
891 | } | 898 | } |
899 | EXPORT_SYMBOL(ceph_monc_validate_auth); | ||
892 | 900 | ||
893 | /* | 901 | /* |
894 | * handle incoming message | 902 | * handle incoming message |
@@ -922,15 +930,16 @@ static void dispatch(struct ceph_connection *con, struct ceph_msg *msg) | |||
922 | ceph_monc_handle_map(monc, msg); | 930 | ceph_monc_handle_map(monc, msg); |
923 | break; | 931 | break; |
924 | 932 | ||
925 | case CEPH_MSG_MDS_MAP: | ||
926 | ceph_mdsc_handle_map(&monc->client->mdsc, msg); | ||
927 | break; | ||
928 | |||
929 | case CEPH_MSG_OSD_MAP: | 933 | case CEPH_MSG_OSD_MAP: |
930 | ceph_osdc_handle_map(&monc->client->osdc, msg); | 934 | ceph_osdc_handle_map(&monc->client->osdc, msg); |
931 | break; | 935 | break; |
932 | 936 | ||
933 | default: | 937 | default: |
938 | /* can the chained handler handle it? */ | ||
939 | if (monc->client->extra_mon_dispatch && | ||
940 | monc->client->extra_mon_dispatch(monc->client, msg) == 0) | ||
941 | break; | ||
942 | |||
934 | pr_err("received unknown message type %d %s\n", type, | 943 | pr_err("received unknown message type %d %s\n", type, |
935 | ceph_msg_type_name(type)); | 944 | ceph_msg_type_name(type)); |
936 | } | 945 | } |
@@ -994,7 +1003,7 @@ static void mon_fault(struct ceph_connection *con) | |||
994 | if (monc->con && !monc->hunting) | 1003 | if (monc->con && !monc->hunting) |
995 | pr_info("mon%d %s session lost, " | 1004 | pr_info("mon%d %s session lost, " |
996 | "hunting for new mon\n", monc->cur_mon, | 1005 | "hunting for new mon\n", monc->cur_mon, |
997 | pr_addr(&monc->con->peer_addr.in_addr)); | 1006 | ceph_pr_addr(&monc->con->peer_addr.in_addr)); |
998 | 1007 | ||
999 | __close_session(monc); | 1008 | __close_session(monc); |
1000 | if (!monc->hunting) { | 1009 | if (!monc->hunting) { |
diff --git a/fs/ceph/msgpool.c b/net/ceph/msgpool.c index dd65a6438131..d5f2d97ac05c 100644 --- a/fs/ceph/msgpool.c +++ b/net/ceph/msgpool.c | |||
@@ -1,11 +1,11 @@ | |||
1 | #include "ceph_debug.h" | 1 | #include <linux/ceph/ceph_debug.h> |
2 | 2 | ||
3 | #include <linux/err.h> | 3 | #include <linux/err.h> |
4 | #include <linux/sched.h> | 4 | #include <linux/sched.h> |
5 | #include <linux/types.h> | 5 | #include <linux/types.h> |
6 | #include <linux/vmalloc.h> | 6 | #include <linux/vmalloc.h> |
7 | 7 | ||
8 | #include "msgpool.h" | 8 | #include <linux/ceph/msgpool.h> |
9 | 9 | ||
10 | static void *alloc_fn(gfp_t gfp_mask, void *arg) | 10 | static void *alloc_fn(gfp_t gfp_mask, void *arg) |
11 | { | 11 | { |
diff --git a/fs/ceph/osd_client.c b/net/ceph/osd_client.c index 0edb43f1ef26..79391994b3ed 100644 --- a/fs/ceph/osd_client.c +++ b/net/ceph/osd_client.c | |||
@@ -1,5 +1,6 @@ | |||
1 | #include "ceph_debug.h" | 1 | #include <linux/ceph/ceph_debug.h> |
2 | 2 | ||
3 | #include <linux/module.h> | ||
3 | #include <linux/err.h> | 4 | #include <linux/err.h> |
4 | #include <linux/highmem.h> | 5 | #include <linux/highmem.h> |
5 | #include <linux/mm.h> | 6 | #include <linux/mm.h> |
@@ -10,12 +11,12 @@ | |||
10 | #include <linux/bio.h> | 11 | #include <linux/bio.h> |
11 | #endif | 12 | #endif |
12 | 13 | ||
13 | #include "super.h" | 14 | #include <linux/ceph/libceph.h> |
14 | #include "osd_client.h" | 15 | #include <linux/ceph/osd_client.h> |
15 | #include "messenger.h" | 16 | #include <linux/ceph/messenger.h> |
16 | #include "decode.h" | 17 | #include <linux/ceph/decode.h> |
17 | #include "auth.h" | 18 | #include <linux/ceph/auth.h> |
18 | #include "pagelist.h" | 19 | #include <linux/ceph/pagelist.h> |
19 | 20 | ||
20 | #define OSD_OP_FRONT_LEN 4096 | 21 | #define OSD_OP_FRONT_LEN 4096 |
21 | #define OSD_OPREPLY_FRONT_LEN 512 | 22 | #define OSD_OPREPLY_FRONT_LEN 512 |
@@ -70,11 +71,14 @@ void ceph_calc_raw_layout(struct ceph_osd_client *osdc, | |||
70 | op->extent.length = objlen; | 71 | op->extent.length = objlen; |
71 | } | 72 | } |
72 | req->r_num_pages = calc_pages_for(off, *plen); | 73 | req->r_num_pages = calc_pages_for(off, *plen); |
74 | if (op->op == CEPH_OSD_OP_WRITE) | ||
75 | op->payload_len = *plen; | ||
73 | 76 | ||
74 | dout("calc_layout bno=%llx %llu~%llu (%d pages)\n", | 77 | dout("calc_layout bno=%llx %llu~%llu (%d pages)\n", |
75 | *bno, objoff, objlen, req->r_num_pages); | 78 | *bno, objoff, objlen, req->r_num_pages); |
76 | 79 | ||
77 | } | 80 | } |
81 | EXPORT_SYMBOL(ceph_calc_raw_layout); | ||
78 | 82 | ||
79 | /* | 83 | /* |
80 | * Implement client access to distributed object storage cluster. | 84 | * Implement client access to distributed object storage cluster. |
@@ -154,19 +158,7 @@ void ceph_osdc_release_request(struct kref *kref) | |||
154 | else | 158 | else |
155 | kfree(req); | 159 | kfree(req); |
156 | } | 160 | } |
157 | 161 | EXPORT_SYMBOL(ceph_osdc_release_request); | |
158 | static int op_needs_trail(int op) | ||
159 | { | ||
160 | switch (op) { | ||
161 | case CEPH_OSD_OP_GETXATTR: | ||
162 | case CEPH_OSD_OP_SETXATTR: | ||
163 | case CEPH_OSD_OP_CMPXATTR: | ||
164 | case CEPH_OSD_OP_CALL: | ||
165 | return 1; | ||
166 | default: | ||
167 | return 0; | ||
168 | } | ||
169 | } | ||
170 | 162 | ||
171 | static int get_num_ops(struct ceph_osd_req_op *ops, int *needs_trail) | 163 | static int get_num_ops(struct ceph_osd_req_op *ops, int *needs_trail) |
172 | { | 164 | { |
@@ -268,6 +260,7 @@ struct ceph_osd_request *ceph_osdc_alloc_request(struct ceph_osd_client *osdc, | |||
268 | 260 | ||
269 | return req; | 261 | return req; |
270 | } | 262 | } |
263 | EXPORT_SYMBOL(ceph_osdc_alloc_request); | ||
271 | 264 | ||
272 | static void osd_req_encode_op(struct ceph_osd_request *req, | 265 | static void osd_req_encode_op(struct ceph_osd_request *req, |
273 | struct ceph_osd_op *dst, | 266 | struct ceph_osd_op *dst, |
@@ -403,6 +396,7 @@ void ceph_osdc_build_request(struct ceph_osd_request *req, | |||
403 | msg->hdr.front_len = cpu_to_le32(msg_size); | 396 | msg->hdr.front_len = cpu_to_le32(msg_size); |
404 | return; | 397 | return; |
405 | } | 398 | } |
399 | EXPORT_SYMBOL(ceph_osdc_build_request); | ||
406 | 400 | ||
407 | /* | 401 | /* |
408 | * build new request AND message, calculate layout, and adjust file | 402 | * build new request AND message, calculate layout, and adjust file |
@@ -460,6 +454,7 @@ struct ceph_osd_request *ceph_osdc_new_request(struct ceph_osd_client *osdc, | |||
460 | 454 | ||
461 | return req; | 455 | return req; |
462 | } | 456 | } |
457 | EXPORT_SYMBOL(ceph_osdc_new_request); | ||
463 | 458 | ||
464 | /* | 459 | /* |
465 | * We keep osd requests in an rbtree, sorted by ->r_tid. | 460 | * We keep osd requests in an rbtree, sorted by ->r_tid. |
@@ -614,7 +609,7 @@ static void __move_osd_to_lru(struct ceph_osd_client *osdc, | |||
614 | dout("__move_osd_to_lru %p\n", osd); | 609 | dout("__move_osd_to_lru %p\n", osd); |
615 | BUG_ON(!list_empty(&osd->o_osd_lru)); | 610 | BUG_ON(!list_empty(&osd->o_osd_lru)); |
616 | list_add_tail(&osd->o_osd_lru, &osdc->osd_lru); | 611 | list_add_tail(&osd->o_osd_lru, &osdc->osd_lru); |
617 | osd->lru_ttl = jiffies + osdc->client->mount_args->osd_idle_ttl * HZ; | 612 | osd->lru_ttl = jiffies + osdc->client->options->osd_idle_ttl * HZ; |
618 | } | 613 | } |
619 | 614 | ||
620 | static void __remove_osd_from_lru(struct ceph_osd *osd) | 615 | static void __remove_osd_from_lru(struct ceph_osd *osd) |
@@ -708,7 +703,7 @@ static struct ceph_osd *__lookup_osd(struct ceph_osd_client *osdc, int o) | |||
708 | static void __schedule_osd_timeout(struct ceph_osd_client *osdc) | 703 | static void __schedule_osd_timeout(struct ceph_osd_client *osdc) |
709 | { | 704 | { |
710 | schedule_delayed_work(&osdc->timeout_work, | 705 | schedule_delayed_work(&osdc->timeout_work, |
711 | osdc->client->mount_args->osd_keepalive_timeout * HZ); | 706 | osdc->client->options->osd_keepalive_timeout * HZ); |
712 | } | 707 | } |
713 | 708 | ||
714 | static void __cancel_osd_timeout(struct ceph_osd_client *osdc) | 709 | static void __cancel_osd_timeout(struct ceph_osd_client *osdc) |
@@ -909,9 +904,9 @@ static void handle_timeout(struct work_struct *work) | |||
909 | container_of(work, struct ceph_osd_client, timeout_work.work); | 904 | container_of(work, struct ceph_osd_client, timeout_work.work); |
910 | struct ceph_osd_request *req, *last_req = NULL; | 905 | struct ceph_osd_request *req, *last_req = NULL; |
911 | struct ceph_osd *osd; | 906 | struct ceph_osd *osd; |
912 | unsigned long timeout = osdc->client->mount_args->osd_timeout * HZ; | 907 | unsigned long timeout = osdc->client->options->osd_timeout * HZ; |
913 | unsigned long keepalive = | 908 | unsigned long keepalive = |
914 | osdc->client->mount_args->osd_keepalive_timeout * HZ; | 909 | osdc->client->options->osd_keepalive_timeout * HZ; |
915 | unsigned long last_stamp = 0; | 910 | unsigned long last_stamp = 0; |
916 | struct rb_node *p; | 911 | struct rb_node *p; |
917 | struct list_head slow_osds; | 912 | struct list_head slow_osds; |
@@ -998,7 +993,7 @@ static void handle_osds_timeout(struct work_struct *work) | |||
998 | container_of(work, struct ceph_osd_client, | 993 | container_of(work, struct ceph_osd_client, |
999 | osds_timeout_work.work); | 994 | osds_timeout_work.work); |
1000 | unsigned long delay = | 995 | unsigned long delay = |
1001 | osdc->client->mount_args->osd_idle_ttl * HZ >> 2; | 996 | osdc->client->options->osd_idle_ttl * HZ >> 2; |
1002 | 997 | ||
1003 | dout("osds timeout\n"); | 998 | dout("osds timeout\n"); |
1004 | down_read(&osdc->map_sem); | 999 | down_read(&osdc->map_sem); |
@@ -1360,6 +1355,7 @@ int ceph_osdc_start_request(struct ceph_osd_client *osdc, | |||
1360 | up_read(&osdc->map_sem); | 1355 | up_read(&osdc->map_sem); |
1361 | return rc; | 1356 | return rc; |
1362 | } | 1357 | } |
1358 | EXPORT_SYMBOL(ceph_osdc_start_request); | ||
1363 | 1359 | ||
1364 | /* | 1360 | /* |
1365 | * wait for a request to complete | 1361 | * wait for a request to complete |
@@ -1382,6 +1378,7 @@ int ceph_osdc_wait_request(struct ceph_osd_client *osdc, | |||
1382 | dout("wait_request tid %llu result %d\n", req->r_tid, req->r_result); | 1378 | dout("wait_request tid %llu result %d\n", req->r_tid, req->r_result); |
1383 | return req->r_result; | 1379 | return req->r_result; |
1384 | } | 1380 | } |
1381 | EXPORT_SYMBOL(ceph_osdc_wait_request); | ||
1385 | 1382 | ||
1386 | /* | 1383 | /* |
1387 | * sync - wait for all in-flight requests to flush. avoid starvation. | 1384 | * sync - wait for all in-flight requests to flush. avoid starvation. |
@@ -1415,6 +1412,7 @@ void ceph_osdc_sync(struct ceph_osd_client *osdc) | |||
1415 | mutex_unlock(&osdc->request_mutex); | 1412 | mutex_unlock(&osdc->request_mutex); |
1416 | dout("sync done (thru tid %llu)\n", last_tid); | 1413 | dout("sync done (thru tid %llu)\n", last_tid); |
1417 | } | 1414 | } |
1415 | EXPORT_SYMBOL(ceph_osdc_sync); | ||
1418 | 1416 | ||
1419 | /* | 1417 | /* |
1420 | * init, shutdown | 1418 | * init, shutdown |
@@ -1440,7 +1438,7 @@ int ceph_osdc_init(struct ceph_osd_client *osdc, struct ceph_client *client) | |||
1440 | INIT_DELAYED_WORK(&osdc->osds_timeout_work, handle_osds_timeout); | 1438 | INIT_DELAYED_WORK(&osdc->osds_timeout_work, handle_osds_timeout); |
1441 | 1439 | ||
1442 | schedule_delayed_work(&osdc->osds_timeout_work, | 1440 | schedule_delayed_work(&osdc->osds_timeout_work, |
1443 | round_jiffies_relative(osdc->client->mount_args->osd_idle_ttl * HZ)); | 1441 | round_jiffies_relative(osdc->client->options->osd_idle_ttl * HZ)); |
1444 | 1442 | ||
1445 | err = -ENOMEM; | 1443 | err = -ENOMEM; |
1446 | osdc->req_mempool = mempool_create_kmalloc_pool(10, | 1444 | osdc->req_mempool = mempool_create_kmalloc_pool(10, |
@@ -1466,6 +1464,7 @@ out_mempool: | |||
1466 | out: | 1464 | out: |
1467 | return err; | 1465 | return err; |
1468 | } | 1466 | } |
1467 | EXPORT_SYMBOL(ceph_osdc_init); | ||
1469 | 1468 | ||
1470 | void ceph_osdc_stop(struct ceph_osd_client *osdc) | 1469 | void ceph_osdc_stop(struct ceph_osd_client *osdc) |
1471 | { | 1470 | { |
@@ -1480,6 +1479,7 @@ void ceph_osdc_stop(struct ceph_osd_client *osdc) | |||
1480 | ceph_msgpool_destroy(&osdc->msgpool_op); | 1479 | ceph_msgpool_destroy(&osdc->msgpool_op); |
1481 | ceph_msgpool_destroy(&osdc->msgpool_op_reply); | 1480 | ceph_msgpool_destroy(&osdc->msgpool_op_reply); |
1482 | } | 1481 | } |
1482 | EXPORT_SYMBOL(ceph_osdc_stop); | ||
1483 | 1483 | ||
1484 | /* | 1484 | /* |
1485 | * Read some contiguous pages. If we cross a stripe boundary, shorten | 1485 | * Read some contiguous pages. If we cross a stripe boundary, shorten |
@@ -1517,6 +1517,7 @@ int ceph_osdc_readpages(struct ceph_osd_client *osdc, | |||
1517 | dout("readpages result %d\n", rc); | 1517 | dout("readpages result %d\n", rc); |
1518 | return rc; | 1518 | return rc; |
1519 | } | 1519 | } |
1520 | EXPORT_SYMBOL(ceph_osdc_readpages); | ||
1520 | 1521 | ||
1521 | /* | 1522 | /* |
1522 | * do a synchronous write on N pages | 1523 | * do a synchronous write on N pages |
@@ -1559,6 +1560,7 @@ int ceph_osdc_writepages(struct ceph_osd_client *osdc, struct ceph_vino vino, | |||
1559 | dout("writepages result %d\n", rc); | 1560 | dout("writepages result %d\n", rc); |
1560 | return rc; | 1561 | return rc; |
1561 | } | 1562 | } |
1563 | EXPORT_SYMBOL(ceph_osdc_writepages); | ||
1562 | 1564 | ||
1563 | /* | 1565 | /* |
1564 | * handle incoming message | 1566 | * handle incoming message |
diff --git a/fs/ceph/osdmap.c b/net/ceph/osdmap.c index 3ccd11761cb6..d73f3f6efa36 100644 --- a/fs/ceph/osdmap.c +++ b/net/ceph/osdmap.c | |||
@@ -1,14 +1,15 @@ | |||
1 | 1 | ||
2 | #include "ceph_debug.h" | 2 | #include <linux/ceph/ceph_debug.h> |
3 | 3 | ||
4 | #include <linux/module.h> | ||
4 | #include <linux/slab.h> | 5 | #include <linux/slab.h> |
5 | #include <asm/div64.h> | 6 | #include <asm/div64.h> |
6 | 7 | ||
7 | #include "super.h" | 8 | #include <linux/ceph/libceph.h> |
8 | #include "osdmap.h" | 9 | #include <linux/ceph/osdmap.h> |
9 | #include "crush/hash.h" | 10 | #include <linux/ceph/decode.h> |
10 | #include "crush/mapper.h" | 11 | #include <linux/crush/hash.h> |
11 | #include "decode.h" | 12 | #include <linux/crush/mapper.h> |
12 | 13 | ||
13 | char *ceph_osdmap_state_str(char *str, int len, int state) | 14 | char *ceph_osdmap_state_str(char *str, int len, int state) |
14 | { | 15 | { |
@@ -429,6 +430,7 @@ int ceph_pg_poolid_by_name(struct ceph_osdmap *map, const char *name) | |||
429 | } | 430 | } |
430 | return -ENOENT; | 431 | return -ENOENT; |
431 | } | 432 | } |
433 | EXPORT_SYMBOL(ceph_pg_poolid_by_name); | ||
432 | 434 | ||
433 | static void __remove_pg_pool(struct rb_root *root, struct ceph_pg_pool_info *pi) | 435 | static void __remove_pg_pool(struct rb_root *root, struct ceph_pg_pool_info *pi) |
434 | { | 436 | { |
@@ -979,6 +981,7 @@ void ceph_calc_file_object_mapping(struct ceph_file_layout *layout, | |||
979 | 981 | ||
980 | dout(" obj extent %llu~%llu\n", *oxoff, *oxlen); | 982 | dout(" obj extent %llu~%llu\n", *oxoff, *oxlen); |
981 | } | 983 | } |
984 | EXPORT_SYMBOL(ceph_calc_file_object_mapping); | ||
982 | 985 | ||
983 | /* | 986 | /* |
984 | * calculate an object layout (i.e. pgid) from an oid, | 987 | * calculate an object layout (i.e. pgid) from an oid, |
@@ -1024,6 +1027,7 @@ int ceph_calc_object_layout(struct ceph_object_layout *ol, | |||
1024 | ol->ol_stripe_unit = fl->fl_object_stripe_unit; | 1027 | ol->ol_stripe_unit = fl->fl_object_stripe_unit; |
1025 | return 0; | 1028 | return 0; |
1026 | } | 1029 | } |
1030 | EXPORT_SYMBOL(ceph_calc_object_layout); | ||
1027 | 1031 | ||
1028 | /* | 1032 | /* |
1029 | * Calculate raw osd vector for the given pgid. Return pointer to osd | 1033 | * Calculate raw osd vector for the given pgid. Return pointer to osd |
@@ -1121,3 +1125,4 @@ int ceph_calc_pg_primary(struct ceph_osdmap *osdmap, struct ceph_pg pgid) | |||
1121 | return osds[i]; | 1125 | return osds[i]; |
1122 | return -1; | 1126 | return -1; |
1123 | } | 1127 | } |
1128 | EXPORT_SYMBOL(ceph_calc_pg_primary); | ||
diff --git a/fs/ceph/pagelist.c b/net/ceph/pagelist.c index 326e1c04176f..3b146cfac182 100644 --- a/fs/ceph/pagelist.c +++ b/net/ceph/pagelist.c | |||
@@ -1,9 +1,9 @@ | |||
1 | 1 | ||
2 | #include <linux/module.h> | ||
2 | #include <linux/gfp.h> | 3 | #include <linux/gfp.h> |
3 | #include <linux/pagemap.h> | 4 | #include <linux/pagemap.h> |
4 | #include <linux/highmem.h> | 5 | #include <linux/highmem.h> |
5 | 6 | #include <linux/ceph/pagelist.h> | |
6 | #include "pagelist.h" | ||
7 | 7 | ||
8 | static void ceph_pagelist_unmap_tail(struct ceph_pagelist *pl) | 8 | static void ceph_pagelist_unmap_tail(struct ceph_pagelist *pl) |
9 | { | 9 | { |
@@ -25,6 +25,7 @@ int ceph_pagelist_release(struct ceph_pagelist *pl) | |||
25 | } | 25 | } |
26 | return 0; | 26 | return 0; |
27 | } | 27 | } |
28 | EXPORT_SYMBOL(ceph_pagelist_release); | ||
28 | 29 | ||
29 | static int ceph_pagelist_addpage(struct ceph_pagelist *pl) | 30 | static int ceph_pagelist_addpage(struct ceph_pagelist *pl) |
30 | { | 31 | { |
@@ -61,3 +62,4 @@ int ceph_pagelist_append(struct ceph_pagelist *pl, const void *buf, size_t len) | |||
61 | pl->room -= len; | 62 | pl->room -= len; |
62 | return 0; | 63 | return 0; |
63 | } | 64 | } |
65 | EXPORT_SYMBOL(ceph_pagelist_append); | ||
diff --git a/net/ceph/pagevec.c b/net/ceph/pagevec.c new file mode 100644 index 000000000000..54caf0687155 --- /dev/null +++ b/net/ceph/pagevec.c | |||
@@ -0,0 +1,223 @@ | |||
1 | #include <linux/ceph/ceph_debug.h> | ||
2 | |||
3 | #include <linux/module.h> | ||
4 | #include <linux/sched.h> | ||
5 | #include <linux/slab.h> | ||
6 | #include <linux/file.h> | ||
7 | #include <linux/namei.h> | ||
8 | #include <linux/writeback.h> | ||
9 | |||
10 | #include <linux/ceph/libceph.h> | ||
11 | |||
12 | /* | ||
13 | * build a vector of user pages | ||
14 | */ | ||
15 | struct page **ceph_get_direct_page_vector(const char __user *data, | ||
16 | int num_pages, | ||
17 | loff_t off, size_t len) | ||
18 | { | ||
19 | struct page **pages; | ||
20 | int rc; | ||
21 | |||
22 | pages = kmalloc(sizeof(*pages) * num_pages, GFP_NOFS); | ||
23 | if (!pages) | ||
24 | return ERR_PTR(-ENOMEM); | ||
25 | |||
26 | down_read(¤t->mm->mmap_sem); | ||
27 | rc = get_user_pages(current, current->mm, (unsigned long)data, | ||
28 | num_pages, 0, 0, pages, NULL); | ||
29 | up_read(¤t->mm->mmap_sem); | ||
30 | if (rc < 0) | ||
31 | goto fail; | ||
32 | return pages; | ||
33 | |||
34 | fail: | ||
35 | kfree(pages); | ||
36 | return ERR_PTR(rc); | ||
37 | } | ||
38 | EXPORT_SYMBOL(ceph_get_direct_page_vector); | ||
39 | |||
40 | void ceph_put_page_vector(struct page **pages, int num_pages) | ||
41 | { | ||
42 | int i; | ||
43 | |||
44 | for (i = 0; i < num_pages; i++) | ||
45 | put_page(pages[i]); | ||
46 | kfree(pages); | ||
47 | } | ||
48 | EXPORT_SYMBOL(ceph_put_page_vector); | ||
49 | |||
50 | void ceph_release_page_vector(struct page **pages, int num_pages) | ||
51 | { | ||
52 | int i; | ||
53 | |||
54 | for (i = 0; i < num_pages; i++) | ||
55 | __free_pages(pages[i], 0); | ||
56 | kfree(pages); | ||
57 | } | ||
58 | EXPORT_SYMBOL(ceph_release_page_vector); | ||
59 | |||
60 | /* | ||
61 | * allocate a vector new pages | ||
62 | */ | ||
63 | struct page **ceph_alloc_page_vector(int num_pages, gfp_t flags) | ||
64 | { | ||
65 | struct page **pages; | ||
66 | int i; | ||
67 | |||
68 | pages = kmalloc(sizeof(*pages) * num_pages, flags); | ||
69 | if (!pages) | ||
70 | return ERR_PTR(-ENOMEM); | ||
71 | for (i = 0; i < num_pages; i++) { | ||
72 | pages[i] = __page_cache_alloc(flags); | ||
73 | if (pages[i] == NULL) { | ||
74 | ceph_release_page_vector(pages, i); | ||
75 | return ERR_PTR(-ENOMEM); | ||
76 | } | ||
77 | } | ||
78 | return pages; | ||
79 | } | ||
80 | EXPORT_SYMBOL(ceph_alloc_page_vector); | ||
81 | |||
82 | /* | ||
83 | * copy user data into a page vector | ||
84 | */ | ||
85 | int ceph_copy_user_to_page_vector(struct page **pages, | ||
86 | const char __user *data, | ||
87 | loff_t off, size_t len) | ||
88 | { | ||
89 | int i = 0; | ||
90 | int po = off & ~PAGE_CACHE_MASK; | ||
91 | int left = len; | ||
92 | int l, bad; | ||
93 | |||
94 | while (left > 0) { | ||
95 | l = min_t(int, PAGE_CACHE_SIZE-po, left); | ||
96 | bad = copy_from_user(page_address(pages[i]) + po, data, l); | ||
97 | if (bad == l) | ||
98 | return -EFAULT; | ||
99 | data += l - bad; | ||
100 | left -= l - bad; | ||
101 | po += l - bad; | ||
102 | if (po == PAGE_CACHE_SIZE) { | ||
103 | po = 0; | ||
104 | i++; | ||
105 | } | ||
106 | } | ||
107 | return len; | ||
108 | } | ||
109 | EXPORT_SYMBOL(ceph_copy_user_to_page_vector); | ||
110 | |||
111 | int ceph_copy_to_page_vector(struct page **pages, | ||
112 | const char *data, | ||
113 | loff_t off, size_t len) | ||
114 | { | ||
115 | int i = 0; | ||
116 | size_t po = off & ~PAGE_CACHE_MASK; | ||
117 | size_t left = len; | ||
118 | size_t l; | ||
119 | |||
120 | while (left > 0) { | ||
121 | l = min_t(size_t, PAGE_CACHE_SIZE-po, left); | ||
122 | memcpy(page_address(pages[i]) + po, data, l); | ||
123 | data += l; | ||
124 | left -= l; | ||
125 | po += l; | ||
126 | if (po == PAGE_CACHE_SIZE) { | ||
127 | po = 0; | ||
128 | i++; | ||
129 | } | ||
130 | } | ||
131 | return len; | ||
132 | } | ||
133 | EXPORT_SYMBOL(ceph_copy_to_page_vector); | ||
134 | |||
135 | int ceph_copy_from_page_vector(struct page **pages, | ||
136 | char *data, | ||
137 | loff_t off, size_t len) | ||
138 | { | ||
139 | int i = 0; | ||
140 | size_t po = off & ~PAGE_CACHE_MASK; | ||
141 | size_t left = len; | ||
142 | size_t l; | ||
143 | |||
144 | while (left > 0) { | ||
145 | l = min_t(size_t, PAGE_CACHE_SIZE-po, left); | ||
146 | memcpy(data, page_address(pages[i]) + po, l); | ||
147 | data += l; | ||
148 | left -= l; | ||
149 | po += l; | ||
150 | if (po == PAGE_CACHE_SIZE) { | ||
151 | po = 0; | ||
152 | i++; | ||
153 | } | ||
154 | } | ||
155 | return len; | ||
156 | } | ||
157 | EXPORT_SYMBOL(ceph_copy_from_page_vector); | ||
158 | |||
159 | /* | ||
160 | * copy user data from a page vector into a user pointer | ||
161 | */ | ||
162 | int ceph_copy_page_vector_to_user(struct page **pages, | ||
163 | char __user *data, | ||
164 | loff_t off, size_t len) | ||
165 | { | ||
166 | int i = 0; | ||
167 | int po = off & ~PAGE_CACHE_MASK; | ||
168 | int left = len; | ||
169 | int l, bad; | ||
170 | |||
171 | while (left > 0) { | ||
172 | l = min_t(int, left, PAGE_CACHE_SIZE-po); | ||
173 | bad = copy_to_user(data, page_address(pages[i]) + po, l); | ||
174 | if (bad == l) | ||
175 | return -EFAULT; | ||
176 | data += l - bad; | ||
177 | left -= l - bad; | ||
178 | if (po) { | ||
179 | po += l - bad; | ||
180 | if (po == PAGE_CACHE_SIZE) | ||
181 | po = 0; | ||
182 | } | ||
183 | i++; | ||
184 | } | ||
185 | return len; | ||
186 | } | ||
187 | EXPORT_SYMBOL(ceph_copy_page_vector_to_user); | ||
188 | |||
189 | /* | ||
190 | * Zero an extent within a page vector. Offset is relative to the | ||
191 | * start of the first page. | ||
192 | */ | ||
193 | void ceph_zero_page_vector_range(int off, int len, struct page **pages) | ||
194 | { | ||
195 | int i = off >> PAGE_CACHE_SHIFT; | ||
196 | |||
197 | off &= ~PAGE_CACHE_MASK; | ||
198 | |||
199 | dout("zero_page_vector_page %u~%u\n", off, len); | ||
200 | |||
201 | /* leading partial page? */ | ||
202 | if (off) { | ||
203 | int end = min((int)PAGE_CACHE_SIZE, off + len); | ||
204 | dout("zeroing %d %p head from %d\n", i, pages[i], | ||
205 | (int)off); | ||
206 | zero_user_segment(pages[i], off, end); | ||
207 | len -= (end - off); | ||
208 | i++; | ||
209 | } | ||
210 | while (len >= PAGE_CACHE_SIZE) { | ||
211 | dout("zeroing %d %p len=%d\n", i, pages[i], len); | ||
212 | zero_user_segment(pages[i], 0, PAGE_CACHE_SIZE); | ||
213 | len -= PAGE_CACHE_SIZE; | ||
214 | i++; | ||
215 | } | ||
216 | /* trailing partial page? */ | ||
217 | if (len) { | ||
218 | dout("zeroing %d %p tail to %d\n", i, pages[i], (int)len); | ||
219 | zero_user_segment(pages[i], 0, len); | ||
220 | } | ||
221 | } | ||
222 | EXPORT_SYMBOL(ceph_zero_page_vector_range); | ||
223 | |||