diff options
Diffstat (limited to 'fs/xfs/linux-2.6/xfs_buf.c')
-rw-r--r-- | fs/xfs/linux-2.6/xfs_buf.c | 117 |
1 files changed, 59 insertions, 58 deletions
diff --git a/fs/xfs/linux-2.6/xfs_buf.c b/fs/xfs/linux-2.6/xfs_buf.c index df0cba239dd5..655bf4a78afe 100644 --- a/fs/xfs/linux-2.6/xfs_buf.c +++ b/fs/xfs/linux-2.6/xfs_buf.c | |||
@@ -1,5 +1,5 @@ | |||
1 | /* | 1 | /* |
2 | * Copyright (c) 2000-2004 Silicon Graphics, Inc. All Rights Reserved. | 2 | * Copyright (c) 2000-2005 Silicon Graphics, Inc. All Rights Reserved. |
3 | * | 3 | * |
4 | * This program is free software; you can redistribute it and/or modify it | 4 | * This program is free software; you can redistribute it and/or modify it |
5 | * under the terms of version 2 of the GNU General Public License as | 5 | * under the terms of version 2 of the GNU General Public License as |
@@ -54,6 +54,7 @@ | |||
54 | #include <linux/percpu.h> | 54 | #include <linux/percpu.h> |
55 | #include <linux/blkdev.h> | 55 | #include <linux/blkdev.h> |
56 | #include <linux/hash.h> | 56 | #include <linux/hash.h> |
57 | #include <linux/kthread.h> | ||
57 | 58 | ||
58 | #include "xfs_linux.h" | 59 | #include "xfs_linux.h" |
59 | 60 | ||
@@ -67,7 +68,7 @@ STATIC int xfsbufd_wakeup(int, unsigned int); | |||
67 | STATIC void pagebuf_delwri_queue(xfs_buf_t *, int); | 68 | STATIC void pagebuf_delwri_queue(xfs_buf_t *, int); |
68 | 69 | ||
69 | STATIC struct workqueue_struct *xfslogd_workqueue; | 70 | STATIC struct workqueue_struct *xfslogd_workqueue; |
70 | STATIC struct workqueue_struct *xfsdatad_workqueue; | 71 | struct workqueue_struct *xfsdatad_workqueue; |
71 | 72 | ||
72 | /* | 73 | /* |
73 | * Pagebuf debugging | 74 | * Pagebuf debugging |
@@ -590,8 +591,10 @@ found: | |||
590 | PB_SET_OWNER(pb); | 591 | PB_SET_OWNER(pb); |
591 | } | 592 | } |
592 | 593 | ||
593 | if (pb->pb_flags & PBF_STALE) | 594 | if (pb->pb_flags & PBF_STALE) { |
595 | ASSERT((pb->pb_flags & _PBF_DELWRI_Q) == 0); | ||
594 | pb->pb_flags &= PBF_MAPPED; | 596 | pb->pb_flags &= PBF_MAPPED; |
597 | } | ||
595 | PB_TRACE(pb, "got_lock", 0); | 598 | PB_TRACE(pb, "got_lock", 0); |
596 | XFS_STATS_INC(pb_get_locked); | 599 | XFS_STATS_INC(pb_get_locked); |
597 | return (pb); | 600 | return (pb); |
@@ -700,25 +703,6 @@ xfs_buf_read_flags( | |||
700 | } | 703 | } |
701 | 704 | ||
702 | /* | 705 | /* |
703 | * Create a skeletal pagebuf (no pages associated with it). | ||
704 | */ | ||
705 | xfs_buf_t * | ||
706 | pagebuf_lookup( | ||
707 | xfs_buftarg_t *target, | ||
708 | loff_t ioff, | ||
709 | size_t isize, | ||
710 | page_buf_flags_t flags) | ||
711 | { | ||
712 | xfs_buf_t *pb; | ||
713 | |||
714 | pb = pagebuf_allocate(flags); | ||
715 | if (pb) { | ||
716 | _pagebuf_initialize(pb, target, ioff, isize, flags); | ||
717 | } | ||
718 | return pb; | ||
719 | } | ||
720 | |||
721 | /* | ||
722 | * If we are not low on memory then do the readahead in a deadlock | 706 | * If we are not low on memory then do the readahead in a deadlock |
723 | * safe manner. | 707 | * safe manner. |
724 | */ | 708 | */ |
@@ -913,22 +897,23 @@ pagebuf_rele( | |||
913 | do_free = 0; | 897 | do_free = 0; |
914 | } | 898 | } |
915 | 899 | ||
916 | if (pb->pb_flags & PBF_DELWRI) { | 900 | if (pb->pb_flags & PBF_FS_MANAGED) { |
917 | pb->pb_flags |= PBF_ASYNC; | ||
918 | atomic_inc(&pb->pb_hold); | ||
919 | pagebuf_delwri_queue(pb, 0); | ||
920 | do_free = 0; | ||
921 | } else if (pb->pb_flags & PBF_FS_MANAGED) { | ||
922 | do_free = 0; | 901 | do_free = 0; |
923 | } | 902 | } |
924 | 903 | ||
925 | if (do_free) { | 904 | if (do_free) { |
905 | ASSERT((pb->pb_flags & (PBF_DELWRI|_PBF_DELWRI_Q)) == 0); | ||
926 | list_del_init(&pb->pb_hash_list); | 906 | list_del_init(&pb->pb_hash_list); |
927 | spin_unlock(&hash->bh_lock); | 907 | spin_unlock(&hash->bh_lock); |
928 | pagebuf_free(pb); | 908 | pagebuf_free(pb); |
929 | } else { | 909 | } else { |
930 | spin_unlock(&hash->bh_lock); | 910 | spin_unlock(&hash->bh_lock); |
931 | } | 911 | } |
912 | } else { | ||
913 | /* | ||
914 | * Catch reference count leaks | ||
915 | */ | ||
916 | ASSERT(atomic_read(&pb->pb_hold) >= 0); | ||
932 | } | 917 | } |
933 | } | 918 | } |
934 | 919 | ||
@@ -1006,13 +991,24 @@ pagebuf_lock( | |||
1006 | * pagebuf_unlock | 991 | * pagebuf_unlock |
1007 | * | 992 | * |
1008 | * pagebuf_unlock releases the lock on the buffer object created by | 993 | * pagebuf_unlock releases the lock on the buffer object created by |
1009 | * pagebuf_lock or pagebuf_cond_lock (not any | 994 | * pagebuf_lock or pagebuf_cond_lock (not any pinning of underlying pages |
1010 | * pinning of underlying pages created by pagebuf_pin). | 995 | * created by pagebuf_pin). |
996 | * | ||
997 | * If the buffer is marked delwri but is not queued, do so before we | ||
998 | * unlock the buffer as we need to set flags correctly. We also need to | ||
999 | * take a reference for the delwri queue because the unlocker is going to | ||
1000 | * drop their's and they don't know we just queued it. | ||
1011 | */ | 1001 | */ |
1012 | void | 1002 | void |
1013 | pagebuf_unlock( /* unlock buffer */ | 1003 | pagebuf_unlock( /* unlock buffer */ |
1014 | xfs_buf_t *pb) /* buffer to unlock */ | 1004 | xfs_buf_t *pb) /* buffer to unlock */ |
1015 | { | 1005 | { |
1006 | if ((pb->pb_flags & (PBF_DELWRI|_PBF_DELWRI_Q)) == PBF_DELWRI) { | ||
1007 | atomic_inc(&pb->pb_hold); | ||
1008 | pb->pb_flags |= PBF_ASYNC; | ||
1009 | pagebuf_delwri_queue(pb, 0); | ||
1010 | } | ||
1011 | |||
1016 | PB_CLEAR_OWNER(pb); | 1012 | PB_CLEAR_OWNER(pb); |
1017 | up(&pb->pb_sema); | 1013 | up(&pb->pb_sema); |
1018 | PB_TRACE(pb, "unlock", 0); | 1014 | PB_TRACE(pb, "unlock", 0); |
@@ -1249,8 +1245,8 @@ bio_end_io_pagebuf( | |||
1249 | int error) | 1245 | int error) |
1250 | { | 1246 | { |
1251 | xfs_buf_t *pb = (xfs_buf_t *)bio->bi_private; | 1247 | xfs_buf_t *pb = (xfs_buf_t *)bio->bi_private; |
1252 | unsigned int i, blocksize = pb->pb_target->pbr_bsize; | 1248 | unsigned int blocksize = pb->pb_target->pbr_bsize; |
1253 | struct bio_vec *bvec = bio->bi_io_vec; | 1249 | struct bio_vec *bvec = bio->bi_io_vec + bio->bi_vcnt - 1; |
1254 | 1250 | ||
1255 | if (bio->bi_size) | 1251 | if (bio->bi_size) |
1256 | return 1; | 1252 | return 1; |
@@ -1258,10 +1254,12 @@ bio_end_io_pagebuf( | |||
1258 | if (!test_bit(BIO_UPTODATE, &bio->bi_flags)) | 1254 | if (!test_bit(BIO_UPTODATE, &bio->bi_flags)) |
1259 | pb->pb_error = EIO; | 1255 | pb->pb_error = EIO; |
1260 | 1256 | ||
1261 | for (i = 0; i < bio->bi_vcnt; i++, bvec++) { | 1257 | do { |
1262 | struct page *page = bvec->bv_page; | 1258 | struct page *page = bvec->bv_page; |
1263 | 1259 | ||
1264 | if (pb->pb_error) { | 1260 | if (unlikely(pb->pb_error)) { |
1261 | if (pb->pb_flags & PBF_READ) | ||
1262 | ClearPageUptodate(page); | ||
1265 | SetPageError(page); | 1263 | SetPageError(page); |
1266 | } else if (blocksize == PAGE_CACHE_SIZE) { | 1264 | } else if (blocksize == PAGE_CACHE_SIZE) { |
1267 | SetPageUptodate(page); | 1265 | SetPageUptodate(page); |
@@ -1270,10 +1268,13 @@ bio_end_io_pagebuf( | |||
1270 | set_page_region(page, bvec->bv_offset, bvec->bv_len); | 1268 | set_page_region(page, bvec->bv_offset, bvec->bv_len); |
1271 | } | 1269 | } |
1272 | 1270 | ||
1271 | if (--bvec >= bio->bi_io_vec) | ||
1272 | prefetchw(&bvec->bv_page->flags); | ||
1273 | |||
1273 | if (_pagebuf_iolocked(pb)) { | 1274 | if (_pagebuf_iolocked(pb)) { |
1274 | unlock_page(page); | 1275 | unlock_page(page); |
1275 | } | 1276 | } |
1276 | } | 1277 | } while (bvec >= bio->bi_io_vec); |
1277 | 1278 | ||
1278 | _pagebuf_iodone(pb, 1); | 1279 | _pagebuf_iodone(pb, 1); |
1279 | bio_put(bio); | 1280 | bio_put(bio); |
@@ -1511,6 +1512,11 @@ again: | |||
1511 | ASSERT(btp == bp->pb_target); | 1512 | ASSERT(btp == bp->pb_target); |
1512 | if (!(bp->pb_flags & PBF_FS_MANAGED)) { | 1513 | if (!(bp->pb_flags & PBF_FS_MANAGED)) { |
1513 | spin_unlock(&hash->bh_lock); | 1514 | spin_unlock(&hash->bh_lock); |
1515 | /* | ||
1516 | * Catch superblock reference count leaks | ||
1517 | * immediately | ||
1518 | */ | ||
1519 | BUG_ON(bp->pb_bn == 0); | ||
1514 | delay(100); | 1520 | delay(100); |
1515 | goto again; | 1521 | goto again; |
1516 | } | 1522 | } |
@@ -1686,17 +1692,20 @@ pagebuf_delwri_queue( | |||
1686 | int unlock) | 1692 | int unlock) |
1687 | { | 1693 | { |
1688 | PB_TRACE(pb, "delwri_q", (long)unlock); | 1694 | PB_TRACE(pb, "delwri_q", (long)unlock); |
1689 | ASSERT(pb->pb_flags & PBF_DELWRI); | 1695 | ASSERT((pb->pb_flags & (PBF_DELWRI|PBF_ASYNC)) == |
1696 | (PBF_DELWRI|PBF_ASYNC)); | ||
1690 | 1697 | ||
1691 | spin_lock(&pbd_delwrite_lock); | 1698 | spin_lock(&pbd_delwrite_lock); |
1692 | /* If already in the queue, dequeue and place at tail */ | 1699 | /* If already in the queue, dequeue and place at tail */ |
1693 | if (!list_empty(&pb->pb_list)) { | 1700 | if (!list_empty(&pb->pb_list)) { |
1701 | ASSERT(pb->pb_flags & _PBF_DELWRI_Q); | ||
1694 | if (unlock) { | 1702 | if (unlock) { |
1695 | atomic_dec(&pb->pb_hold); | 1703 | atomic_dec(&pb->pb_hold); |
1696 | } | 1704 | } |
1697 | list_del(&pb->pb_list); | 1705 | list_del(&pb->pb_list); |
1698 | } | 1706 | } |
1699 | 1707 | ||
1708 | pb->pb_flags |= _PBF_DELWRI_Q; | ||
1700 | list_add_tail(&pb->pb_list, &pbd_delwrite_queue); | 1709 | list_add_tail(&pb->pb_list, &pbd_delwrite_queue); |
1701 | pb->pb_queuetime = jiffies; | 1710 | pb->pb_queuetime = jiffies; |
1702 | spin_unlock(&pbd_delwrite_lock); | 1711 | spin_unlock(&pbd_delwrite_lock); |
@@ -1713,10 +1722,11 @@ pagebuf_delwri_dequeue( | |||
1713 | 1722 | ||
1714 | spin_lock(&pbd_delwrite_lock); | 1723 | spin_lock(&pbd_delwrite_lock); |
1715 | if ((pb->pb_flags & PBF_DELWRI) && !list_empty(&pb->pb_list)) { | 1724 | if ((pb->pb_flags & PBF_DELWRI) && !list_empty(&pb->pb_list)) { |
1725 | ASSERT(pb->pb_flags & _PBF_DELWRI_Q); | ||
1716 | list_del_init(&pb->pb_list); | 1726 | list_del_init(&pb->pb_list); |
1717 | dequeued = 1; | 1727 | dequeued = 1; |
1718 | } | 1728 | } |
1719 | pb->pb_flags &= ~PBF_DELWRI; | 1729 | pb->pb_flags &= ~(PBF_DELWRI|_PBF_DELWRI_Q); |
1720 | spin_unlock(&pbd_delwrite_lock); | 1730 | spin_unlock(&pbd_delwrite_lock); |
1721 | 1731 | ||
1722 | if (dequeued) | 1732 | if (dequeued) |
@@ -1733,9 +1743,7 @@ pagebuf_runall_queues( | |||
1733 | } | 1743 | } |
1734 | 1744 | ||
1735 | /* Defines for pagebuf daemon */ | 1745 | /* Defines for pagebuf daemon */ |
1736 | STATIC DECLARE_COMPLETION(xfsbufd_done); | ||
1737 | STATIC struct task_struct *xfsbufd_task; | 1746 | STATIC struct task_struct *xfsbufd_task; |
1738 | STATIC int xfsbufd_active; | ||
1739 | STATIC int xfsbufd_force_flush; | 1747 | STATIC int xfsbufd_force_flush; |
1740 | STATIC int xfsbufd_force_sleep; | 1748 | STATIC int xfsbufd_force_sleep; |
1741 | 1749 | ||
@@ -1761,14 +1769,8 @@ xfsbufd( | |||
1761 | xfs_buftarg_t *target; | 1769 | xfs_buftarg_t *target; |
1762 | xfs_buf_t *pb, *n; | 1770 | xfs_buf_t *pb, *n; |
1763 | 1771 | ||
1764 | /* Set up the thread */ | ||
1765 | daemonize("xfsbufd"); | ||
1766 | current->flags |= PF_MEMALLOC; | 1772 | current->flags |= PF_MEMALLOC; |
1767 | 1773 | ||
1768 | xfsbufd_task = current; | ||
1769 | xfsbufd_active = 1; | ||
1770 | barrier(); | ||
1771 | |||
1772 | INIT_LIST_HEAD(&tmp); | 1774 | INIT_LIST_HEAD(&tmp); |
1773 | do { | 1775 | do { |
1774 | if (unlikely(freezing(current))) { | 1776 | if (unlikely(freezing(current))) { |
@@ -1795,7 +1797,7 @@ xfsbufd( | |||
1795 | break; | 1797 | break; |
1796 | } | 1798 | } |
1797 | 1799 | ||
1798 | pb->pb_flags &= ~PBF_DELWRI; | 1800 | pb->pb_flags &= ~(PBF_DELWRI|_PBF_DELWRI_Q); |
1799 | pb->pb_flags |= PBF_WRITE; | 1801 | pb->pb_flags |= PBF_WRITE; |
1800 | list_move(&pb->pb_list, &tmp); | 1802 | list_move(&pb->pb_list, &tmp); |
1801 | } | 1803 | } |
@@ -1816,9 +1818,9 @@ xfsbufd( | |||
1816 | purge_addresses(); | 1818 | purge_addresses(); |
1817 | 1819 | ||
1818 | xfsbufd_force_flush = 0; | 1820 | xfsbufd_force_flush = 0; |
1819 | } while (xfsbufd_active); | 1821 | } while (!kthread_should_stop()); |
1820 | 1822 | ||
1821 | complete_and_exit(&xfsbufd_done, 0); | 1823 | return 0; |
1822 | } | 1824 | } |
1823 | 1825 | ||
1824 | /* | 1826 | /* |
@@ -1845,15 +1847,13 @@ xfs_flush_buftarg( | |||
1845 | if (pb->pb_target != target) | 1847 | if (pb->pb_target != target) |
1846 | continue; | 1848 | continue; |
1847 | 1849 | ||
1848 | ASSERT(pb->pb_flags & PBF_DELWRI); | 1850 | ASSERT(pb->pb_flags & (PBF_DELWRI|_PBF_DELWRI_Q)); |
1849 | PB_TRACE(pb, "walkq2", (long)pagebuf_ispin(pb)); | 1851 | PB_TRACE(pb, "walkq2", (long)pagebuf_ispin(pb)); |
1850 | if (pagebuf_ispin(pb)) { | 1852 | if (pagebuf_ispin(pb)) { |
1851 | pincount++; | 1853 | pincount++; |
1852 | continue; | 1854 | continue; |
1853 | } | 1855 | } |
1854 | 1856 | ||
1855 | pb->pb_flags &= ~PBF_DELWRI; | ||
1856 | pb->pb_flags |= PBF_WRITE; | ||
1857 | list_move(&pb->pb_list, &tmp); | 1857 | list_move(&pb->pb_list, &tmp); |
1858 | } | 1858 | } |
1859 | spin_unlock(&pbd_delwrite_lock); | 1859 | spin_unlock(&pbd_delwrite_lock); |
@@ -1862,12 +1862,14 @@ xfs_flush_buftarg( | |||
1862 | * Dropped the delayed write list lock, now walk the temporary list | 1862 | * Dropped the delayed write list lock, now walk the temporary list |
1863 | */ | 1863 | */ |
1864 | list_for_each_entry_safe(pb, n, &tmp, pb_list) { | 1864 | list_for_each_entry_safe(pb, n, &tmp, pb_list) { |
1865 | pagebuf_lock(pb); | ||
1866 | pb->pb_flags &= ~(PBF_DELWRI|_PBF_DELWRI_Q); | ||
1867 | pb->pb_flags |= PBF_WRITE; | ||
1865 | if (wait) | 1868 | if (wait) |
1866 | pb->pb_flags &= ~PBF_ASYNC; | 1869 | pb->pb_flags &= ~PBF_ASYNC; |
1867 | else | 1870 | else |
1868 | list_del_init(&pb->pb_list); | 1871 | list_del_init(&pb->pb_list); |
1869 | 1872 | ||
1870 | pagebuf_lock(pb); | ||
1871 | pagebuf_iostrategy(pb); | 1873 | pagebuf_iostrategy(pb); |
1872 | } | 1874 | } |
1873 | 1875 | ||
@@ -1901,9 +1903,11 @@ xfs_buf_daemons_start(void) | |||
1901 | if (!xfsdatad_workqueue) | 1903 | if (!xfsdatad_workqueue) |
1902 | goto out_destroy_xfslogd_workqueue; | 1904 | goto out_destroy_xfslogd_workqueue; |
1903 | 1905 | ||
1904 | error = kernel_thread(xfsbufd, NULL, CLONE_FS|CLONE_FILES); | 1906 | xfsbufd_task = kthread_run(xfsbufd, NULL, "xfsbufd"); |
1905 | if (error < 0) | 1907 | if (IS_ERR(xfsbufd_task)) { |
1908 | error = PTR_ERR(xfsbufd_task); | ||
1906 | goto out_destroy_xfsdatad_workqueue; | 1909 | goto out_destroy_xfsdatad_workqueue; |
1910 | } | ||
1907 | return 0; | 1911 | return 0; |
1908 | 1912 | ||
1909 | out_destroy_xfsdatad_workqueue: | 1913 | out_destroy_xfsdatad_workqueue: |
@@ -1920,10 +1924,7 @@ xfs_buf_daemons_start(void) | |||
1920 | STATIC void | 1924 | STATIC void |
1921 | xfs_buf_daemons_stop(void) | 1925 | xfs_buf_daemons_stop(void) |
1922 | { | 1926 | { |
1923 | xfsbufd_active = 0; | 1927 | kthread_stop(xfsbufd_task); |
1924 | barrier(); | ||
1925 | wait_for_completion(&xfsbufd_done); | ||
1926 | |||
1927 | destroy_workqueue(xfslogd_workqueue); | 1928 | destroy_workqueue(xfslogd_workqueue); |
1928 | destroy_workqueue(xfsdatad_workqueue); | 1929 | destroy_workqueue(xfsdatad_workqueue); |
1929 | } | 1930 | } |