diff options
Diffstat (limited to 'fs/ocfs2/journal.c')
-rw-r--r-- | fs/ocfs2/journal.c | 111 |
1 files changed, 111 insertions, 0 deletions
diff --git a/fs/ocfs2/journal.c b/fs/ocfs2/journal.c index a20a0f1e37fd..4a3b9e6b31ad 100644 --- a/fs/ocfs2/journal.c +++ b/fs/ocfs2/journal.c | |||
@@ -28,6 +28,8 @@ | |||
28 | #include <linux/slab.h> | 28 | #include <linux/slab.h> |
29 | #include <linux/highmem.h> | 29 | #include <linux/highmem.h> |
30 | #include <linux/kthread.h> | 30 | #include <linux/kthread.h> |
31 | #include <linux/time.h> | ||
32 | #include <linux/random.h> | ||
31 | 33 | ||
32 | #define MLOG_MASK_PREFIX ML_JOURNAL | 34 | #define MLOG_MASK_PREFIX ML_JOURNAL |
33 | #include <cluster/masklog.h> | 35 | #include <cluster/masklog.h> |
@@ -52,6 +54,8 @@ | |||
52 | 54 | ||
53 | DEFINE_SPINLOCK(trans_inc_lock); | 55 | DEFINE_SPINLOCK(trans_inc_lock); |
54 | 56 | ||
57 | #define ORPHAN_SCAN_SCHEDULE_TIMEOUT 300000 | ||
58 | |||
55 | static int ocfs2_force_read_journal(struct inode *inode); | 59 | static int ocfs2_force_read_journal(struct inode *inode); |
56 | static int ocfs2_recover_node(struct ocfs2_super *osb, | 60 | static int ocfs2_recover_node(struct ocfs2_super *osb, |
57 | int node_num, int slot_num); | 61 | int node_num, int slot_num); |
@@ -1841,6 +1845,113 @@ bail: | |||
1841 | return status; | 1845 | return status; |
1842 | } | 1846 | } |
1843 | 1847 | ||
1848 | /* | ||
1849 | * Scan timer should get fired every ORPHAN_SCAN_SCHEDULE_TIMEOUT. Add some | ||
1850 | * randomness to the timeout to minimize multple nodes firing the timer at the | ||
1851 | * same time. | ||
1852 | */ | ||
1853 | static inline unsigned long ocfs2_orphan_scan_timeout(void) | ||
1854 | { | ||
1855 | unsigned long time; | ||
1856 | |||
1857 | get_random_bytes(&time, sizeof(time)); | ||
1858 | time = ORPHAN_SCAN_SCHEDULE_TIMEOUT + (time % 5000); | ||
1859 | return msecs_to_jiffies(time); | ||
1860 | } | ||
1861 | |||
1862 | /* | ||
1863 | * ocfs2_queue_orphan_scan calls ocfs2_queue_recovery_completion for | ||
1864 | * every slot, queuing a recovery of the slot on the ocfs2_wq thread. This | ||
1865 | * is done to catch any orphans that are left over in orphan directories. | ||
1866 | * | ||
1867 | * ocfs2_queue_orphan_scan gets called every ORPHAN_SCAN_SCHEDULE_TIMEOUT | ||
1868 | * seconds. It gets an EX lock on os_lockres and checks sequence number | ||
1869 | * stored in LVB. If the sequence number has changed, it means some other | ||
1870 | * node has done the scan. This node skips the scan and tracks the | ||
1871 | * sequence number. If the sequence number didn't change, it means a scan | ||
1872 | * hasn't happened. The node queues a scan and increments the | ||
1873 | * sequence number in the LVB. | ||
1874 | */ | ||
1875 | void ocfs2_queue_orphan_scan(struct ocfs2_super *osb) | ||
1876 | { | ||
1877 | struct ocfs2_orphan_scan *os; | ||
1878 | int status, i; | ||
1879 | u32 seqno = 0; | ||
1880 | |||
1881 | os = &osb->osb_orphan_scan; | ||
1882 | |||
1883 | status = ocfs2_orphan_scan_lock(osb, &seqno, DLM_LOCK_EX); | ||
1884 | if (status < 0) { | ||
1885 | if (status != -EAGAIN) | ||
1886 | mlog_errno(status); | ||
1887 | goto out; | ||
1888 | } | ||
1889 | |||
1890 | if (os->os_seqno != seqno) { | ||
1891 | os->os_seqno = seqno; | ||
1892 | goto unlock; | ||
1893 | } | ||
1894 | |||
1895 | for (i = 0; i < osb->max_slots; i++) | ||
1896 | ocfs2_queue_recovery_completion(osb->journal, i, NULL, NULL, | ||
1897 | NULL); | ||
1898 | /* | ||
1899 | * We queued a recovery on orphan slots, increment the sequence | ||
1900 | * number and update LVB so other node will skip the scan for a while | ||
1901 | */ | ||
1902 | seqno++; | ||
1903 | os->os_count++; | ||
1904 | os->os_scantime = CURRENT_TIME; | ||
1905 | unlock: | ||
1906 | ocfs2_orphan_scan_unlock(osb, seqno, DLM_LOCK_EX); | ||
1907 | out: | ||
1908 | return; | ||
1909 | } | ||
1910 | |||
1911 | /* Worker task that gets fired every ORPHAN_SCAN_SCHEDULE_TIMEOUT millsec */ | ||
1912 | void ocfs2_orphan_scan_work(struct work_struct *work) | ||
1913 | { | ||
1914 | struct ocfs2_orphan_scan *os; | ||
1915 | struct ocfs2_super *osb; | ||
1916 | |||
1917 | os = container_of(work, struct ocfs2_orphan_scan, | ||
1918 | os_orphan_scan_work.work); | ||
1919 | osb = os->os_osb; | ||
1920 | |||
1921 | mutex_lock(&os->os_lock); | ||
1922 | ocfs2_queue_orphan_scan(osb); | ||
1923 | schedule_delayed_work(&os->os_orphan_scan_work, | ||
1924 | ocfs2_orphan_scan_timeout()); | ||
1925 | mutex_unlock(&os->os_lock); | ||
1926 | } | ||
1927 | |||
1928 | void ocfs2_orphan_scan_stop(struct ocfs2_super *osb) | ||
1929 | { | ||
1930 | struct ocfs2_orphan_scan *os; | ||
1931 | |||
1932 | os = &osb->osb_orphan_scan; | ||
1933 | mutex_lock(&os->os_lock); | ||
1934 | cancel_delayed_work(&os->os_orphan_scan_work); | ||
1935 | mutex_unlock(&os->os_lock); | ||
1936 | } | ||
1937 | |||
1938 | int ocfs2_orphan_scan_init(struct ocfs2_super *osb) | ||
1939 | { | ||
1940 | struct ocfs2_orphan_scan *os; | ||
1941 | |||
1942 | os = &osb->osb_orphan_scan; | ||
1943 | os->os_osb = osb; | ||
1944 | os->os_count = 0; | ||
1945 | os->os_scantime = CURRENT_TIME; | ||
1946 | mutex_init(&os->os_lock); | ||
1947 | |||
1948 | INIT_DELAYED_WORK(&os->os_orphan_scan_work, | ||
1949 | ocfs2_orphan_scan_work); | ||
1950 | schedule_delayed_work(&os->os_orphan_scan_work, | ||
1951 | ocfs2_orphan_scan_timeout()); | ||
1952 | return 0; | ||
1953 | } | ||
1954 | |||
1844 | struct ocfs2_orphan_filldir_priv { | 1955 | struct ocfs2_orphan_filldir_priv { |
1845 | struct inode *head; | 1956 | struct inode *head; |
1846 | struct ocfs2_super *osb; | 1957 | struct ocfs2_super *osb; |