diff options
Diffstat (limited to 'fs/xfs/xfs_super.c')
-rw-r--r-- | fs/xfs/xfs_super.c | 1773 |
1 files changed, 1773 insertions, 0 deletions
diff --git a/fs/xfs/xfs_super.c b/fs/xfs/xfs_super.c new file mode 100644 index 000000000000..9a72dda58bd0 --- /dev/null +++ b/fs/xfs/xfs_super.c | |||
@@ -0,0 +1,1773 @@ | |||
1 | /* | ||
2 | * Copyright (c) 2000-2006 Silicon Graphics, Inc. | ||
3 | * All Rights Reserved. | ||
4 | * | ||
5 | * This program is free software; you can redistribute it and/or | ||
6 | * modify it under the terms of the GNU General Public License as | ||
7 | * published by the Free Software Foundation. | ||
8 | * | ||
9 | * This program is distributed in the hope that it would be useful, | ||
10 | * but WITHOUT ANY WARRANTY; without even the implied warranty of | ||
11 | * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the | ||
12 | * GNU General Public License for more details. | ||
13 | * | ||
14 | * You should have received a copy of the GNU General Public License | ||
15 | * along with this program; if not, write the Free Software Foundation, | ||
16 | * Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA | ||
17 | */ | ||
18 | |||
19 | #include "xfs.h" | ||
20 | #include "xfs_bit.h" | ||
21 | #include "xfs_log.h" | ||
22 | #include "xfs_inum.h" | ||
23 | #include "xfs_trans.h" | ||
24 | #include "xfs_sb.h" | ||
25 | #include "xfs_ag.h" | ||
26 | #include "xfs_dir2.h" | ||
27 | #include "xfs_alloc.h" | ||
28 | #include "xfs_quota.h" | ||
29 | #include "xfs_mount.h" | ||
30 | #include "xfs_bmap_btree.h" | ||
31 | #include "xfs_alloc_btree.h" | ||
32 | #include "xfs_ialloc_btree.h" | ||
33 | #include "xfs_dinode.h" | ||
34 | #include "xfs_inode.h" | ||
35 | #include "xfs_btree.h" | ||
36 | #include "xfs_ialloc.h" | ||
37 | #include "xfs_bmap.h" | ||
38 | #include "xfs_rtalloc.h" | ||
39 | #include "xfs_error.h" | ||
40 | #include "xfs_itable.h" | ||
41 | #include "xfs_fsops.h" | ||
42 | #include "xfs_attr.h" | ||
43 | #include "xfs_buf_item.h" | ||
44 | #include "xfs_utils.h" | ||
45 | #include "xfs_vnodeops.h" | ||
46 | #include "xfs_log_priv.h" | ||
47 | #include "xfs_trans_priv.h" | ||
48 | #include "xfs_filestream.h" | ||
49 | #include "xfs_da_btree.h" | ||
50 | #include "xfs_extfree_item.h" | ||
51 | #include "xfs_mru_cache.h" | ||
52 | #include "xfs_inode_item.h" | ||
53 | #include "xfs_sync.h" | ||
54 | #include "xfs_trace.h" | ||
55 | |||
56 | #include <linux/namei.h> | ||
57 | #include <linux/init.h> | ||
58 | #include <linux/slab.h> | ||
59 | #include <linux/mount.h> | ||
60 | #include <linux/mempool.h> | ||
61 | #include <linux/writeback.h> | ||
62 | #include <linux/kthread.h> | ||
63 | #include <linux/freezer.h> | ||
64 | #include <linux/parser.h> | ||
65 | |||
66 | static const struct super_operations xfs_super_operations; | ||
67 | static kmem_zone_t *xfs_ioend_zone; | ||
68 | mempool_t *xfs_ioend_pool; | ||
69 | |||
70 | #define MNTOPT_LOGBUFS "logbufs" /* number of XFS log buffers */ | ||
71 | #define MNTOPT_LOGBSIZE "logbsize" /* size of XFS log buffers */ | ||
72 | #define MNTOPT_LOGDEV "logdev" /* log device */ | ||
73 | #define MNTOPT_RTDEV "rtdev" /* realtime I/O device */ | ||
74 | #define MNTOPT_BIOSIZE "biosize" /* log2 of preferred buffered io size */ | ||
75 | #define MNTOPT_WSYNC "wsync" /* safe-mode nfs compatible mount */ | ||
76 | #define MNTOPT_NOALIGN "noalign" /* turn off stripe alignment */ | ||
77 | #define MNTOPT_SWALLOC "swalloc" /* turn on stripe width allocation */ | ||
78 | #define MNTOPT_SUNIT "sunit" /* data volume stripe unit */ | ||
79 | #define MNTOPT_SWIDTH "swidth" /* data volume stripe width */ | ||
80 | #define MNTOPT_NOUUID "nouuid" /* ignore filesystem UUID */ | ||
81 | #define MNTOPT_MTPT "mtpt" /* filesystem mount point */ | ||
82 | #define MNTOPT_GRPID "grpid" /* group-ID from parent directory */ | ||
83 | #define MNTOPT_NOGRPID "nogrpid" /* group-ID from current process */ | ||
84 | #define MNTOPT_BSDGROUPS "bsdgroups" /* group-ID from parent directory */ | ||
85 | #define MNTOPT_SYSVGROUPS "sysvgroups" /* group-ID from current process */ | ||
86 | #define MNTOPT_ALLOCSIZE "allocsize" /* preferred allocation size */ | ||
87 | #define MNTOPT_NORECOVERY "norecovery" /* don't run XFS recovery */ | ||
88 | #define MNTOPT_BARRIER "barrier" /* use writer barriers for log write and | ||
89 | * unwritten extent conversion */ | ||
90 | #define MNTOPT_NOBARRIER "nobarrier" /* .. disable */ | ||
91 | #define MNTOPT_64BITINODE "inode64" /* inodes can be allocated anywhere */ | ||
92 | #define MNTOPT_IKEEP "ikeep" /* do not free empty inode clusters */ | ||
93 | #define MNTOPT_NOIKEEP "noikeep" /* free empty inode clusters */ | ||
94 | #define MNTOPT_LARGEIO "largeio" /* report large I/O sizes in stat() */ | ||
95 | #define MNTOPT_NOLARGEIO "nolargeio" /* do not report large I/O sizes | ||
96 | * in stat(). */ | ||
97 | #define MNTOPT_ATTR2 "attr2" /* do use attr2 attribute format */ | ||
98 | #define MNTOPT_NOATTR2 "noattr2" /* do not use attr2 attribute format */ | ||
99 | #define MNTOPT_FILESTREAM "filestreams" /* use filestreams allocator */ | ||
100 | #define MNTOPT_QUOTA "quota" /* disk quotas (user) */ | ||
101 | #define MNTOPT_NOQUOTA "noquota" /* no quotas */ | ||
102 | #define MNTOPT_USRQUOTA "usrquota" /* user quota enabled */ | ||
103 | #define MNTOPT_GRPQUOTA "grpquota" /* group quota enabled */ | ||
104 | #define MNTOPT_PRJQUOTA "prjquota" /* project quota enabled */ | ||
105 | #define MNTOPT_UQUOTA "uquota" /* user quota (IRIX variant) */ | ||
106 | #define MNTOPT_GQUOTA "gquota" /* group quota (IRIX variant) */ | ||
107 | #define MNTOPT_PQUOTA "pquota" /* project quota (IRIX variant) */ | ||
108 | #define MNTOPT_UQUOTANOENF "uqnoenforce"/* user quota limit enforcement */ | ||
109 | #define MNTOPT_GQUOTANOENF "gqnoenforce"/* group quota limit enforcement */ | ||
110 | #define MNTOPT_PQUOTANOENF "pqnoenforce"/* project quota limit enforcement */ | ||
111 | #define MNTOPT_QUOTANOENF "qnoenforce" /* same as uqnoenforce */ | ||
112 | #define MNTOPT_DELAYLOG "delaylog" /* Delayed logging enabled */ | ||
113 | #define MNTOPT_NODELAYLOG "nodelaylog" /* Delayed logging disabled */ | ||
114 | #define MNTOPT_DISCARD "discard" /* Discard unused blocks */ | ||
115 | #define MNTOPT_NODISCARD "nodiscard" /* Do not discard unused blocks */ | ||
116 | |||
117 | /* | ||
118 | * Table driven mount option parser. | ||
119 | * | ||
120 | * Currently only used for remount, but it will be used for mount | ||
121 | * in the future, too. | ||
122 | */ | ||
123 | enum { | ||
124 | Opt_barrier, Opt_nobarrier, Opt_err | ||
125 | }; | ||
126 | |||
127 | static const match_table_t tokens = { | ||
128 | {Opt_barrier, "barrier"}, | ||
129 | {Opt_nobarrier, "nobarrier"}, | ||
130 | {Opt_err, NULL} | ||
131 | }; | ||
132 | |||
133 | |||
134 | STATIC unsigned long | ||
135 | suffix_strtoul(char *s, char **endp, unsigned int base) | ||
136 | { | ||
137 | int last, shift_left_factor = 0; | ||
138 | char *value = s; | ||
139 | |||
140 | last = strlen(value) - 1; | ||
141 | if (value[last] == 'K' || value[last] == 'k') { | ||
142 | shift_left_factor = 10; | ||
143 | value[last] = '\0'; | ||
144 | } | ||
145 | if (value[last] == 'M' || value[last] == 'm') { | ||
146 | shift_left_factor = 20; | ||
147 | value[last] = '\0'; | ||
148 | } | ||
149 | if (value[last] == 'G' || value[last] == 'g') { | ||
150 | shift_left_factor = 30; | ||
151 | value[last] = '\0'; | ||
152 | } | ||
153 | |||
154 | return simple_strtoul((const char *)s, endp, base) << shift_left_factor; | ||
155 | } | ||
156 | |||
157 | /* | ||
158 | * This function fills in xfs_mount_t fields based on mount args. | ||
159 | * Note: the superblock has _not_ yet been read in. | ||
160 | * | ||
161 | * Note that this function leaks the various device name allocations on | ||
162 | * failure. The caller takes care of them. | ||
163 | */ | ||
164 | STATIC int | ||
165 | xfs_parseargs( | ||
166 | struct xfs_mount *mp, | ||
167 | char *options) | ||
168 | { | ||
169 | struct super_block *sb = mp->m_super; | ||
170 | char *this_char, *value, *eov; | ||
171 | int dsunit = 0; | ||
172 | int dswidth = 0; | ||
173 | int iosize = 0; | ||
174 | __uint8_t iosizelog = 0; | ||
175 | |||
176 | /* | ||
177 | * set up the mount name first so all the errors will refer to the | ||
178 | * correct device. | ||
179 | */ | ||
180 | mp->m_fsname = kstrndup(sb->s_id, MAXNAMELEN, GFP_KERNEL); | ||
181 | if (!mp->m_fsname) | ||
182 | return ENOMEM; | ||
183 | mp->m_fsname_len = strlen(mp->m_fsname) + 1; | ||
184 | |||
185 | /* | ||
186 | * Copy binary VFS mount flags we are interested in. | ||
187 | */ | ||
188 | if (sb->s_flags & MS_RDONLY) | ||
189 | mp->m_flags |= XFS_MOUNT_RDONLY; | ||
190 | if (sb->s_flags & MS_DIRSYNC) | ||
191 | mp->m_flags |= XFS_MOUNT_DIRSYNC; | ||
192 | if (sb->s_flags & MS_SYNCHRONOUS) | ||
193 | mp->m_flags |= XFS_MOUNT_WSYNC; | ||
194 | |||
195 | /* | ||
196 | * Set some default flags that could be cleared by the mount option | ||
197 | * parsing. | ||
198 | */ | ||
199 | mp->m_flags |= XFS_MOUNT_BARRIER; | ||
200 | mp->m_flags |= XFS_MOUNT_COMPAT_IOSIZE; | ||
201 | mp->m_flags |= XFS_MOUNT_SMALL_INUMS; | ||
202 | mp->m_flags |= XFS_MOUNT_DELAYLOG; | ||
203 | |||
204 | /* | ||
205 | * These can be overridden by the mount option parsing. | ||
206 | */ | ||
207 | mp->m_logbufs = -1; | ||
208 | mp->m_logbsize = -1; | ||
209 | |||
210 | if (!options) | ||
211 | goto done; | ||
212 | |||
213 | while ((this_char = strsep(&options, ",")) != NULL) { | ||
214 | if (!*this_char) | ||
215 | continue; | ||
216 | if ((value = strchr(this_char, '=')) != NULL) | ||
217 | *value++ = 0; | ||
218 | |||
219 | if (!strcmp(this_char, MNTOPT_LOGBUFS)) { | ||
220 | if (!value || !*value) { | ||
221 | xfs_warn(mp, "%s option requires an argument", | ||
222 | this_char); | ||
223 | return EINVAL; | ||
224 | } | ||
225 | mp->m_logbufs = simple_strtoul(value, &eov, 10); | ||
226 | } else if (!strcmp(this_char, MNTOPT_LOGBSIZE)) { | ||
227 | if (!value || !*value) { | ||
228 | xfs_warn(mp, "%s option requires an argument", | ||
229 | this_char); | ||
230 | return EINVAL; | ||
231 | } | ||
232 | mp->m_logbsize = suffix_strtoul(value, &eov, 10); | ||
233 | } else if (!strcmp(this_char, MNTOPT_LOGDEV)) { | ||
234 | if (!value || !*value) { | ||
235 | xfs_warn(mp, "%s option requires an argument", | ||
236 | this_char); | ||
237 | return EINVAL; | ||
238 | } | ||
239 | mp->m_logname = kstrndup(value, MAXNAMELEN, GFP_KERNEL); | ||
240 | if (!mp->m_logname) | ||
241 | return ENOMEM; | ||
242 | } else if (!strcmp(this_char, MNTOPT_MTPT)) { | ||
243 | xfs_warn(mp, "%s option not allowed on this system", | ||
244 | this_char); | ||
245 | return EINVAL; | ||
246 | } else if (!strcmp(this_char, MNTOPT_RTDEV)) { | ||
247 | if (!value || !*value) { | ||
248 | xfs_warn(mp, "%s option requires an argument", | ||
249 | this_char); | ||
250 | return EINVAL; | ||
251 | } | ||
252 | mp->m_rtname = kstrndup(value, MAXNAMELEN, GFP_KERNEL); | ||
253 | if (!mp->m_rtname) | ||
254 | return ENOMEM; | ||
255 | } else if (!strcmp(this_char, MNTOPT_BIOSIZE)) { | ||
256 | if (!value || !*value) { | ||
257 | xfs_warn(mp, "%s option requires an argument", | ||
258 | this_char); | ||
259 | return EINVAL; | ||
260 | } | ||
261 | iosize = simple_strtoul(value, &eov, 10); | ||
262 | iosizelog = ffs(iosize) - 1; | ||
263 | } else if (!strcmp(this_char, MNTOPT_ALLOCSIZE)) { | ||
264 | if (!value || !*value) { | ||
265 | xfs_warn(mp, "%s option requires an argument", | ||
266 | this_char); | ||
267 | return EINVAL; | ||
268 | } | ||
269 | iosize = suffix_strtoul(value, &eov, 10); | ||
270 | iosizelog = ffs(iosize) - 1; | ||
271 | } else if (!strcmp(this_char, MNTOPT_GRPID) || | ||
272 | !strcmp(this_char, MNTOPT_BSDGROUPS)) { | ||
273 | mp->m_flags |= XFS_MOUNT_GRPID; | ||
274 | } else if (!strcmp(this_char, MNTOPT_NOGRPID) || | ||
275 | !strcmp(this_char, MNTOPT_SYSVGROUPS)) { | ||
276 | mp->m_flags &= ~XFS_MOUNT_GRPID; | ||
277 | } else if (!strcmp(this_char, MNTOPT_WSYNC)) { | ||
278 | mp->m_flags |= XFS_MOUNT_WSYNC; | ||
279 | } else if (!strcmp(this_char, MNTOPT_NORECOVERY)) { | ||
280 | mp->m_flags |= XFS_MOUNT_NORECOVERY; | ||
281 | } else if (!strcmp(this_char, MNTOPT_NOALIGN)) { | ||
282 | mp->m_flags |= XFS_MOUNT_NOALIGN; | ||
283 | } else if (!strcmp(this_char, MNTOPT_SWALLOC)) { | ||
284 | mp->m_flags |= XFS_MOUNT_SWALLOC; | ||
285 | } else if (!strcmp(this_char, MNTOPT_SUNIT)) { | ||
286 | if (!value || !*value) { | ||
287 | xfs_warn(mp, "%s option requires an argument", | ||
288 | this_char); | ||
289 | return EINVAL; | ||
290 | } | ||
291 | dsunit = simple_strtoul(value, &eov, 10); | ||
292 | } else if (!strcmp(this_char, MNTOPT_SWIDTH)) { | ||
293 | if (!value || !*value) { | ||
294 | xfs_warn(mp, "%s option requires an argument", | ||
295 | this_char); | ||
296 | return EINVAL; | ||
297 | } | ||
298 | dswidth = simple_strtoul(value, &eov, 10); | ||
299 | } else if (!strcmp(this_char, MNTOPT_64BITINODE)) { | ||
300 | mp->m_flags &= ~XFS_MOUNT_SMALL_INUMS; | ||
301 | #if !XFS_BIG_INUMS | ||
302 | xfs_warn(mp, "%s option not allowed on this system", | ||
303 | this_char); | ||
304 | return EINVAL; | ||
305 | #endif | ||
306 | } else if (!strcmp(this_char, MNTOPT_NOUUID)) { | ||
307 | mp->m_flags |= XFS_MOUNT_NOUUID; | ||
308 | } else if (!strcmp(this_char, MNTOPT_BARRIER)) { | ||
309 | mp->m_flags |= XFS_MOUNT_BARRIER; | ||
310 | } else if (!strcmp(this_char, MNTOPT_NOBARRIER)) { | ||
311 | mp->m_flags &= ~XFS_MOUNT_BARRIER; | ||
312 | } else if (!strcmp(this_char, MNTOPT_IKEEP)) { | ||
313 | mp->m_flags |= XFS_MOUNT_IKEEP; | ||
314 | } else if (!strcmp(this_char, MNTOPT_NOIKEEP)) { | ||
315 | mp->m_flags &= ~XFS_MOUNT_IKEEP; | ||
316 | } else if (!strcmp(this_char, MNTOPT_LARGEIO)) { | ||
317 | mp->m_flags &= ~XFS_MOUNT_COMPAT_IOSIZE; | ||
318 | } else if (!strcmp(this_char, MNTOPT_NOLARGEIO)) { | ||
319 | mp->m_flags |= XFS_MOUNT_COMPAT_IOSIZE; | ||
320 | } else if (!strcmp(this_char, MNTOPT_ATTR2)) { | ||
321 | mp->m_flags |= XFS_MOUNT_ATTR2; | ||
322 | } else if (!strcmp(this_char, MNTOPT_NOATTR2)) { | ||
323 | mp->m_flags &= ~XFS_MOUNT_ATTR2; | ||
324 | mp->m_flags |= XFS_MOUNT_NOATTR2; | ||
325 | } else if (!strcmp(this_char, MNTOPT_FILESTREAM)) { | ||
326 | mp->m_flags |= XFS_MOUNT_FILESTREAMS; | ||
327 | } else if (!strcmp(this_char, MNTOPT_NOQUOTA)) { | ||
328 | mp->m_qflags &= ~(XFS_UQUOTA_ACCT | XFS_UQUOTA_ACTIVE | | ||
329 | XFS_GQUOTA_ACCT | XFS_GQUOTA_ACTIVE | | ||
330 | XFS_PQUOTA_ACCT | XFS_PQUOTA_ACTIVE | | ||
331 | XFS_UQUOTA_ENFD | XFS_OQUOTA_ENFD); | ||
332 | } else if (!strcmp(this_char, MNTOPT_QUOTA) || | ||
333 | !strcmp(this_char, MNTOPT_UQUOTA) || | ||
334 | !strcmp(this_char, MNTOPT_USRQUOTA)) { | ||
335 | mp->m_qflags |= (XFS_UQUOTA_ACCT | XFS_UQUOTA_ACTIVE | | ||
336 | XFS_UQUOTA_ENFD); | ||
337 | } else if (!strcmp(this_char, MNTOPT_QUOTANOENF) || | ||
338 | !strcmp(this_char, MNTOPT_UQUOTANOENF)) { | ||
339 | mp->m_qflags |= (XFS_UQUOTA_ACCT | XFS_UQUOTA_ACTIVE); | ||
340 | mp->m_qflags &= ~XFS_UQUOTA_ENFD; | ||
341 | } else if (!strcmp(this_char, MNTOPT_PQUOTA) || | ||
342 | !strcmp(this_char, MNTOPT_PRJQUOTA)) { | ||
343 | mp->m_qflags |= (XFS_PQUOTA_ACCT | XFS_PQUOTA_ACTIVE | | ||
344 | XFS_OQUOTA_ENFD); | ||
345 | } else if (!strcmp(this_char, MNTOPT_PQUOTANOENF)) { | ||
346 | mp->m_qflags |= (XFS_PQUOTA_ACCT | XFS_PQUOTA_ACTIVE); | ||
347 | mp->m_qflags &= ~XFS_OQUOTA_ENFD; | ||
348 | } else if (!strcmp(this_char, MNTOPT_GQUOTA) || | ||
349 | !strcmp(this_char, MNTOPT_GRPQUOTA)) { | ||
350 | mp->m_qflags |= (XFS_GQUOTA_ACCT | XFS_GQUOTA_ACTIVE | | ||
351 | XFS_OQUOTA_ENFD); | ||
352 | } else if (!strcmp(this_char, MNTOPT_GQUOTANOENF)) { | ||
353 | mp->m_qflags |= (XFS_GQUOTA_ACCT | XFS_GQUOTA_ACTIVE); | ||
354 | mp->m_qflags &= ~XFS_OQUOTA_ENFD; | ||
355 | } else if (!strcmp(this_char, MNTOPT_DELAYLOG)) { | ||
356 | mp->m_flags |= XFS_MOUNT_DELAYLOG; | ||
357 | } else if (!strcmp(this_char, MNTOPT_NODELAYLOG)) { | ||
358 | mp->m_flags &= ~XFS_MOUNT_DELAYLOG; | ||
359 | } else if (!strcmp(this_char, MNTOPT_DISCARD)) { | ||
360 | mp->m_flags |= XFS_MOUNT_DISCARD; | ||
361 | } else if (!strcmp(this_char, MNTOPT_NODISCARD)) { | ||
362 | mp->m_flags &= ~XFS_MOUNT_DISCARD; | ||
363 | } else if (!strcmp(this_char, "ihashsize")) { | ||
364 | xfs_warn(mp, | ||
365 | "ihashsize no longer used, option is deprecated."); | ||
366 | } else if (!strcmp(this_char, "osyncisdsync")) { | ||
367 | xfs_warn(mp, | ||
368 | "osyncisdsync has no effect, option is deprecated."); | ||
369 | } else if (!strcmp(this_char, "osyncisosync")) { | ||
370 | xfs_warn(mp, | ||
371 | "osyncisosync has no effect, option is deprecated."); | ||
372 | } else if (!strcmp(this_char, "irixsgid")) { | ||
373 | xfs_warn(mp, | ||
374 | "irixsgid is now a sysctl(2) variable, option is deprecated."); | ||
375 | } else { | ||
376 | xfs_warn(mp, "unknown mount option [%s].", this_char); | ||
377 | return EINVAL; | ||
378 | } | ||
379 | } | ||
380 | |||
381 | /* | ||
382 | * no recovery flag requires a read-only mount | ||
383 | */ | ||
384 | if ((mp->m_flags & XFS_MOUNT_NORECOVERY) && | ||
385 | !(mp->m_flags & XFS_MOUNT_RDONLY)) { | ||
386 | xfs_warn(mp, "no-recovery mounts must be read-only."); | ||
387 | return EINVAL; | ||
388 | } | ||
389 | |||
390 | if ((mp->m_flags & XFS_MOUNT_NOALIGN) && (dsunit || dswidth)) { | ||
391 | xfs_warn(mp, | ||
392 | "sunit and swidth options incompatible with the noalign option"); | ||
393 | return EINVAL; | ||
394 | } | ||
395 | |||
396 | if ((mp->m_flags & XFS_MOUNT_DISCARD) && | ||
397 | !(mp->m_flags & XFS_MOUNT_DELAYLOG)) { | ||
398 | xfs_warn(mp, | ||
399 | "the discard option is incompatible with the nodelaylog option"); | ||
400 | return EINVAL; | ||
401 | } | ||
402 | |||
403 | #ifndef CONFIG_XFS_QUOTA | ||
404 | if (XFS_IS_QUOTA_RUNNING(mp)) { | ||
405 | xfs_warn(mp, "quota support not available in this kernel."); | ||
406 | return EINVAL; | ||
407 | } | ||
408 | #endif | ||
409 | |||
410 | if ((mp->m_qflags & (XFS_GQUOTA_ACCT | XFS_GQUOTA_ACTIVE)) && | ||
411 | (mp->m_qflags & (XFS_PQUOTA_ACCT | XFS_PQUOTA_ACTIVE))) { | ||
412 | xfs_warn(mp, "cannot mount with both project and group quota"); | ||
413 | return EINVAL; | ||
414 | } | ||
415 | |||
416 | if ((dsunit && !dswidth) || (!dsunit && dswidth)) { | ||
417 | xfs_warn(mp, "sunit and swidth must be specified together"); | ||
418 | return EINVAL; | ||
419 | } | ||
420 | |||
421 | if (dsunit && (dswidth % dsunit != 0)) { | ||
422 | xfs_warn(mp, | ||
423 | "stripe width (%d) must be a multiple of the stripe unit (%d)", | ||
424 | dswidth, dsunit); | ||
425 | return EINVAL; | ||
426 | } | ||
427 | |||
428 | done: | ||
429 | if (!(mp->m_flags & XFS_MOUNT_NOALIGN)) { | ||
430 | /* | ||
431 | * At this point the superblock has not been read | ||
432 | * in, therefore we do not know the block size. | ||
433 | * Before the mount call ends we will convert | ||
434 | * these to FSBs. | ||
435 | */ | ||
436 | if (dsunit) { | ||
437 | mp->m_dalign = dsunit; | ||
438 | mp->m_flags |= XFS_MOUNT_RETERR; | ||
439 | } | ||
440 | |||
441 | if (dswidth) | ||
442 | mp->m_swidth = dswidth; | ||
443 | } | ||
444 | |||
445 | if (mp->m_logbufs != -1 && | ||
446 | mp->m_logbufs != 0 && | ||
447 | (mp->m_logbufs < XLOG_MIN_ICLOGS || | ||
448 | mp->m_logbufs > XLOG_MAX_ICLOGS)) { | ||
449 | xfs_warn(mp, "invalid logbufs value: %d [not %d-%d]", | ||
450 | mp->m_logbufs, XLOG_MIN_ICLOGS, XLOG_MAX_ICLOGS); | ||
451 | return XFS_ERROR(EINVAL); | ||
452 | } | ||
453 | if (mp->m_logbsize != -1 && | ||
454 | mp->m_logbsize != 0 && | ||
455 | (mp->m_logbsize < XLOG_MIN_RECORD_BSIZE || | ||
456 | mp->m_logbsize > XLOG_MAX_RECORD_BSIZE || | ||
457 | !is_power_of_2(mp->m_logbsize))) { | ||
458 | xfs_warn(mp, | ||
459 | "invalid logbufsize: %d [not 16k,32k,64k,128k or 256k]", | ||
460 | mp->m_logbsize); | ||
461 | return XFS_ERROR(EINVAL); | ||
462 | } | ||
463 | |||
464 | if (iosizelog) { | ||
465 | if (iosizelog > XFS_MAX_IO_LOG || | ||
466 | iosizelog < XFS_MIN_IO_LOG) { | ||
467 | xfs_warn(mp, "invalid log iosize: %d [not %d-%d]", | ||
468 | iosizelog, XFS_MIN_IO_LOG, | ||
469 | XFS_MAX_IO_LOG); | ||
470 | return XFS_ERROR(EINVAL); | ||
471 | } | ||
472 | |||
473 | mp->m_flags |= XFS_MOUNT_DFLT_IOSIZE; | ||
474 | mp->m_readio_log = iosizelog; | ||
475 | mp->m_writeio_log = iosizelog; | ||
476 | } | ||
477 | |||
478 | return 0; | ||
479 | } | ||
480 | |||
481 | struct proc_xfs_info { | ||
482 | int flag; | ||
483 | char *str; | ||
484 | }; | ||
485 | |||
486 | STATIC int | ||
487 | xfs_showargs( | ||
488 | struct xfs_mount *mp, | ||
489 | struct seq_file *m) | ||
490 | { | ||
491 | static struct proc_xfs_info xfs_info_set[] = { | ||
492 | /* the few simple ones we can get from the mount struct */ | ||
493 | { XFS_MOUNT_IKEEP, "," MNTOPT_IKEEP }, | ||
494 | { XFS_MOUNT_WSYNC, "," MNTOPT_WSYNC }, | ||
495 | { XFS_MOUNT_NOALIGN, "," MNTOPT_NOALIGN }, | ||
496 | { XFS_MOUNT_SWALLOC, "," MNTOPT_SWALLOC }, | ||
497 | { XFS_MOUNT_NOUUID, "," MNTOPT_NOUUID }, | ||
498 | { XFS_MOUNT_NORECOVERY, "," MNTOPT_NORECOVERY }, | ||
499 | { XFS_MOUNT_ATTR2, "," MNTOPT_ATTR2 }, | ||
500 | { XFS_MOUNT_FILESTREAMS, "," MNTOPT_FILESTREAM }, | ||
501 | { XFS_MOUNT_GRPID, "," MNTOPT_GRPID }, | ||
502 | { XFS_MOUNT_DELAYLOG, "," MNTOPT_DELAYLOG }, | ||
503 | { XFS_MOUNT_DISCARD, "," MNTOPT_DISCARD }, | ||
504 | { 0, NULL } | ||
505 | }; | ||
506 | static struct proc_xfs_info xfs_info_unset[] = { | ||
507 | /* the few simple ones we can get from the mount struct */ | ||
508 | { XFS_MOUNT_COMPAT_IOSIZE, "," MNTOPT_LARGEIO }, | ||
509 | { XFS_MOUNT_BARRIER, "," MNTOPT_NOBARRIER }, | ||
510 | { XFS_MOUNT_SMALL_INUMS, "," MNTOPT_64BITINODE }, | ||
511 | { 0, NULL } | ||
512 | }; | ||
513 | struct proc_xfs_info *xfs_infop; | ||
514 | |||
515 | for (xfs_infop = xfs_info_set; xfs_infop->flag; xfs_infop++) { | ||
516 | if (mp->m_flags & xfs_infop->flag) | ||
517 | seq_puts(m, xfs_infop->str); | ||
518 | } | ||
519 | for (xfs_infop = xfs_info_unset; xfs_infop->flag; xfs_infop++) { | ||
520 | if (!(mp->m_flags & xfs_infop->flag)) | ||
521 | seq_puts(m, xfs_infop->str); | ||
522 | } | ||
523 | |||
524 | if (mp->m_flags & XFS_MOUNT_DFLT_IOSIZE) | ||
525 | seq_printf(m, "," MNTOPT_ALLOCSIZE "=%dk", | ||
526 | (int)(1 << mp->m_writeio_log) >> 10); | ||
527 | |||
528 | if (mp->m_logbufs > 0) | ||
529 | seq_printf(m, "," MNTOPT_LOGBUFS "=%d", mp->m_logbufs); | ||
530 | if (mp->m_logbsize > 0) | ||
531 | seq_printf(m, "," MNTOPT_LOGBSIZE "=%dk", mp->m_logbsize >> 10); | ||
532 | |||
533 | if (mp->m_logname) | ||
534 | seq_printf(m, "," MNTOPT_LOGDEV "=%s", mp->m_logname); | ||
535 | if (mp->m_rtname) | ||
536 | seq_printf(m, "," MNTOPT_RTDEV "=%s", mp->m_rtname); | ||
537 | |||
538 | if (mp->m_dalign > 0) | ||
539 | seq_printf(m, "," MNTOPT_SUNIT "=%d", | ||
540 | (int)XFS_FSB_TO_BB(mp, mp->m_dalign)); | ||
541 | if (mp->m_swidth > 0) | ||
542 | seq_printf(m, "," MNTOPT_SWIDTH "=%d", | ||
543 | (int)XFS_FSB_TO_BB(mp, mp->m_swidth)); | ||
544 | |||
545 | if (mp->m_qflags & (XFS_UQUOTA_ACCT|XFS_UQUOTA_ENFD)) | ||
546 | seq_puts(m, "," MNTOPT_USRQUOTA); | ||
547 | else if (mp->m_qflags & XFS_UQUOTA_ACCT) | ||
548 | seq_puts(m, "," MNTOPT_UQUOTANOENF); | ||
549 | |||
550 | /* Either project or group quotas can be active, not both */ | ||
551 | |||
552 | if (mp->m_qflags & XFS_PQUOTA_ACCT) { | ||
553 | if (mp->m_qflags & XFS_OQUOTA_ENFD) | ||
554 | seq_puts(m, "," MNTOPT_PRJQUOTA); | ||
555 | else | ||
556 | seq_puts(m, "," MNTOPT_PQUOTANOENF); | ||
557 | } else if (mp->m_qflags & XFS_GQUOTA_ACCT) { | ||
558 | if (mp->m_qflags & XFS_OQUOTA_ENFD) | ||
559 | seq_puts(m, "," MNTOPT_GRPQUOTA); | ||
560 | else | ||
561 | seq_puts(m, "," MNTOPT_GQUOTANOENF); | ||
562 | } | ||
563 | |||
564 | if (!(mp->m_qflags & XFS_ALL_QUOTA_ACCT)) | ||
565 | seq_puts(m, "," MNTOPT_NOQUOTA); | ||
566 | |||
567 | return 0; | ||
568 | } | ||
569 | __uint64_t | ||
570 | xfs_max_file_offset( | ||
571 | unsigned int blockshift) | ||
572 | { | ||
573 | unsigned int pagefactor = 1; | ||
574 | unsigned int bitshift = BITS_PER_LONG - 1; | ||
575 | |||
576 | /* Figure out maximum filesize, on Linux this can depend on | ||
577 | * the filesystem blocksize (on 32 bit platforms). | ||
578 | * __block_write_begin does this in an [unsigned] long... | ||
579 | * page->index << (PAGE_CACHE_SHIFT - bbits) | ||
580 | * So, for page sized blocks (4K on 32 bit platforms), | ||
581 | * this wraps at around 8Tb (hence MAX_LFS_FILESIZE which is | ||
582 | * (((u64)PAGE_CACHE_SIZE << (BITS_PER_LONG-1))-1) | ||
583 | * but for smaller blocksizes it is less (bbits = log2 bsize). | ||
584 | * Note1: get_block_t takes a long (implicit cast from above) | ||
585 | * Note2: The Large Block Device (LBD and HAVE_SECTOR_T) patch | ||
586 | * can optionally convert the [unsigned] long from above into | ||
587 | * an [unsigned] long long. | ||
588 | */ | ||
589 | |||
590 | #if BITS_PER_LONG == 32 | ||
591 | # if defined(CONFIG_LBDAF) | ||
592 | ASSERT(sizeof(sector_t) == 8); | ||
593 | pagefactor = PAGE_CACHE_SIZE; | ||
594 | bitshift = BITS_PER_LONG; | ||
595 | # else | ||
596 | pagefactor = PAGE_CACHE_SIZE >> (PAGE_CACHE_SHIFT - blockshift); | ||
597 | # endif | ||
598 | #endif | ||
599 | |||
600 | return (((__uint64_t)pagefactor) << bitshift) - 1; | ||
601 | } | ||
602 | |||
603 | STATIC int | ||
604 | xfs_blkdev_get( | ||
605 | xfs_mount_t *mp, | ||
606 | const char *name, | ||
607 | struct block_device **bdevp) | ||
608 | { | ||
609 | int error = 0; | ||
610 | |||
611 | *bdevp = blkdev_get_by_path(name, FMODE_READ|FMODE_WRITE|FMODE_EXCL, | ||
612 | mp); | ||
613 | if (IS_ERR(*bdevp)) { | ||
614 | error = PTR_ERR(*bdevp); | ||
615 | xfs_warn(mp, "Invalid device [%s], error=%d\n", name, error); | ||
616 | } | ||
617 | |||
618 | return -error; | ||
619 | } | ||
620 | |||
621 | STATIC void | ||
622 | xfs_blkdev_put( | ||
623 | struct block_device *bdev) | ||
624 | { | ||
625 | if (bdev) | ||
626 | blkdev_put(bdev, FMODE_READ|FMODE_WRITE|FMODE_EXCL); | ||
627 | } | ||
628 | |||
629 | void | ||
630 | xfs_blkdev_issue_flush( | ||
631 | xfs_buftarg_t *buftarg) | ||
632 | { | ||
633 | blkdev_issue_flush(buftarg->bt_bdev, GFP_KERNEL, NULL); | ||
634 | } | ||
635 | |||
636 | STATIC void | ||
637 | xfs_close_devices( | ||
638 | struct xfs_mount *mp) | ||
639 | { | ||
640 | if (mp->m_logdev_targp && mp->m_logdev_targp != mp->m_ddev_targp) { | ||
641 | struct block_device *logdev = mp->m_logdev_targp->bt_bdev; | ||
642 | xfs_free_buftarg(mp, mp->m_logdev_targp); | ||
643 | xfs_blkdev_put(logdev); | ||
644 | } | ||
645 | if (mp->m_rtdev_targp) { | ||
646 | struct block_device *rtdev = mp->m_rtdev_targp->bt_bdev; | ||
647 | xfs_free_buftarg(mp, mp->m_rtdev_targp); | ||
648 | xfs_blkdev_put(rtdev); | ||
649 | } | ||
650 | xfs_free_buftarg(mp, mp->m_ddev_targp); | ||
651 | } | ||
652 | |||
653 | /* | ||
654 | * The file system configurations are: | ||
655 | * (1) device (partition) with data and internal log | ||
656 | * (2) logical volume with data and log subvolumes. | ||
657 | * (3) logical volume with data, log, and realtime subvolumes. | ||
658 | * | ||
659 | * We only have to handle opening the log and realtime volumes here if | ||
660 | * they are present. The data subvolume has already been opened by | ||
661 | * get_sb_bdev() and is stored in sb->s_bdev. | ||
662 | */ | ||
663 | STATIC int | ||
664 | xfs_open_devices( | ||
665 | struct xfs_mount *mp) | ||
666 | { | ||
667 | struct block_device *ddev = mp->m_super->s_bdev; | ||
668 | struct block_device *logdev = NULL, *rtdev = NULL; | ||
669 | int error; | ||
670 | |||
671 | /* | ||
672 | * Open real time and log devices - order is important. | ||
673 | */ | ||
674 | if (mp->m_logname) { | ||
675 | error = xfs_blkdev_get(mp, mp->m_logname, &logdev); | ||
676 | if (error) | ||
677 | goto out; | ||
678 | } | ||
679 | |||
680 | if (mp->m_rtname) { | ||
681 | error = xfs_blkdev_get(mp, mp->m_rtname, &rtdev); | ||
682 | if (error) | ||
683 | goto out_close_logdev; | ||
684 | |||
685 | if (rtdev == ddev || rtdev == logdev) { | ||
686 | xfs_warn(mp, | ||
687 | "Cannot mount filesystem with identical rtdev and ddev/logdev."); | ||
688 | error = EINVAL; | ||
689 | goto out_close_rtdev; | ||
690 | } | ||
691 | } | ||
692 | |||
693 | /* | ||
694 | * Setup xfs_mount buffer target pointers | ||
695 | */ | ||
696 | error = ENOMEM; | ||
697 | mp->m_ddev_targp = xfs_alloc_buftarg(mp, ddev, 0, mp->m_fsname); | ||
698 | if (!mp->m_ddev_targp) | ||
699 | goto out_close_rtdev; | ||
700 | |||
701 | if (rtdev) { | ||
702 | mp->m_rtdev_targp = xfs_alloc_buftarg(mp, rtdev, 1, | ||
703 | mp->m_fsname); | ||
704 | if (!mp->m_rtdev_targp) | ||
705 | goto out_free_ddev_targ; | ||
706 | } | ||
707 | |||
708 | if (logdev && logdev != ddev) { | ||
709 | mp->m_logdev_targp = xfs_alloc_buftarg(mp, logdev, 1, | ||
710 | mp->m_fsname); | ||
711 | if (!mp->m_logdev_targp) | ||
712 | goto out_free_rtdev_targ; | ||
713 | } else { | ||
714 | mp->m_logdev_targp = mp->m_ddev_targp; | ||
715 | } | ||
716 | |||
717 | return 0; | ||
718 | |||
719 | out_free_rtdev_targ: | ||
720 | if (mp->m_rtdev_targp) | ||
721 | xfs_free_buftarg(mp, mp->m_rtdev_targp); | ||
722 | out_free_ddev_targ: | ||
723 | xfs_free_buftarg(mp, mp->m_ddev_targp); | ||
724 | out_close_rtdev: | ||
725 | if (rtdev) | ||
726 | xfs_blkdev_put(rtdev); | ||
727 | out_close_logdev: | ||
728 | if (logdev && logdev != ddev) | ||
729 | xfs_blkdev_put(logdev); | ||
730 | out: | ||
731 | return error; | ||
732 | } | ||
733 | |||
734 | /* | ||
735 | * Setup xfs_mount buffer target pointers based on superblock | ||
736 | */ | ||
737 | STATIC int | ||
738 | xfs_setup_devices( | ||
739 | struct xfs_mount *mp) | ||
740 | { | ||
741 | int error; | ||
742 | |||
743 | error = xfs_setsize_buftarg(mp->m_ddev_targp, mp->m_sb.sb_blocksize, | ||
744 | mp->m_sb.sb_sectsize); | ||
745 | if (error) | ||
746 | return error; | ||
747 | |||
748 | if (mp->m_logdev_targp && mp->m_logdev_targp != mp->m_ddev_targp) { | ||
749 | unsigned int log_sector_size = BBSIZE; | ||
750 | |||
751 | if (xfs_sb_version_hassector(&mp->m_sb)) | ||
752 | log_sector_size = mp->m_sb.sb_logsectsize; | ||
753 | error = xfs_setsize_buftarg(mp->m_logdev_targp, | ||
754 | mp->m_sb.sb_blocksize, | ||
755 | log_sector_size); | ||
756 | if (error) | ||
757 | return error; | ||
758 | } | ||
759 | if (mp->m_rtdev_targp) { | ||
760 | error = xfs_setsize_buftarg(mp->m_rtdev_targp, | ||
761 | mp->m_sb.sb_blocksize, | ||
762 | mp->m_sb.sb_sectsize); | ||
763 | if (error) | ||
764 | return error; | ||
765 | } | ||
766 | |||
767 | return 0; | ||
768 | } | ||
769 | |||
770 | /* Catch misguided souls that try to use this interface on XFS */ | ||
771 | STATIC struct inode * | ||
772 | xfs_fs_alloc_inode( | ||
773 | struct super_block *sb) | ||
774 | { | ||
775 | BUG(); | ||
776 | return NULL; | ||
777 | } | ||
778 | |||
779 | /* | ||
780 | * Now that the generic code is guaranteed not to be accessing | ||
781 | * the linux inode, we can reclaim the inode. | ||
782 | */ | ||
783 | STATIC void | ||
784 | xfs_fs_destroy_inode( | ||
785 | struct inode *inode) | ||
786 | { | ||
787 | struct xfs_inode *ip = XFS_I(inode); | ||
788 | |||
789 | trace_xfs_destroy_inode(ip); | ||
790 | |||
791 | XFS_STATS_INC(vn_reclaim); | ||
792 | |||
793 | /* bad inode, get out here ASAP */ | ||
794 | if (is_bad_inode(inode)) | ||
795 | goto out_reclaim; | ||
796 | |||
797 | xfs_ioend_wait(ip); | ||
798 | |||
799 | ASSERT(XFS_FORCED_SHUTDOWN(ip->i_mount) || ip->i_delayed_blks == 0); | ||
800 | |||
801 | /* | ||
802 | * We should never get here with one of the reclaim flags already set. | ||
803 | */ | ||
804 | ASSERT_ALWAYS(!xfs_iflags_test(ip, XFS_IRECLAIMABLE)); | ||
805 | ASSERT_ALWAYS(!xfs_iflags_test(ip, XFS_IRECLAIM)); | ||
806 | |||
807 | /* | ||
808 | * We always use background reclaim here because even if the | ||
809 | * inode is clean, it still may be under IO and hence we have | ||
810 | * to take the flush lock. The background reclaim path handles | ||
811 | * this more efficiently than we can here, so simply let background | ||
812 | * reclaim tear down all inodes. | ||
813 | */ | ||
814 | out_reclaim: | ||
815 | xfs_inode_set_reclaim_tag(ip); | ||
816 | } | ||
817 | |||
818 | /* | ||
819 | * Slab object creation initialisation for the XFS inode. | ||
820 | * This covers only the idempotent fields in the XFS inode; | ||
821 | * all other fields need to be initialised on allocation | ||
822 | * from the slab. This avoids the need to repeatedly initialise | ||
823 | * fields in the xfs inode that left in the initialise state | ||
824 | * when freeing the inode. | ||
825 | */ | ||
826 | STATIC void | ||
827 | xfs_fs_inode_init_once( | ||
828 | void *inode) | ||
829 | { | ||
830 | struct xfs_inode *ip = inode; | ||
831 | |||
832 | memset(ip, 0, sizeof(struct xfs_inode)); | ||
833 | |||
834 | /* vfs inode */ | ||
835 | inode_init_once(VFS_I(ip)); | ||
836 | |||
837 | /* xfs inode */ | ||
838 | atomic_set(&ip->i_iocount, 0); | ||
839 | atomic_set(&ip->i_pincount, 0); | ||
840 | spin_lock_init(&ip->i_flags_lock); | ||
841 | init_waitqueue_head(&ip->i_ipin_wait); | ||
842 | /* | ||
843 | * Because we want to use a counting completion, complete | ||
844 | * the flush completion once to allow a single access to | ||
845 | * the flush completion without blocking. | ||
846 | */ | ||
847 | init_completion(&ip->i_flush); | ||
848 | complete(&ip->i_flush); | ||
849 | |||
850 | mrlock_init(&ip->i_lock, MRLOCK_ALLOW_EQUAL_PRI|MRLOCK_BARRIER, | ||
851 | "xfsino", ip->i_ino); | ||
852 | } | ||
853 | |||
854 | /* | ||
855 | * Dirty the XFS inode when mark_inode_dirty_sync() is called so that | ||
856 | * we catch unlogged VFS level updates to the inode. | ||
857 | * | ||
858 | * We need the barrier() to maintain correct ordering between unlogged | ||
859 | * updates and the transaction commit code that clears the i_update_core | ||
860 | * field. This requires all updates to be completed before marking the | ||
861 | * inode dirty. | ||
862 | */ | ||
863 | STATIC void | ||
864 | xfs_fs_dirty_inode( | ||
865 | struct inode *inode, | ||
866 | int flags) | ||
867 | { | ||
868 | barrier(); | ||
869 | XFS_I(inode)->i_update_core = 1; | ||
870 | } | ||
871 | |||
872 | STATIC int | ||
873 | xfs_log_inode( | ||
874 | struct xfs_inode *ip) | ||
875 | { | ||
876 | struct xfs_mount *mp = ip->i_mount; | ||
877 | struct xfs_trans *tp; | ||
878 | int error; | ||
879 | |||
880 | xfs_iunlock(ip, XFS_ILOCK_SHARED); | ||
881 | tp = xfs_trans_alloc(mp, XFS_TRANS_FSYNC_TS); | ||
882 | error = xfs_trans_reserve(tp, 0, XFS_FSYNC_TS_LOG_RES(mp), 0, 0, 0); | ||
883 | |||
884 | if (error) { | ||
885 | xfs_trans_cancel(tp, 0); | ||
886 | /* we need to return with the lock hold shared */ | ||
887 | xfs_ilock(ip, XFS_ILOCK_SHARED); | ||
888 | return error; | ||
889 | } | ||
890 | |||
891 | xfs_ilock(ip, XFS_ILOCK_EXCL); | ||
892 | |||
893 | /* | ||
894 | * Note - it's possible that we might have pushed ourselves out of the | ||
895 | * way during trans_reserve which would flush the inode. But there's | ||
896 | * no guarantee that the inode buffer has actually gone out yet (it's | ||
897 | * delwri). Plus the buffer could be pinned anyway if it's part of | ||
898 | * an inode in another recent transaction. So we play it safe and | ||
899 | * fire off the transaction anyway. | ||
900 | */ | ||
901 | xfs_trans_ijoin(tp, ip); | ||
902 | xfs_trans_log_inode(tp, ip, XFS_ILOG_CORE); | ||
903 | error = xfs_trans_commit(tp, 0); | ||
904 | xfs_ilock_demote(ip, XFS_ILOCK_EXCL); | ||
905 | |||
906 | return error; | ||
907 | } | ||
908 | |||
909 | STATIC int | ||
910 | xfs_fs_write_inode( | ||
911 | struct inode *inode, | ||
912 | struct writeback_control *wbc) | ||
913 | { | ||
914 | struct xfs_inode *ip = XFS_I(inode); | ||
915 | struct xfs_mount *mp = ip->i_mount; | ||
916 | int error = EAGAIN; | ||
917 | |||
918 | trace_xfs_write_inode(ip); | ||
919 | |||
920 | if (XFS_FORCED_SHUTDOWN(mp)) | ||
921 | return XFS_ERROR(EIO); | ||
922 | |||
923 | if (wbc->sync_mode == WB_SYNC_ALL) { | ||
924 | /* | ||
925 | * Make sure the inode has made it it into the log. Instead | ||
926 | * of forcing it all the way to stable storage using a | ||
927 | * synchronous transaction we let the log force inside the | ||
928 | * ->sync_fs call do that for thus, which reduces the number | ||
929 | * of synchronous log foces dramatically. | ||
930 | */ | ||
931 | xfs_ioend_wait(ip); | ||
932 | xfs_ilock(ip, XFS_ILOCK_SHARED); | ||
933 | if (ip->i_update_core) { | ||
934 | error = xfs_log_inode(ip); | ||
935 | if (error) | ||
936 | goto out_unlock; | ||
937 | } | ||
938 | } else { | ||
939 | /* | ||
940 | * We make this non-blocking if the inode is contended, return | ||
941 | * EAGAIN to indicate to the caller that they did not succeed. | ||
942 | * This prevents the flush path from blocking on inodes inside | ||
943 | * another operation right now, they get caught later by | ||
944 | * xfs_sync. | ||
945 | */ | ||
946 | if (!xfs_ilock_nowait(ip, XFS_ILOCK_SHARED)) | ||
947 | goto out; | ||
948 | |||
949 | if (xfs_ipincount(ip) || !xfs_iflock_nowait(ip)) | ||
950 | goto out_unlock; | ||
951 | |||
952 | /* | ||
953 | * Now we have the flush lock and the inode is not pinned, we | ||
954 | * can check if the inode is really clean as we know that | ||
955 | * there are no pending transaction completions, it is not | ||
956 | * waiting on the delayed write queue and there is no IO in | ||
957 | * progress. | ||
958 | */ | ||
959 | if (xfs_inode_clean(ip)) { | ||
960 | xfs_ifunlock(ip); | ||
961 | error = 0; | ||
962 | goto out_unlock; | ||
963 | } | ||
964 | error = xfs_iflush(ip, SYNC_TRYLOCK); | ||
965 | } | ||
966 | |||
967 | out_unlock: | ||
968 | xfs_iunlock(ip, XFS_ILOCK_SHARED); | ||
969 | out: | ||
970 | /* | ||
971 | * if we failed to write out the inode then mark | ||
972 | * it dirty again so we'll try again later. | ||
973 | */ | ||
974 | if (error) | ||
975 | xfs_mark_inode_dirty_sync(ip); | ||
976 | return -error; | ||
977 | } | ||
978 | |||
979 | STATIC void | ||
980 | xfs_fs_evict_inode( | ||
981 | struct inode *inode) | ||
982 | { | ||
983 | xfs_inode_t *ip = XFS_I(inode); | ||
984 | |||
985 | trace_xfs_evict_inode(ip); | ||
986 | |||
987 | truncate_inode_pages(&inode->i_data, 0); | ||
988 | end_writeback(inode); | ||
989 | XFS_STATS_INC(vn_rele); | ||
990 | XFS_STATS_INC(vn_remove); | ||
991 | XFS_STATS_DEC(vn_active); | ||
992 | |||
993 | /* | ||
994 | * The iolock is used by the file system to coordinate reads, | ||
995 | * writes, and block truncates. Up to this point the lock | ||
996 | * protected concurrent accesses by users of the inode. But | ||
997 | * from here forward we're doing some final processing of the | ||
998 | * inode because we're done with it, and although we reuse the | ||
999 | * iolock for protection it is really a distinct lock class | ||
1000 | * (in the lockdep sense) from before. To keep lockdep happy | ||
1001 | * (and basically indicate what we are doing), we explicitly | ||
1002 | * re-init the iolock here. | ||
1003 | */ | ||
1004 | ASSERT(!rwsem_is_locked(&ip->i_iolock.mr_lock)); | ||
1005 | mrlock_init(&ip->i_iolock, MRLOCK_BARRIER, "xfsio", ip->i_ino); | ||
1006 | lockdep_set_class_and_name(&ip->i_iolock.mr_lock, | ||
1007 | &xfs_iolock_reclaimable, "xfs_iolock_reclaimable"); | ||
1008 | |||
1009 | xfs_inactive(ip); | ||
1010 | } | ||
1011 | |||
1012 | STATIC void | ||
1013 | xfs_free_fsname( | ||
1014 | struct xfs_mount *mp) | ||
1015 | { | ||
1016 | kfree(mp->m_fsname); | ||
1017 | kfree(mp->m_rtname); | ||
1018 | kfree(mp->m_logname); | ||
1019 | } | ||
1020 | |||
1021 | STATIC void | ||
1022 | xfs_fs_put_super( | ||
1023 | struct super_block *sb) | ||
1024 | { | ||
1025 | struct xfs_mount *mp = XFS_M(sb); | ||
1026 | |||
1027 | xfs_syncd_stop(mp); | ||
1028 | |||
1029 | /* | ||
1030 | * Blow away any referenced inode in the filestreams cache. | ||
1031 | * This can and will cause log traffic as inodes go inactive | ||
1032 | * here. | ||
1033 | */ | ||
1034 | xfs_filestream_unmount(mp); | ||
1035 | |||
1036 | XFS_bflush(mp->m_ddev_targp); | ||
1037 | |||
1038 | xfs_unmountfs(mp); | ||
1039 | xfs_freesb(mp); | ||
1040 | xfs_icsb_destroy_counters(mp); | ||
1041 | xfs_close_devices(mp); | ||
1042 | xfs_free_fsname(mp); | ||
1043 | kfree(mp); | ||
1044 | } | ||
1045 | |||
1046 | STATIC int | ||
1047 | xfs_fs_sync_fs( | ||
1048 | struct super_block *sb, | ||
1049 | int wait) | ||
1050 | { | ||
1051 | struct xfs_mount *mp = XFS_M(sb); | ||
1052 | int error; | ||
1053 | |||
1054 | /* | ||
1055 | * Not much we can do for the first async pass. Writing out the | ||
1056 | * superblock would be counter-productive as we are going to redirty | ||
1057 | * when writing out other data and metadata (and writing out a single | ||
1058 | * block is quite fast anyway). | ||
1059 | * | ||
1060 | * Try to asynchronously kick off quota syncing at least. | ||
1061 | */ | ||
1062 | if (!wait) { | ||
1063 | xfs_qm_sync(mp, SYNC_TRYLOCK); | ||
1064 | return 0; | ||
1065 | } | ||
1066 | |||
1067 | error = xfs_quiesce_data(mp); | ||
1068 | if (error) | ||
1069 | return -error; | ||
1070 | |||
1071 | if (laptop_mode) { | ||
1072 | /* | ||
1073 | * The disk must be active because we're syncing. | ||
1074 | * We schedule xfssyncd now (now that the disk is | ||
1075 | * active) instead of later (when it might not be). | ||
1076 | */ | ||
1077 | flush_delayed_work_sync(&mp->m_sync_work); | ||
1078 | } | ||
1079 | |||
1080 | return 0; | ||
1081 | } | ||
1082 | |||
1083 | STATIC int | ||
1084 | xfs_fs_statfs( | ||
1085 | struct dentry *dentry, | ||
1086 | struct kstatfs *statp) | ||
1087 | { | ||
1088 | struct xfs_mount *mp = XFS_M(dentry->d_sb); | ||
1089 | xfs_sb_t *sbp = &mp->m_sb; | ||
1090 | struct xfs_inode *ip = XFS_I(dentry->d_inode); | ||
1091 | __uint64_t fakeinos, id; | ||
1092 | xfs_extlen_t lsize; | ||
1093 | __int64_t ffree; | ||
1094 | |||
1095 | statp->f_type = XFS_SB_MAGIC; | ||
1096 | statp->f_namelen = MAXNAMELEN - 1; | ||
1097 | |||
1098 | id = huge_encode_dev(mp->m_ddev_targp->bt_dev); | ||
1099 | statp->f_fsid.val[0] = (u32)id; | ||
1100 | statp->f_fsid.val[1] = (u32)(id >> 32); | ||
1101 | |||
1102 | xfs_icsb_sync_counters(mp, XFS_ICSB_LAZY_COUNT); | ||
1103 | |||
1104 | spin_lock(&mp->m_sb_lock); | ||
1105 | statp->f_bsize = sbp->sb_blocksize; | ||
1106 | lsize = sbp->sb_logstart ? sbp->sb_logblocks : 0; | ||
1107 | statp->f_blocks = sbp->sb_dblocks - lsize; | ||
1108 | statp->f_bfree = statp->f_bavail = | ||
1109 | sbp->sb_fdblocks - XFS_ALLOC_SET_ASIDE(mp); | ||
1110 | fakeinos = statp->f_bfree << sbp->sb_inopblog; | ||
1111 | statp->f_files = | ||
1112 | MIN(sbp->sb_icount + fakeinos, (__uint64_t)XFS_MAXINUMBER); | ||
1113 | if (mp->m_maxicount) | ||
1114 | statp->f_files = min_t(typeof(statp->f_files), | ||
1115 | statp->f_files, | ||
1116 | mp->m_maxicount); | ||
1117 | |||
1118 | /* make sure statp->f_ffree does not underflow */ | ||
1119 | ffree = statp->f_files - (sbp->sb_icount - sbp->sb_ifree); | ||
1120 | statp->f_ffree = max_t(__int64_t, ffree, 0); | ||
1121 | |||
1122 | spin_unlock(&mp->m_sb_lock); | ||
1123 | |||
1124 | if ((ip->i_d.di_flags & XFS_DIFLAG_PROJINHERIT) || | ||
1125 | ((mp->m_qflags & (XFS_PQUOTA_ACCT|XFS_OQUOTA_ENFD))) == | ||
1126 | (XFS_PQUOTA_ACCT|XFS_OQUOTA_ENFD)) | ||
1127 | xfs_qm_statvfs(ip, statp); | ||
1128 | return 0; | ||
1129 | } | ||
1130 | |||
1131 | STATIC void | ||
1132 | xfs_save_resvblks(struct xfs_mount *mp) | ||
1133 | { | ||
1134 | __uint64_t resblks = 0; | ||
1135 | |||
1136 | mp->m_resblks_save = mp->m_resblks; | ||
1137 | xfs_reserve_blocks(mp, &resblks, NULL); | ||
1138 | } | ||
1139 | |||
1140 | STATIC void | ||
1141 | xfs_restore_resvblks(struct xfs_mount *mp) | ||
1142 | { | ||
1143 | __uint64_t resblks; | ||
1144 | |||
1145 | if (mp->m_resblks_save) { | ||
1146 | resblks = mp->m_resblks_save; | ||
1147 | mp->m_resblks_save = 0; | ||
1148 | } else | ||
1149 | resblks = xfs_default_resblks(mp); | ||
1150 | |||
1151 | xfs_reserve_blocks(mp, &resblks, NULL); | ||
1152 | } | ||
1153 | |||
1154 | STATIC int | ||
1155 | xfs_fs_remount( | ||
1156 | struct super_block *sb, | ||
1157 | int *flags, | ||
1158 | char *options) | ||
1159 | { | ||
1160 | struct xfs_mount *mp = XFS_M(sb); | ||
1161 | substring_t args[MAX_OPT_ARGS]; | ||
1162 | char *p; | ||
1163 | int error; | ||
1164 | |||
1165 | while ((p = strsep(&options, ",")) != NULL) { | ||
1166 | int token; | ||
1167 | |||
1168 | if (!*p) | ||
1169 | continue; | ||
1170 | |||
1171 | token = match_token(p, tokens, args); | ||
1172 | switch (token) { | ||
1173 | case Opt_barrier: | ||
1174 | mp->m_flags |= XFS_MOUNT_BARRIER; | ||
1175 | break; | ||
1176 | case Opt_nobarrier: | ||
1177 | mp->m_flags &= ~XFS_MOUNT_BARRIER; | ||
1178 | break; | ||
1179 | default: | ||
1180 | /* | ||
1181 | * Logically we would return an error here to prevent | ||
1182 | * users from believing they might have changed | ||
1183 | * mount options using remount which can't be changed. | ||
1184 | * | ||
1185 | * But unfortunately mount(8) adds all options from | ||
1186 | * mtab and fstab to the mount arguments in some cases | ||
1187 | * so we can't blindly reject options, but have to | ||
1188 | * check for each specified option if it actually | ||
1189 | * differs from the currently set option and only | ||
1190 | * reject it if that's the case. | ||
1191 | * | ||
1192 | * Until that is implemented we return success for | ||
1193 | * every remount request, and silently ignore all | ||
1194 | * options that we can't actually change. | ||
1195 | */ | ||
1196 | #if 0 | ||
1197 | xfs_info(mp, | ||
1198 | "mount option \"%s\" not supported for remount\n", p); | ||
1199 | return -EINVAL; | ||
1200 | #else | ||
1201 | break; | ||
1202 | #endif | ||
1203 | } | ||
1204 | } | ||
1205 | |||
1206 | /* ro -> rw */ | ||
1207 | if ((mp->m_flags & XFS_MOUNT_RDONLY) && !(*flags & MS_RDONLY)) { | ||
1208 | mp->m_flags &= ~XFS_MOUNT_RDONLY; | ||
1209 | |||
1210 | /* | ||
1211 | * If this is the first remount to writeable state we | ||
1212 | * might have some superblock changes to update. | ||
1213 | */ | ||
1214 | if (mp->m_update_flags) { | ||
1215 | error = xfs_mount_log_sb(mp, mp->m_update_flags); | ||
1216 | if (error) { | ||
1217 | xfs_warn(mp, "failed to write sb changes"); | ||
1218 | return error; | ||
1219 | } | ||
1220 | mp->m_update_flags = 0; | ||
1221 | } | ||
1222 | |||
1223 | /* | ||
1224 | * Fill out the reserve pool if it is empty. Use the stashed | ||
1225 | * value if it is non-zero, otherwise go with the default. | ||
1226 | */ | ||
1227 | xfs_restore_resvblks(mp); | ||
1228 | } | ||
1229 | |||
1230 | /* rw -> ro */ | ||
1231 | if (!(mp->m_flags & XFS_MOUNT_RDONLY) && (*flags & MS_RDONLY)) { | ||
1232 | /* | ||
1233 | * After we have synced the data but before we sync the | ||
1234 | * metadata, we need to free up the reserve block pool so that | ||
1235 | * the used block count in the superblock on disk is correct at | ||
1236 | * the end of the remount. Stash the current reserve pool size | ||
1237 | * so that if we get remounted rw, we can return it to the same | ||
1238 | * size. | ||
1239 | */ | ||
1240 | |||
1241 | xfs_quiesce_data(mp); | ||
1242 | xfs_save_resvblks(mp); | ||
1243 | xfs_quiesce_attr(mp); | ||
1244 | mp->m_flags |= XFS_MOUNT_RDONLY; | ||
1245 | } | ||
1246 | |||
1247 | return 0; | ||
1248 | } | ||
1249 | |||
1250 | /* | ||
1251 | * Second stage of a freeze. The data is already frozen so we only | ||
1252 | * need to take care of the metadata. Once that's done write a dummy | ||
1253 | * record to dirty the log in case of a crash while frozen. | ||
1254 | */ | ||
1255 | STATIC int | ||
1256 | xfs_fs_freeze( | ||
1257 | struct super_block *sb) | ||
1258 | { | ||
1259 | struct xfs_mount *mp = XFS_M(sb); | ||
1260 | |||
1261 | xfs_save_resvblks(mp); | ||
1262 | xfs_quiesce_attr(mp); | ||
1263 | return -xfs_fs_log_dummy(mp); | ||
1264 | } | ||
1265 | |||
1266 | STATIC int | ||
1267 | xfs_fs_unfreeze( | ||
1268 | struct super_block *sb) | ||
1269 | { | ||
1270 | struct xfs_mount *mp = XFS_M(sb); | ||
1271 | |||
1272 | xfs_restore_resvblks(mp); | ||
1273 | return 0; | ||
1274 | } | ||
1275 | |||
1276 | STATIC int | ||
1277 | xfs_fs_show_options( | ||
1278 | struct seq_file *m, | ||
1279 | struct vfsmount *mnt) | ||
1280 | { | ||
1281 | return -xfs_showargs(XFS_M(mnt->mnt_sb), m); | ||
1282 | } | ||
1283 | |||
1284 | /* | ||
1285 | * This function fills in xfs_mount_t fields based on mount args. | ||
1286 | * Note: the superblock _has_ now been read in. | ||
1287 | */ | ||
1288 | STATIC int | ||
1289 | xfs_finish_flags( | ||
1290 | struct xfs_mount *mp) | ||
1291 | { | ||
1292 | int ronly = (mp->m_flags & XFS_MOUNT_RDONLY); | ||
1293 | |||
1294 | /* Fail a mount where the logbuf is smaller than the log stripe */ | ||
1295 | if (xfs_sb_version_haslogv2(&mp->m_sb)) { | ||
1296 | if (mp->m_logbsize <= 0 && | ||
1297 | mp->m_sb.sb_logsunit > XLOG_BIG_RECORD_BSIZE) { | ||
1298 | mp->m_logbsize = mp->m_sb.sb_logsunit; | ||
1299 | } else if (mp->m_logbsize > 0 && | ||
1300 | mp->m_logbsize < mp->m_sb.sb_logsunit) { | ||
1301 | xfs_warn(mp, | ||
1302 | "logbuf size must be greater than or equal to log stripe size"); | ||
1303 | return XFS_ERROR(EINVAL); | ||
1304 | } | ||
1305 | } else { | ||
1306 | /* Fail a mount if the logbuf is larger than 32K */ | ||
1307 | if (mp->m_logbsize > XLOG_BIG_RECORD_BSIZE) { | ||
1308 | xfs_warn(mp, | ||
1309 | "logbuf size for version 1 logs must be 16K or 32K"); | ||
1310 | return XFS_ERROR(EINVAL); | ||
1311 | } | ||
1312 | } | ||
1313 | |||
1314 | /* | ||
1315 | * mkfs'ed attr2 will turn on attr2 mount unless explicitly | ||
1316 | * told by noattr2 to turn it off | ||
1317 | */ | ||
1318 | if (xfs_sb_version_hasattr2(&mp->m_sb) && | ||
1319 | !(mp->m_flags & XFS_MOUNT_NOATTR2)) | ||
1320 | mp->m_flags |= XFS_MOUNT_ATTR2; | ||
1321 | |||
1322 | /* | ||
1323 | * prohibit r/w mounts of read-only filesystems | ||
1324 | */ | ||
1325 | if ((mp->m_sb.sb_flags & XFS_SBF_READONLY) && !ronly) { | ||
1326 | xfs_warn(mp, | ||
1327 | "cannot mount a read-only filesystem as read-write"); | ||
1328 | return XFS_ERROR(EROFS); | ||
1329 | } | ||
1330 | |||
1331 | return 0; | ||
1332 | } | ||
1333 | |||
1334 | STATIC int | ||
1335 | xfs_fs_fill_super( | ||
1336 | struct super_block *sb, | ||
1337 | void *data, | ||
1338 | int silent) | ||
1339 | { | ||
1340 | struct inode *root; | ||
1341 | struct xfs_mount *mp = NULL; | ||
1342 | int flags = 0, error = ENOMEM; | ||
1343 | |||
1344 | mp = kzalloc(sizeof(struct xfs_mount), GFP_KERNEL); | ||
1345 | if (!mp) | ||
1346 | goto out; | ||
1347 | |||
1348 | spin_lock_init(&mp->m_sb_lock); | ||
1349 | mutex_init(&mp->m_growlock); | ||
1350 | atomic_set(&mp->m_active_trans, 0); | ||
1351 | |||
1352 | mp->m_super = sb; | ||
1353 | sb->s_fs_info = mp; | ||
1354 | |||
1355 | error = xfs_parseargs(mp, (char *)data); | ||
1356 | if (error) | ||
1357 | goto out_free_fsname; | ||
1358 | |||
1359 | sb_min_blocksize(sb, BBSIZE); | ||
1360 | sb->s_xattr = xfs_xattr_handlers; | ||
1361 | sb->s_export_op = &xfs_export_operations; | ||
1362 | #ifdef CONFIG_XFS_QUOTA | ||
1363 | sb->s_qcop = &xfs_quotactl_operations; | ||
1364 | #endif | ||
1365 | sb->s_op = &xfs_super_operations; | ||
1366 | |||
1367 | if (silent) | ||
1368 | flags |= XFS_MFSI_QUIET; | ||
1369 | |||
1370 | error = xfs_open_devices(mp); | ||
1371 | if (error) | ||
1372 | goto out_free_fsname; | ||
1373 | |||
1374 | error = xfs_icsb_init_counters(mp); | ||
1375 | if (error) | ||
1376 | goto out_close_devices; | ||
1377 | |||
1378 | error = xfs_readsb(mp, flags); | ||
1379 | if (error) | ||
1380 | goto out_destroy_counters; | ||
1381 | |||
1382 | error = xfs_finish_flags(mp); | ||
1383 | if (error) | ||
1384 | goto out_free_sb; | ||
1385 | |||
1386 | error = xfs_setup_devices(mp); | ||
1387 | if (error) | ||
1388 | goto out_free_sb; | ||
1389 | |||
1390 | error = xfs_filestream_mount(mp); | ||
1391 | if (error) | ||
1392 | goto out_free_sb; | ||
1393 | |||
1394 | /* | ||
1395 | * we must configure the block size in the superblock before we run the | ||
1396 | * full mount process as the mount process can lookup and cache inodes. | ||
1397 | * For the same reason we must also initialise the syncd and register | ||
1398 | * the inode cache shrinker so that inodes can be reclaimed during | ||
1399 | * operations like a quotacheck that iterate all inodes in the | ||
1400 | * filesystem. | ||
1401 | */ | ||
1402 | sb->s_magic = XFS_SB_MAGIC; | ||
1403 | sb->s_blocksize = mp->m_sb.sb_blocksize; | ||
1404 | sb->s_blocksize_bits = ffs(sb->s_blocksize) - 1; | ||
1405 | sb->s_maxbytes = xfs_max_file_offset(sb->s_blocksize_bits); | ||
1406 | sb->s_time_gran = 1; | ||
1407 | set_posix_acl_flag(sb); | ||
1408 | |||
1409 | error = xfs_mountfs(mp); | ||
1410 | if (error) | ||
1411 | goto out_filestream_unmount; | ||
1412 | |||
1413 | error = xfs_syncd_init(mp); | ||
1414 | if (error) | ||
1415 | goto out_unmount; | ||
1416 | |||
1417 | root = igrab(VFS_I(mp->m_rootip)); | ||
1418 | if (!root) { | ||
1419 | error = ENOENT; | ||
1420 | goto out_syncd_stop; | ||
1421 | } | ||
1422 | if (is_bad_inode(root)) { | ||
1423 | error = EINVAL; | ||
1424 | goto out_syncd_stop; | ||
1425 | } | ||
1426 | sb->s_root = d_alloc_root(root); | ||
1427 | if (!sb->s_root) { | ||
1428 | error = ENOMEM; | ||
1429 | goto out_iput; | ||
1430 | } | ||
1431 | |||
1432 | return 0; | ||
1433 | |||
1434 | out_filestream_unmount: | ||
1435 | xfs_filestream_unmount(mp); | ||
1436 | out_free_sb: | ||
1437 | xfs_freesb(mp); | ||
1438 | out_destroy_counters: | ||
1439 | xfs_icsb_destroy_counters(mp); | ||
1440 | out_close_devices: | ||
1441 | xfs_close_devices(mp); | ||
1442 | out_free_fsname: | ||
1443 | xfs_free_fsname(mp); | ||
1444 | kfree(mp); | ||
1445 | out: | ||
1446 | return -error; | ||
1447 | |||
1448 | out_iput: | ||
1449 | iput(root); | ||
1450 | out_syncd_stop: | ||
1451 | xfs_syncd_stop(mp); | ||
1452 | out_unmount: | ||
1453 | /* | ||
1454 | * Blow away any referenced inode in the filestreams cache. | ||
1455 | * This can and will cause log traffic as inodes go inactive | ||
1456 | * here. | ||
1457 | */ | ||
1458 | xfs_filestream_unmount(mp); | ||
1459 | |||
1460 | XFS_bflush(mp->m_ddev_targp); | ||
1461 | |||
1462 | xfs_unmountfs(mp); | ||
1463 | goto out_free_sb; | ||
1464 | } | ||
1465 | |||
1466 | STATIC struct dentry * | ||
1467 | xfs_fs_mount( | ||
1468 | struct file_system_type *fs_type, | ||
1469 | int flags, | ||
1470 | const char *dev_name, | ||
1471 | void *data) | ||
1472 | { | ||
1473 | return mount_bdev(fs_type, flags, dev_name, data, xfs_fs_fill_super); | ||
1474 | } | ||
1475 | |||
1476 | static int | ||
1477 | xfs_fs_nr_cached_objects( | ||
1478 | struct super_block *sb) | ||
1479 | { | ||
1480 | return xfs_reclaim_inodes_count(XFS_M(sb)); | ||
1481 | } | ||
1482 | |||
1483 | static void | ||
1484 | xfs_fs_free_cached_objects( | ||
1485 | struct super_block *sb, | ||
1486 | int nr_to_scan) | ||
1487 | { | ||
1488 | xfs_reclaim_inodes_nr(XFS_M(sb), nr_to_scan); | ||
1489 | } | ||
1490 | |||
1491 | static const struct super_operations xfs_super_operations = { | ||
1492 | .alloc_inode = xfs_fs_alloc_inode, | ||
1493 | .destroy_inode = xfs_fs_destroy_inode, | ||
1494 | .dirty_inode = xfs_fs_dirty_inode, | ||
1495 | .write_inode = xfs_fs_write_inode, | ||
1496 | .evict_inode = xfs_fs_evict_inode, | ||
1497 | .put_super = xfs_fs_put_super, | ||
1498 | .sync_fs = xfs_fs_sync_fs, | ||
1499 | .freeze_fs = xfs_fs_freeze, | ||
1500 | .unfreeze_fs = xfs_fs_unfreeze, | ||
1501 | .statfs = xfs_fs_statfs, | ||
1502 | .remount_fs = xfs_fs_remount, | ||
1503 | .show_options = xfs_fs_show_options, | ||
1504 | .nr_cached_objects = xfs_fs_nr_cached_objects, | ||
1505 | .free_cached_objects = xfs_fs_free_cached_objects, | ||
1506 | }; | ||
1507 | |||
1508 | static struct file_system_type xfs_fs_type = { | ||
1509 | .owner = THIS_MODULE, | ||
1510 | .name = "xfs", | ||
1511 | .mount = xfs_fs_mount, | ||
1512 | .kill_sb = kill_block_super, | ||
1513 | .fs_flags = FS_REQUIRES_DEV, | ||
1514 | }; | ||
1515 | |||
1516 | STATIC int __init | ||
1517 | xfs_init_zones(void) | ||
1518 | { | ||
1519 | |||
1520 | xfs_ioend_zone = kmem_zone_init(sizeof(xfs_ioend_t), "xfs_ioend"); | ||
1521 | if (!xfs_ioend_zone) | ||
1522 | goto out; | ||
1523 | |||
1524 | xfs_ioend_pool = mempool_create_slab_pool(4 * MAX_BUF_PER_PAGE, | ||
1525 | xfs_ioend_zone); | ||
1526 | if (!xfs_ioend_pool) | ||
1527 | goto out_destroy_ioend_zone; | ||
1528 | |||
1529 | xfs_log_ticket_zone = kmem_zone_init(sizeof(xlog_ticket_t), | ||
1530 | "xfs_log_ticket"); | ||
1531 | if (!xfs_log_ticket_zone) | ||
1532 | goto out_destroy_ioend_pool; | ||
1533 | |||
1534 | xfs_bmap_free_item_zone = kmem_zone_init(sizeof(xfs_bmap_free_item_t), | ||
1535 | "xfs_bmap_free_item"); | ||
1536 | if (!xfs_bmap_free_item_zone) | ||
1537 | goto out_destroy_log_ticket_zone; | ||
1538 | |||
1539 | xfs_btree_cur_zone = kmem_zone_init(sizeof(xfs_btree_cur_t), | ||
1540 | "xfs_btree_cur"); | ||
1541 | if (!xfs_btree_cur_zone) | ||
1542 | goto out_destroy_bmap_free_item_zone; | ||
1543 | |||
1544 | xfs_da_state_zone = kmem_zone_init(sizeof(xfs_da_state_t), | ||
1545 | "xfs_da_state"); | ||
1546 | if (!xfs_da_state_zone) | ||
1547 | goto out_destroy_btree_cur_zone; | ||
1548 | |||
1549 | xfs_dabuf_zone = kmem_zone_init(sizeof(xfs_dabuf_t), "xfs_dabuf"); | ||
1550 | if (!xfs_dabuf_zone) | ||
1551 | goto out_destroy_da_state_zone; | ||
1552 | |||
1553 | xfs_ifork_zone = kmem_zone_init(sizeof(xfs_ifork_t), "xfs_ifork"); | ||
1554 | if (!xfs_ifork_zone) | ||
1555 | goto out_destroy_dabuf_zone; | ||
1556 | |||
1557 | xfs_trans_zone = kmem_zone_init(sizeof(xfs_trans_t), "xfs_trans"); | ||
1558 | if (!xfs_trans_zone) | ||
1559 | goto out_destroy_ifork_zone; | ||
1560 | |||
1561 | xfs_log_item_desc_zone = | ||
1562 | kmem_zone_init(sizeof(struct xfs_log_item_desc), | ||
1563 | "xfs_log_item_desc"); | ||
1564 | if (!xfs_log_item_desc_zone) | ||
1565 | goto out_destroy_trans_zone; | ||
1566 | |||
1567 | /* | ||
1568 | * The size of the zone allocated buf log item is the maximum | ||
1569 | * size possible under XFS. This wastes a little bit of memory, | ||
1570 | * but it is much faster. | ||
1571 | */ | ||
1572 | xfs_buf_item_zone = kmem_zone_init((sizeof(xfs_buf_log_item_t) + | ||
1573 | (((XFS_MAX_BLOCKSIZE / XFS_BLF_CHUNK) / | ||
1574 | NBWORD) * sizeof(int))), "xfs_buf_item"); | ||
1575 | if (!xfs_buf_item_zone) | ||
1576 | goto out_destroy_log_item_desc_zone; | ||
1577 | |||
1578 | xfs_efd_zone = kmem_zone_init((sizeof(xfs_efd_log_item_t) + | ||
1579 | ((XFS_EFD_MAX_FAST_EXTENTS - 1) * | ||
1580 | sizeof(xfs_extent_t))), "xfs_efd_item"); | ||
1581 | if (!xfs_efd_zone) | ||
1582 | goto out_destroy_buf_item_zone; | ||
1583 | |||
1584 | xfs_efi_zone = kmem_zone_init((sizeof(xfs_efi_log_item_t) + | ||
1585 | ((XFS_EFI_MAX_FAST_EXTENTS - 1) * | ||
1586 | sizeof(xfs_extent_t))), "xfs_efi_item"); | ||
1587 | if (!xfs_efi_zone) | ||
1588 | goto out_destroy_efd_zone; | ||
1589 | |||
1590 | xfs_inode_zone = | ||
1591 | kmem_zone_init_flags(sizeof(xfs_inode_t), "xfs_inode", | ||
1592 | KM_ZONE_HWALIGN | KM_ZONE_RECLAIM | KM_ZONE_SPREAD, | ||
1593 | xfs_fs_inode_init_once); | ||
1594 | if (!xfs_inode_zone) | ||
1595 | goto out_destroy_efi_zone; | ||
1596 | |||
1597 | xfs_ili_zone = | ||
1598 | kmem_zone_init_flags(sizeof(xfs_inode_log_item_t), "xfs_ili", | ||
1599 | KM_ZONE_SPREAD, NULL); | ||
1600 | if (!xfs_ili_zone) | ||
1601 | goto out_destroy_inode_zone; | ||
1602 | |||
1603 | return 0; | ||
1604 | |||
1605 | out_destroy_inode_zone: | ||
1606 | kmem_zone_destroy(xfs_inode_zone); | ||
1607 | out_destroy_efi_zone: | ||
1608 | kmem_zone_destroy(xfs_efi_zone); | ||
1609 | out_destroy_efd_zone: | ||
1610 | kmem_zone_destroy(xfs_efd_zone); | ||
1611 | out_destroy_buf_item_zone: | ||
1612 | kmem_zone_destroy(xfs_buf_item_zone); | ||
1613 | out_destroy_log_item_desc_zone: | ||
1614 | kmem_zone_destroy(xfs_log_item_desc_zone); | ||
1615 | out_destroy_trans_zone: | ||
1616 | kmem_zone_destroy(xfs_trans_zone); | ||
1617 | out_destroy_ifork_zone: | ||
1618 | kmem_zone_destroy(xfs_ifork_zone); | ||
1619 | out_destroy_dabuf_zone: | ||
1620 | kmem_zone_destroy(xfs_dabuf_zone); | ||
1621 | out_destroy_da_state_zone: | ||
1622 | kmem_zone_destroy(xfs_da_state_zone); | ||
1623 | out_destroy_btree_cur_zone: | ||
1624 | kmem_zone_destroy(xfs_btree_cur_zone); | ||
1625 | out_destroy_bmap_free_item_zone: | ||
1626 | kmem_zone_destroy(xfs_bmap_free_item_zone); | ||
1627 | out_destroy_log_ticket_zone: | ||
1628 | kmem_zone_destroy(xfs_log_ticket_zone); | ||
1629 | out_destroy_ioend_pool: | ||
1630 | mempool_destroy(xfs_ioend_pool); | ||
1631 | out_destroy_ioend_zone: | ||
1632 | kmem_zone_destroy(xfs_ioend_zone); | ||
1633 | out: | ||
1634 | return -ENOMEM; | ||
1635 | } | ||
1636 | |||
1637 | STATIC void | ||
1638 | xfs_destroy_zones(void) | ||
1639 | { | ||
1640 | kmem_zone_destroy(xfs_ili_zone); | ||
1641 | kmem_zone_destroy(xfs_inode_zone); | ||
1642 | kmem_zone_destroy(xfs_efi_zone); | ||
1643 | kmem_zone_destroy(xfs_efd_zone); | ||
1644 | kmem_zone_destroy(xfs_buf_item_zone); | ||
1645 | kmem_zone_destroy(xfs_log_item_desc_zone); | ||
1646 | kmem_zone_destroy(xfs_trans_zone); | ||
1647 | kmem_zone_destroy(xfs_ifork_zone); | ||
1648 | kmem_zone_destroy(xfs_dabuf_zone); | ||
1649 | kmem_zone_destroy(xfs_da_state_zone); | ||
1650 | kmem_zone_destroy(xfs_btree_cur_zone); | ||
1651 | kmem_zone_destroy(xfs_bmap_free_item_zone); | ||
1652 | kmem_zone_destroy(xfs_log_ticket_zone); | ||
1653 | mempool_destroy(xfs_ioend_pool); | ||
1654 | kmem_zone_destroy(xfs_ioend_zone); | ||
1655 | |||
1656 | } | ||
1657 | |||
1658 | STATIC int __init | ||
1659 | xfs_init_workqueues(void) | ||
1660 | { | ||
1661 | /* | ||
1662 | * max_active is set to 8 to give enough concurency to allow | ||
1663 | * multiple work operations on each CPU to run. This allows multiple | ||
1664 | * filesystems to be running sync work concurrently, and scales with | ||
1665 | * the number of CPUs in the system. | ||
1666 | */ | ||
1667 | xfs_syncd_wq = alloc_workqueue("xfssyncd", WQ_CPU_INTENSIVE, 8); | ||
1668 | if (!xfs_syncd_wq) | ||
1669 | goto out; | ||
1670 | |||
1671 | xfs_ail_wq = alloc_workqueue("xfsail", WQ_CPU_INTENSIVE, 8); | ||
1672 | if (!xfs_ail_wq) | ||
1673 | goto out_destroy_syncd; | ||
1674 | |||
1675 | return 0; | ||
1676 | |||
1677 | out_destroy_syncd: | ||
1678 | destroy_workqueue(xfs_syncd_wq); | ||
1679 | out: | ||
1680 | return -ENOMEM; | ||
1681 | } | ||
1682 | |||
1683 | STATIC void | ||
1684 | xfs_destroy_workqueues(void) | ||
1685 | { | ||
1686 | destroy_workqueue(xfs_ail_wq); | ||
1687 | destroy_workqueue(xfs_syncd_wq); | ||
1688 | } | ||
1689 | |||
1690 | STATIC int __init | ||
1691 | init_xfs_fs(void) | ||
1692 | { | ||
1693 | int error; | ||
1694 | |||
1695 | printk(KERN_INFO XFS_VERSION_STRING " with " | ||
1696 | XFS_BUILD_OPTIONS " enabled\n"); | ||
1697 | |||
1698 | xfs_ioend_init(); | ||
1699 | xfs_dir_startup(); | ||
1700 | |||
1701 | error = xfs_init_zones(); | ||
1702 | if (error) | ||
1703 | goto out; | ||
1704 | |||
1705 | error = xfs_init_workqueues(); | ||
1706 | if (error) | ||
1707 | goto out_destroy_zones; | ||
1708 | |||
1709 | error = xfs_mru_cache_init(); | ||
1710 | if (error) | ||
1711 | goto out_destroy_wq; | ||
1712 | |||
1713 | error = xfs_filestream_init(); | ||
1714 | if (error) | ||
1715 | goto out_mru_cache_uninit; | ||
1716 | |||
1717 | error = xfs_buf_init(); | ||
1718 | if (error) | ||
1719 | goto out_filestream_uninit; | ||
1720 | |||
1721 | error = xfs_init_procfs(); | ||
1722 | if (error) | ||
1723 | goto out_buf_terminate; | ||
1724 | |||
1725 | error = xfs_sysctl_register(); | ||
1726 | if (error) | ||
1727 | goto out_cleanup_procfs; | ||
1728 | |||
1729 | vfs_initquota(); | ||
1730 | |||
1731 | error = register_filesystem(&xfs_fs_type); | ||
1732 | if (error) | ||
1733 | goto out_sysctl_unregister; | ||
1734 | return 0; | ||
1735 | |||
1736 | out_sysctl_unregister: | ||
1737 | xfs_sysctl_unregister(); | ||
1738 | out_cleanup_procfs: | ||
1739 | xfs_cleanup_procfs(); | ||
1740 | out_buf_terminate: | ||
1741 | xfs_buf_terminate(); | ||
1742 | out_filestream_uninit: | ||
1743 | xfs_filestream_uninit(); | ||
1744 | out_mru_cache_uninit: | ||
1745 | xfs_mru_cache_uninit(); | ||
1746 | out_destroy_wq: | ||
1747 | xfs_destroy_workqueues(); | ||
1748 | out_destroy_zones: | ||
1749 | xfs_destroy_zones(); | ||
1750 | out: | ||
1751 | return error; | ||
1752 | } | ||
1753 | |||
1754 | STATIC void __exit | ||
1755 | exit_xfs_fs(void) | ||
1756 | { | ||
1757 | vfs_exitquota(); | ||
1758 | unregister_filesystem(&xfs_fs_type); | ||
1759 | xfs_sysctl_unregister(); | ||
1760 | xfs_cleanup_procfs(); | ||
1761 | xfs_buf_terminate(); | ||
1762 | xfs_filestream_uninit(); | ||
1763 | xfs_mru_cache_uninit(); | ||
1764 | xfs_destroy_workqueues(); | ||
1765 | xfs_destroy_zones(); | ||
1766 | } | ||
1767 | |||
1768 | module_init(init_xfs_fs); | ||
1769 | module_exit(exit_xfs_fs); | ||
1770 | |||
1771 | MODULE_AUTHOR("Silicon Graphics, Inc."); | ||
1772 | MODULE_DESCRIPTION(XFS_VERSION_STRING " with " XFS_BUILD_OPTIONS " enabled"); | ||
1773 | MODULE_LICENSE("GPL"); | ||