]> bbs.cooldavid.org Git - net-next-2.6.git/blame - fs/xfs/linux-2.6/xfs_super.c
[XFS] use generic_permission
[net-next-2.6.git] / fs / xfs / linux-2.6 / xfs_super.c
CommitLineData
1da177e4 1/*
a805bad5 2 * Copyright (c) 2000-2006 Silicon Graphics, Inc.
7b718769 3 * All Rights Reserved.
1da177e4 4 *
7b718769
NS
5 * This program is free software; you can redistribute it and/or
6 * modify it under the terms of the GNU General Public License as
1da177e4
LT
7 * published by the Free Software Foundation.
8 *
7b718769
NS
9 * This program is distributed in the hope that it would be useful,
10 * but WITHOUT ANY WARRANTY; without even the implied warranty of
11 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
12 * GNU General Public License for more details.
1da177e4 13 *
7b718769
NS
14 * You should have received a copy of the GNU General Public License
15 * along with this program; if not, write the Free Software Foundation,
16 * Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA
1da177e4 17 */
1da177e4 18#include "xfs.h"
a844f451 19#include "xfs_bit.h"
1da177e4
LT
20#include "xfs_log.h"
21#include "xfs_clnt.h"
a844f451 22#include "xfs_inum.h"
1da177e4
LT
23#include "xfs_trans.h"
24#include "xfs_sb.h"
a844f451 25#include "xfs_ag.h"
1da177e4
LT
26#include "xfs_dir2.h"
27#include "xfs_alloc.h"
28#include "xfs_dmapi.h"
29#include "xfs_quota.h"
30#include "xfs_mount.h"
1da177e4 31#include "xfs_bmap_btree.h"
a844f451 32#include "xfs_alloc_btree.h"
1da177e4 33#include "xfs_ialloc_btree.h"
1da177e4 34#include "xfs_dir2_sf.h"
a844f451 35#include "xfs_attr_sf.h"
1da177e4
LT
36#include "xfs_dinode.h"
37#include "xfs_inode.h"
a844f451
NS
38#include "xfs_btree.h"
39#include "xfs_ialloc.h"
1da177e4 40#include "xfs_bmap.h"
1da177e4
LT
41#include "xfs_rtalloc.h"
42#include "xfs_error.h"
43#include "xfs_itable.h"
9909c4aa 44#include "xfs_fsops.h"
1da177e4
LT
45#include "xfs_rw.h"
46#include "xfs_acl.h"
1da177e4
LT
47#include "xfs_attr.h"
48#include "xfs_buf_item.h"
49#include "xfs_utils.h"
739bfb2a 50#include "xfs_vnodeops.h"
745f6919 51#include "xfs_vfsops.h"
1da177e4 52#include "xfs_version.h"
a67d7c5f 53#include "xfs_log_priv.h"
1da177e4
LT
54
55#include <linux/namei.h>
56#include <linux/init.h>
57#include <linux/mount.h>
0829c360 58#include <linux/mempool.h>
1da177e4 59#include <linux/writeback.h>
4df08c52 60#include <linux/kthread.h>
7dfb7103 61#include <linux/freezer.h>
1da177e4 62
7989cb8e
DC
63static struct quotactl_ops xfs_quotactl_operations;
64static struct super_operations xfs_super_operations;
65static kmem_zone_t *xfs_vnode_zone;
66static kmem_zone_t *xfs_ioend_zone;
0829c360 67mempool_t *xfs_ioend_pool;
1da177e4
LT
68
69STATIC struct xfs_mount_args *
70xfs_args_allocate(
764d1f89
NS
71 struct super_block *sb,
72 int silent)
1da177e4
LT
73{
74 struct xfs_mount_args *args;
75
76 args = kmem_zalloc(sizeof(struct xfs_mount_args), KM_SLEEP);
77 args->logbufs = args->logbufsize = -1;
78 strncpy(args->fsname, sb->s_id, MAXNAMELEN);
79
80 /* Copy the already-parsed mount(2) flags we're interested in */
1da177e4
LT
81 if (sb->s_flags & MS_DIRSYNC)
82 args->flags |= XFSMNT_DIRSYNC;
83 if (sb->s_flags & MS_SYNCHRONOUS)
84 args->flags |= XFSMNT_WSYNC;
764d1f89
NS
85 if (silent)
86 args->flags |= XFSMNT_QUIET;
1da177e4
LT
87 args->flags |= XFSMNT_32BITINODES;
88
89 return args;
90}
91
a67d7c5f
DC
92#define MNTOPT_LOGBUFS "logbufs" /* number of XFS log buffers */
93#define MNTOPT_LOGBSIZE "logbsize" /* size of XFS log buffers */
94#define MNTOPT_LOGDEV "logdev" /* log device */
95#define MNTOPT_RTDEV "rtdev" /* realtime I/O device */
96#define MNTOPT_BIOSIZE "biosize" /* log2 of preferred buffered io size */
97#define MNTOPT_WSYNC "wsync" /* safe-mode nfs compatible mount */
98#define MNTOPT_INO64 "ino64" /* force inodes into 64-bit range */
99#define MNTOPT_NOALIGN "noalign" /* turn off stripe alignment */
100#define MNTOPT_SWALLOC "swalloc" /* turn on stripe width allocation */
101#define MNTOPT_SUNIT "sunit" /* data volume stripe unit */
102#define MNTOPT_SWIDTH "swidth" /* data volume stripe width */
103#define MNTOPT_NOUUID "nouuid" /* ignore filesystem UUID */
104#define MNTOPT_MTPT "mtpt" /* filesystem mount point */
105#define MNTOPT_GRPID "grpid" /* group-ID from parent directory */
106#define MNTOPT_NOGRPID "nogrpid" /* group-ID from current process */
107#define MNTOPT_BSDGROUPS "bsdgroups" /* group-ID from parent directory */
108#define MNTOPT_SYSVGROUPS "sysvgroups" /* group-ID from current process */
109#define MNTOPT_ALLOCSIZE "allocsize" /* preferred allocation size */
110#define MNTOPT_NORECOVERY "norecovery" /* don't run XFS recovery */
111#define MNTOPT_BARRIER "barrier" /* use writer barriers for log write and
112 * unwritten extent conversion */
113#define MNTOPT_NOBARRIER "nobarrier" /* .. disable */
114#define MNTOPT_OSYNCISOSYNC "osyncisosync" /* o_sync is REALLY o_sync */
115#define MNTOPT_64BITINODE "inode64" /* inodes can be allocated anywhere */
116#define MNTOPT_IKEEP "ikeep" /* do not free empty inode clusters */
117#define MNTOPT_NOIKEEP "noikeep" /* free empty inode clusters */
118#define MNTOPT_LARGEIO "largeio" /* report large I/O sizes in stat() */
119#define MNTOPT_NOLARGEIO "nolargeio" /* do not report large I/O sizes
120 * in stat(). */
121#define MNTOPT_ATTR2 "attr2" /* do use attr2 attribute format */
122#define MNTOPT_NOATTR2 "noattr2" /* do not use attr2 attribute format */
123#define MNTOPT_FILESTREAM "filestreams" /* use filestreams allocator */
124#define MNTOPT_QUOTA "quota" /* disk quotas (user) */
125#define MNTOPT_NOQUOTA "noquota" /* no quotas */
126#define MNTOPT_USRQUOTA "usrquota" /* user quota enabled */
127#define MNTOPT_GRPQUOTA "grpquota" /* group quota enabled */
128#define MNTOPT_PRJQUOTA "prjquota" /* project quota enabled */
129#define MNTOPT_UQUOTA "uquota" /* user quota (IRIX variant) */
130#define MNTOPT_GQUOTA "gquota" /* group quota (IRIX variant) */
131#define MNTOPT_PQUOTA "pquota" /* project quota (IRIX variant) */
132#define MNTOPT_UQUOTANOENF "uqnoenforce"/* user quota limit enforcement */
133#define MNTOPT_GQUOTANOENF "gqnoenforce"/* group quota limit enforcement */
134#define MNTOPT_PQUOTANOENF "pqnoenforce"/* project quota limit enforcement */
135#define MNTOPT_QUOTANOENF "qnoenforce" /* same as uqnoenforce */
136#define MNTOPT_DMAPI "dmapi" /* DMI enabled (DMAPI / XDSM) */
137#define MNTOPT_XDSM "xdsm" /* DMI enabled (DMAPI / XDSM) */
138#define MNTOPT_DMI "dmi" /* DMI enabled (DMAPI / XDSM) */
139
140STATIC unsigned long
141suffix_strtoul(char *s, char **endp, unsigned int base)
142{
143 int last, shift_left_factor = 0;
144 char *value = s;
145
146 last = strlen(value) - 1;
147 if (value[last] == 'K' || value[last] == 'k') {
148 shift_left_factor = 10;
149 value[last] = '\0';
150 }
151 if (value[last] == 'M' || value[last] == 'm') {
152 shift_left_factor = 20;
153 value[last] = '\0';
154 }
155 if (value[last] == 'G' || value[last] == 'g') {
156 shift_left_factor = 30;
157 value[last] = '\0';
158 }
159
160 return simple_strtoul((const char *)s, endp, base) << shift_left_factor;
161}
162
163STATIC int
164xfs_parseargs(
165 struct xfs_mount *mp,
166 char *options,
167 struct xfs_mount_args *args,
168 int update)
169{
170 char *this_char, *value, *eov;
171 int dsunit, dswidth, vol_dsunit, vol_dswidth;
172 int iosize;
173 int ikeep = 0;
174
175 args->flags |= XFSMNT_BARRIER;
176 args->flags2 |= XFSMNT2_COMPAT_IOSIZE;
177
178 if (!options)
179 goto done;
180
181 iosize = dsunit = dswidth = vol_dsunit = vol_dswidth = 0;
182
183 while ((this_char = strsep(&options, ",")) != NULL) {
184 if (!*this_char)
185 continue;
186 if ((value = strchr(this_char, '=')) != NULL)
187 *value++ = 0;
188
189 if (!strcmp(this_char, MNTOPT_LOGBUFS)) {
190 if (!value || !*value) {
191 cmn_err(CE_WARN,
192 "XFS: %s option requires an argument",
193 this_char);
194 return EINVAL;
195 }
196 args->logbufs = simple_strtoul(value, &eov, 10);
197 } else if (!strcmp(this_char, MNTOPT_LOGBSIZE)) {
198 if (!value || !*value) {
199 cmn_err(CE_WARN,
200 "XFS: %s option requires an argument",
201 this_char);
202 return EINVAL;
203 }
204 args->logbufsize = suffix_strtoul(value, &eov, 10);
205 } else if (!strcmp(this_char, MNTOPT_LOGDEV)) {
206 if (!value || !*value) {
207 cmn_err(CE_WARN,
208 "XFS: %s option requires an argument",
209 this_char);
210 return EINVAL;
211 }
212 strncpy(args->logname, value, MAXNAMELEN);
213 } else if (!strcmp(this_char, MNTOPT_MTPT)) {
214 if (!value || !*value) {
215 cmn_err(CE_WARN,
216 "XFS: %s option requires an argument",
217 this_char);
218 return EINVAL;
219 }
220 strncpy(args->mtpt, value, MAXNAMELEN);
221 } else if (!strcmp(this_char, MNTOPT_RTDEV)) {
222 if (!value || !*value) {
223 cmn_err(CE_WARN,
224 "XFS: %s option requires an argument",
225 this_char);
226 return EINVAL;
227 }
228 strncpy(args->rtname, value, MAXNAMELEN);
229 } else if (!strcmp(this_char, MNTOPT_BIOSIZE)) {
230 if (!value || !*value) {
231 cmn_err(CE_WARN,
232 "XFS: %s option requires an argument",
233 this_char);
234 return EINVAL;
235 }
236 iosize = simple_strtoul(value, &eov, 10);
237 args->flags |= XFSMNT_IOSIZE;
238 args->iosizelog = (uint8_t) iosize;
239 } else if (!strcmp(this_char, MNTOPT_ALLOCSIZE)) {
240 if (!value || !*value) {
241 cmn_err(CE_WARN,
242 "XFS: %s option requires an argument",
243 this_char);
244 return EINVAL;
245 }
246 iosize = suffix_strtoul(value, &eov, 10);
247 args->flags |= XFSMNT_IOSIZE;
248 args->iosizelog = ffs(iosize) - 1;
249 } else if (!strcmp(this_char, MNTOPT_GRPID) ||
250 !strcmp(this_char, MNTOPT_BSDGROUPS)) {
251 mp->m_flags |= XFS_MOUNT_GRPID;
252 } else if (!strcmp(this_char, MNTOPT_NOGRPID) ||
253 !strcmp(this_char, MNTOPT_SYSVGROUPS)) {
254 mp->m_flags &= ~XFS_MOUNT_GRPID;
255 } else if (!strcmp(this_char, MNTOPT_WSYNC)) {
256 args->flags |= XFSMNT_WSYNC;
257 } else if (!strcmp(this_char, MNTOPT_OSYNCISOSYNC)) {
258 args->flags |= XFSMNT_OSYNCISOSYNC;
259 } else if (!strcmp(this_char, MNTOPT_NORECOVERY)) {
260 args->flags |= XFSMNT_NORECOVERY;
261 } else if (!strcmp(this_char, MNTOPT_INO64)) {
262 args->flags |= XFSMNT_INO64;
263#if !XFS_BIG_INUMS
264 cmn_err(CE_WARN,
265 "XFS: %s option not allowed on this system",
266 this_char);
267 return EINVAL;
268#endif
269 } else if (!strcmp(this_char, MNTOPT_NOALIGN)) {
270 args->flags |= XFSMNT_NOALIGN;
271 } else if (!strcmp(this_char, MNTOPT_SWALLOC)) {
272 args->flags |= XFSMNT_SWALLOC;
273 } else if (!strcmp(this_char, MNTOPT_SUNIT)) {
274 if (!value || !*value) {
275 cmn_err(CE_WARN,
276 "XFS: %s option requires an argument",
277 this_char);
278 return EINVAL;
279 }
280 dsunit = simple_strtoul(value, &eov, 10);
281 } else if (!strcmp(this_char, MNTOPT_SWIDTH)) {
282 if (!value || !*value) {
283 cmn_err(CE_WARN,
284 "XFS: %s option requires an argument",
285 this_char);
286 return EINVAL;
287 }
288 dswidth = simple_strtoul(value, &eov, 10);
289 } else if (!strcmp(this_char, MNTOPT_64BITINODE)) {
290 args->flags &= ~XFSMNT_32BITINODES;
291#if !XFS_BIG_INUMS
292 cmn_err(CE_WARN,
293 "XFS: %s option not allowed on this system",
294 this_char);
295 return EINVAL;
296#endif
297 } else if (!strcmp(this_char, MNTOPT_NOUUID)) {
298 args->flags |= XFSMNT_NOUUID;
299 } else if (!strcmp(this_char, MNTOPT_BARRIER)) {
300 args->flags |= XFSMNT_BARRIER;
301 } else if (!strcmp(this_char, MNTOPT_NOBARRIER)) {
302 args->flags &= ~XFSMNT_BARRIER;
303 } else if (!strcmp(this_char, MNTOPT_IKEEP)) {
304 ikeep = 1;
305 args->flags &= ~XFSMNT_IDELETE;
306 } else if (!strcmp(this_char, MNTOPT_NOIKEEP)) {
307 args->flags |= XFSMNT_IDELETE;
308 } else if (!strcmp(this_char, MNTOPT_LARGEIO)) {
309 args->flags2 &= ~XFSMNT2_COMPAT_IOSIZE;
310 } else if (!strcmp(this_char, MNTOPT_NOLARGEIO)) {
311 args->flags2 |= XFSMNT2_COMPAT_IOSIZE;
312 } else if (!strcmp(this_char, MNTOPT_ATTR2)) {
313 args->flags |= XFSMNT_ATTR2;
314 } else if (!strcmp(this_char, MNTOPT_NOATTR2)) {
315 args->flags &= ~XFSMNT_ATTR2;
316 } else if (!strcmp(this_char, MNTOPT_FILESTREAM)) {
317 args->flags2 |= XFSMNT2_FILESTREAMS;
318 } else if (!strcmp(this_char, MNTOPT_NOQUOTA)) {
319 args->flags &= ~(XFSMNT_UQUOTAENF|XFSMNT_UQUOTA);
320 args->flags &= ~(XFSMNT_GQUOTAENF|XFSMNT_GQUOTA);
321 } else if (!strcmp(this_char, MNTOPT_QUOTA) ||
322 !strcmp(this_char, MNTOPT_UQUOTA) ||
323 !strcmp(this_char, MNTOPT_USRQUOTA)) {
324 args->flags |= XFSMNT_UQUOTA | XFSMNT_UQUOTAENF;
325 } else if (!strcmp(this_char, MNTOPT_QUOTANOENF) ||
326 !strcmp(this_char, MNTOPT_UQUOTANOENF)) {
327 args->flags |= XFSMNT_UQUOTA;
328 args->flags &= ~XFSMNT_UQUOTAENF;
329 } else if (!strcmp(this_char, MNTOPT_PQUOTA) ||
330 !strcmp(this_char, MNTOPT_PRJQUOTA)) {
331 args->flags |= XFSMNT_PQUOTA | XFSMNT_PQUOTAENF;
332 } else if (!strcmp(this_char, MNTOPT_PQUOTANOENF)) {
333 args->flags |= XFSMNT_PQUOTA;
334 args->flags &= ~XFSMNT_PQUOTAENF;
335 } else if (!strcmp(this_char, MNTOPT_GQUOTA) ||
336 !strcmp(this_char, MNTOPT_GRPQUOTA)) {
337 args->flags |= XFSMNT_GQUOTA | XFSMNT_GQUOTAENF;
338 } else if (!strcmp(this_char, MNTOPT_GQUOTANOENF)) {
339 args->flags |= XFSMNT_GQUOTA;
340 args->flags &= ~XFSMNT_GQUOTAENF;
341 } else if (!strcmp(this_char, MNTOPT_DMAPI)) {
342 args->flags |= XFSMNT_DMAPI;
343 } else if (!strcmp(this_char, MNTOPT_XDSM)) {
344 args->flags |= XFSMNT_DMAPI;
345 } else if (!strcmp(this_char, MNTOPT_DMI)) {
346 args->flags |= XFSMNT_DMAPI;
347 } else if (!strcmp(this_char, "ihashsize")) {
348 cmn_err(CE_WARN,
349 "XFS: ihashsize no longer used, option is deprecated.");
350 } else if (!strcmp(this_char, "osyncisdsync")) {
351 /* no-op, this is now the default */
352 cmn_err(CE_WARN,
353 "XFS: osyncisdsync is now the default, option is deprecated.");
354 } else if (!strcmp(this_char, "irixsgid")) {
355 cmn_err(CE_WARN,
356 "XFS: irixsgid is now a sysctl(2) variable, option is deprecated.");
357 } else {
358 cmn_err(CE_WARN,
359 "XFS: unknown mount option [%s].", this_char);
360 return EINVAL;
361 }
362 }
363
364 if (args->flags & XFSMNT_NORECOVERY) {
365 if ((mp->m_flags & XFS_MOUNT_RDONLY) == 0) {
366 cmn_err(CE_WARN,
367 "XFS: no-recovery mounts must be read-only.");
368 return EINVAL;
369 }
370 }
371
372 if ((args->flags & XFSMNT_NOALIGN) && (dsunit || dswidth)) {
373 cmn_err(CE_WARN,
374 "XFS: sunit and swidth options incompatible with the noalign option");
375 return EINVAL;
376 }
377
378 if ((args->flags & XFSMNT_GQUOTA) && (args->flags & XFSMNT_PQUOTA)) {
379 cmn_err(CE_WARN,
380 "XFS: cannot mount with both project and group quota");
381 return EINVAL;
382 }
383
384 if ((args->flags & XFSMNT_DMAPI) && *args->mtpt == '\0') {
385 printk("XFS: %s option needs the mount point option as well\n",
386 MNTOPT_DMAPI);
387 return EINVAL;
388 }
389
390 if ((dsunit && !dswidth) || (!dsunit && dswidth)) {
391 cmn_err(CE_WARN,
392 "XFS: sunit and swidth must be specified together");
393 return EINVAL;
394 }
395
396 if (dsunit && (dswidth % dsunit != 0)) {
397 cmn_err(CE_WARN,
398 "XFS: stripe width (%d) must be a multiple of the stripe unit (%d)",
399 dswidth, dsunit);
400 return EINVAL;
401 }
402
403 /*
404 * Applications using DMI filesystems often expect the
405 * inode generation number to be monotonically increasing.
406 * If we delete inode chunks we break this assumption, so
407 * keep unused inode chunks on disk for DMI filesystems
408 * until we come up with a better solution.
409 * Note that if "ikeep" or "noikeep" mount options are
410 * supplied, then they are honored.
411 */
412 if (!(args->flags & XFSMNT_DMAPI) && !ikeep)
413 args->flags |= XFSMNT_IDELETE;
414
415 if ((args->flags & XFSMNT_NOALIGN) != XFSMNT_NOALIGN) {
416 if (dsunit) {
417 args->sunit = dsunit;
418 args->flags |= XFSMNT_RETERR;
419 } else {
420 args->sunit = vol_dsunit;
421 }
422 dswidth ? (args->swidth = dswidth) :
423 (args->swidth = vol_dswidth);
424 } else {
425 args->sunit = args->swidth = 0;
426 }
427
428done:
429 if (args->flags & XFSMNT_32BITINODES)
430 mp->m_flags |= XFS_MOUNT_SMALL_INUMS;
431 if (args->flags2)
432 args->flags |= XFSMNT_FLAGS2;
433 return 0;
434}
435
436struct proc_xfs_info {
437 int flag;
438 char *str;
439};
440
441STATIC int
442xfs_showargs(
443 struct xfs_mount *mp,
444 struct seq_file *m)
445{
446 static struct proc_xfs_info xfs_info_set[] = {
447 /* the few simple ones we can get from the mount struct */
448 { XFS_MOUNT_WSYNC, "," MNTOPT_WSYNC },
449 { XFS_MOUNT_INO64, "," MNTOPT_INO64 },
450 { XFS_MOUNT_NOALIGN, "," MNTOPT_NOALIGN },
451 { XFS_MOUNT_SWALLOC, "," MNTOPT_SWALLOC },
452 { XFS_MOUNT_NOUUID, "," MNTOPT_NOUUID },
453 { XFS_MOUNT_NORECOVERY, "," MNTOPT_NORECOVERY },
454 { XFS_MOUNT_OSYNCISOSYNC, "," MNTOPT_OSYNCISOSYNC },
455 { XFS_MOUNT_ATTR2, "," MNTOPT_ATTR2 },
456 { XFS_MOUNT_FILESTREAMS, "," MNTOPT_FILESTREAM },
457 { XFS_MOUNT_DMAPI, "," MNTOPT_DMAPI },
458 { XFS_MOUNT_GRPID, "," MNTOPT_GRPID },
459 { 0, NULL }
460 };
461 static struct proc_xfs_info xfs_info_unset[] = {
462 /* the few simple ones we can get from the mount struct */
463 { XFS_MOUNT_IDELETE, "," MNTOPT_IKEEP },
464 { XFS_MOUNT_COMPAT_IOSIZE, "," MNTOPT_LARGEIO },
465 { XFS_MOUNT_BARRIER, "," MNTOPT_NOBARRIER },
466 { XFS_MOUNT_SMALL_INUMS, "," MNTOPT_64BITINODE },
467 { 0, NULL }
468 };
469 struct proc_xfs_info *xfs_infop;
470
471 for (xfs_infop = xfs_info_set; xfs_infop->flag; xfs_infop++) {
472 if (mp->m_flags & xfs_infop->flag)
473 seq_puts(m, xfs_infop->str);
474 }
475 for (xfs_infop = xfs_info_unset; xfs_infop->flag; xfs_infop++) {
476 if (!(mp->m_flags & xfs_infop->flag))
477 seq_puts(m, xfs_infop->str);
478 }
479
480 if (mp->m_flags & XFS_MOUNT_DFLT_IOSIZE)
481 seq_printf(m, "," MNTOPT_ALLOCSIZE "=%dk",
482 (int)(1 << mp->m_writeio_log) >> 10);
483
484 if (mp->m_logbufs > 0)
485 seq_printf(m, "," MNTOPT_LOGBUFS "=%d", mp->m_logbufs);
486 if (mp->m_logbsize > 0)
487 seq_printf(m, "," MNTOPT_LOGBSIZE "=%dk", mp->m_logbsize >> 10);
488
489 if (mp->m_logname)
490 seq_printf(m, "," MNTOPT_LOGDEV "=%s", mp->m_logname);
491 if (mp->m_rtname)
492 seq_printf(m, "," MNTOPT_RTDEV "=%s", mp->m_rtname);
493
494 if (mp->m_dalign > 0)
495 seq_printf(m, "," MNTOPT_SUNIT "=%d",
496 (int)XFS_FSB_TO_BB(mp, mp->m_dalign));
497 if (mp->m_swidth > 0)
498 seq_printf(m, "," MNTOPT_SWIDTH "=%d",
499 (int)XFS_FSB_TO_BB(mp, mp->m_swidth));
500
501 if (mp->m_qflags & (XFS_UQUOTA_ACCT|XFS_UQUOTA_ENFD))
502 seq_puts(m, "," MNTOPT_USRQUOTA);
503 else if (mp->m_qflags & XFS_UQUOTA_ACCT)
504 seq_puts(m, "," MNTOPT_UQUOTANOENF);
505
506 if (mp->m_qflags & (XFS_PQUOTA_ACCT|XFS_OQUOTA_ENFD))
507 seq_puts(m, "," MNTOPT_PRJQUOTA);
508 else if (mp->m_qflags & XFS_PQUOTA_ACCT)
509 seq_puts(m, "," MNTOPT_PQUOTANOENF);
510
511 if (mp->m_qflags & (XFS_GQUOTA_ACCT|XFS_OQUOTA_ENFD))
512 seq_puts(m, "," MNTOPT_GRPQUOTA);
513 else if (mp->m_qflags & XFS_GQUOTA_ACCT)
514 seq_puts(m, "," MNTOPT_GQUOTANOENF);
515
516 if (!(mp->m_qflags & XFS_ALL_QUOTA_ACCT))
517 seq_puts(m, "," MNTOPT_NOQUOTA);
518
519 return 0;
520}
1da177e4
LT
521__uint64_t
522xfs_max_file_offset(
523 unsigned int blockshift)
524{
525 unsigned int pagefactor = 1;
526 unsigned int bitshift = BITS_PER_LONG - 1;
527
528 /* Figure out maximum filesize, on Linux this can depend on
529 * the filesystem blocksize (on 32 bit platforms).
530 * __block_prepare_write does this in an [unsigned] long...
531 * page->index << (PAGE_CACHE_SHIFT - bbits)
532 * So, for page sized blocks (4K on 32 bit platforms),
533 * this wraps at around 8Tb (hence MAX_LFS_FILESIZE which is
534 * (((u64)PAGE_CACHE_SIZE << (BITS_PER_LONG-1))-1)
535 * but for smaller blocksizes it is less (bbits = log2 bsize).
536 * Note1: get_block_t takes a long (implicit cast from above)
537 * Note2: The Large Block Device (LBD and HAVE_SECTOR_T) patch
538 * can optionally convert the [unsigned] long from above into
539 * an [unsigned] long long.
540 */
541
542#if BITS_PER_LONG == 32
543# if defined(CONFIG_LBD)
544 ASSERT(sizeof(sector_t) == 8);
545 pagefactor = PAGE_CACHE_SIZE;
546 bitshift = BITS_PER_LONG;
547# else
548 pagefactor = PAGE_CACHE_SIZE >> (PAGE_CACHE_SHIFT - blockshift);
549# endif
550#endif
551
552 return (((__uint64_t)pagefactor) << bitshift) - 1;
553}
554
7989cb8e 555STATIC_INLINE void
1da177e4
LT
556xfs_set_inodeops(
557 struct inode *inode)
558{
0432dab2
CH
559 switch (inode->i_mode & S_IFMT) {
560 case S_IFREG:
416c6d5b 561 inode->i_op = &xfs_inode_operations;
3562fd45 562 inode->i_fop = &xfs_file_operations;
e4c573bb 563 inode->i_mapping->a_ops = &xfs_address_space_operations;
0432dab2
CH
564 break;
565 case S_IFDIR:
416c6d5b 566 inode->i_op = &xfs_dir_inode_operations;
3562fd45 567 inode->i_fop = &xfs_dir_file_operations;
0432dab2
CH
568 break;
569 case S_IFLNK:
416c6d5b 570 inode->i_op = &xfs_symlink_inode_operations;
1da177e4 571 if (inode->i_blocks)
e4c573bb 572 inode->i_mapping->a_ops = &xfs_address_space_operations;
0432dab2
CH
573 break;
574 default:
416c6d5b 575 inode->i_op = &xfs_inode_operations;
1da177e4 576 init_special_inode(inode, inode->i_mode, inode->i_rdev);
0432dab2 577 break;
1da177e4
LT
578 }
579}
580
7989cb8e 581STATIC_INLINE void
1da177e4
LT
582xfs_revalidate_inode(
583 xfs_mount_t *mp,
67fcaa73 584 bhv_vnode_t *vp,
1da177e4
LT
585 xfs_inode_t *ip)
586{
ec86dc02 587 struct inode *inode = vn_to_inode(vp);
1da177e4 588
0432dab2 589 inode->i_mode = ip->i_d.di_mode;
1da177e4
LT
590 inode->i_nlink = ip->i_d.di_nlink;
591 inode->i_uid = ip->i_d.di_uid;
592 inode->i_gid = ip->i_d.di_gid;
0432dab2
CH
593
594 switch (inode->i_mode & S_IFMT) {
595 case S_IFBLK:
596 case S_IFCHR:
597 inode->i_rdev =
598 MKDEV(sysv_major(ip->i_df.if_u2.if_rdev) & 0x1ff,
599 sysv_minor(ip->i_df.if_u2.if_rdev));
600 break;
601 default:
1da177e4 602 inode->i_rdev = 0;
0432dab2 603 break;
1da177e4 604 }
0432dab2 605
1da177e4
LT
606 inode->i_generation = ip->i_d.di_gen;
607 i_size_write(inode, ip->i_d.di_size);
608 inode->i_blocks =
609 XFS_FSB_TO_BB(mp, ip->i_d.di_nblocks + ip->i_delayed_blks);
610 inode->i_atime.tv_sec = ip->i_d.di_atime.t_sec;
611 inode->i_atime.tv_nsec = ip->i_d.di_atime.t_nsec;
612 inode->i_mtime.tv_sec = ip->i_d.di_mtime.t_sec;
613 inode->i_mtime.tv_nsec = ip->i_d.di_mtime.t_nsec;
614 inode->i_ctime.tv_sec = ip->i_d.di_ctime.t_sec;
615 inode->i_ctime.tv_nsec = ip->i_d.di_ctime.t_nsec;
616 if (ip->i_d.di_flags & XFS_DIFLAG_IMMUTABLE)
617 inode->i_flags |= S_IMMUTABLE;
618 else
619 inode->i_flags &= ~S_IMMUTABLE;
620 if (ip->i_d.di_flags & XFS_DIFLAG_APPEND)
621 inode->i_flags |= S_APPEND;
622 else
623 inode->i_flags &= ~S_APPEND;
624 if (ip->i_d.di_flags & XFS_DIFLAG_SYNC)
625 inode->i_flags |= S_SYNC;
626 else
627 inode->i_flags &= ~S_SYNC;
628 if (ip->i_d.di_flags & XFS_DIFLAG_NOATIME)
629 inode->i_flags |= S_NOATIME;
630 else
631 inode->i_flags &= ~S_NOATIME;
b3aea4ed 632 xfs_iflags_clear(ip, XFS_IMODIFIED);
1da177e4
LT
633}
634
635void
636xfs_initialize_vnode(
48c872a9 637 struct xfs_mount *mp,
67fcaa73 638 bhv_vnode_t *vp,
745f6919 639 struct xfs_inode *ip)
1da177e4 640{
ec86dc02 641 struct inode *inode = vn_to_inode(vp);
1da177e4 642
739bfb2a 643 if (!ip->i_vnode) {
739bfb2a
CH
644 ip->i_vnode = vp;
645 inode->i_private = ip;
1da177e4
LT
646 }
647
648 /*
649 * We need to set the ops vectors, and unlock the inode, but if
650 * we have been called during the new inode create process, it is
651 * too early to fill in the Linux inode. We will get called a
652 * second time once the inode is properly set up, and then we can
653 * finish our work.
654 */
745f6919 655 if (ip->i_d.di_mode != 0 && (inode->i_state & I_NEW)) {
48c872a9 656 xfs_revalidate_inode(mp, vp, ip);
1da177e4 657 xfs_set_inodeops(inode);
ec86dc02 658
7a18c386 659 xfs_iflags_clear(ip, XFS_INEW);
1da177e4
LT
660 barrier();
661
662 unlock_new_inode(inode);
663 }
664}
665
666int
667xfs_blkdev_get(
668 xfs_mount_t *mp,
669 const char *name,
670 struct block_device **bdevp)
671{
672 int error = 0;
673
674 *bdevp = open_bdev_excl(name, 0, mp);
675 if (IS_ERR(*bdevp)) {
676 error = PTR_ERR(*bdevp);
677 printk("XFS: Invalid device [%s], error=%d\n", name, error);
678 }
679
680 return -error;
681}
682
683void
684xfs_blkdev_put(
685 struct block_device *bdev)
686{
687 if (bdev)
688 close_bdev_excl(bdev);
689}
690
f538d4da
CH
691/*
692 * Try to write out the superblock using barriers.
693 */
694STATIC int
695xfs_barrier_test(
696 xfs_mount_t *mp)
697{
698 xfs_buf_t *sbp = xfs_getsb(mp, 0);
699 int error;
700
701 XFS_BUF_UNDONE(sbp);
702 XFS_BUF_UNREAD(sbp);
703 XFS_BUF_UNDELAYWRITE(sbp);
704 XFS_BUF_WRITE(sbp);
705 XFS_BUF_UNASYNC(sbp);
706 XFS_BUF_ORDERED(sbp);
707
708 xfsbdstrat(mp, sbp);
709 error = xfs_iowait(sbp);
710
711 /*
712 * Clear all the flags we set and possible error state in the
713 * buffer. We only did the write to try out whether barriers
714 * worked and shouldn't leave any traces in the superblock
715 * buffer.
716 */
717 XFS_BUF_DONE(sbp);
718 XFS_BUF_ERROR(sbp, 0);
719 XFS_BUF_UNORDERED(sbp);
720
721 xfs_buf_relse(sbp);
722 return error;
723}
724
725void
726xfs_mountfs_check_barriers(xfs_mount_t *mp)
727{
728 int error;
729
730 if (mp->m_logdev_targp != mp->m_ddev_targp) {
731 xfs_fs_cmn_err(CE_NOTE, mp,
732 "Disabling barriers, not supported with external log device");
733 mp->m_flags &= ~XFS_MOUNT_BARRIER;
4ef19ddd 734 return;
f538d4da
CH
735 }
736
ce8e922c 737 if (mp->m_ddev_targp->bt_bdev->bd_disk->queue->ordered ==
f538d4da
CH
738 QUEUE_ORDERED_NONE) {
739 xfs_fs_cmn_err(CE_NOTE, mp,
740 "Disabling barriers, not supported by the underlying device");
741 mp->m_flags &= ~XFS_MOUNT_BARRIER;
4ef19ddd 742 return;
f538d4da
CH
743 }
744
b2ea401b
NS
745 if (xfs_readonly_buftarg(mp->m_ddev_targp)) {
746 xfs_fs_cmn_err(CE_NOTE, mp,
747 "Disabling barriers, underlying device is readonly");
748 mp->m_flags &= ~XFS_MOUNT_BARRIER;
749 return;
750 }
751
f538d4da
CH
752 error = xfs_barrier_test(mp);
753 if (error) {
754 xfs_fs_cmn_err(CE_NOTE, mp,
755 "Disabling barriers, trial barrier write failed");
756 mp->m_flags &= ~XFS_MOUNT_BARRIER;
4ef19ddd 757 return;
f538d4da
CH
758 }
759}
760
761void
762xfs_blkdev_issue_flush(
763 xfs_buftarg_t *buftarg)
764{
ce8e922c 765 blkdev_issue_flush(buftarg->bt_bdev, NULL);
f538d4da 766}
1da177e4
LT
767
768STATIC struct inode *
a50cd269 769xfs_fs_alloc_inode(
1da177e4
LT
770 struct super_block *sb)
771{
67fcaa73 772 bhv_vnode_t *vp;
1da177e4 773
8758280f
NS
774 vp = kmem_zone_alloc(xfs_vnode_zone, KM_SLEEP);
775 if (unlikely(!vp))
1da177e4 776 return NULL;
ec86dc02 777 return vn_to_inode(vp);
1da177e4
LT
778}
779
780STATIC void
a50cd269 781xfs_fs_destroy_inode(
1da177e4
LT
782 struct inode *inode)
783{
ec86dc02 784 kmem_zone_free(xfs_vnode_zone, vn_from_inode(inode));
1da177e4
LT
785}
786
787STATIC void
a50cd269 788xfs_fs_inode_init_once(
8758280f 789 kmem_zone_t *zonep,
4ba9b9d0 790 void *vnode)
1da177e4 791{
a35afb83 792 inode_init_once(vn_to_inode((bhv_vnode_t *)vnode));
1da177e4
LT
793}
794
795STATIC int
8758280f 796xfs_init_zones(void)
1da177e4 797{
67fcaa73 798 xfs_vnode_zone = kmem_zone_init_flags(sizeof(bhv_vnode_t), "xfs_vnode",
e0cc2325
NS
799 KM_ZONE_HWALIGN | KM_ZONE_RECLAIM |
800 KM_ZONE_SPREAD,
a50cd269 801 xfs_fs_inode_init_once);
0829c360
CH
802 if (!xfs_vnode_zone)
803 goto out;
804
805 xfs_ioend_zone = kmem_zone_init(sizeof(xfs_ioend_t), "xfs_ioend");
806 if (!xfs_ioend_zone)
807 goto out_destroy_vnode_zone;
808
93d2341c
MD
809 xfs_ioend_pool = mempool_create_slab_pool(4 * MAX_BUF_PER_PAGE,
810 xfs_ioend_zone);
0829c360
CH
811 if (!xfs_ioend_pool)
812 goto out_free_ioend_zone;
1da177e4 813 return 0;
0829c360 814
0829c360
CH
815 out_free_ioend_zone:
816 kmem_zone_destroy(xfs_ioend_zone);
817 out_destroy_vnode_zone:
818 kmem_zone_destroy(xfs_vnode_zone);
819 out:
820 return -ENOMEM;
1da177e4
LT
821}
822
823STATIC void
8758280f 824xfs_destroy_zones(void)
1da177e4 825{
0829c360
CH
826 mempool_destroy(xfs_ioend_pool);
827 kmem_zone_destroy(xfs_vnode_zone);
828 kmem_zone_destroy(xfs_ioend_zone);
1da177e4
LT
829}
830
831/*
832 * Attempt to flush the inode, this will actually fail
833 * if the inode is pinned, but we dirty the inode again
834 * at the point when it is unpinned after a log write,
8758280f 835 * since this is when the inode itself becomes flushable.
1da177e4
LT
836 */
837STATIC int
a50cd269 838xfs_fs_write_inode(
1da177e4
LT
839 struct inode *inode,
840 int sync)
841{
1da177e4
LT
842 int error = 0, flags = FLUSH_INODE;
843
cf441eeb 844 xfs_itrace_entry(XFS_I(inode));
739bfb2a
CH
845 if (sync) {
846 filemap_fdatawait(inode->i_mapping);
847 flags |= FLUSH_SYNC;
1da177e4 848 }
739bfb2a 849 error = xfs_inode_flush(XFS_I(inode), flags);
e893bffd
LM
850 /*
851 * if we failed to write out the inode then mark
852 * it dirty again so we'll try again later.
853 */
854 if (error)
855 mark_inode_dirty_sync(inode);
739bfb2a 856
1da177e4
LT
857 return -error;
858}
859
860STATIC void
a50cd269 861xfs_fs_clear_inode(
1da177e4
LT
862 struct inode *inode)
863{
1543d79c 864 xfs_inode_t *ip = XFS_I(inode);
56d433e4 865
02ba71de 866 /*
1543d79c 867 * ip can be null when xfs_iget_core calls xfs_idestroy if we
02ba71de
CH
868 * find an inode with di_mode == 0 but without IGET_CREATE set.
869 */
1543d79c 870 if (ip) {
cf441eeb 871 xfs_itrace_entry(ip);
1543d79c
CH
872 XFS_STATS_INC(vn_rele);
873 XFS_STATS_INC(vn_remove);
874 XFS_STATS_INC(vn_reclaim);
875 XFS_STATS_DEC(vn_active);
876
877 xfs_inactive(ip);
878 xfs_iflags_clear(ip, XFS_IMODIFIED);
879 if (xfs_reclaim(ip))
880 panic("%s: cannot reclaim 0x%p\n", __FUNCTION__, inode);
b3aea4ed 881 }
56d433e4 882
739bfb2a 883 ASSERT(XFS_I(inode) == NULL);
56d433e4 884}
1da177e4
LT
885
886/*
887 * Enqueue a work item to be picked up by the vfs xfssyncd thread.
888 * Doing this has two advantages:
889 * - It saves on stack space, which is tight in certain situations
890 * - It can be used (with care) as a mechanism to avoid deadlocks.
891 * Flushing while allocating in a full filesystem requires both.
892 */
893STATIC void
894xfs_syncd_queue_work(
74394496 895 struct xfs_mount *mp,
1da177e4 896 void *data,
74394496 897 void (*syncer)(struct xfs_mount *, void *))
1da177e4 898{
b83bd138 899 struct bhv_vfs_sync_work *work;
1da177e4 900
b83bd138 901 work = kmem_alloc(sizeof(struct bhv_vfs_sync_work), KM_SLEEP);
1da177e4
LT
902 INIT_LIST_HEAD(&work->w_list);
903 work->w_syncer = syncer;
904 work->w_data = data;
74394496
CH
905 work->w_mount = mp;
906 spin_lock(&mp->m_sync_lock);
907 list_add_tail(&work->w_list, &mp->m_sync_list);
908 spin_unlock(&mp->m_sync_lock);
909 wake_up_process(mp->m_sync_task);
1da177e4
LT
910}
911
912/*
913 * Flush delayed allocate data, attempting to free up reserved space
914 * from existing allocations. At this point a new allocation attempt
915 * has failed with ENOSPC and we are in the process of scratching our
916 * heads, looking about for more room...
917 */
918STATIC void
919xfs_flush_inode_work(
74394496
CH
920 struct xfs_mount *mp,
921 void *arg)
1da177e4 922{
74394496
CH
923 struct inode *inode = arg;
924 filemap_flush(inode->i_mapping);
925 iput(inode);
1da177e4
LT
926}
927
928void
929xfs_flush_inode(
930 xfs_inode_t *ip)
931{
74394496 932 struct inode *inode = ip->i_vnode;
1da177e4
LT
933
934 igrab(inode);
74394496 935 xfs_syncd_queue_work(ip->i_mount, inode, xfs_flush_inode_work);
041e0e3b 936 delay(msecs_to_jiffies(500));
1da177e4
LT
937}
938
939/*
940 * This is the "bigger hammer" version of xfs_flush_inode_work...
941 * (IOW, "If at first you don't succeed, use a Bigger Hammer").
942 */
943STATIC void
944xfs_flush_device_work(
74394496
CH
945 struct xfs_mount *mp,
946 void *arg)
1da177e4 947{
74394496 948 struct inode *inode = arg;
b267ce99 949 sync_blockdev(mp->m_super->s_bdev);
74394496 950 iput(inode);
1da177e4
LT
951}
952
953void
954xfs_flush_device(
955 xfs_inode_t *ip)
956{
ec86dc02 957 struct inode *inode = vn_to_inode(XFS_ITOV(ip));
1da177e4
LT
958
959 igrab(inode);
74394496 960 xfs_syncd_queue_work(ip->i_mount, inode, xfs_flush_device_work);
041e0e3b 961 delay(msecs_to_jiffies(500));
1da177e4
LT
962 xfs_log_force(ip->i_mount, (xfs_lsn_t)0, XFS_LOG_FORCE|XFS_LOG_SYNC);
963}
964
1da177e4 965STATIC void
74394496
CH
966xfs_sync_worker(
967 struct xfs_mount *mp,
1da177e4
LT
968 void *unused)
969{
970 int error;
971
74394496
CH
972 if (!(mp->m_flags & XFS_MOUNT_RDONLY))
973 error = xfs_sync(mp, SYNC_FSDATA | SYNC_BDFLUSH | SYNC_ATTR |
974 SYNC_REFCACHE | SYNC_SUPER);
975 mp->m_sync_seq++;
976 wake_up(&mp->m_wait_single_sync_task);
1da177e4
LT
977}
978
979STATIC int
980xfssyncd(
981 void *arg)
982{
74394496 983 struct xfs_mount *mp = arg;
1da177e4 984 long timeleft;
b83bd138 985 bhv_vfs_sync_work_t *work, *n;
4df08c52 986 LIST_HEAD (tmp);
1da177e4 987
83144186 988 set_freezable();
041e0e3b 989 timeleft = xfs_syncd_centisecs * msecs_to_jiffies(10);
1da177e4 990 for (;;) {
041e0e3b 991 timeleft = schedule_timeout_interruptible(timeleft);
1da177e4 992 /* swsusp */
3e1d1d28 993 try_to_freeze();
74394496 994 if (kthread_should_stop() && list_empty(&mp->m_sync_list))
1da177e4
LT
995 break;
996
74394496 997 spin_lock(&mp->m_sync_lock);
1da177e4
LT
998 /*
999 * We can get woken by laptop mode, to do a sync -
1000 * that's the (only!) case where the list would be
1001 * empty with time remaining.
1002 */
74394496 1003 if (!timeleft || list_empty(&mp->m_sync_list)) {
1da177e4 1004 if (!timeleft)
041e0e3b
NA
1005 timeleft = xfs_syncd_centisecs *
1006 msecs_to_jiffies(10);
74394496
CH
1007 INIT_LIST_HEAD(&mp->m_sync_work.w_list);
1008 list_add_tail(&mp->m_sync_work.w_list,
1009 &mp->m_sync_list);
1da177e4 1010 }
74394496 1011 list_for_each_entry_safe(work, n, &mp->m_sync_list, w_list)
1da177e4 1012 list_move(&work->w_list, &tmp);
74394496 1013 spin_unlock(&mp->m_sync_lock);
1da177e4
LT
1014
1015 list_for_each_entry_safe(work, n, &tmp, w_list) {
74394496 1016 (*work->w_syncer)(mp, work->w_data);
1da177e4 1017 list_del(&work->w_list);
74394496 1018 if (work == &mp->m_sync_work)
1da177e4 1019 continue;
b83bd138 1020 kmem_free(work, sizeof(struct bhv_vfs_sync_work));
1da177e4
LT
1021 }
1022 }
1023
1da177e4
LT
1024 return 0;
1025}
1026
1da177e4 1027STATIC void
a50cd269 1028xfs_fs_put_super(
1da177e4
LT
1029 struct super_block *sb)
1030{
745f6919 1031 struct xfs_mount *mp = XFS_M(sb);
1da177e4
LT
1032 int error;
1033
74394496
CH
1034 kthread_stop(mp->m_sync_task);
1035
745f6919
CH
1036 xfs_sync(mp, SYNC_ATTR | SYNC_DELWRI);
1037 error = xfs_unmount(mp, 0, NULL);
b267ce99 1038 if (error)
b83bd138 1039 printk("XFS: unmount got error=%d\n", error);
1da177e4
LT
1040}
1041
1042STATIC void
a50cd269 1043xfs_fs_write_super(
1da177e4
LT
1044 struct super_block *sb)
1045{
b83bd138 1046 if (!(sb->s_flags & MS_RDONLY))
745f6919 1047 xfs_sync(XFS_M(sb), SYNC_FSDATA);
1da177e4
LT
1048 sb->s_dirt = 0;
1049}
1050
1051STATIC int
a50cd269 1052xfs_fs_sync_super(
1da177e4
LT
1053 struct super_block *sb,
1054 int wait)
1055{
745f6919 1056 struct xfs_mount *mp = XFS_M(sb);
b83bd138
NS
1057 int error;
1058 int flags;
1da177e4 1059
e893bffd
LM
1060 /*
1061 * Treat a sync operation like a freeze. This is to work
1062 * around a race in sync_inodes() which works in two phases
1063 * - an asynchronous flush, which can write out an inode
1064 * without waiting for file size updates to complete, and a
1065 * synchronous flush, which wont do anything because the
1066 * async flush removed the inode's dirty flag. Also
1067 * sync_inodes() will not see any files that just have
1068 * outstanding transactions to be flushed because we don't
1069 * dirty the Linux inode until after the transaction I/O
1070 * completes.
1071 */
1072 if (wait || unlikely(sb->s_frozen == SB_FREEZE_WRITE)) {
2823945f
DC
1073 /*
1074 * First stage of freeze - no more writers will make progress
1075 * now we are here, so we flush delwri and delalloc buffers
1076 * here, then wait for all I/O to complete. Data is frozen at
1077 * that point. Metadata is not frozen, transactions can still
1078 * occur here so don't bother flushing the buftarg (i.e
1079 * SYNC_QUIESCE) because it'll just get dirty again.
1080 */
516b2e7c 1081 flags = SYNC_DATA_QUIESCE;
2823945f 1082 } else
e893bffd 1083 flags = SYNC_FSDATA;
1da177e4 1084
745f6919 1085 error = xfs_sync(mp, flags);
1da177e4
LT
1086 sb->s_dirt = 0;
1087
1088 if (unlikely(laptop_mode)) {
74394496 1089 int prev_sync_seq = mp->m_sync_seq;
1da177e4
LT
1090
1091 /*
1092 * The disk must be active because we're syncing.
1093 * We schedule xfssyncd now (now that the disk is
1094 * active) instead of later (when it might not be).
1095 */
74394496 1096 wake_up_process(mp->m_sync_task);
1da177e4
LT
1097 /*
1098 * We have to wait for the sync iteration to complete.
1099 * If we don't, the disk activity caused by the sync
1100 * will come after the sync is completed, and that
1101 * triggers another sync from laptop mode.
1102 */
74394496
CH
1103 wait_event(mp->m_wait_single_sync_task,
1104 mp->m_sync_seq != prev_sync_seq);
1da177e4
LT
1105 }
1106
1107 return -error;
1108}
1109
1110STATIC int
a50cd269 1111xfs_fs_statfs(
726c3342 1112 struct dentry *dentry,
1da177e4
LT
1113 struct kstatfs *statp)
1114{
4ca488eb
CH
1115 struct xfs_mount *mp = XFS_M(dentry->d_sb);
1116 xfs_sb_t *sbp = &mp->m_sb;
1117 __uint64_t fakeinos, id;
1118 xfs_extlen_t lsize;
1119
1120 statp->f_type = XFS_SB_MAGIC;
1121 statp->f_namelen = MAXNAMELEN - 1;
1122
1123 id = huge_encode_dev(mp->m_ddev_targp->bt_dev);
1124 statp->f_fsid.val[0] = (u32)id;
1125 statp->f_fsid.val[1] = (u32)(id >> 32);
1126
1127 xfs_icsb_sync_counters_flags(mp, XFS_ICSB_LAZY_COUNT);
1128
1129 spin_lock(&mp->m_sb_lock);
1130 statp->f_bsize = sbp->sb_blocksize;
1131 lsize = sbp->sb_logstart ? sbp->sb_logblocks : 0;
1132 statp->f_blocks = sbp->sb_dblocks - lsize;
1133 statp->f_bfree = statp->f_bavail =
1134 sbp->sb_fdblocks - XFS_ALLOC_SET_ASIDE(mp);
1135 fakeinos = statp->f_bfree << sbp->sb_inopblog;
1136#if XFS_BIG_INUMS
1137 fakeinos += mp->m_inoadd;
1138#endif
1139 statp->f_files =
1140 MIN(sbp->sb_icount + fakeinos, (__uint64_t)XFS_MAXINUMBER);
1141 if (mp->m_maxicount)
1142#if XFS_BIG_INUMS
1143 if (!mp->m_inoadd)
1144#endif
1145 statp->f_files = min_t(typeof(statp->f_files),
1146 statp->f_files,
1147 mp->m_maxicount);
1148 statp->f_ffree = statp->f_files - (sbp->sb_icount - sbp->sb_ifree);
1149 spin_unlock(&mp->m_sb_lock);
1150
1151 XFS_QM_DQSTATVFS(XFS_I(dentry->d_inode), statp);
1152 return 0;
1da177e4
LT
1153}
1154
1155STATIC int
a50cd269 1156xfs_fs_remount(
1da177e4
LT
1157 struct super_block *sb,
1158 int *flags,
1159 char *options)
1160{
745f6919 1161 struct xfs_mount *mp = XFS_M(sb);
764d1f89 1162 struct xfs_mount_args *args = xfs_args_allocate(sb, 0);
1da177e4
LT
1163 int error;
1164
745f6919 1165 error = xfs_parseargs(mp, options, args, 1);
1da177e4 1166 if (!error)
745f6919 1167 error = xfs_mntupdate(mp, flags, args);
1da177e4
LT
1168 kmem_free(args, sizeof(*args));
1169 return -error;
1170}
1171
9909c4aa
CH
1172/*
1173 * Second stage of a freeze. The data is already frozen so we only
1174 * need to take care of themetadata. Once that's done write a dummy
1175 * record to dirty the log in case of a crash while frozen.
1176 */
1da177e4 1177STATIC void
a50cd269 1178xfs_fs_lockfs(
1da177e4
LT
1179 struct super_block *sb)
1180{
9909c4aa
CH
1181 struct xfs_mount *mp = XFS_M(sb);
1182
1183 xfs_attr_quiesce(mp);
1184 xfs_fs_log_dummy(mp);
1da177e4
LT
1185}
1186
1187STATIC int
a50cd269 1188xfs_fs_show_options(
1da177e4
LT
1189 struct seq_file *m,
1190 struct vfsmount *mnt)
1191{
745f6919 1192 return -xfs_showargs(XFS_M(mnt->mnt_sb), m);
1da177e4
LT
1193}
1194
ee34807a 1195STATIC int
a50cd269 1196xfs_fs_quotasync(
ee34807a
NS
1197 struct super_block *sb,
1198 int type)
1199{
b09cc771 1200 return -XFS_QM_QUOTACTL(XFS_M(sb), Q_XQUOTASYNC, 0, NULL);
ee34807a
NS
1201}
1202
1da177e4 1203STATIC int
a50cd269 1204xfs_fs_getxstate(
1da177e4
LT
1205 struct super_block *sb,
1206 struct fs_quota_stat *fqs)
1207{
b09cc771 1208 return -XFS_QM_QUOTACTL(XFS_M(sb), Q_XGETQSTAT, 0, (caddr_t)fqs);
1da177e4
LT
1209}
1210
1211STATIC int
a50cd269 1212xfs_fs_setxstate(
1da177e4
LT
1213 struct super_block *sb,
1214 unsigned int flags,
1215 int op)
1216{
b09cc771 1217 return -XFS_QM_QUOTACTL(XFS_M(sb), op, 0, (caddr_t)&flags);
1da177e4
LT
1218}
1219
1220STATIC int
a50cd269 1221xfs_fs_getxquota(
1da177e4
LT
1222 struct super_block *sb,
1223 int type,
1224 qid_t id,
1225 struct fs_disk_quota *fdq)
1226{
b09cc771 1227 return -XFS_QM_QUOTACTL(XFS_M(sb),
b83bd138
NS
1228 (type == USRQUOTA) ? Q_XGETQUOTA :
1229 ((type == GRPQUOTA) ? Q_XGETGQUOTA :
1230 Q_XGETPQUOTA), id, (caddr_t)fdq);
1da177e4
LT
1231}
1232
1233STATIC int
a50cd269 1234xfs_fs_setxquota(
1da177e4
LT
1235 struct super_block *sb,
1236 int type,
1237 qid_t id,
1238 struct fs_disk_quota *fdq)
1239{
b09cc771 1240 return -XFS_QM_QUOTACTL(XFS_M(sb),
b83bd138
NS
1241 (type == USRQUOTA) ? Q_XSETQLIM :
1242 ((type == GRPQUOTA) ? Q_XSETGQLIM :
1243 Q_XSETPQLIM), id, (caddr_t)fdq);
1da177e4
LT
1244}
1245
1246STATIC int
a50cd269 1247xfs_fs_fill_super(
1da177e4
LT
1248 struct super_block *sb,
1249 void *data,
1250 int silent)
1251{
0a74cd19 1252 struct inode *rootvp;
745f6919 1253 struct xfs_mount *mp = NULL;
764d1f89 1254 struct xfs_mount_args *args = xfs_args_allocate(sb, silent);
b83bd138 1255 int error;
1da177e4 1256
745f6919 1257 mp = xfs_mount_init();
1da177e4 1258
74394496
CH
1259 INIT_LIST_HEAD(&mp->m_sync_list);
1260 spin_lock_init(&mp->m_sync_lock);
1261 init_waitqueue_head(&mp->m_wait_single_sync_task);
1262
b267ce99
CH
1263 mp->m_super = sb;
1264 sb->s_fs_info = mp;
1da177e4 1265
bd186aa9
CH
1266 if (sb->s_flags & MS_RDONLY)
1267 mp->m_flags |= XFS_MOUNT_RDONLY;
1268
745f6919
CH
1269 error = xfs_parseargs(mp, (char *)data, args, 0);
1270 if (error)
1da177e4 1271 goto fail_vfsop;
1da177e4
LT
1272
1273 sb_min_blocksize(sb, BBSIZE);
a50cd269 1274 sb->s_export_op = &xfs_export_operations;
a50cd269
NS
1275 sb->s_qcop = &xfs_quotactl_operations;
1276 sb->s_op = &xfs_super_operations;
1da177e4 1277
745f6919
CH
1278 error = xfs_mount(mp, args, NULL);
1279 if (error)
1da177e4 1280 goto fail_vfsop;
1da177e4 1281
1da177e4 1282 sb->s_dirt = 1;
4ca488eb
CH
1283 sb->s_magic = XFS_SB_MAGIC;
1284 sb->s_blocksize = mp->m_sb.sb_blocksize;
1285 sb->s_blocksize_bits = ffs(sb->s_blocksize) - 1;
1da177e4
LT
1286 sb->s_maxbytes = xfs_max_file_offset(sb->s_blocksize_bits);
1287 sb->s_time_gran = 1;
1288 set_posix_acl_flag(sb);
1289
745f6919 1290 error = xfs_root(mp, &rootvp);
1da177e4
LT
1291 if (error)
1292 goto fail_unmount;
1293
ec86dc02 1294 sb->s_root = d_alloc_root(vn_to_inode(rootvp));
1da177e4
LT
1295 if (!sb->s_root) {
1296 error = ENOMEM;
1297 goto fail_vnrele;
1298 }
1299 if (is_bad_inode(sb->s_root->d_inode)) {
1300 error = EINVAL;
1301 goto fail_vnrele;
1302 }
74394496
CH
1303
1304 mp->m_sync_work.w_syncer = xfs_sync_worker;
1305 mp->m_sync_work.w_mount = mp;
1306 mp->m_sync_task = kthread_run(xfssyncd, mp, "xfssyncd");
1307 if (IS_ERR(mp->m_sync_task)) {
1308 error = -PTR_ERR(mp->m_sync_task);
1da177e4 1309 goto fail_vnrele;
74394496
CH
1310 }
1311
cf441eeb 1312 xfs_itrace_exit(XFS_I(sb->s_root->d_inode));
1da177e4
LT
1313
1314 kmem_free(args, sizeof(*args));
1315 return 0;
1316
1317fail_vnrele:
1318 if (sb->s_root) {
1319 dput(sb->s_root);
1320 sb->s_root = NULL;
1321 } else {
1322 VN_RELE(rootvp);
1323 }
1324
1325fail_unmount:
745f6919 1326 xfs_unmount(mp, 0, NULL);
1da177e4
LT
1327
1328fail_vfsop:
1da177e4
LT
1329 kmem_free(args, sizeof(*args));
1330 return -error;
1331}
1332
454e2398 1333STATIC int
a50cd269 1334xfs_fs_get_sb(
1da177e4
LT
1335 struct file_system_type *fs_type,
1336 int flags,
1337 const char *dev_name,
454e2398
DH
1338 void *data,
1339 struct vfsmount *mnt)
1da177e4 1340{
454e2398
DH
1341 return get_sb_bdev(fs_type, flags, dev_name, data, xfs_fs_fill_super,
1342 mnt);
a50cd269
NS
1343}
1344
7989cb8e 1345static struct super_operations xfs_super_operations = {
a50cd269
NS
1346 .alloc_inode = xfs_fs_alloc_inode,
1347 .destroy_inode = xfs_fs_destroy_inode,
1348 .write_inode = xfs_fs_write_inode,
1349 .clear_inode = xfs_fs_clear_inode,
1350 .put_super = xfs_fs_put_super,
1351 .write_super = xfs_fs_write_super,
1352 .sync_fs = xfs_fs_sync_super,
1353 .write_super_lockfs = xfs_fs_lockfs,
1354 .statfs = xfs_fs_statfs,
1355 .remount_fs = xfs_fs_remount,
1356 .show_options = xfs_fs_show_options,
1da177e4
LT
1357};
1358
7989cb8e 1359static struct quotactl_ops xfs_quotactl_operations = {
a50cd269
NS
1360 .quota_sync = xfs_fs_quotasync,
1361 .get_xstate = xfs_fs_getxstate,
1362 .set_xstate = xfs_fs_setxstate,
1363 .get_xquota = xfs_fs_getxquota,
1364 .set_xquota = xfs_fs_setxquota,
1da177e4
LT
1365};
1366
5085b607 1367static struct file_system_type xfs_fs_type = {
1da177e4
LT
1368 .owner = THIS_MODULE,
1369 .name = "xfs",
a50cd269 1370 .get_sb = xfs_fs_get_sb,
1da177e4
LT
1371 .kill_sb = kill_block_super,
1372 .fs_flags = FS_REQUIRES_DEV,
1373};
1374
1375
1376STATIC int __init
1377init_xfs_fs( void )
1378{
1379 int error;
1da177e4
LT
1380 static char message[] __initdata = KERN_INFO \
1381 XFS_VERSION_STRING " with " XFS_BUILD_OPTIONS " enabled\n";
1382
1383 printk(message);
1384
1da177e4
LT
1385 ktrace_init(64);
1386
8758280f 1387 error = xfs_init_zones();
1da177e4 1388 if (error < 0)
0829c360 1389 goto undo_zones;
1da177e4 1390
ce8e922c 1391 error = xfs_buf_init();
1da177e4 1392 if (error < 0)
ce8e922c 1393 goto undo_buffers;
1da177e4
LT
1394
1395 vn_init();
1396 xfs_init();
1397 uuid_init();
1398 vfs_initquota();
1399
1400 error = register_filesystem(&xfs_fs_type);
1401 if (error)
1402 goto undo_register;
1da177e4
LT
1403 return 0;
1404
1405undo_register:
ce8e922c 1406 xfs_buf_terminate();
1da177e4 1407
ce8e922c 1408undo_buffers:
8758280f 1409 xfs_destroy_zones();
1da177e4 1410
0829c360 1411undo_zones:
1da177e4
LT
1412 return error;
1413}
1414
1415STATIC void __exit
1416exit_xfs_fs( void )
1417{
1418 vfs_exitquota();
1da177e4
LT
1419 unregister_filesystem(&xfs_fs_type);
1420 xfs_cleanup();
ce8e922c 1421 xfs_buf_terminate();
8758280f 1422 xfs_destroy_zones();
1da177e4
LT
1423 ktrace_uninit();
1424}
1425
1426module_init(init_xfs_fs);
1427module_exit(exit_xfs_fs);
1428
1429MODULE_AUTHOR("Silicon Graphics, Inc.");
1430MODULE_DESCRIPTION(XFS_VERSION_STRING " with " XFS_BUILD_OPTIONS " enabled");
1431MODULE_LICENSE("GPL");