2007-04-26 16:49:28 -06:00
|
|
|
/* AFS superblock handling
|
|
|
|
*
|
2007-04-26 16:55:03 -06:00
|
|
|
* Copyright (c) 2002, 2007 Red Hat, Inc. All rights reserved.
|
2005-04-16 16:20:36 -06:00
|
|
|
*
|
|
|
|
* This software may be freely redistributed under the terms of the
|
|
|
|
* GNU General Public License.
|
|
|
|
*
|
|
|
|
* You should have received a copy of the GNU General Public License
|
|
|
|
* along with this program; if not, write to the Free Software
|
|
|
|
* Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
|
|
|
|
*
|
|
|
|
* Authors: David Howells <dhowells@redhat.com>
|
2008-06-05 23:46:18 -06:00
|
|
|
* David Woodhouse <dwmw2@infradead.org>
|
2005-04-16 16:20:36 -06:00
|
|
|
*
|
|
|
|
*/
|
|
|
|
|
|
|
|
#include <linux/kernel.h>
|
|
|
|
#include <linux/module.h>
|
|
|
|
#include <linux/init.h>
|
|
|
|
#include <linux/slab.h>
|
|
|
|
#include <linux/fs.h>
|
|
|
|
#include <linux/pagemap.h>
|
2007-05-03 04:11:29 -06:00
|
|
|
#include <linux/parser.h>
|
2007-05-10 23:22:20 -06:00
|
|
|
#include <linux/statfs.h>
|
Detach sched.h from mm.h
First thing mm.h does is including sched.h solely for can_do_mlock() inline
function which has "current" dereference inside. By dealing with can_do_mlock()
mm.h can be detached from sched.h which is good. See below, why.
This patch
a) removes unconditional inclusion of sched.h from mm.h
b) makes can_do_mlock() normal function in mm/mlock.c
c) exports can_do_mlock() to not break compilation
d) adds sched.h inclusions back to files that were getting it indirectly.
e) adds less bloated headers to some files (asm/signal.h, jiffies.h) that were
getting them indirectly
Net result is:
a) mm.h users would get less code to open, read, preprocess, parse, ... if
they don't need sched.h
b) sched.h stops being dependency for significant number of files:
on x86_64 allmodconfig touching sched.h results in recompile of 4083 files,
after patch it's only 3744 (-8.3%).
Cross-compile tested on
all arm defconfigs, all mips defconfigs, all powerpc defconfigs,
alpha alpha-up
arm
i386 i386-up i386-defconfig i386-allnoconfig
ia64 ia64-up
m68k
mips
parisc parisc-up
powerpc powerpc-up
s390 s390-up
sparc sparc-up
sparc64 sparc64-up
um-x86_64
x86_64 x86_64-up x86_64-defconfig x86_64-allnoconfig
as well as my two usual configs.
Signed-off-by: Alexey Dobriyan <adobriyan@gmail.com>
Signed-off-by: Linus Torvalds <torvalds@linux-foundation.org>
2007-05-20 15:22:52 -06:00
|
|
|
#include <linux/sched.h>
|
2005-04-16 16:20:36 -06:00
|
|
|
#include "internal.h"
|
|
|
|
|
|
|
|
#define AFS_FS_MAGIC 0x6B414653 /* 'kAFS' */
|
|
|
|
|
2007-10-17 00:25:51 -06:00
|
|
|
static void afs_i_init_once(struct kmem_cache *cachep, void *foo);
|
[PATCH] VFS: Permit filesystem to override root dentry on mount
Extend the get_sb() filesystem operation to take an extra argument that
permits the VFS to pass in the target vfsmount that defines the mountpoint.
The filesystem is then required to manually set the superblock and root dentry
pointers. For most filesystems, this should be done with simple_set_mnt()
which will set the superblock pointer and then set the root dentry to the
superblock's s_root (as per the old default behaviour).
The get_sb() op now returns an integer as there's now no need to return the
superblock pointer.
This patch permits a superblock to be implicitly shared amongst several mount
points, such as can be done with NFS to avoid potential inode aliasing. In
such a case, simple_set_mnt() would not be called, and instead the mnt_root
and mnt_sb would be set directly.
The patch also makes the following changes:
(*) the get_sb_*() convenience functions in the core kernel now take a vfsmount
pointer argument and return an integer, so most filesystems have to change
very little.
(*) If one of the convenience function is not used, then get_sb() should
normally call simple_set_mnt() to instantiate the vfsmount. This will
always return 0, and so can be tail-called from get_sb().
(*) generic_shutdown_super() now calls shrink_dcache_sb() to clean up the
dcache upon superblock destruction rather than shrink_dcache_anon().
This is required because the superblock may now have multiple trees that
aren't actually bound to s_root, but that still need to be cleaned up. The
currently called functions assume that the whole tree is rooted at s_root,
and that anonymous dentries are not the roots of trees which results in
dentries being left unculled.
However, with the way NFS superblock sharing are currently set to be
implemented, these assumptions are violated: the root of the filesystem is
simply a dummy dentry and inode (the real inode for '/' may well be
inaccessible), and all the vfsmounts are rooted on anonymous[*] dentries
with child trees.
[*] Anonymous until discovered from another tree.
(*) The documentation has been adjusted, including the additional bit of
changing ext2_* into foo_* in the documentation.
[akpm@osdl.org: convert ipath_fs, do other stuff]
Signed-off-by: David Howells <dhowells@redhat.com>
Acked-by: Al Viro <viro@zeniv.linux.org.uk>
Cc: Nathan Scott <nathans@sgi.com>
Cc: Roland Dreier <rolandd@cisco.com>
Signed-off-by: Andrew Morton <akpm@osdl.org>
Signed-off-by: Linus Torvalds <torvalds@osdl.org>
2006-06-23 03:02:57 -06:00
|
|
|
static int afs_get_sb(struct file_system_type *fs_type,
|
|
|
|
int flags, const char *dev_name,
|
|
|
|
void *data, struct vfsmount *mnt);
|
2005-04-16 16:20:36 -06:00
|
|
|
static struct inode *afs_alloc_inode(struct super_block *sb);
|
|
|
|
static void afs_put_super(struct super_block *sb);
|
|
|
|
static void afs_destroy_inode(struct inode *inode);
|
2007-05-10 23:22:20 -06:00
|
|
|
static int afs_statfs(struct dentry *dentry, struct kstatfs *buf);
|
2005-04-16 16:20:36 -06:00
|
|
|
|
2006-06-09 07:34:16 -06:00
|
|
|
struct file_system_type afs_fs_type = {
|
2005-04-16 16:20:36 -06:00
|
|
|
.owner = THIS_MODULE,
|
|
|
|
.name = "afs",
|
|
|
|
.get_sb = afs_get_sb,
|
|
|
|
.kill_sb = kill_anon_super,
|
2007-05-03 04:11:29 -06:00
|
|
|
.fs_flags = 0,
|
2005-04-16 16:20:36 -06:00
|
|
|
};
|
|
|
|
|
2007-02-12 01:55:41 -07:00
|
|
|
static const struct super_operations afs_super_ops = {
|
2007-05-10 23:22:20 -06:00
|
|
|
.statfs = afs_statfs,
|
2005-04-16 16:20:36 -06:00
|
|
|
.alloc_inode = afs_alloc_inode,
|
AFS: implement basic file write support
Implement support for writing to regular AFS files, including:
(1) write
(2) truncate
(3) fsync, fdatasync
(4) chmod, chown, chgrp, utime.
AFS writeback attempts to batch writes into as chunks as large as it can manage
up to the point that it writes back 65535 pages in one chunk or it meets a
locked page.
Furthermore, if a page has been written to using a particular key, then should
another write to that page use some other key, the first write will be flushed
before the second is allowed to take place. If the first write fails due to a
security error, then the page will be scrapped and reread before the second
write takes place.
If a page is dirty and the callback on it is broken by the server, then the
dirty data is not discarded (same behaviour as NFS).
Shared-writable mappings are not supported by this patch.
[akpm@linux-foundation.org: fix a bunch of warnings]
Signed-off-by: David Howells <dhowells@redhat.com>
Signed-off-by: Andrew Morton <akpm@linux-foundation.org>
Signed-off-by: Linus Torvalds <torvalds@linux-foundation.org>
2007-05-09 03:33:46 -06:00
|
|
|
.write_inode = afs_write_inode,
|
2005-04-16 16:20:36 -06:00
|
|
|
.destroy_inode = afs_destroy_inode,
|
|
|
|
.clear_inode = afs_clear_inode,
|
|
|
|
.put_super = afs_put_super,
|
2008-02-08 05:21:37 -07:00
|
|
|
.show_options = generic_show_options,
|
2005-04-16 16:20:36 -06:00
|
|
|
};
|
|
|
|
|
2006-12-06 21:33:20 -07:00
|
|
|
static struct kmem_cache *afs_inode_cachep;
|
2005-04-16 16:20:36 -06:00
|
|
|
static atomic_t afs_count_active_inodes;
|
|
|
|
|
2007-05-03 04:11:29 -06:00
|
|
|
enum {
|
|
|
|
afs_no_opt,
|
|
|
|
afs_opt_cell,
|
|
|
|
afs_opt_rwpath,
|
|
|
|
afs_opt_vol,
|
|
|
|
};
|
|
|
|
|
AFS: implement basic file write support
Implement support for writing to regular AFS files, including:
(1) write
(2) truncate
(3) fsync, fdatasync
(4) chmod, chown, chgrp, utime.
AFS writeback attempts to batch writes into as chunks as large as it can manage
up to the point that it writes back 65535 pages in one chunk or it meets a
locked page.
Furthermore, if a page has been written to using a particular key, then should
another write to that page use some other key, the first write will be flushed
before the second is allowed to take place. If the first write fails due to a
security error, then the page will be scrapped and reread before the second
write takes place.
If a page is dirty and the callback on it is broken by the server, then the
dirty data is not discarded (same behaviour as NFS).
Shared-writable mappings are not supported by this patch.
[akpm@linux-foundation.org: fix a bunch of warnings]
Signed-off-by: David Howells <dhowells@redhat.com>
Signed-off-by: Andrew Morton <akpm@linux-foundation.org>
Signed-off-by: Linus Torvalds <torvalds@linux-foundation.org>
2007-05-09 03:33:46 -06:00
|
|
|
static match_table_t afs_options_list = {
|
2007-05-03 04:11:29 -06:00
|
|
|
{ afs_opt_cell, "cell=%s" },
|
|
|
|
{ afs_opt_rwpath, "rwpath" },
|
|
|
|
{ afs_opt_vol, "vol=%s" },
|
|
|
|
{ afs_no_opt, NULL },
|
|
|
|
};
|
|
|
|
|
2005-04-16 16:20:36 -06:00
|
|
|
/*
|
|
|
|
* initialise the filesystem
|
|
|
|
*/
|
|
|
|
int __init afs_fs_init(void)
|
|
|
|
{
|
|
|
|
int ret;
|
|
|
|
|
|
|
|
_enter("");
|
|
|
|
|
|
|
|
/* create ourselves an inode cache */
|
|
|
|
atomic_set(&afs_count_active_inodes, 0);
|
|
|
|
|
|
|
|
ret = -ENOMEM;
|
|
|
|
afs_inode_cachep = kmem_cache_create("afs_inode_cache",
|
|
|
|
sizeof(struct afs_vnode),
|
|
|
|
0,
|
|
|
|
SLAB_HWCACHE_ALIGN,
|
2007-07-19 19:11:58 -06:00
|
|
|
afs_i_init_once);
|
2005-04-16 16:20:36 -06:00
|
|
|
if (!afs_inode_cachep) {
|
|
|
|
printk(KERN_NOTICE "kAFS: Failed to allocate inode cache\n");
|
|
|
|
return ret;
|
|
|
|
}
|
|
|
|
|
|
|
|
/* now export our filesystem to lesser mortals */
|
|
|
|
ret = register_filesystem(&afs_fs_type);
|
|
|
|
if (ret < 0) {
|
|
|
|
kmem_cache_destroy(afs_inode_cachep);
|
2007-04-26 16:55:03 -06:00
|
|
|
_leave(" = %d", ret);
|
2005-04-16 16:20:36 -06:00
|
|
|
return ret;
|
|
|
|
}
|
|
|
|
|
2007-04-26 16:55:03 -06:00
|
|
|
_leave(" = 0");
|
2005-04-16 16:20:36 -06:00
|
|
|
return 0;
|
2007-04-26 16:49:28 -06:00
|
|
|
}
|
2005-04-16 16:20:36 -06:00
|
|
|
|
|
|
|
/*
|
|
|
|
* clean up the filesystem
|
|
|
|
*/
|
|
|
|
void __exit afs_fs_exit(void)
|
|
|
|
{
|
2007-04-26 16:55:03 -06:00
|
|
|
_enter("");
|
|
|
|
|
|
|
|
afs_mntpt_kill_timer();
|
2005-04-16 16:20:36 -06:00
|
|
|
unregister_filesystem(&afs_fs_type);
|
|
|
|
|
|
|
|
if (atomic_read(&afs_count_active_inodes) != 0) {
|
|
|
|
printk("kAFS: %d active inode objects still present\n",
|
|
|
|
atomic_read(&afs_count_active_inodes));
|
|
|
|
BUG();
|
|
|
|
}
|
|
|
|
|
|
|
|
kmem_cache_destroy(afs_inode_cachep);
|
2007-04-26 16:55:03 -06:00
|
|
|
_leave("");
|
2007-04-26 16:49:28 -06:00
|
|
|
}
|
2005-04-16 16:20:36 -06:00
|
|
|
|
|
|
|
/*
|
|
|
|
* parse the mount options
|
|
|
|
* - this function has been shamelessly adapted from the ext3 fs which
|
|
|
|
* shamelessly adapted it from the msdos fs
|
|
|
|
*/
|
2007-04-26 16:57:07 -06:00
|
|
|
static int afs_parse_options(struct afs_mount_params *params,
|
|
|
|
char *options, const char **devname)
|
2005-04-16 16:20:36 -06:00
|
|
|
{
|
2007-04-26 16:55:03 -06:00
|
|
|
struct afs_cell *cell;
|
2007-05-03 04:11:29 -06:00
|
|
|
substring_t args[MAX_OPT_ARGS];
|
|
|
|
char *p;
|
|
|
|
int token;
|
2005-04-16 16:20:36 -06:00
|
|
|
|
|
|
|
_enter("%s", options);
|
|
|
|
|
|
|
|
options[PAGE_SIZE - 1] = 0;
|
|
|
|
|
2007-05-03 04:11:29 -06:00
|
|
|
while ((p = strsep(&options, ","))) {
|
|
|
|
if (!*p)
|
|
|
|
continue;
|
2005-04-16 16:20:36 -06:00
|
|
|
|
2007-05-03 04:11:29 -06:00
|
|
|
token = match_token(p, afs_options_list, args);
|
|
|
|
switch (token) {
|
|
|
|
case afs_opt_cell:
|
|
|
|
cell = afs_cell_lookup(args[0].from,
|
|
|
|
args[0].to - args[0].from);
|
2007-04-26 16:55:03 -06:00
|
|
|
if (IS_ERR(cell))
|
|
|
|
return PTR_ERR(cell);
|
2007-04-26 16:57:07 -06:00
|
|
|
afs_put_cell(params->cell);
|
|
|
|
params->cell = cell;
|
2007-05-03 04:11:29 -06:00
|
|
|
break;
|
|
|
|
|
|
|
|
case afs_opt_rwpath:
|
|
|
|
params->rwpath = 1;
|
|
|
|
break;
|
|
|
|
|
|
|
|
case afs_opt_vol:
|
|
|
|
*devname = args[0].from;
|
|
|
|
break;
|
|
|
|
|
|
|
|
default:
|
|
|
|
printk(KERN_ERR "kAFS:"
|
|
|
|
" Unknown or invalid mount option: '%s'\n", p);
|
|
|
|
return -EINVAL;
|
2005-04-16 16:20:36 -06:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2007-05-03 04:11:29 -06:00
|
|
|
_leave(" = 0");
|
|
|
|
return 0;
|
2007-04-26 16:49:28 -06:00
|
|
|
}
|
2005-04-16 16:20:36 -06:00
|
|
|
|
2007-04-26 16:57:07 -06:00
|
|
|
/*
|
|
|
|
* parse a device name to get cell name, volume name, volume type and R/W
|
|
|
|
* selector
|
|
|
|
* - this can be one of the following:
|
|
|
|
* "%[cell:]volume[.]" R/W volume
|
|
|
|
* "#[cell:]volume[.]" R/O or R/W volume (rwpath=0),
|
|
|
|
* or R/W (rwpath=1) volume
|
|
|
|
* "%[cell:]volume.readonly" R/O volume
|
|
|
|
* "#[cell:]volume.readonly" R/O volume
|
|
|
|
* "%[cell:]volume.backup" Backup volume
|
|
|
|
* "#[cell:]volume.backup" Backup volume
|
|
|
|
*/
|
|
|
|
static int afs_parse_device_name(struct afs_mount_params *params,
|
|
|
|
const char *name)
|
|
|
|
{
|
|
|
|
struct afs_cell *cell;
|
|
|
|
const char *cellname, *suffix;
|
|
|
|
int cellnamesz;
|
|
|
|
|
|
|
|
_enter(",%s", name);
|
|
|
|
|
|
|
|
if (!name) {
|
|
|
|
printk(KERN_ERR "kAFS: no volume name specified\n");
|
|
|
|
return -EINVAL;
|
|
|
|
}
|
|
|
|
|
|
|
|
if ((name[0] != '%' && name[0] != '#') || !name[1]) {
|
|
|
|
printk(KERN_ERR "kAFS: unparsable volume name\n");
|
|
|
|
return -EINVAL;
|
|
|
|
}
|
|
|
|
|
|
|
|
/* determine the type of volume we're looking for */
|
|
|
|
params->type = AFSVL_ROVOL;
|
|
|
|
params->force = false;
|
|
|
|
if (params->rwpath || name[0] == '%') {
|
|
|
|
params->type = AFSVL_RWVOL;
|
|
|
|
params->force = true;
|
|
|
|
}
|
|
|
|
name++;
|
|
|
|
|
|
|
|
/* split the cell name out if there is one */
|
|
|
|
params->volname = strchr(name, ':');
|
|
|
|
if (params->volname) {
|
|
|
|
cellname = name;
|
|
|
|
cellnamesz = params->volname - name;
|
|
|
|
params->volname++;
|
|
|
|
} else {
|
|
|
|
params->volname = name;
|
|
|
|
cellname = NULL;
|
|
|
|
cellnamesz = 0;
|
|
|
|
}
|
|
|
|
|
|
|
|
/* the volume type is further affected by a possible suffix */
|
|
|
|
suffix = strrchr(params->volname, '.');
|
|
|
|
if (suffix) {
|
|
|
|
if (strcmp(suffix, ".readonly") == 0) {
|
|
|
|
params->type = AFSVL_ROVOL;
|
|
|
|
params->force = true;
|
|
|
|
} else if (strcmp(suffix, ".backup") == 0) {
|
|
|
|
params->type = AFSVL_BACKVOL;
|
|
|
|
params->force = true;
|
|
|
|
} else if (suffix[1] == 0) {
|
|
|
|
} else {
|
|
|
|
suffix = NULL;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
params->volnamesz = suffix ?
|
|
|
|
suffix - params->volname : strlen(params->volname);
|
|
|
|
|
|
|
|
_debug("cell %*.*s [%p]",
|
|
|
|
cellnamesz, cellnamesz, cellname ?: "", params->cell);
|
|
|
|
|
|
|
|
/* lookup the cell record */
|
|
|
|
if (cellname || !params->cell) {
|
|
|
|
cell = afs_cell_lookup(cellname, cellnamesz);
|
|
|
|
if (IS_ERR(cell)) {
|
|
|
|
printk(KERN_ERR "kAFS: unable to lookup cell '%s'\n",
|
|
|
|
cellname ?: "");
|
|
|
|
return PTR_ERR(cell);
|
|
|
|
}
|
|
|
|
afs_put_cell(params->cell);
|
|
|
|
params->cell = cell;
|
|
|
|
}
|
|
|
|
|
|
|
|
_debug("CELL:%s [%p] VOLUME:%*.*s SUFFIX:%s TYPE:%d%s",
|
|
|
|
params->cell->name, params->cell,
|
|
|
|
params->volnamesz, params->volnamesz, params->volname,
|
|
|
|
suffix ?: "-", params->type, params->force ? " FORCE" : "");
|
|
|
|
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
2005-04-16 16:20:36 -06:00
|
|
|
/*
|
|
|
|
* check a superblock to see if it's the one we're looking for
|
|
|
|
*/
|
|
|
|
static int afs_test_super(struct super_block *sb, void *data)
|
|
|
|
{
|
|
|
|
struct afs_mount_params *params = data;
|
|
|
|
struct afs_super_info *as = sb->s_fs_info;
|
|
|
|
|
|
|
|
return as->volume == params->volume;
|
2007-04-26 16:49:28 -06:00
|
|
|
}
|
2005-04-16 16:20:36 -06:00
|
|
|
|
|
|
|
/*
|
|
|
|
* fill in the superblock
|
|
|
|
*/
|
2007-04-26 16:56:24 -06:00
|
|
|
static int afs_fill_super(struct super_block *sb, void *data)
|
2005-04-16 16:20:36 -06:00
|
|
|
{
|
|
|
|
struct afs_mount_params *params = data;
|
|
|
|
struct afs_super_info *as = NULL;
|
|
|
|
struct afs_fid fid;
|
|
|
|
struct dentry *root = NULL;
|
|
|
|
struct inode *inode = NULL;
|
|
|
|
int ret;
|
|
|
|
|
2007-04-26 16:55:03 -06:00
|
|
|
_enter("");
|
2005-04-16 16:20:36 -06:00
|
|
|
|
|
|
|
/* allocate a superblock info record */
|
2006-12-06 21:40:32 -07:00
|
|
|
as = kzalloc(sizeof(struct afs_super_info), GFP_KERNEL);
|
2005-04-16 16:20:36 -06:00
|
|
|
if (!as) {
|
|
|
|
_leave(" = -ENOMEM");
|
|
|
|
return -ENOMEM;
|
|
|
|
}
|
|
|
|
|
|
|
|
afs_get_volume(params->volume);
|
|
|
|
as->volume = params->volume;
|
|
|
|
|
|
|
|
/* fill in the superblock */
|
|
|
|
sb->s_blocksize = PAGE_CACHE_SIZE;
|
|
|
|
sb->s_blocksize_bits = PAGE_CACHE_SHIFT;
|
|
|
|
sb->s_magic = AFS_FS_MAGIC;
|
|
|
|
sb->s_op = &afs_super_ops;
|
|
|
|
sb->s_fs_info = as;
|
|
|
|
|
|
|
|
/* allocate the root inode and dentry */
|
|
|
|
fid.vid = as->volume->vid;
|
|
|
|
fid.vnode = 1;
|
|
|
|
fid.unique = 1;
|
2007-04-26 16:59:35 -06:00
|
|
|
inode = afs_iget(sb, params->key, &fid, NULL, NULL);
|
2007-04-26 16:55:03 -06:00
|
|
|
if (IS_ERR(inode))
|
|
|
|
goto error_inode;
|
2005-04-16 16:20:36 -06:00
|
|
|
|
|
|
|
ret = -ENOMEM;
|
|
|
|
root = d_alloc_root(inode);
|
|
|
|
if (!root)
|
|
|
|
goto error;
|
|
|
|
|
|
|
|
sb->s_root = root;
|
|
|
|
|
2007-04-26 16:55:03 -06:00
|
|
|
_leave(" = 0");
|
2005-04-16 16:20:36 -06:00
|
|
|
return 0;
|
|
|
|
|
2007-04-26 16:55:03 -06:00
|
|
|
error_inode:
|
|
|
|
ret = PTR_ERR(inode);
|
|
|
|
inode = NULL;
|
2007-04-26 16:49:28 -06:00
|
|
|
error:
|
2005-04-16 16:20:36 -06:00
|
|
|
iput(inode);
|
|
|
|
afs_put_volume(as->volume);
|
|
|
|
kfree(as);
|
|
|
|
|
|
|
|
sb->s_fs_info = NULL;
|
|
|
|
|
2007-04-26 16:55:03 -06:00
|
|
|
_leave(" = %d", ret);
|
2005-04-16 16:20:36 -06:00
|
|
|
return ret;
|
2007-04-26 16:49:28 -06:00
|
|
|
}
|
2005-04-16 16:20:36 -06:00
|
|
|
|
|
|
|
/*
|
|
|
|
* get an AFS superblock
|
|
|
|
*/
|
[PATCH] VFS: Permit filesystem to override root dentry on mount
Extend the get_sb() filesystem operation to take an extra argument that
permits the VFS to pass in the target vfsmount that defines the mountpoint.
The filesystem is then required to manually set the superblock and root dentry
pointers. For most filesystems, this should be done with simple_set_mnt()
which will set the superblock pointer and then set the root dentry to the
superblock's s_root (as per the old default behaviour).
The get_sb() op now returns an integer as there's now no need to return the
superblock pointer.
This patch permits a superblock to be implicitly shared amongst several mount
points, such as can be done with NFS to avoid potential inode aliasing. In
such a case, simple_set_mnt() would not be called, and instead the mnt_root
and mnt_sb would be set directly.
The patch also makes the following changes:
(*) the get_sb_*() convenience functions in the core kernel now take a vfsmount
pointer argument and return an integer, so most filesystems have to change
very little.
(*) If one of the convenience function is not used, then get_sb() should
normally call simple_set_mnt() to instantiate the vfsmount. This will
always return 0, and so can be tail-called from get_sb().
(*) generic_shutdown_super() now calls shrink_dcache_sb() to clean up the
dcache upon superblock destruction rather than shrink_dcache_anon().
This is required because the superblock may now have multiple trees that
aren't actually bound to s_root, but that still need to be cleaned up. The
currently called functions assume that the whole tree is rooted at s_root,
and that anonymous dentries are not the roots of trees which results in
dentries being left unculled.
However, with the way NFS superblock sharing are currently set to be
implemented, these assumptions are violated: the root of the filesystem is
simply a dummy dentry and inode (the real inode for '/' may well be
inaccessible), and all the vfsmounts are rooted on anonymous[*] dentries
with child trees.
[*] Anonymous until discovered from another tree.
(*) The documentation has been adjusted, including the additional bit of
changing ext2_* into foo_* in the documentation.
[akpm@osdl.org: convert ipath_fs, do other stuff]
Signed-off-by: David Howells <dhowells@redhat.com>
Acked-by: Al Viro <viro@zeniv.linux.org.uk>
Cc: Nathan Scott <nathans@sgi.com>
Cc: Roland Dreier <rolandd@cisco.com>
Signed-off-by: Andrew Morton <akpm@osdl.org>
Signed-off-by: Linus Torvalds <torvalds@osdl.org>
2006-06-23 03:02:57 -06:00
|
|
|
static int afs_get_sb(struct file_system_type *fs_type,
|
|
|
|
int flags,
|
|
|
|
const char *dev_name,
|
|
|
|
void *options,
|
|
|
|
struct vfsmount *mnt)
|
2005-04-16 16:20:36 -06:00
|
|
|
{
|
|
|
|
struct afs_mount_params params;
|
|
|
|
struct super_block *sb;
|
2007-04-26 16:55:03 -06:00
|
|
|
struct afs_volume *vol;
|
2007-04-26 16:57:07 -06:00
|
|
|
struct key *key;
|
2008-02-08 05:21:37 -07:00
|
|
|
char *new_opts = kstrdup(options, GFP_KERNEL);
|
2005-04-16 16:20:36 -06:00
|
|
|
int ret;
|
|
|
|
|
|
|
|
_enter(",,%s,%p", dev_name, options);
|
|
|
|
|
|
|
|
memset(¶ms, 0, sizeof(params));
|
|
|
|
|
2007-04-26 16:57:07 -06:00
|
|
|
/* parse the options and device name */
|
2005-04-16 16:20:36 -06:00
|
|
|
if (options) {
|
2007-04-26 16:57:07 -06:00
|
|
|
ret = afs_parse_options(¶ms, options, &dev_name);
|
2005-04-16 16:20:36 -06:00
|
|
|
if (ret < 0)
|
|
|
|
goto error;
|
|
|
|
}
|
|
|
|
|
2007-04-26 16:57:07 -06:00
|
|
|
ret = afs_parse_device_name(¶ms, dev_name);
|
|
|
|
if (ret < 0)
|
|
|
|
goto error;
|
|
|
|
|
|
|
|
/* try and do the mount securely */
|
|
|
|
key = afs_request_key(params.cell);
|
|
|
|
if (IS_ERR(key)) {
|
|
|
|
_leave(" = %ld [key]", PTR_ERR(key));
|
|
|
|
ret = PTR_ERR(key);
|
|
|
|
goto error;
|
|
|
|
}
|
|
|
|
params.key = key;
|
|
|
|
|
2005-04-16 16:20:36 -06:00
|
|
|
/* parse the device name */
|
2007-04-26 16:57:07 -06:00
|
|
|
vol = afs_volume_lookup(¶ms);
|
2007-04-26 16:55:03 -06:00
|
|
|
if (IS_ERR(vol)) {
|
|
|
|
ret = PTR_ERR(vol);
|
2005-04-16 16:20:36 -06:00
|
|
|
goto error;
|
2007-04-26 16:55:03 -06:00
|
|
|
}
|
|
|
|
params.volume = vol;
|
2005-04-16 16:20:36 -06:00
|
|
|
|
|
|
|
/* allocate a deviceless superblock */
|
|
|
|
sb = sget(fs_type, afs_test_super, set_anon_super, ¶ms);
|
2007-04-26 16:55:03 -06:00
|
|
|
if (IS_ERR(sb)) {
|
|
|
|
ret = PTR_ERR(sb);
|
2005-04-16 16:20:36 -06:00
|
|
|
goto error;
|
2007-04-26 16:55:03 -06:00
|
|
|
}
|
2005-04-16 16:20:36 -06:00
|
|
|
|
2007-04-26 16:56:24 -06:00
|
|
|
if (!sb->s_root) {
|
|
|
|
/* initial superblock/root creation */
|
|
|
|
_debug("create");
|
|
|
|
sb->s_flags = flags;
|
|
|
|
ret = afs_fill_super(sb, ¶ms);
|
|
|
|
if (ret < 0) {
|
|
|
|
up_write(&sb->s_umount);
|
|
|
|
deactivate_super(sb);
|
|
|
|
goto error;
|
|
|
|
}
|
2008-02-08 05:21:37 -07:00
|
|
|
sb->s_options = new_opts;
|
2007-04-26 16:56:24 -06:00
|
|
|
sb->s_flags |= MS_ACTIVE;
|
|
|
|
} else {
|
|
|
|
_debug("reuse");
|
2008-02-08 05:21:37 -07:00
|
|
|
kfree(new_opts);
|
2007-04-26 16:56:24 -06:00
|
|
|
ASSERTCMP(sb->s_flags, &, MS_ACTIVE);
|
2005-04-16 16:20:36 -06:00
|
|
|
}
|
|
|
|
|
2007-04-26 16:56:24 -06:00
|
|
|
simple_set_mnt(mnt, sb);
|
2005-04-16 16:20:36 -06:00
|
|
|
afs_put_volume(params.volume);
|
2007-04-26 16:57:07 -06:00
|
|
|
afs_put_cell(params.cell);
|
2007-04-26 16:55:03 -06:00
|
|
|
_leave(" = 0 [%p]", sb);
|
[PATCH] VFS: Permit filesystem to override root dentry on mount
Extend the get_sb() filesystem operation to take an extra argument that
permits the VFS to pass in the target vfsmount that defines the mountpoint.
The filesystem is then required to manually set the superblock and root dentry
pointers. For most filesystems, this should be done with simple_set_mnt()
which will set the superblock pointer and then set the root dentry to the
superblock's s_root (as per the old default behaviour).
The get_sb() op now returns an integer as there's now no need to return the
superblock pointer.
This patch permits a superblock to be implicitly shared amongst several mount
points, such as can be done with NFS to avoid potential inode aliasing. In
such a case, simple_set_mnt() would not be called, and instead the mnt_root
and mnt_sb would be set directly.
The patch also makes the following changes:
(*) the get_sb_*() convenience functions in the core kernel now take a vfsmount
pointer argument and return an integer, so most filesystems have to change
very little.
(*) If one of the convenience function is not used, then get_sb() should
normally call simple_set_mnt() to instantiate the vfsmount. This will
always return 0, and so can be tail-called from get_sb().
(*) generic_shutdown_super() now calls shrink_dcache_sb() to clean up the
dcache upon superblock destruction rather than shrink_dcache_anon().
This is required because the superblock may now have multiple trees that
aren't actually bound to s_root, but that still need to be cleaned up. The
currently called functions assume that the whole tree is rooted at s_root,
and that anonymous dentries are not the roots of trees which results in
dentries being left unculled.
However, with the way NFS superblock sharing are currently set to be
implemented, these assumptions are violated: the root of the filesystem is
simply a dummy dentry and inode (the real inode for '/' may well be
inaccessible), and all the vfsmounts are rooted on anonymous[*] dentries
with child trees.
[*] Anonymous until discovered from another tree.
(*) The documentation has been adjusted, including the additional bit of
changing ext2_* into foo_* in the documentation.
[akpm@osdl.org: convert ipath_fs, do other stuff]
Signed-off-by: David Howells <dhowells@redhat.com>
Acked-by: Al Viro <viro@zeniv.linux.org.uk>
Cc: Nathan Scott <nathans@sgi.com>
Cc: Roland Dreier <rolandd@cisco.com>
Signed-off-by: Andrew Morton <akpm@osdl.org>
Signed-off-by: Linus Torvalds <torvalds@osdl.org>
2006-06-23 03:02:57 -06:00
|
|
|
return 0;
|
2005-04-16 16:20:36 -06:00
|
|
|
|
2007-04-26 16:49:28 -06:00
|
|
|
error:
|
2005-04-16 16:20:36 -06:00
|
|
|
afs_put_volume(params.volume);
|
2007-04-26 16:57:07 -06:00
|
|
|
afs_put_cell(params.cell);
|
|
|
|
key_put(params.key);
|
2008-02-08 05:21:37 -07:00
|
|
|
kfree(new_opts);
|
2005-04-16 16:20:36 -06:00
|
|
|
_leave(" = %d", ret);
|
[PATCH] VFS: Permit filesystem to override root dentry on mount
Extend the get_sb() filesystem operation to take an extra argument that
permits the VFS to pass in the target vfsmount that defines the mountpoint.
The filesystem is then required to manually set the superblock and root dentry
pointers. For most filesystems, this should be done with simple_set_mnt()
which will set the superblock pointer and then set the root dentry to the
superblock's s_root (as per the old default behaviour).
The get_sb() op now returns an integer as there's now no need to return the
superblock pointer.
This patch permits a superblock to be implicitly shared amongst several mount
points, such as can be done with NFS to avoid potential inode aliasing. In
such a case, simple_set_mnt() would not be called, and instead the mnt_root
and mnt_sb would be set directly.
The patch also makes the following changes:
(*) the get_sb_*() convenience functions in the core kernel now take a vfsmount
pointer argument and return an integer, so most filesystems have to change
very little.
(*) If one of the convenience function is not used, then get_sb() should
normally call simple_set_mnt() to instantiate the vfsmount. This will
always return 0, and so can be tail-called from get_sb().
(*) generic_shutdown_super() now calls shrink_dcache_sb() to clean up the
dcache upon superblock destruction rather than shrink_dcache_anon().
This is required because the superblock may now have multiple trees that
aren't actually bound to s_root, but that still need to be cleaned up. The
currently called functions assume that the whole tree is rooted at s_root,
and that anonymous dentries are not the roots of trees which results in
dentries being left unculled.
However, with the way NFS superblock sharing are currently set to be
implemented, these assumptions are violated: the root of the filesystem is
simply a dummy dentry and inode (the real inode for '/' may well be
inaccessible), and all the vfsmounts are rooted on anonymous[*] dentries
with child trees.
[*] Anonymous until discovered from another tree.
(*) The documentation has been adjusted, including the additional bit of
changing ext2_* into foo_* in the documentation.
[akpm@osdl.org: convert ipath_fs, do other stuff]
Signed-off-by: David Howells <dhowells@redhat.com>
Acked-by: Al Viro <viro@zeniv.linux.org.uk>
Cc: Nathan Scott <nathans@sgi.com>
Cc: Roland Dreier <rolandd@cisco.com>
Signed-off-by: Andrew Morton <akpm@osdl.org>
Signed-off-by: Linus Torvalds <torvalds@osdl.org>
2006-06-23 03:02:57 -06:00
|
|
|
return ret;
|
2007-04-26 16:49:28 -06:00
|
|
|
}
|
2005-04-16 16:20:36 -06:00
|
|
|
|
|
|
|
/*
|
|
|
|
* finish the unmounting process on the superblock
|
|
|
|
*/
|
|
|
|
static void afs_put_super(struct super_block *sb)
|
|
|
|
{
|
|
|
|
struct afs_super_info *as = sb->s_fs_info;
|
|
|
|
|
|
|
|
_enter("");
|
|
|
|
|
|
|
|
afs_put_volume(as->volume);
|
|
|
|
|
|
|
|
_leave("");
|
2007-04-26 16:49:28 -06:00
|
|
|
}
|
2005-04-16 16:20:36 -06:00
|
|
|
|
|
|
|
/*
|
|
|
|
* initialise an inode cache slab element prior to any use
|
|
|
|
*/
|
2007-10-17 00:25:51 -06:00
|
|
|
static void afs_i_init_once(struct kmem_cache *cachep, void *_vnode)
|
2005-04-16 16:20:36 -06:00
|
|
|
{
|
2007-04-26 16:49:28 -06:00
|
|
|
struct afs_vnode *vnode = _vnode;
|
2005-04-16 16:20:36 -06:00
|
|
|
|
2007-05-16 23:10:57 -06:00
|
|
|
memset(vnode, 0, sizeof(*vnode));
|
|
|
|
inode_init_once(&vnode->vfs_inode);
|
|
|
|
init_waitqueue_head(&vnode->update_waitq);
|
|
|
|
mutex_init(&vnode->permits_lock);
|
|
|
|
mutex_init(&vnode->validate_lock);
|
|
|
|
spin_lock_init(&vnode->writeback_lock);
|
|
|
|
spin_lock_init(&vnode->lock);
|
|
|
|
INIT_LIST_HEAD(&vnode->writebacks);
|
2007-07-16 00:40:12 -06:00
|
|
|
INIT_LIST_HEAD(&vnode->pending_locks);
|
|
|
|
INIT_LIST_HEAD(&vnode->granted_locks);
|
|
|
|
INIT_DELAYED_WORK(&vnode->lock_work, afs_lock_work);
|
2007-05-16 23:10:57 -06:00
|
|
|
INIT_WORK(&vnode->cb_broken_work, afs_broken_callback_work);
|
2007-04-26 16:49:28 -06:00
|
|
|
}
|
2005-04-16 16:20:36 -06:00
|
|
|
|
|
|
|
/*
|
|
|
|
* allocate an AFS inode struct from our slab cache
|
|
|
|
*/
|
|
|
|
static struct inode *afs_alloc_inode(struct super_block *sb)
|
|
|
|
{
|
|
|
|
struct afs_vnode *vnode;
|
|
|
|
|
2007-04-26 16:49:28 -06:00
|
|
|
vnode = kmem_cache_alloc(afs_inode_cachep, GFP_KERNEL);
|
2005-04-16 16:20:36 -06:00
|
|
|
if (!vnode)
|
|
|
|
return NULL;
|
|
|
|
|
|
|
|
atomic_inc(&afs_count_active_inodes);
|
|
|
|
|
|
|
|
memset(&vnode->fid, 0, sizeof(vnode->fid));
|
|
|
|
memset(&vnode->status, 0, sizeof(vnode->status));
|
|
|
|
|
|
|
|
vnode->volume = NULL;
|
|
|
|
vnode->update_cnt = 0;
|
2007-04-26 16:59:35 -06:00
|
|
|
vnode->flags = 1 << AFS_VNODE_UNSET;
|
2007-04-26 16:55:03 -06:00
|
|
|
vnode->cb_promised = false;
|
2005-04-16 16:20:36 -06:00
|
|
|
|
2007-05-10 23:22:20 -06:00
|
|
|
_leave(" = %p", &vnode->vfs_inode);
|
2005-04-16 16:20:36 -06:00
|
|
|
return &vnode->vfs_inode;
|
2007-04-26 16:49:28 -06:00
|
|
|
}
|
2005-04-16 16:20:36 -06:00
|
|
|
|
|
|
|
/*
|
|
|
|
* destroy an AFS inode struct
|
|
|
|
*/
|
|
|
|
static void afs_destroy_inode(struct inode *inode)
|
|
|
|
{
|
2007-04-26 16:55:03 -06:00
|
|
|
struct afs_vnode *vnode = AFS_FS_I(inode);
|
|
|
|
|
2007-05-10 23:22:20 -06:00
|
|
|
_enter("%p{%x:%u}", inode, vnode->fid.vid, vnode->fid.vnode);
|
2005-04-16 16:20:36 -06:00
|
|
|
|
2007-04-26 16:55:03 -06:00
|
|
|
_debug("DESTROY INODE %p", inode);
|
|
|
|
|
|
|
|
ASSERTCMP(vnode->server, ==, NULL);
|
|
|
|
|
|
|
|
kmem_cache_free(afs_inode_cachep, vnode);
|
2005-04-16 16:20:36 -06:00
|
|
|
atomic_dec(&afs_count_active_inodes);
|
2007-04-26 16:49:28 -06:00
|
|
|
}
|
2007-05-10 23:22:20 -06:00
|
|
|
|
|
|
|
/*
|
|
|
|
* return information about an AFS volume
|
|
|
|
*/
|
|
|
|
static int afs_statfs(struct dentry *dentry, struct kstatfs *buf)
|
|
|
|
{
|
|
|
|
struct afs_volume_status vs;
|
|
|
|
struct afs_vnode *vnode = AFS_FS_I(dentry->d_inode);
|
|
|
|
struct key *key;
|
|
|
|
int ret;
|
|
|
|
|
|
|
|
key = afs_request_key(vnode->volume->cell);
|
|
|
|
if (IS_ERR(key))
|
|
|
|
return PTR_ERR(key);
|
|
|
|
|
|
|
|
ret = afs_vnode_get_volume_status(vnode, key, &vs);
|
|
|
|
key_put(key);
|
|
|
|
if (ret < 0) {
|
|
|
|
_leave(" = %d", ret);
|
|
|
|
return ret;
|
|
|
|
}
|
|
|
|
|
|
|
|
buf->f_type = dentry->d_sb->s_magic;
|
|
|
|
buf->f_bsize = AFS_BLOCK_SIZE;
|
|
|
|
buf->f_namelen = AFSNAMEMAX - 1;
|
|
|
|
|
|
|
|
if (vs.max_quota == 0)
|
|
|
|
buf->f_blocks = vs.part_max_blocks;
|
|
|
|
else
|
|
|
|
buf->f_blocks = vs.max_quota;
|
|
|
|
buf->f_bavail = buf->f_bfree = buf->f_blocks - vs.blocks_in_use;
|
|
|
|
return 0;
|
|
|
|
}
|