| /* |
| * linux/fs/super.c |
| * |
| * Copyright (C) 1991, 1992 Linus Torvalds |
| * |
| * super.c contains code to handle: - mount structures |
| * - super-block tables |
| * - filesystem drivers list |
| * - mount system call |
| * - umount system call |
| * - ustat system call |
| * |
| * GK 2/5/95 - Changed to support mounting the root fs via NFS |
| * |
| * Added kerneld support: Jacques Gelinas and Bjorn Ekwall |
| * Added change_root: Werner Almesberger & Hans Lermen, Feb '96 |
| * Added options to /proc/mounts: |
| * Torbjörn Lindh (torbjorn.lindh@gopta.se), April 14, 1996. |
| * Added devfs support: Richard Gooch <rgooch@atnf.csiro.au>, 13-JAN-1998 |
| * Heavily rewritten for 'one fs - one tree' dcache architecture. AV, Mar 2000 |
| */ |
| |
| #include <linux/config.h> |
| #include <linux/slab.h> |
| #include <linux/smp_lock.h> |
| #include <linux/acct.h> |
| #include <linux/blkdev.h> |
| #include <linux/quotaops.h> |
| #include <linux/namei.h> |
| #include <linux/buffer_head.h> /* for fsync_super() */ |
| #include <linux/mount.h> |
| #include <linux/security.h> |
| #include <linux/vfs.h> |
| #include <asm/uaccess.h> |
| |
| |
| void get_filesystem(struct file_system_type *fs); |
| void put_filesystem(struct file_system_type *fs); |
| struct file_system_type *get_fs_type(const char *name); |
| |
| LIST_HEAD(super_blocks); |
| spinlock_t sb_lock = SPIN_LOCK_UNLOCKED; |
| |
| /** |
| * alloc_super - create new superblock |
| * |
| * Allocates and initializes a new &struct super_block. alloc_super() |
| * returns a pointer new superblock or %NULL if allocation had failed. |
| */ |
| static struct super_block *alloc_super(void) |
| { |
| struct super_block *s = kmalloc(sizeof(struct super_block), GFP_USER); |
| static struct super_operations default_op; |
| |
| if (s) { |
| memset(s, 0, sizeof(struct super_block)); |
| if (security_sb_alloc(s)) { |
| kfree(s); |
| s = NULL; |
| goto out; |
| } |
| INIT_LIST_HEAD(&s->s_dirty); |
| INIT_LIST_HEAD(&s->s_io); |
| INIT_LIST_HEAD(&s->s_files); |
| INIT_LIST_HEAD(&s->s_instances); |
| INIT_LIST_HEAD(&s->s_anon); |
| init_rwsem(&s->s_umount); |
| sema_init(&s->s_lock, 1); |
| down_write(&s->s_umount); |
| s->s_count = S_BIAS; |
| atomic_set(&s->s_active, 1); |
| sema_init(&s->s_vfs_rename_sem,1); |
| sema_init(&s->s_dquot.dqio_sem, 1); |
| sema_init(&s->s_dquot.dqonoff_sem, 1); |
| init_rwsem(&s->s_dquot.dqptr_sem); |
| s->s_maxbytes = MAX_NON_LFS; |
| s->dq_op = sb_dquot_ops; |
| s->s_qcop = sb_quotactl_ops; |
| s->s_op = &default_op; |
| } |
| out: |
| return s; |
| } |
| |
| /** |
| * destroy_super - frees a superblock |
| * @s: superblock to free |
| * |
| * Frees a superblock. |
| */ |
| static inline void destroy_super(struct super_block *s) |
| { |
| security_sb_free(s); |
| kfree(s); |
| } |
| |
| /* Superblock refcounting */ |
| |
| /** |
| * put_super - drop a temporary reference to superblock |
| * @s: superblock in question |
| * |
| * Drops a temporary reference, frees superblock if there's no |
| * references left. |
| */ |
| static inline void put_super(struct super_block *s) |
| { |
| spin_lock(&sb_lock); |
| if (!--s->s_count) |
| destroy_super(s); |
| spin_unlock(&sb_lock); |
| } |
| |
| /** |
| * deactivate_super - drop an active reference to superblock |
| * @s: superblock to deactivate |
| * |
| * Drops an active reference to superblock, acquiring a temprory one if |
| * there is no active references left. In that case we lock superblock, |
| * tell fs driver to shut it down and drop the temporary reference we |
| * had just acquired. |
| */ |
| void deactivate_super(struct super_block *s) |
| { |
| struct file_system_type *fs = s->s_type; |
| if (atomic_dec_and_lock(&s->s_active, &sb_lock)) { |
| s->s_count -= S_BIAS-1; |
| spin_unlock(&sb_lock); |
| down_write(&s->s_umount); |
| fs->kill_sb(s); |
| put_filesystem(fs); |
| put_super(s); |
| } |
| } |
| |
| /** |
| * grab_super - acquire an active reference |
| * @s - reference we are trying to make active |
| * |
| * Tries to acquire an active reference. grab_super() is used when we |
| * had just found a superblock in super_blocks or fs_type->fs_supers |
| * and want to turn it into a full-blown active reference. grab_super() |
| * is called with sb_lock held and drops it. Returns 1 in case of |
| * success, 0 if we had failed (superblock contents was already dead or |
| * dying when grab_super() had been called). |
| */ |
| static int grab_super(struct super_block *s) |
| { |
| s->s_count++; |
| spin_unlock(&sb_lock); |
| down_write(&s->s_umount); |
| if (s->s_root) { |
| spin_lock(&sb_lock); |
| if (s->s_count > S_BIAS) { |
| atomic_inc(&s->s_active); |
| s->s_count--; |
| spin_unlock(&sb_lock); |
| return 1; |
| } |
| spin_unlock(&sb_lock); |
| } |
| up_write(&s->s_umount); |
| put_super(s); |
| yield(); |
| return 0; |
| } |
| |
| /** |
| * generic_shutdown_super - common helper for ->kill_sb() |
| * @sb: superblock to kill |
| * |
| * generic_shutdown_super() does all fs-independent work on superblock |
| * shutdown. Typical ->kill_sb() should pick all fs-specific objects |
| * that need destruction out of superblock, call generic_shutdown_super() |
| * and release aforementioned objects. Note: dentries and inodes _are_ |
| * taken care of and do not need specific handling. |
| */ |
| void generic_shutdown_super(struct super_block *sb) |
| { |
| struct dentry *root = sb->s_root; |
| struct super_operations *sop = sb->s_op; |
| |
| if (root) { |
| sb->s_root = NULL; |
| shrink_dcache_parent(root); |
| shrink_dcache_anon(&sb->s_anon); |
| dput(root); |
| fsync_super(sb); |
| lock_super(sb); |
| lock_kernel(); |
| sb->s_flags &= ~MS_ACTIVE; |
| /* bad name - it should be evict_inodes() */ |
| invalidate_inodes(sb); |
| |
| if (sop->write_super && sb->s_dirt) |
| sop->write_super(sb); |
| if (sop->put_super) |
| sop->put_super(sb); |
| |
| /* Forget any remaining inodes */ |
| if (invalidate_inodes(sb)) { |
| printk("VFS: Busy inodes after unmount. " |
| "Self-destruct in 5 seconds. Have a nice day...\n"); |
| } |
| |
| unlock_kernel(); |
| unlock_super(sb); |
| } |
| spin_lock(&sb_lock); |
| list_del(&sb->s_list); |
| list_del(&sb->s_instances); |
| spin_unlock(&sb_lock); |
| up_write(&sb->s_umount); |
| } |
| |
| /** |
| * sget - find or create a superblock |
| * @type: filesystem type superblock should belong to |
| * @test: comparison callback |
| * @set: setup callback |
| * @data: argument to each of them |
| */ |
| struct super_block *sget(struct file_system_type *type, |
| int (*test)(struct super_block *,void *), |
| int (*set)(struct super_block *,void *), |
| void *data) |
| { |
| struct super_block *s = alloc_super(); |
| struct list_head *p; |
| int err; |
| |
| if (!s) |
| return ERR_PTR(-ENOMEM); |
| |
| retry: |
| spin_lock(&sb_lock); |
| if (test) list_for_each(p, &type->fs_supers) { |
| struct super_block *old; |
| old = list_entry(p, struct super_block, s_instances); |
| if (!test(old, data)) |
| continue; |
| if (!grab_super(old)) |
| goto retry; |
| destroy_super(s); |
| return old; |
| } |
| err = set(s, data); |
| if (err) { |
| spin_unlock(&sb_lock); |
| destroy_super(s); |
| return ERR_PTR(err); |
| } |
| s->s_type = type; |
| list_add(&s->s_list, super_blocks.prev); |
| list_add(&s->s_instances, &type->fs_supers); |
| spin_unlock(&sb_lock); |
| get_filesystem(type); |
| return s; |
| } |
| |
| struct vfsmount *alloc_vfsmnt(char *name); |
| void free_vfsmnt(struct vfsmount *mnt); |
| |
| void drop_super(struct super_block *sb) |
| { |
| up_read(&sb->s_umount); |
| put_super(sb); |
| } |
| |
| static inline void write_super(struct super_block *sb) |
| { |
| lock_super(sb); |
| if (sb->s_root && sb->s_dirt) |
| if (sb->s_op->write_super) |
| sb->s_op->write_super(sb); |
| unlock_super(sb); |
| } |
| |
| /* |
| * Note: check the dirty flag before waiting, so we don't |
| * hold up the sync while mounting a device. (The newly |
| * mounted device won't need syncing.) |
| */ |
| void sync_supers(void) |
| { |
| struct super_block * sb; |
| restart: |
| spin_lock(&sb_lock); |
| sb = sb_entry(super_blocks.next); |
| while (sb != sb_entry(&super_blocks)) |
| if (sb->s_dirt) { |
| sb->s_count++; |
| spin_unlock(&sb_lock); |
| down_read(&sb->s_umount); |
| write_super(sb); |
| drop_super(sb); |
| goto restart; |
| } else |
| sb = sb_entry(sb->s_list.next); |
| spin_unlock(&sb_lock); |
| } |
| |
| /* |
| * Call the ->sync_fs super_op against all filesytems which are r/w and |
| * which implement it. |
| */ |
| void sync_filesystems(int wait) |
| { |
| struct super_block * sb; |
| |
| spin_lock(&sb_lock); |
| for (sb = sb_entry(super_blocks.next); sb != sb_entry(&super_blocks); |
| sb = sb_entry(sb->s_list.next)) { |
| if (!sb->s_op->sync_fs) |
| continue; |
| if (sb->s_flags & MS_RDONLY) |
| continue; |
| sb->s_need_sync_fs = 1; |
| } |
| spin_unlock(&sb_lock); |
| |
| restart: |
| spin_lock(&sb_lock); |
| for (sb = sb_entry(super_blocks.next); sb != sb_entry(&super_blocks); |
| sb = sb_entry(sb->s_list.next)) { |
| if (!sb->s_need_sync_fs) |
| continue; |
| sb->s_need_sync_fs = 0; |
| if (sb->s_flags & MS_RDONLY) |
| continue; /* hm. Was remounted r/o meanwhile */ |
| sb->s_count++; |
| spin_unlock(&sb_lock); |
| down_read(&sb->s_umount); |
| if (sb->s_root) |
| sb->s_op->sync_fs(sb, wait); |
| drop_super(sb); |
| goto restart; |
| } |
| spin_unlock(&sb_lock); |
| } |
| |
| /** |
| * get_super - get the superblock of a device |
| * @dev: device to get the superblock for |
| * |
| * Scans the superblock list and finds the superblock of the file system |
| * mounted on the device given. %NULL is returned if no match is found. |
| */ |
| |
| struct super_block * get_super(struct block_device *bdev) |
| { |
| struct list_head *p; |
| if (!bdev) |
| return NULL; |
| rescan: |
| spin_lock(&sb_lock); |
| list_for_each(p, &super_blocks) { |
| struct super_block *s = sb_entry(p); |
| if (s->s_bdev == bdev) { |
| s->s_count++; |
| spin_unlock(&sb_lock); |
| down_read(&s->s_umount); |
| if (s->s_root) |
| return s; |
| drop_super(s); |
| goto rescan; |
| } |
| } |
| spin_unlock(&sb_lock); |
| return NULL; |
| } |
| |
| struct super_block * user_get_super(dev_t dev) |
| { |
| struct list_head *p; |
| |
| rescan: |
| spin_lock(&sb_lock); |
| list_for_each(p, &super_blocks) { |
| struct super_block *s = sb_entry(p); |
| if (s->s_dev == dev) { |
| s->s_count++; |
| spin_unlock(&sb_lock); |
| down_read(&s->s_umount); |
| if (s->s_root) |
| return s; |
| drop_super(s); |
| goto rescan; |
| } |
| } |
| spin_unlock(&sb_lock); |
| return NULL; |
| } |
| |
| asmlinkage long sys_ustat(dev_t dev, struct ustat * ubuf) |
| { |
| struct super_block *s; |
| struct ustat tmp; |
| struct statfs sbuf; |
| int err = -EINVAL; |
| |
| s = user_get_super(dev); |
| if (s == NULL) |
| goto out; |
| err = vfs_statfs(s, &sbuf); |
| drop_super(s); |
| if (err) |
| goto out; |
| |
| memset(&tmp,0,sizeof(struct ustat)); |
| tmp.f_tfree = sbuf.f_bfree; |
| tmp.f_tinode = sbuf.f_ffree; |
| |
| err = copy_to_user(ubuf,&tmp,sizeof(struct ustat)) ? -EFAULT : 0; |
| out: |
| return err; |
| } |
| |
| /** |
| * do_remount_sb - asks filesystem to change mount options. |
| * @sb: superblock in question |
| * @flags: numeric part of options |
| * @data: the rest of options |
| * |
| * Alters the mount options of a mounted file system. |
| */ |
| int do_remount_sb(struct super_block *sb, int flags, void *data) |
| { |
| int retval; |
| |
| if (!(flags & MS_RDONLY) && bdev_read_only(sb->s_bdev)) |
| return -EACCES; |
| /*flags |= MS_RDONLY;*/ |
| if (flags & MS_RDONLY) |
| acct_auto_close(sb); |
| shrink_dcache_sb(sb); |
| fsync_super(sb); |
| /* If we are remounting RDONLY, make sure there are no rw files open */ |
| if ((flags & MS_RDONLY) && !(sb->s_flags & MS_RDONLY)) |
| if (!fs_may_remount_ro(sb)) |
| return -EBUSY; |
| if (sb->s_op->remount_fs) { |
| lock_super(sb); |
| retval = sb->s_op->remount_fs(sb, &flags, data); |
| unlock_super(sb); |
| if (retval) |
| return retval; |
| } |
| sb->s_flags = (sb->s_flags & ~MS_RMT_MASK) | (flags & MS_RMT_MASK); |
| return 0; |
| } |
| |
| /* |
| * Unnamed block devices are dummy devices used by virtual |
| * filesystems which don't use real block-devices. -- jrs |
| */ |
| |
| enum {Max_anon = 256}; |
| static unsigned long unnamed_dev_in_use[Max_anon/(8*sizeof(unsigned long))]; |
| static spinlock_t unnamed_dev_lock = SPIN_LOCK_UNLOCKED;/* protects the above */ |
| |
| int set_anon_super(struct super_block *s, void *data) |
| { |
| int dev; |
| spin_lock(&unnamed_dev_lock); |
| dev = find_first_zero_bit(unnamed_dev_in_use, Max_anon); |
| if (dev == Max_anon) { |
| spin_unlock(&unnamed_dev_lock); |
| return -EMFILE; |
| } |
| set_bit(dev, unnamed_dev_in_use); |
| spin_unlock(&unnamed_dev_lock); |
| s->s_dev = MKDEV(0, dev); |
| return 0; |
| } |
| |
| void kill_anon_super(struct super_block *sb) |
| { |
| int slot = MINOR(sb->s_dev); |
| generic_shutdown_super(sb); |
| spin_lock(&unnamed_dev_lock); |
| clear_bit(slot, unnamed_dev_in_use); |
| spin_unlock(&unnamed_dev_lock); |
| } |
| |
| void kill_litter_super(struct super_block *sb) |
| { |
| if (sb->s_root) |
| d_genocide(sb->s_root); |
| kill_anon_super(sb); |
| } |
| |
| static int set_bdev_super(struct super_block *s, void *data) |
| { |
| s->s_bdev = data; |
| s->s_dev = s->s_bdev->bd_dev; |
| return 0; |
| } |
| |
| static int test_bdev_super(struct super_block *s, void *data) |
| { |
| return (void *)s->s_bdev == data; |
| } |
| |
| struct super_block *get_sb_bdev(struct file_system_type *fs_type, |
| int flags, char *dev_name, void * data, |
| int (*fill_super)(struct super_block *, void *, int)) |
| { |
| struct block_device *bdev; |
| struct super_block *s; |
| int error = 0; |
| |
| bdev = open_bdev_excl(dev_name, flags, BDEV_FS, fs_type); |
| if (IS_ERR(bdev)) |
| return (struct super_block *)bdev; |
| |
| s = sget(fs_type, test_bdev_super, set_bdev_super, bdev); |
| if (IS_ERR(s)) |
| goto out; |
| |
| if (s->s_root) { |
| if ((flags ^ s->s_flags) & MS_RDONLY) { |
| up_write(&s->s_umount); |
| deactivate_super(s); |
| s = ERR_PTR(-EBUSY); |
| } |
| goto out; |
| } else { |
| s->s_flags = flags; |
| strncpy(s->s_id, bdevname(bdev), sizeof(s->s_id)); |
| s->s_old_blocksize = block_size(bdev); |
| sb_set_blocksize(s, s->s_old_blocksize); |
| error = fill_super(s, data, flags & MS_VERBOSE ? 1 : 0); |
| if (error) { |
| up_write(&s->s_umount); |
| deactivate_super(s); |
| s = ERR_PTR(error); |
| } else |
| s->s_flags |= MS_ACTIVE; |
| } |
| |
| return s; |
| |
| out: |
| close_bdev_excl(bdev, BDEV_FS); |
| return s; |
| } |
| |
| void kill_block_super(struct super_block *sb) |
| { |
| struct block_device *bdev = sb->s_bdev; |
| generic_shutdown_super(sb); |
| set_blocksize(bdev, sb->s_old_blocksize); |
| close_bdev_excl(bdev, BDEV_FS); |
| } |
| |
| struct super_block *get_sb_nodev(struct file_system_type *fs_type, |
| int flags, void *data, |
| int (*fill_super)(struct super_block *, void *, int)) |
| { |
| int error; |
| struct super_block *s = sget(fs_type, NULL, set_anon_super, NULL); |
| |
| if (IS_ERR(s)) |
| return s; |
| |
| s->s_flags = flags; |
| |
| error = fill_super(s, data, flags & MS_VERBOSE ? 1 : 0); |
| if (error) { |
| up_write(&s->s_umount); |
| deactivate_super(s); |
| return ERR_PTR(error); |
| } |
| s->s_flags |= MS_ACTIVE; |
| return s; |
| } |
| |
| static int compare_single(struct super_block *s, void *p) |
| { |
| return 1; |
| } |
| |
| struct super_block *get_sb_single(struct file_system_type *fs_type, |
| int flags, void *data, |
| int (*fill_super)(struct super_block *, void *, int)) |
| { |
| struct super_block *s; |
| int error; |
| |
| s = sget(fs_type, compare_single, set_anon_super, NULL); |
| if (IS_ERR(s)) |
| return s; |
| if (!s->s_root) { |
| s->s_flags = flags; |
| error = fill_super(s, data, flags & MS_VERBOSE ? 1 : 0); |
| if (error) { |
| up_write(&s->s_umount); |
| deactivate_super(s); |
| return ERR_PTR(error); |
| } |
| s->s_flags |= MS_ACTIVE; |
| } |
| do_remount_sb(s, flags, data); |
| return s; |
| } |
| |
| struct vfsmount * |
| do_kern_mount(const char *fstype, int flags, char *name, void *data) |
| { |
| struct file_system_type *type = get_fs_type(fstype); |
| struct super_block *sb = ERR_PTR(-ENOMEM); |
| struct vfsmount *mnt; |
| |
| if (!type) |
| return ERR_PTR(-ENODEV); |
| |
| mnt = alloc_vfsmnt(name); |
| if (!mnt) |
| goto out; |
| sb = type->get_sb(type, flags, name, data); |
| if (IS_ERR(sb)) |
| goto out_mnt; |
| mnt->mnt_sb = sb; |
| mnt->mnt_root = dget(sb->s_root); |
| mnt->mnt_mountpoint = sb->s_root; |
| mnt->mnt_parent = mnt; |
| up_write(&sb->s_umount); |
| put_filesystem(type); |
| return mnt; |
| out_mnt: |
| free_vfsmnt(mnt); |
| out: |
| put_filesystem(type); |
| return (struct vfsmount *)sb; |
| } |
| |
| struct vfsmount *kern_mount(struct file_system_type *type) |
| { |
| return do_kern_mount(type->name, 0, (char *)type->name, NULL); |
| } |