freebsd-skq/sys/ufs/ffs/ffs_vnops.c
kato fe9b86cf0b Clustered read and write are switched at mount-option level.
1. Clustered I/O is switched by the MNT_NOCLUSTERR and MNT_NOCLUSTERW
   bits of the mnt_flag.  The sysctl variables, vfs.foo.doclusterread
   and vfs.foo.doclusterwrite are deleted.  Only mount option can
   control clustered I/O from userland.
2. When foofs_mount mounts block device, foofs_mount checks D_CLUSTERR
   and D_CLUSTERW bits of the d_flags member in the block device switch
   table.  If D_NOCLUSTERR / D_NOCLUSTERW are set, MNT_NOCLUSTERR /
   MNT_NOCLUSTERW bits will be set.  In this case, MNT_NOCLUSTERR and
   MNT_NOCLUSTERW cannot be cleared from userland.
3. Vnode driver disables both clustered read and write.
4. Union filesystem disables clutered write.

Reviewed by:	bde
1997-09-27 13:40:20 +00:00

344 lines
13 KiB
C

/*
* Copyright (c) 1982, 1986, 1989, 1993
* The Regents of the University of California. All rights reserved.
*
* Redistribution and use in source and binary forms, with or without
* modification, are permitted provided that the following conditions
* are met:
* 1. Redistributions of source code must retain the above copyright
* notice, this list of conditions and the following disclaimer.
* 2. Redistributions in binary form must reproduce the above copyright
* notice, this list of conditions and the following disclaimer in the
* documentation and/or other materials provided with the distribution.
* 3. All advertising materials mentioning features or use of this software
* must display the following acknowledgement:
* This product includes software developed by the University of
* California, Berkeley and its contributors.
* 4. Neither the name of the University nor the names of its contributors
* may be used to endorse or promote products derived from this software
* without specific prior written permission.
*
* THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
* ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
* IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
* ARE DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
* FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
* DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
* OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
* HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
* LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
* OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
* SUCH DAMAGE.
*
* @(#)ffs_vnops.c 8.15 (Berkeley) 5/14/95
* $Id: ffs_vnops.c,v 1.29 1997/09/14 02:58:05 peter Exp $
*/
#include <sys/param.h>
#include <sys/systm.h>
#include <sys/resourcevar.h>
#include <sys/signalvar.h>
#include <sys/kernel.h>
#include <sys/stat.h>
#include <sys/buf.h>
#include <sys/proc.h>
#include <sys/mount.h>
#include <sys/sysctl.h>
#include <sys/vnode.h>
#include <sys/malloc.h>
#include <vm/vm.h>
#include <vm/vm_prot.h>
#include <vm/vm_page.h>
#include <vm/vm_object.h>
#include <vm/vm_extern.h>
#include <miscfs/specfs/specdev.h>
#include <miscfs/fifofs/fifo.h>
#include <ufs/ufs/quota.h>
#include <ufs/ufs/inode.h>
#include <ufs/ufs/ufsmount.h>
#include <ufs/ufs/ufs_extern.h>
#include <ufs/ffs/fs.h>
#include <ufs/ffs/ffs_extern.h>
static int ffs_fsync __P((struct vop_fsync_args *));
static int ffs_getpages __P((struct vop_getpages_args *));
static int ffs_read __P((struct vop_read_args *));
static int ffs_write __P((struct vop_write_args *));
/* Global vfs data structures for ufs. */
vop_t **ffs_vnodeop_p;
static struct vnodeopv_entry_desc ffs_vnodeop_entries[] = {
{ &vop_default_desc, (vop_t *)vn_default_error },
{ &vop_lookup_desc, (vop_t *)vfs_cache_lookup },/* lookup */
{ &vop_cachedlookup_desc, (vop_t *)ufs_lookup },/* cachedlookup */
{ &vop_create_desc, (vop_t *)ufs_create }, /* create */
{ &vop_whiteout_desc, (vop_t *)ufs_whiteout }, /* whiteout */
{ &vop_mknod_desc, (vop_t *)ufs_mknod }, /* mknod */
{ &vop_open_desc, (vop_t *)ufs_open }, /* open */
{ &vop_close_desc, (vop_t *)ufs_close }, /* close */
{ &vop_access_desc, (vop_t *)ufs_access }, /* access */
{ &vop_getattr_desc, (vop_t *)ufs_getattr }, /* getattr */
{ &vop_setattr_desc, (vop_t *)ufs_setattr }, /* setattr */
{ &vop_read_desc, (vop_t *)ffs_read }, /* read */
{ &vop_write_desc, (vop_t *)ffs_write }, /* write */
{ &vop_lease_desc, (vop_t *)ufs_lease_check }, /* lease */
{ &vop_ioctl_desc, (vop_t *)ufs_ioctl }, /* ioctl */
{ &vop_poll_desc, (vop_t *)ufs_poll }, /* poll */
{ &vop_revoke_desc, (vop_t *)ufs_revoke }, /* revoke */
{ &vop_mmap_desc, (vop_t *)ufs_mmap }, /* mmap */
{ &vop_fsync_desc, (vop_t *)ffs_fsync }, /* fsync */
{ &vop_seek_desc, (vop_t *)ufs_seek }, /* seek */
{ &vop_remove_desc, (vop_t *)ufs_remove }, /* remove */
{ &vop_link_desc, (vop_t *)ufs_link }, /* link */
{ &vop_rename_desc, (vop_t *)ufs_rename }, /* rename */
{ &vop_mkdir_desc, (vop_t *)ufs_mkdir }, /* mkdir */
{ &vop_rmdir_desc, (vop_t *)ufs_rmdir }, /* rmdir */
{ &vop_symlink_desc, (vop_t *)ufs_symlink }, /* symlink */
{ &vop_readdir_desc, (vop_t *)ufs_readdir }, /* readdir */
{ &vop_readlink_desc, (vop_t *)ufs_readlink }, /* readlink */
{ &vop_abortop_desc, (vop_t *)ufs_abortop }, /* abortop */
{ &vop_inactive_desc, (vop_t *)ufs_inactive }, /* inactive */
{ &vop_reclaim_desc, (vop_t *)ffs_reclaim }, /* reclaim */
{ &vop_lock_desc, (vop_t *)ufs_lock }, /* lock */
{ &vop_unlock_desc, (vop_t *)ufs_unlock }, /* unlock */
{ &vop_bmap_desc, (vop_t *)ufs_bmap }, /* bmap */
{ &vop_strategy_desc, (vop_t *)ufs_strategy }, /* strategy */
{ &vop_print_desc, (vop_t *)ufs_print }, /* print */
{ &vop_islocked_desc, (vop_t *)ufs_islocked }, /* islocked */
{ &vop_pathconf_desc, (vop_t *)ufs_pathconf }, /* pathconf */
{ &vop_advlock_desc, (vop_t *)ufs_advlock }, /* advlock */
{ &vop_blkatoff_desc, (vop_t *)ffs_blkatoff }, /* blkatoff */
{ &vop_valloc_desc, (vop_t *)ffs_valloc }, /* valloc */
{ &vop_reallocblks_desc, (vop_t *)ffs_reallocblks }, /* reallocblks */
{ &vop_vfree_desc, (vop_t *)ffs_vfree }, /* vfree */
{ &vop_truncate_desc, (vop_t *)ffs_truncate }, /* truncate */
{ &vop_update_desc, (vop_t *)ffs_update }, /* update */
{ &vop_getpages_desc, (vop_t *)ffs_getpages}, /* getpages */
/* XXX: vop_putpages */
{ &vop_bwrite_desc, (vop_t *)vn_bwrite }, /* bwrite */
{ NULL, NULL }
};
static struct vnodeopv_desc ffs_vnodeop_opv_desc =
{ &ffs_vnodeop_p, ffs_vnodeop_entries };
vop_t **ffs_specop_p;
static struct vnodeopv_entry_desc ffs_specop_entries[] = {
{ &vop_default_desc, (vop_t *)vn_default_error },
{ &vop_lookup_desc, (vop_t *)spec_lookup }, /* lookup */
/* XXX: vop_cachedlookup */
{ &vop_create_desc, (vop_t *)spec_create }, /* create */
/* XXX: vop_whiteout */
{ &vop_mknod_desc, (vop_t *)spec_mknod }, /* mknod */
{ &vop_open_desc, (vop_t *)spec_open }, /* open */
{ &vop_close_desc, (vop_t *)ufsspec_close }, /* close */
{ &vop_access_desc, (vop_t *)ufs_access }, /* access */
{ &vop_getattr_desc, (vop_t *)ufs_getattr }, /* getattr */
{ &vop_setattr_desc, (vop_t *)ufs_setattr }, /* setattr */
{ &vop_read_desc, (vop_t *)ufsspec_read }, /* read */
{ &vop_write_desc, (vop_t *)ufsspec_write }, /* write */
{ &vop_lease_desc, (vop_t *)spec_lease_check }, /* lease */
{ &vop_ioctl_desc, (vop_t *)spec_ioctl }, /* ioctl */
{ &vop_poll_desc, (vop_t *)spec_poll }, /* poll */
{ &vop_revoke_desc, (vop_t *)spec_revoke }, /* revoke */
{ &vop_mmap_desc, (vop_t *)spec_mmap }, /* mmap */
{ &vop_fsync_desc, (vop_t *)ffs_fsync }, /* fsync */
{ &vop_seek_desc, (vop_t *)spec_seek }, /* seek */
{ &vop_remove_desc, (vop_t *)spec_remove }, /* remove */
{ &vop_link_desc, (vop_t *)spec_link }, /* link */
{ &vop_rename_desc, (vop_t *)spec_rename }, /* rename */
{ &vop_mkdir_desc, (vop_t *)spec_mkdir }, /* mkdir */
{ &vop_rmdir_desc, (vop_t *)spec_rmdir }, /* rmdir */
{ &vop_symlink_desc, (vop_t *)spec_symlink }, /* symlink */
{ &vop_readdir_desc, (vop_t *)spec_readdir }, /* readdir */
{ &vop_readlink_desc, (vop_t *)spec_readlink }, /* readlink */
{ &vop_abortop_desc, (vop_t *)spec_abortop }, /* abortop */
{ &vop_inactive_desc, (vop_t *)ufs_inactive }, /* inactive */
{ &vop_reclaim_desc, (vop_t *)ffs_reclaim }, /* reclaim */
{ &vop_lock_desc, (vop_t *)ufs_lock }, /* lock */
{ &vop_unlock_desc, (vop_t *)ufs_unlock }, /* unlock */
{ &vop_bmap_desc, (vop_t *)spec_bmap }, /* bmap */
{ &vop_strategy_desc, (vop_t *)spec_strategy }, /* strategy */
{ &vop_print_desc, (vop_t *)ufs_print }, /* print */
{ &vop_islocked_desc, (vop_t *)ufs_islocked }, /* islocked */
{ &vop_pathconf_desc, (vop_t *)spec_pathconf }, /* pathconf */
{ &vop_advlock_desc, (vop_t *)spec_advlock }, /* advlock */
{ &vop_blkatoff_desc, (vop_t *)spec_blkatoff }, /* blkatoff */
{ &vop_valloc_desc, (vop_t *)spec_valloc }, /* valloc */
{ &vop_reallocblks_desc, (vop_t *)spec_reallocblks }, /* reallocblks */
{ &vop_vfree_desc, (vop_t *)ffs_vfree }, /* vfree */
{ &vop_truncate_desc, (vop_t *)spec_truncate }, /* truncate */
{ &vop_update_desc, (vop_t *)ffs_update }, /* update */
{ &vop_getpages_desc, (vop_t *)spec_getpages}, /* getpages */
/* XXX: vop_putpages */
{ &vop_bwrite_desc, (vop_t *)vn_bwrite }, /* bwrite */
{ NULL, NULL }
};
static struct vnodeopv_desc ffs_specop_opv_desc =
{ &ffs_specop_p, ffs_specop_entries };
vop_t **ffs_fifoop_p;
static struct vnodeopv_entry_desc ffs_fifoop_entries[] = {
{ &vop_default_desc, (vop_t *)vn_default_error },
{ &vop_lookup_desc, (vop_t *)fifo_lookup }, /* lookup */
/* XXX: vop_cachedlookup */
{ &vop_create_desc, (vop_t *)fifo_create }, /* create */
/* XXX: vop_whiteout */
{ &vop_mknod_desc, (vop_t *)fifo_mknod }, /* mknod */
{ &vop_open_desc, (vop_t *)fifo_open }, /* open */
{ &vop_close_desc, (vop_t *)ufsfifo_close }, /* close */
{ &vop_access_desc, (vop_t *)ufs_access }, /* access */
{ &vop_getattr_desc, (vop_t *)ufs_getattr }, /* getattr */
{ &vop_setattr_desc, (vop_t *)ufs_setattr }, /* setattr */
{ &vop_read_desc, (vop_t *)ufsfifo_read }, /* read */
{ &vop_write_desc, (vop_t *)ufsfifo_write }, /* write */
{ &vop_lease_desc, (vop_t *)fifo_lease_check }, /* lease */
{ &vop_ioctl_desc, (vop_t *)fifo_ioctl }, /* ioctl */
{ &vop_poll_desc, (vop_t *)fifo_poll }, /* poll */
{ &vop_revoke_desc, (vop_t *)fifo_revoke }, /* revoke */
{ &vop_mmap_desc, (vop_t *)fifo_mmap }, /* mmap */
{ &vop_fsync_desc, (vop_t *)ffs_fsync }, /* fsync */
{ &vop_seek_desc, (vop_t *)fifo_seek }, /* seek */
{ &vop_remove_desc, (vop_t *)fifo_remove }, /* remove */
{ &vop_link_desc, (vop_t *)fifo_link }, /* link */
{ &vop_rename_desc, (vop_t *)fifo_rename }, /* rename */
{ &vop_mkdir_desc, (vop_t *)fifo_mkdir }, /* mkdir */
{ &vop_rmdir_desc, (vop_t *)fifo_rmdir }, /* rmdir */
{ &vop_symlink_desc, (vop_t *)fifo_symlink }, /* symlink */
{ &vop_readdir_desc, (vop_t *)fifo_readdir }, /* readdir */
{ &vop_readlink_desc, (vop_t *)fifo_readlink }, /* readlink */
{ &vop_abortop_desc, (vop_t *)fifo_abortop }, /* abortop */
{ &vop_inactive_desc, (vop_t *)ufs_inactive }, /* inactive */
{ &vop_reclaim_desc, (vop_t *)ffs_reclaim }, /* reclaim */
{ &vop_lock_desc, (vop_t *)ufs_lock }, /* lock */
{ &vop_unlock_desc, (vop_t *)ufs_unlock }, /* unlock */
{ &vop_bmap_desc, (vop_t *)fifo_bmap }, /* bmap */
{ &vop_strategy_desc, (vop_t *)fifo_strategy }, /* strategy */
{ &vop_print_desc, (vop_t *)ufs_print }, /* print */
{ &vop_islocked_desc, (vop_t *)ufs_islocked }, /* islocked */
{ &vop_pathconf_desc, (vop_t *)fifo_pathconf }, /* pathconf */
{ &vop_advlock_desc, (vop_t *)fifo_advlock }, /* advlock */
{ &vop_blkatoff_desc, (vop_t *)fifo_blkatoff }, /* blkatoff */
{ &vop_valloc_desc, (vop_t *)fifo_valloc }, /* valloc */
{ &vop_reallocblks_desc, (vop_t *)fifo_reallocblks }, /* reallocblks */
{ &vop_vfree_desc, (vop_t *)ffs_vfree }, /* vfree */
{ &vop_truncate_desc, (vop_t *)fifo_truncate }, /* truncate */
{ &vop_update_desc, (vop_t *)ffs_update }, /* update */
/* XXX: vop_getpages */
/* XXX: vop_putpages */
{ &vop_bwrite_desc, (vop_t *)vn_bwrite }, /* bwrite */
{ NULL, NULL }
};
static struct vnodeopv_desc ffs_fifoop_opv_desc =
{ &ffs_fifoop_p, ffs_fifoop_entries };
VNODEOP_SET(ffs_vnodeop_opv_desc);
VNODEOP_SET(ffs_specop_opv_desc);
VNODEOP_SET(ffs_fifoop_opv_desc);
SYSCTL_NODE(_vfs, MOUNT_UFS, ffs, CTLFLAG_RW, 0, "FFS filesystem");
#include <ufs/ufs/ufs_readwrite.c>
/*
* Synch an open file.
*/
/* ARGSUSED */
static int
ffs_fsync(ap)
struct vop_fsync_args /* {
struct vnode *a_vp;
struct ucred *a_cred;
int a_waitfor;
struct proc *a_p;
} */ *ap;
{
register struct vnode *vp = ap->a_vp;
register struct buf *bp;
struct timeval tv;
struct buf *nbp;
int pass;
int s;
pass = 0;
/*
* Flush all dirty buffers associated with a vnode.
*/
loop:
s = splbio();
for (bp = vp->v_dirtyblkhd.lh_first; bp; bp = nbp) {
nbp = bp->b_vnbufs.le_next;
if ((bp->b_flags & B_BUSY) || (pass == 0 && (bp->b_blkno < 0)))
continue;
if ((bp->b_flags & B_DELWRI) == 0)
panic("ffs_fsync: not dirty");
if (bp->b_vp != vp || ap->a_waitfor != MNT_NOWAIT) {
bremfree(bp);
bp->b_flags |= B_BUSY;
splx(s);
/*
* Wait for I/O associated with indirect blocks to complete,
* since there is no way to quickly wait for them below.
*/
if (bp->b_vp == vp || ap->a_waitfor == MNT_NOWAIT)
(void) bawrite(bp);
else
(void) bwrite(bp);
} else {
vfs_bio_awrite(bp);
splx(s);
}
goto loop;
}
splx(s);
if (pass == 0) {
pass = 1;
goto loop;
}
if (ap->a_waitfor == MNT_WAIT) {
s = splbio();
while (vp->v_numoutput) {
vp->v_flag |= VBWAIT;
(void) tsleep((caddr_t)&vp->v_numoutput, PRIBIO + 1, "ffsfsn", 0);
}
splx(s);
#ifdef DIAGNOSTIC
if (vp->v_dirtyblkhd.lh_first) {
vprint("ffs_fsync: dirty", vp);
goto loop;
}
#endif
}
gettime(&tv);
return (VOP_UPDATE(ap->a_vp, &tv, &tv, ap->a_waitfor == MNT_WAIT));
}
/*
* Reclaim an inode so that it can be used for other purposes.
*/
int
ffs_reclaim(ap)
struct vop_reclaim_args /* {
struct vnode *a_vp;
struct proc *a_p;
} */ *ap;
{
register struct vnode *vp = ap->a_vp;
int error;
if (error = ufs_reclaim(vp, ap->a_p))
return (error);
FREE(vp->v_data, VFSTOUFS(vp->v_mount)->um_devvp->v_tag == VT_MFS ?
M_MFSNODE : M_FFSNODE);
vp->v_data = NULL;
return (0);
}