fe9b86cf0b
1. Clustered I/O is switched by the MNT_NOCLUSTERR and MNT_NOCLUSTERW bits of the mnt_flag. The sysctl variables, vfs.foo.doclusterread and vfs.foo.doclusterwrite are deleted. Only mount option can control clustered I/O from userland. 2. When foofs_mount mounts block device, foofs_mount checks D_CLUSTERR and D_CLUSTERW bits of the d_flags member in the block device switch table. If D_NOCLUSTERR / D_NOCLUSTERW are set, MNT_NOCLUSTERR / MNT_NOCLUSTERW bits will be set. In this case, MNT_NOCLUSTERR and MNT_NOCLUSTERW cannot be cleared from userland. 3. Vnode driver disables both clustered read and write. 4. Union filesystem disables clutered write. Reviewed by: bde
344 lines
13 KiB
C
344 lines
13 KiB
C
/*
|
|
* Copyright (c) 1982, 1986, 1989, 1993
|
|
* The Regents of the University of California. All rights reserved.
|
|
*
|
|
* Redistribution and use in source and binary forms, with or without
|
|
* modification, are permitted provided that the following conditions
|
|
* are met:
|
|
* 1. Redistributions of source code must retain the above copyright
|
|
* notice, this list of conditions and the following disclaimer.
|
|
* 2. Redistributions in binary form must reproduce the above copyright
|
|
* notice, this list of conditions and the following disclaimer in the
|
|
* documentation and/or other materials provided with the distribution.
|
|
* 3. All advertising materials mentioning features or use of this software
|
|
* must display the following acknowledgement:
|
|
* This product includes software developed by the University of
|
|
* California, Berkeley and its contributors.
|
|
* 4. Neither the name of the University nor the names of its contributors
|
|
* may be used to endorse or promote products derived from this software
|
|
* without specific prior written permission.
|
|
*
|
|
* THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
|
|
* ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
|
|
* IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
|
|
* ARE DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
|
|
* FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
|
|
* DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
|
|
* OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
|
|
* HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
|
|
* LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
|
|
* OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
|
|
* SUCH DAMAGE.
|
|
*
|
|
* @(#)ffs_vnops.c 8.15 (Berkeley) 5/14/95
|
|
* $Id: ffs_vnops.c,v 1.29 1997/09/14 02:58:05 peter Exp $
|
|
*/
|
|
|
|
#include <sys/param.h>
|
|
#include <sys/systm.h>
|
|
#include <sys/resourcevar.h>
|
|
#include <sys/signalvar.h>
|
|
#include <sys/kernel.h>
|
|
#include <sys/stat.h>
|
|
#include <sys/buf.h>
|
|
#include <sys/proc.h>
|
|
#include <sys/mount.h>
|
|
#include <sys/sysctl.h>
|
|
#include <sys/vnode.h>
|
|
#include <sys/malloc.h>
|
|
|
|
#include <vm/vm.h>
|
|
#include <vm/vm_prot.h>
|
|
#include <vm/vm_page.h>
|
|
#include <vm/vm_object.h>
|
|
#include <vm/vm_extern.h>
|
|
|
|
#include <miscfs/specfs/specdev.h>
|
|
#include <miscfs/fifofs/fifo.h>
|
|
|
|
#include <ufs/ufs/quota.h>
|
|
#include <ufs/ufs/inode.h>
|
|
#include <ufs/ufs/ufsmount.h>
|
|
#include <ufs/ufs/ufs_extern.h>
|
|
|
|
#include <ufs/ffs/fs.h>
|
|
#include <ufs/ffs/ffs_extern.h>
|
|
|
|
static int ffs_fsync __P((struct vop_fsync_args *));
|
|
static int ffs_getpages __P((struct vop_getpages_args *));
|
|
static int ffs_read __P((struct vop_read_args *));
|
|
static int ffs_write __P((struct vop_write_args *));
|
|
|
|
/* Global vfs data structures for ufs. */
|
|
vop_t **ffs_vnodeop_p;
|
|
static struct vnodeopv_entry_desc ffs_vnodeop_entries[] = {
|
|
{ &vop_default_desc, (vop_t *)vn_default_error },
|
|
{ &vop_lookup_desc, (vop_t *)vfs_cache_lookup },/* lookup */
|
|
{ &vop_cachedlookup_desc, (vop_t *)ufs_lookup },/* cachedlookup */
|
|
{ &vop_create_desc, (vop_t *)ufs_create }, /* create */
|
|
{ &vop_whiteout_desc, (vop_t *)ufs_whiteout }, /* whiteout */
|
|
{ &vop_mknod_desc, (vop_t *)ufs_mknod }, /* mknod */
|
|
{ &vop_open_desc, (vop_t *)ufs_open }, /* open */
|
|
{ &vop_close_desc, (vop_t *)ufs_close }, /* close */
|
|
{ &vop_access_desc, (vop_t *)ufs_access }, /* access */
|
|
{ &vop_getattr_desc, (vop_t *)ufs_getattr }, /* getattr */
|
|
{ &vop_setattr_desc, (vop_t *)ufs_setattr }, /* setattr */
|
|
{ &vop_read_desc, (vop_t *)ffs_read }, /* read */
|
|
{ &vop_write_desc, (vop_t *)ffs_write }, /* write */
|
|
{ &vop_lease_desc, (vop_t *)ufs_lease_check }, /* lease */
|
|
{ &vop_ioctl_desc, (vop_t *)ufs_ioctl }, /* ioctl */
|
|
{ &vop_poll_desc, (vop_t *)ufs_poll }, /* poll */
|
|
{ &vop_revoke_desc, (vop_t *)ufs_revoke }, /* revoke */
|
|
{ &vop_mmap_desc, (vop_t *)ufs_mmap }, /* mmap */
|
|
{ &vop_fsync_desc, (vop_t *)ffs_fsync }, /* fsync */
|
|
{ &vop_seek_desc, (vop_t *)ufs_seek }, /* seek */
|
|
{ &vop_remove_desc, (vop_t *)ufs_remove }, /* remove */
|
|
{ &vop_link_desc, (vop_t *)ufs_link }, /* link */
|
|
{ &vop_rename_desc, (vop_t *)ufs_rename }, /* rename */
|
|
{ &vop_mkdir_desc, (vop_t *)ufs_mkdir }, /* mkdir */
|
|
{ &vop_rmdir_desc, (vop_t *)ufs_rmdir }, /* rmdir */
|
|
{ &vop_symlink_desc, (vop_t *)ufs_symlink }, /* symlink */
|
|
{ &vop_readdir_desc, (vop_t *)ufs_readdir }, /* readdir */
|
|
{ &vop_readlink_desc, (vop_t *)ufs_readlink }, /* readlink */
|
|
{ &vop_abortop_desc, (vop_t *)ufs_abortop }, /* abortop */
|
|
{ &vop_inactive_desc, (vop_t *)ufs_inactive }, /* inactive */
|
|
{ &vop_reclaim_desc, (vop_t *)ffs_reclaim }, /* reclaim */
|
|
{ &vop_lock_desc, (vop_t *)ufs_lock }, /* lock */
|
|
{ &vop_unlock_desc, (vop_t *)ufs_unlock }, /* unlock */
|
|
{ &vop_bmap_desc, (vop_t *)ufs_bmap }, /* bmap */
|
|
{ &vop_strategy_desc, (vop_t *)ufs_strategy }, /* strategy */
|
|
{ &vop_print_desc, (vop_t *)ufs_print }, /* print */
|
|
{ &vop_islocked_desc, (vop_t *)ufs_islocked }, /* islocked */
|
|
{ &vop_pathconf_desc, (vop_t *)ufs_pathconf }, /* pathconf */
|
|
{ &vop_advlock_desc, (vop_t *)ufs_advlock }, /* advlock */
|
|
{ &vop_blkatoff_desc, (vop_t *)ffs_blkatoff }, /* blkatoff */
|
|
{ &vop_valloc_desc, (vop_t *)ffs_valloc }, /* valloc */
|
|
{ &vop_reallocblks_desc, (vop_t *)ffs_reallocblks }, /* reallocblks */
|
|
{ &vop_vfree_desc, (vop_t *)ffs_vfree }, /* vfree */
|
|
{ &vop_truncate_desc, (vop_t *)ffs_truncate }, /* truncate */
|
|
{ &vop_update_desc, (vop_t *)ffs_update }, /* update */
|
|
{ &vop_getpages_desc, (vop_t *)ffs_getpages}, /* getpages */
|
|
/* XXX: vop_putpages */
|
|
{ &vop_bwrite_desc, (vop_t *)vn_bwrite }, /* bwrite */
|
|
{ NULL, NULL }
|
|
};
|
|
static struct vnodeopv_desc ffs_vnodeop_opv_desc =
|
|
{ &ffs_vnodeop_p, ffs_vnodeop_entries };
|
|
|
|
vop_t **ffs_specop_p;
|
|
static struct vnodeopv_entry_desc ffs_specop_entries[] = {
|
|
{ &vop_default_desc, (vop_t *)vn_default_error },
|
|
{ &vop_lookup_desc, (vop_t *)spec_lookup }, /* lookup */
|
|
/* XXX: vop_cachedlookup */
|
|
{ &vop_create_desc, (vop_t *)spec_create }, /* create */
|
|
/* XXX: vop_whiteout */
|
|
{ &vop_mknod_desc, (vop_t *)spec_mknod }, /* mknod */
|
|
{ &vop_open_desc, (vop_t *)spec_open }, /* open */
|
|
{ &vop_close_desc, (vop_t *)ufsspec_close }, /* close */
|
|
{ &vop_access_desc, (vop_t *)ufs_access }, /* access */
|
|
{ &vop_getattr_desc, (vop_t *)ufs_getattr }, /* getattr */
|
|
{ &vop_setattr_desc, (vop_t *)ufs_setattr }, /* setattr */
|
|
{ &vop_read_desc, (vop_t *)ufsspec_read }, /* read */
|
|
{ &vop_write_desc, (vop_t *)ufsspec_write }, /* write */
|
|
{ &vop_lease_desc, (vop_t *)spec_lease_check }, /* lease */
|
|
{ &vop_ioctl_desc, (vop_t *)spec_ioctl }, /* ioctl */
|
|
{ &vop_poll_desc, (vop_t *)spec_poll }, /* poll */
|
|
{ &vop_revoke_desc, (vop_t *)spec_revoke }, /* revoke */
|
|
{ &vop_mmap_desc, (vop_t *)spec_mmap }, /* mmap */
|
|
{ &vop_fsync_desc, (vop_t *)ffs_fsync }, /* fsync */
|
|
{ &vop_seek_desc, (vop_t *)spec_seek }, /* seek */
|
|
{ &vop_remove_desc, (vop_t *)spec_remove }, /* remove */
|
|
{ &vop_link_desc, (vop_t *)spec_link }, /* link */
|
|
{ &vop_rename_desc, (vop_t *)spec_rename }, /* rename */
|
|
{ &vop_mkdir_desc, (vop_t *)spec_mkdir }, /* mkdir */
|
|
{ &vop_rmdir_desc, (vop_t *)spec_rmdir }, /* rmdir */
|
|
{ &vop_symlink_desc, (vop_t *)spec_symlink }, /* symlink */
|
|
{ &vop_readdir_desc, (vop_t *)spec_readdir }, /* readdir */
|
|
{ &vop_readlink_desc, (vop_t *)spec_readlink }, /* readlink */
|
|
{ &vop_abortop_desc, (vop_t *)spec_abortop }, /* abortop */
|
|
{ &vop_inactive_desc, (vop_t *)ufs_inactive }, /* inactive */
|
|
{ &vop_reclaim_desc, (vop_t *)ffs_reclaim }, /* reclaim */
|
|
{ &vop_lock_desc, (vop_t *)ufs_lock }, /* lock */
|
|
{ &vop_unlock_desc, (vop_t *)ufs_unlock }, /* unlock */
|
|
{ &vop_bmap_desc, (vop_t *)spec_bmap }, /* bmap */
|
|
{ &vop_strategy_desc, (vop_t *)spec_strategy }, /* strategy */
|
|
{ &vop_print_desc, (vop_t *)ufs_print }, /* print */
|
|
{ &vop_islocked_desc, (vop_t *)ufs_islocked }, /* islocked */
|
|
{ &vop_pathconf_desc, (vop_t *)spec_pathconf }, /* pathconf */
|
|
{ &vop_advlock_desc, (vop_t *)spec_advlock }, /* advlock */
|
|
{ &vop_blkatoff_desc, (vop_t *)spec_blkatoff }, /* blkatoff */
|
|
{ &vop_valloc_desc, (vop_t *)spec_valloc }, /* valloc */
|
|
{ &vop_reallocblks_desc, (vop_t *)spec_reallocblks }, /* reallocblks */
|
|
{ &vop_vfree_desc, (vop_t *)ffs_vfree }, /* vfree */
|
|
{ &vop_truncate_desc, (vop_t *)spec_truncate }, /* truncate */
|
|
{ &vop_update_desc, (vop_t *)ffs_update }, /* update */
|
|
{ &vop_getpages_desc, (vop_t *)spec_getpages}, /* getpages */
|
|
/* XXX: vop_putpages */
|
|
{ &vop_bwrite_desc, (vop_t *)vn_bwrite }, /* bwrite */
|
|
{ NULL, NULL }
|
|
};
|
|
static struct vnodeopv_desc ffs_specop_opv_desc =
|
|
{ &ffs_specop_p, ffs_specop_entries };
|
|
|
|
vop_t **ffs_fifoop_p;
|
|
static struct vnodeopv_entry_desc ffs_fifoop_entries[] = {
|
|
{ &vop_default_desc, (vop_t *)vn_default_error },
|
|
{ &vop_lookup_desc, (vop_t *)fifo_lookup }, /* lookup */
|
|
/* XXX: vop_cachedlookup */
|
|
{ &vop_create_desc, (vop_t *)fifo_create }, /* create */
|
|
/* XXX: vop_whiteout */
|
|
{ &vop_mknod_desc, (vop_t *)fifo_mknod }, /* mknod */
|
|
{ &vop_open_desc, (vop_t *)fifo_open }, /* open */
|
|
{ &vop_close_desc, (vop_t *)ufsfifo_close }, /* close */
|
|
{ &vop_access_desc, (vop_t *)ufs_access }, /* access */
|
|
{ &vop_getattr_desc, (vop_t *)ufs_getattr }, /* getattr */
|
|
{ &vop_setattr_desc, (vop_t *)ufs_setattr }, /* setattr */
|
|
{ &vop_read_desc, (vop_t *)ufsfifo_read }, /* read */
|
|
{ &vop_write_desc, (vop_t *)ufsfifo_write }, /* write */
|
|
{ &vop_lease_desc, (vop_t *)fifo_lease_check }, /* lease */
|
|
{ &vop_ioctl_desc, (vop_t *)fifo_ioctl }, /* ioctl */
|
|
{ &vop_poll_desc, (vop_t *)fifo_poll }, /* poll */
|
|
{ &vop_revoke_desc, (vop_t *)fifo_revoke }, /* revoke */
|
|
{ &vop_mmap_desc, (vop_t *)fifo_mmap }, /* mmap */
|
|
{ &vop_fsync_desc, (vop_t *)ffs_fsync }, /* fsync */
|
|
{ &vop_seek_desc, (vop_t *)fifo_seek }, /* seek */
|
|
{ &vop_remove_desc, (vop_t *)fifo_remove }, /* remove */
|
|
{ &vop_link_desc, (vop_t *)fifo_link }, /* link */
|
|
{ &vop_rename_desc, (vop_t *)fifo_rename }, /* rename */
|
|
{ &vop_mkdir_desc, (vop_t *)fifo_mkdir }, /* mkdir */
|
|
{ &vop_rmdir_desc, (vop_t *)fifo_rmdir }, /* rmdir */
|
|
{ &vop_symlink_desc, (vop_t *)fifo_symlink }, /* symlink */
|
|
{ &vop_readdir_desc, (vop_t *)fifo_readdir }, /* readdir */
|
|
{ &vop_readlink_desc, (vop_t *)fifo_readlink }, /* readlink */
|
|
{ &vop_abortop_desc, (vop_t *)fifo_abortop }, /* abortop */
|
|
{ &vop_inactive_desc, (vop_t *)ufs_inactive }, /* inactive */
|
|
{ &vop_reclaim_desc, (vop_t *)ffs_reclaim }, /* reclaim */
|
|
{ &vop_lock_desc, (vop_t *)ufs_lock }, /* lock */
|
|
{ &vop_unlock_desc, (vop_t *)ufs_unlock }, /* unlock */
|
|
{ &vop_bmap_desc, (vop_t *)fifo_bmap }, /* bmap */
|
|
{ &vop_strategy_desc, (vop_t *)fifo_strategy }, /* strategy */
|
|
{ &vop_print_desc, (vop_t *)ufs_print }, /* print */
|
|
{ &vop_islocked_desc, (vop_t *)ufs_islocked }, /* islocked */
|
|
{ &vop_pathconf_desc, (vop_t *)fifo_pathconf }, /* pathconf */
|
|
{ &vop_advlock_desc, (vop_t *)fifo_advlock }, /* advlock */
|
|
{ &vop_blkatoff_desc, (vop_t *)fifo_blkatoff }, /* blkatoff */
|
|
{ &vop_valloc_desc, (vop_t *)fifo_valloc }, /* valloc */
|
|
{ &vop_reallocblks_desc, (vop_t *)fifo_reallocblks }, /* reallocblks */
|
|
{ &vop_vfree_desc, (vop_t *)ffs_vfree }, /* vfree */
|
|
{ &vop_truncate_desc, (vop_t *)fifo_truncate }, /* truncate */
|
|
{ &vop_update_desc, (vop_t *)ffs_update }, /* update */
|
|
/* XXX: vop_getpages */
|
|
/* XXX: vop_putpages */
|
|
{ &vop_bwrite_desc, (vop_t *)vn_bwrite }, /* bwrite */
|
|
{ NULL, NULL }
|
|
};
|
|
static struct vnodeopv_desc ffs_fifoop_opv_desc =
|
|
{ &ffs_fifoop_p, ffs_fifoop_entries };
|
|
|
|
VNODEOP_SET(ffs_vnodeop_opv_desc);
|
|
VNODEOP_SET(ffs_specop_opv_desc);
|
|
VNODEOP_SET(ffs_fifoop_opv_desc);
|
|
|
|
SYSCTL_NODE(_vfs, MOUNT_UFS, ffs, CTLFLAG_RW, 0, "FFS filesystem");
|
|
|
|
#include <ufs/ufs/ufs_readwrite.c>
|
|
|
|
/*
|
|
* Synch an open file.
|
|
*/
|
|
/* ARGSUSED */
|
|
static int
|
|
ffs_fsync(ap)
|
|
struct vop_fsync_args /* {
|
|
struct vnode *a_vp;
|
|
struct ucred *a_cred;
|
|
int a_waitfor;
|
|
struct proc *a_p;
|
|
} */ *ap;
|
|
{
|
|
register struct vnode *vp = ap->a_vp;
|
|
register struct buf *bp;
|
|
struct timeval tv;
|
|
struct buf *nbp;
|
|
int pass;
|
|
int s;
|
|
|
|
pass = 0;
|
|
/*
|
|
* Flush all dirty buffers associated with a vnode.
|
|
*/
|
|
loop:
|
|
s = splbio();
|
|
for (bp = vp->v_dirtyblkhd.lh_first; bp; bp = nbp) {
|
|
nbp = bp->b_vnbufs.le_next;
|
|
if ((bp->b_flags & B_BUSY) || (pass == 0 && (bp->b_blkno < 0)))
|
|
continue;
|
|
if ((bp->b_flags & B_DELWRI) == 0)
|
|
panic("ffs_fsync: not dirty");
|
|
|
|
if (bp->b_vp != vp || ap->a_waitfor != MNT_NOWAIT) {
|
|
|
|
bremfree(bp);
|
|
bp->b_flags |= B_BUSY;
|
|
splx(s);
|
|
/*
|
|
* Wait for I/O associated with indirect blocks to complete,
|
|
* since there is no way to quickly wait for them below.
|
|
*/
|
|
if (bp->b_vp == vp || ap->a_waitfor == MNT_NOWAIT)
|
|
(void) bawrite(bp);
|
|
else
|
|
(void) bwrite(bp);
|
|
} else {
|
|
vfs_bio_awrite(bp);
|
|
splx(s);
|
|
}
|
|
goto loop;
|
|
}
|
|
splx(s);
|
|
|
|
if (pass == 0) {
|
|
pass = 1;
|
|
goto loop;
|
|
}
|
|
|
|
if (ap->a_waitfor == MNT_WAIT) {
|
|
s = splbio();
|
|
while (vp->v_numoutput) {
|
|
vp->v_flag |= VBWAIT;
|
|
(void) tsleep((caddr_t)&vp->v_numoutput, PRIBIO + 1, "ffsfsn", 0);
|
|
}
|
|
splx(s);
|
|
#ifdef DIAGNOSTIC
|
|
if (vp->v_dirtyblkhd.lh_first) {
|
|
vprint("ffs_fsync: dirty", vp);
|
|
goto loop;
|
|
}
|
|
#endif
|
|
}
|
|
|
|
gettime(&tv);
|
|
return (VOP_UPDATE(ap->a_vp, &tv, &tv, ap->a_waitfor == MNT_WAIT));
|
|
}
|
|
|
|
/*
|
|
* Reclaim an inode so that it can be used for other purposes.
|
|
*/
|
|
int
|
|
ffs_reclaim(ap)
|
|
struct vop_reclaim_args /* {
|
|
struct vnode *a_vp;
|
|
struct proc *a_p;
|
|
} */ *ap;
|
|
{
|
|
register struct vnode *vp = ap->a_vp;
|
|
int error;
|
|
|
|
if (error = ufs_reclaim(vp, ap->a_p))
|
|
return (error);
|
|
FREE(vp->v_data, VFSTOUFS(vp->v_mount)->um_devvp->v_tag == VT_MFS ?
|
|
M_MFSNODE : M_FFSNODE);
|
|
vp->v_data = NULL;
|
|
return (0);
|
|
}
|