4950 files sometimes can't be removed from a full filesystem
Reviewed by: Adam Leventhal <adam.leventhal@delphix.com> Reviewed by: George Wilson <george.wilson@delphix.com> Reviewed by: Sebastien Roy <sebastien.roy@delphix.com> Reviewed by: Boris Protopopov <bprotopopov@hotmail.com> Approved by: Dan McDonald <danmcd@omniti.com> illumos/illumos-gate@4bb7380495
This commit is contained in:
parent
b209944943
commit
f82f5510a4
@ -666,6 +666,12 @@ dmu_free_long_range_impl(objset_t *os, dnode_t *dn, uint64_t offset,
|
||||
dmu_tx_t *tx = dmu_tx_create(os);
|
||||
dmu_tx_hold_free(tx, dn->dn_object,
|
||||
chunk_begin, chunk_end - chunk_begin);
|
||||
|
||||
/*
|
||||
* Mark this transaction as typically resulting in a net
|
||||
* reduction in space used.
|
||||
*/
|
||||
dmu_tx_mark_netfree(tx);
|
||||
err = dmu_tx_assign(tx, TXG_WAIT);
|
||||
if (err) {
|
||||
dmu_tx_abort(tx);
|
||||
@ -717,6 +723,7 @@ dmu_free_long_object(objset_t *os, uint64_t object)
|
||||
tx = dmu_tx_create(os);
|
||||
dmu_tx_hold_bonus(tx, object);
|
||||
dmu_tx_hold_free(tx, object, 0, DMU_OBJECT_END);
|
||||
dmu_tx_mark_netfree(tx);
|
||||
err = dmu_tx_assign(tx, TXG_WAIT);
|
||||
if (err == 0) {
|
||||
err = dmu_object_free(os, object, tx);
|
||||
|
@ -21,7 +21,7 @@
|
||||
/*
|
||||
* Copyright (c) 2005, 2010, Oracle and/or its affiliates. All rights reserved.
|
||||
* Copyright 2011 Nexenta Systems, Inc. All rights reserved.
|
||||
* Copyright (c) 2013 by Delphix. All rights reserved.
|
||||
* Copyright (c) 2012, 2014 by Delphix. All rights reserved.
|
||||
*/
|
||||
|
||||
#include <sys/dmu.h>
|
||||
@ -583,6 +583,32 @@ dmu_tx_count_free(dmu_tx_hold_t *txh, uint64_t off, uint64_t len)
|
||||
txh->txh_space_tounref += unref;
|
||||
}
|
||||
|
||||
/*
|
||||
* This function marks the transaction as being a "net free". The end
|
||||
* result is that refquotas will be disabled for this transaction, and
|
||||
* this transaction will be able to use half of the pool space overhead
|
||||
* (see dsl_pool_adjustedsize()). Therefore this function should only
|
||||
* be called for transactions that we expect will not cause a net increase
|
||||
* in the amount of space used (but it's OK if that is occasionally not true).
|
||||
*/
|
||||
void
|
||||
dmu_tx_mark_netfree(dmu_tx_t *tx)
|
||||
{
|
||||
dmu_tx_hold_t *txh;
|
||||
|
||||
txh = dmu_tx_hold_object_impl(tx, tx->tx_objset,
|
||||
DMU_NEW_OBJECT, THT_FREE, 0, 0);
|
||||
|
||||
/*
|
||||
* Pretend that this operation will free 1GB of space. This
|
||||
* should be large enough to cancel out the largest write.
|
||||
* We don't want to use something like UINT64_MAX, because that would
|
||||
* cause overflows when doing math with these values (e.g. in
|
||||
* dmu_tx_try_assign()).
|
||||
*/
|
||||
txh->txh_space_tofree = txh->txh_space_tounref = 1024 * 1024 * 1024;
|
||||
}
|
||||
|
||||
void
|
||||
dmu_tx_hold_free(dmu_tx_t *tx, uint64_t object, uint64_t off, uint64_t len)
|
||||
{
|
||||
|
@ -567,6 +567,7 @@ void dmu_tx_abort(dmu_tx_t *tx);
|
||||
int dmu_tx_assign(dmu_tx_t *tx, enum txg_how txg_how);
|
||||
void dmu_tx_wait(dmu_tx_t *tx);
|
||||
void dmu_tx_commit(dmu_tx_t *tx);
|
||||
void dmu_tx_mark_netfree(dmu_tx_t *tx);
|
||||
|
||||
/*
|
||||
* To register a commit callback, dmu_tx_callback_register() must be called.
|
||||
|
@ -20,7 +20,7 @@
|
||||
*/
|
||||
/*
|
||||
* Copyright (c) 2005, 2010, Oracle and/or its affiliates. All rights reserved.
|
||||
* Copyright (c) 2013 by Delphix. All rights reserved.
|
||||
* Copyright (c) 2013, 2014 by Delphix. All rights reserved.
|
||||
*/
|
||||
|
||||
#include <sys/types.h>
|
||||
@ -554,6 +554,7 @@ zfs_purgedir(znode_t *dzp)
|
||||
dmu_tx_hold_zap(tx, zfsvfs->z_unlinkedobj, FALSE, NULL);
|
||||
/* Is this really needed ? */
|
||||
zfs_sa_upgrade_txholds(tx, xzp);
|
||||
dmu_tx_mark_netfree(tx);
|
||||
error = dmu_tx_assign(tx, TXG_WAIT);
|
||||
if (error) {
|
||||
dmu_tx_abort(tx);
|
||||
|
@ -20,7 +20,7 @@
|
||||
*/
|
||||
/*
|
||||
* Copyright (c) 2005, 2010, Oracle and/or its affiliates. All rights reserved.
|
||||
* Copyright (c) 2013 by Delphix. All rights reserved.
|
||||
* Copyright (c) 2013, 2014 by Delphix. All rights reserved.
|
||||
* Copyright 2014 Nexenta Systems, Inc. All rights reserved.
|
||||
*/
|
||||
|
||||
@ -1301,7 +1301,7 @@ zfs_lookup(vnode_t *dvp, char *nm, vnode_t **vpp, struct pathname *pnp,
|
||||
* cr - credentials of caller.
|
||||
* flag - large file flag [UNUSED].
|
||||
* ct - caller context
|
||||
* vsecp - ACL to be set
|
||||
* vsecp - ACL to be set
|
||||
*
|
||||
* OUT: vpp - vnode of created or trunc'd entry.
|
||||
*
|
||||
@ -1577,7 +1577,7 @@ zfs_remove(vnode_t *dvp, char *name, cred_t *cr, caller_context_t *ct,
|
||||
zfsvfs_t *zfsvfs = dzp->z_zfsvfs;
|
||||
zilog_t *zilog;
|
||||
uint64_t acl_obj, xattr_obj;
|
||||
uint64_t xattr_obj_unlinked = 0;
|
||||
uint64_t xattr_obj_unlinked = 0;
|
||||
uint64_t obj = 0;
|
||||
zfs_dirlock_t *dl;
|
||||
dmu_tx_t *tx;
|
||||
@ -1677,6 +1677,14 @@ zfs_remove(vnode_t *dvp, char *name, cred_t *cr, caller_context_t *ct,
|
||||
/* charge as an update -- would be nice not to charge at all */
|
||||
dmu_tx_hold_zap(tx, zfsvfs->z_unlinkedobj, FALSE, NULL);
|
||||
|
||||
/*
|
||||
* Mark this transaction as typically resulting in a net free of
|
||||
* space, unless object removal will be delayed indefinitely
|
||||
* (due to active holds on the vnode due to the file being open).
|
||||
*/
|
||||
if (may_delete_now)
|
||||
dmu_tx_mark_netfree(tx);
|
||||
|
||||
error = dmu_tx_assign(tx, waited ? TXG_WAITED : TXG_NOWAIT);
|
||||
if (error) {
|
||||
zfs_dirent_unlock(dl);
|
||||
@ -1707,7 +1715,6 @@ zfs_remove(vnode_t *dvp, char *name, cred_t *cr, caller_context_t *ct,
|
||||
}
|
||||
|
||||
if (unlinked) {
|
||||
|
||||
/*
|
||||
* Hold z_lock so that we can make sure that the ACL obj
|
||||
* hasn't changed. Could have been deleted due to
|
||||
@ -4692,13 +4699,13 @@ zfs_addmap(vnode_t *vp, offset_t off, struct as *as, caddr_t addr,
|
||||
* last page is pushed. The problem occurs when the msync() call is omitted,
|
||||
* which by far the most common case:
|
||||
*
|
||||
* open()
|
||||
* mmap()
|
||||
* <modify memory>
|
||||
* munmap()
|
||||
* close()
|
||||
* <time lapse>
|
||||
* putpage() via fsflush
|
||||
* open()
|
||||
* mmap()
|
||||
* <modify memory>
|
||||
* munmap()
|
||||
* close()
|
||||
* <time lapse>
|
||||
* putpage() via fsflush
|
||||
*
|
||||
* If we wait until fsflush to come along, we can have a modification time that
|
||||
* is some arbitrary point in the future. In order to prevent this in the
|
||||
@ -5172,7 +5179,7 @@ const fs_operation_def_t zfs_dvnodeops_template[] = {
|
||||
VOPNAME_PATHCONF, { .vop_pathconf = zfs_pathconf },
|
||||
VOPNAME_GETSECATTR, { .vop_getsecattr = zfs_getsecattr },
|
||||
VOPNAME_SETSECATTR, { .vop_setsecattr = zfs_setsecattr },
|
||||
VOPNAME_VNEVENT, { .vop_vnevent = fs_vnevent_support },
|
||||
VOPNAME_VNEVENT, { .vop_vnevent = fs_vnevent_support },
|
||||
NULL, NULL
|
||||
};
|
||||
|
||||
@ -5206,8 +5213,8 @@ const fs_operation_def_t zfs_fvnodeops_template[] = {
|
||||
VOPNAME_GETSECATTR, { .vop_getsecattr = zfs_getsecattr },
|
||||
VOPNAME_SETSECATTR, { .vop_setsecattr = zfs_setsecattr },
|
||||
VOPNAME_VNEVENT, { .vop_vnevent = fs_vnevent_support },
|
||||
VOPNAME_REQZCBUF, { .vop_reqzcbuf = zfs_reqzcbuf },
|
||||
VOPNAME_RETZCBUF, { .vop_retzcbuf = zfs_retzcbuf },
|
||||
VOPNAME_REQZCBUF, { .vop_reqzcbuf = zfs_reqzcbuf },
|
||||
VOPNAME_RETZCBUF, { .vop_retzcbuf = zfs_retzcbuf },
|
||||
NULL, NULL
|
||||
};
|
||||
|
||||
|
@ -20,7 +20,7 @@
|
||||
*/
|
||||
/*
|
||||
* Copyright (c) 2005, 2010, Oracle and/or its affiliates. All rights reserved.
|
||||
* Copyright (c) 2013 by Delphix. All rights reserved.
|
||||
* Copyright (c) 2012, 2014 by Delphix. All rights reserved.
|
||||
*/
|
||||
|
||||
/* Portions Copyright 2007 Jeremy Teo */
|
||||
@ -1442,7 +1442,7 @@ zfs_no_putpage(vnode_t *vp, page_t *pp, u_offset_t *offp, size_t *lenp,
|
||||
* IN: zp - znode of file to free data in.
|
||||
* end - new end-of-file
|
||||
*
|
||||
* RETURN: 0 on success, error code on failure
|
||||
* RETURN: 0 on success, error code on failure
|
||||
*/
|
||||
static int
|
||||
zfs_extend(znode_t *zp, uint64_t end)
|
||||
@ -1513,7 +1513,7 @@ zfs_extend(znode_t *zp, uint64_t end)
|
||||
* off - start of section to free.
|
||||
* len - length of section to free.
|
||||
*
|
||||
* RETURN: 0 on success, error code on failure
|
||||
* RETURN: 0 on success, error code on failure
|
||||
*/
|
||||
static int
|
||||
zfs_free_range(znode_t *zp, uint64_t off, uint64_t len)
|
||||
@ -1551,7 +1551,7 @@ zfs_free_range(znode_t *zp, uint64_t off, uint64_t len)
|
||||
* IN: zp - znode of file to free data in.
|
||||
* end - new end-of-file.
|
||||
*
|
||||
* RETURN: 0 on success, error code on failure
|
||||
* RETURN: 0 on success, error code on failure
|
||||
*/
|
||||
static int
|
||||
zfs_trunc(znode_t *zp, uint64_t end)
|
||||
@ -1585,6 +1585,7 @@ zfs_trunc(znode_t *zp, uint64_t end)
|
||||
tx = dmu_tx_create(zfsvfs->z_os);
|
||||
dmu_tx_hold_sa(tx, zp->z_sa_hdl, B_FALSE);
|
||||
zfs_sa_upgrade_txholds(tx, zp);
|
||||
dmu_tx_mark_netfree(tx);
|
||||
error = dmu_tx_assign(tx, TXG_WAIT);
|
||||
if (error) {
|
||||
dmu_tx_abort(tx);
|
||||
@ -1643,7 +1644,7 @@ zfs_trunc(znode_t *zp, uint64_t end)
|
||||
* flag - current file open mode flags.
|
||||
* log - TRUE if this action should be logged
|
||||
*
|
||||
* RETURN: 0 on success, error code on failure
|
||||
* RETURN: 0 on success, error code on failure
|
||||
*/
|
||||
int
|
||||
zfs_freesp(znode_t *zp, uint64_t off, uint64_t len, int flag, boolean_t log)
|
||||
|
@ -717,6 +717,7 @@ zvol_update_volsize(objset_t *os, uint64_t volsize)
|
||||
|
||||
tx = dmu_tx_create(os);
|
||||
dmu_tx_hold_zap(tx, ZVOL_ZAP_OBJ, TRUE, NULL);
|
||||
dmu_tx_mark_netfree(tx);
|
||||
error = dmu_tx_assign(tx, TXG_WAIT);
|
||||
if (error) {
|
||||
dmu_tx_abort(tx);
|
||||
@ -1786,6 +1787,7 @@ zvol_ioctl(dev_t dev, int cmd, intptr_t arg, int flag, cred_t *cr, int *rvalp)
|
||||
rl = zfs_range_lock(&zv->zv_znode, df.df_start, df.df_length,
|
||||
RL_WRITER);
|
||||
tx = dmu_tx_create(zv->zv_objset);
|
||||
dmu_tx_mark_netfree(tx);
|
||||
error = dmu_tx_assign(tx, TXG_WAIT);
|
||||
if (error != 0) {
|
||||
dmu_tx_abort(tx);
|
||||
|
Loading…
Reference in New Issue
Block a user