fs: remove inode_lock from iput_final and prune_icache
Now that inode state changes are protected by the inode->i_lock and the inode LRU manipulations by the inode_lru_lock, we can remove the inode_lock from prune_icache and the initial part of iput_final(). instead of using the inode_lock to protect the inode during iput_final, use the inode->i_lock instead. This protects the inode against new references being taken while we change the inode state to I_FREEING, as well as preventing prune_icache from grabbing the inode while we are manipulating it. Hence we no longer need the inode_lock in iput_final prior to setting I_FREEING on the inode. For prune_icache, we no longer need the inode_lock to protect the LRU list, and the inodes themselves are protected against freeing races by the inode->i_lock. Hence we can lift the inode_lock from prune_icache as well. Signed-off-by: Dave Chinner <dchinner@redhat.com> Signed-off-by: Al Viro <viro@zeniv.linux.org.uk>
This commit is contained in:
@@ -128,7 +128,7 @@ alloc_inode:
|
|||||||
destroy_inode:
|
destroy_inode:
|
||||||
dirty_inode: (must not sleep)
|
dirty_inode: (must not sleep)
|
||||||
write_inode:
|
write_inode:
|
||||||
drop_inode: !!!inode_lock!!!
|
drop_inode: !!!inode->i_lock!!!
|
||||||
evict_inode:
|
evict_inode:
|
||||||
put_super: write
|
put_super: write
|
||||||
write_super: read
|
write_super: read
|
||||||
|
|||||||
@@ -298,11 +298,14 @@ be used instead. It gets called whenever the inode is evicted, whether it has
|
|||||||
remaining links or not. Caller does *not* evict the pagecache or inode-associated
|
remaining links or not. Caller does *not* evict the pagecache or inode-associated
|
||||||
metadata buffers; getting rid of those is responsibility of method, as it had
|
metadata buffers; getting rid of those is responsibility of method, as it had
|
||||||
been for ->delete_inode().
|
been for ->delete_inode().
|
||||||
->drop_inode() returns int now; it's called on final iput() with inode_lock
|
|
||||||
held and it returns true if filesystems wants the inode to be dropped. As before,
|
->drop_inode() returns int now; it's called on final iput() with
|
||||||
generic_drop_inode() is still the default and it's been updated appropriately.
|
inode->i_lock held and it returns true if filesystems wants the inode to be
|
||||||
generic_delete_inode() is also alive and it consists simply of return 1. Note that
|
dropped. As before, generic_drop_inode() is still the default and it's been
|
||||||
all actual eviction work is done by caller after ->drop_inode() returns.
|
updated appropriately. generic_delete_inode() is also alive and it consists
|
||||||
|
simply of return 1. Note that all actual eviction work is done by caller after
|
||||||
|
->drop_inode() returns.
|
||||||
|
|
||||||
clear_inode() is gone; use end_writeback() instead. As before, it must
|
clear_inode() is gone; use end_writeback() instead. As before, it must
|
||||||
be called exactly once on each call of ->evict_inode() (as it used to be for
|
be called exactly once on each call of ->evict_inode() (as it used to be for
|
||||||
each call of ->delete_inode()). Unlike before, if you are using inode-associated
|
each call of ->delete_inode()). Unlike before, if you are using inode-associated
|
||||||
@@ -395,6 +398,9 @@ Currently you can only have FALLOC_FL_PUNCH_HOLE with FALLOC_FL_KEEP_SIZE set,
|
|||||||
so the i_size should not change when hole punching, even when puching the end of
|
so the i_size should not change when hole punching, even when puching the end of
|
||||||
a file off.
|
a file off.
|
||||||
|
|
||||||
|
--
|
||||||
|
[mandatory]
|
||||||
|
|
||||||
--
|
--
|
||||||
[mandatory]
|
[mandatory]
|
||||||
->get_sb() is gone. Switch to use of ->mount(). Typically it's just
|
->get_sb() is gone. Switch to use of ->mount(). Typically it's just
|
||||||
|
|||||||
@@ -254,7 +254,7 @@ or bottom half).
|
|||||||
should be synchronous or not, not all filesystems check this flag.
|
should be synchronous or not, not all filesystems check this flag.
|
||||||
|
|
||||||
drop_inode: called when the last access to the inode is dropped,
|
drop_inode: called when the last access to the inode is dropped,
|
||||||
with the inode_lock spinlock held.
|
with the inode->i_lock spinlock held.
|
||||||
|
|
||||||
This method should be either NULL (normal UNIX filesystem
|
This method should be either NULL (normal UNIX filesystem
|
||||||
semantics) or "generic_delete_inode" (for filesystems that do not
|
semantics) or "generic_delete_inode" (for filesystems that do not
|
||||||
|
|||||||
17
fs/inode.c
17
fs/inode.c
@@ -650,7 +650,6 @@ static void prune_icache(int nr_to_scan)
|
|||||||
unsigned long reap = 0;
|
unsigned long reap = 0;
|
||||||
|
|
||||||
down_read(&iprune_sem);
|
down_read(&iprune_sem);
|
||||||
spin_lock(&inode_lock);
|
|
||||||
spin_lock(&inode_lru_lock);
|
spin_lock(&inode_lru_lock);
|
||||||
for (nr_scanned = 0; nr_scanned < nr_to_scan; nr_scanned++) {
|
for (nr_scanned = 0; nr_scanned < nr_to_scan; nr_scanned++) {
|
||||||
struct inode *inode;
|
struct inode *inode;
|
||||||
@@ -676,8 +675,8 @@ static void prune_icache(int nr_to_scan)
|
|||||||
*/
|
*/
|
||||||
if (atomic_read(&inode->i_count) ||
|
if (atomic_read(&inode->i_count) ||
|
||||||
(inode->i_state & ~I_REFERENCED)) {
|
(inode->i_state & ~I_REFERENCED)) {
|
||||||
spin_unlock(&inode->i_lock);
|
|
||||||
list_del_init(&inode->i_lru);
|
list_del_init(&inode->i_lru);
|
||||||
|
spin_unlock(&inode->i_lock);
|
||||||
inodes_stat.nr_unused--;
|
inodes_stat.nr_unused--;
|
||||||
continue;
|
continue;
|
||||||
}
|
}
|
||||||
@@ -685,20 +684,18 @@ static void prune_icache(int nr_to_scan)
|
|||||||
/* recently referenced inodes get one more pass */
|
/* recently referenced inodes get one more pass */
|
||||||
if (inode->i_state & I_REFERENCED) {
|
if (inode->i_state & I_REFERENCED) {
|
||||||
inode->i_state &= ~I_REFERENCED;
|
inode->i_state &= ~I_REFERENCED;
|
||||||
spin_unlock(&inode->i_lock);
|
|
||||||
list_move(&inode->i_lru, &inode_lru);
|
list_move(&inode->i_lru, &inode_lru);
|
||||||
|
spin_unlock(&inode->i_lock);
|
||||||
continue;
|
continue;
|
||||||
}
|
}
|
||||||
if (inode_has_buffers(inode) || inode->i_data.nrpages) {
|
if (inode_has_buffers(inode) || inode->i_data.nrpages) {
|
||||||
__iget(inode);
|
__iget(inode);
|
||||||
spin_unlock(&inode->i_lock);
|
spin_unlock(&inode->i_lock);
|
||||||
spin_unlock(&inode_lru_lock);
|
spin_unlock(&inode_lru_lock);
|
||||||
spin_unlock(&inode_lock);
|
|
||||||
if (remove_inode_buffers(inode))
|
if (remove_inode_buffers(inode))
|
||||||
reap += invalidate_mapping_pages(&inode->i_data,
|
reap += invalidate_mapping_pages(&inode->i_data,
|
||||||
0, -1);
|
0, -1);
|
||||||
iput(inode);
|
iput(inode);
|
||||||
spin_lock(&inode_lock);
|
|
||||||
spin_lock(&inode_lru_lock);
|
spin_lock(&inode_lru_lock);
|
||||||
|
|
||||||
if (inode != list_entry(inode_lru.next,
|
if (inode != list_entry(inode_lru.next,
|
||||||
@@ -724,7 +721,6 @@ static void prune_icache(int nr_to_scan)
|
|||||||
else
|
else
|
||||||
__count_vm_events(PGINODESTEAL, reap);
|
__count_vm_events(PGINODESTEAL, reap);
|
||||||
spin_unlock(&inode_lru_lock);
|
spin_unlock(&inode_lru_lock);
|
||||||
spin_unlock(&inode_lock);
|
|
||||||
|
|
||||||
dispose_list(&freeable);
|
dispose_list(&freeable);
|
||||||
up_read(&iprune_sem);
|
up_read(&iprune_sem);
|
||||||
@@ -1082,7 +1078,6 @@ EXPORT_SYMBOL(iunique);
|
|||||||
|
|
||||||
struct inode *igrab(struct inode *inode)
|
struct inode *igrab(struct inode *inode)
|
||||||
{
|
{
|
||||||
spin_lock(&inode_lock);
|
|
||||||
spin_lock(&inode->i_lock);
|
spin_lock(&inode->i_lock);
|
||||||
if (!(inode->i_state & (I_FREEING|I_WILL_FREE))) {
|
if (!(inode->i_state & (I_FREEING|I_WILL_FREE))) {
|
||||||
__iget(inode);
|
__iget(inode);
|
||||||
@@ -1096,7 +1091,6 @@ struct inode *igrab(struct inode *inode)
|
|||||||
*/
|
*/
|
||||||
inode = NULL;
|
inode = NULL;
|
||||||
}
|
}
|
||||||
spin_unlock(&inode_lock);
|
|
||||||
return inode;
|
return inode;
|
||||||
}
|
}
|
||||||
EXPORT_SYMBOL(igrab);
|
EXPORT_SYMBOL(igrab);
|
||||||
@@ -1439,7 +1433,6 @@ static void iput_final(struct inode *inode)
|
|||||||
const struct super_operations *op = inode->i_sb->s_op;
|
const struct super_operations *op = inode->i_sb->s_op;
|
||||||
int drop;
|
int drop;
|
||||||
|
|
||||||
spin_lock(&inode->i_lock);
|
|
||||||
WARN_ON(inode->i_state & I_NEW);
|
WARN_ON(inode->i_state & I_NEW);
|
||||||
|
|
||||||
if (op && op->drop_inode)
|
if (op && op->drop_inode)
|
||||||
@@ -1452,16 +1445,13 @@ static void iput_final(struct inode *inode)
|
|||||||
if (!(inode->i_state & (I_DIRTY|I_SYNC)))
|
if (!(inode->i_state & (I_DIRTY|I_SYNC)))
|
||||||
inode_lru_list_add(inode);
|
inode_lru_list_add(inode);
|
||||||
spin_unlock(&inode->i_lock);
|
spin_unlock(&inode->i_lock);
|
||||||
spin_unlock(&inode_lock);
|
|
||||||
return;
|
return;
|
||||||
}
|
}
|
||||||
|
|
||||||
if (!drop) {
|
if (!drop) {
|
||||||
inode->i_state |= I_WILL_FREE;
|
inode->i_state |= I_WILL_FREE;
|
||||||
spin_unlock(&inode->i_lock);
|
spin_unlock(&inode->i_lock);
|
||||||
spin_unlock(&inode_lock);
|
|
||||||
write_inode_now(inode, 1);
|
write_inode_now(inode, 1);
|
||||||
spin_lock(&inode_lock);
|
|
||||||
spin_lock(&inode->i_lock);
|
spin_lock(&inode->i_lock);
|
||||||
WARN_ON(inode->i_state & I_NEW);
|
WARN_ON(inode->i_state & I_NEW);
|
||||||
inode->i_state &= ~I_WILL_FREE;
|
inode->i_state &= ~I_WILL_FREE;
|
||||||
@@ -1470,7 +1460,6 @@ static void iput_final(struct inode *inode)
|
|||||||
inode->i_state |= I_FREEING;
|
inode->i_state |= I_FREEING;
|
||||||
inode_lru_list_del(inode);
|
inode_lru_list_del(inode);
|
||||||
spin_unlock(&inode->i_lock);
|
spin_unlock(&inode->i_lock);
|
||||||
spin_unlock(&inode_lock);
|
|
||||||
|
|
||||||
evict(inode);
|
evict(inode);
|
||||||
}
|
}
|
||||||
@@ -1489,7 +1478,7 @@ void iput(struct inode *inode)
|
|||||||
if (inode) {
|
if (inode) {
|
||||||
BUG_ON(inode->i_state & I_CLEAR);
|
BUG_ON(inode->i_state & I_CLEAR);
|
||||||
|
|
||||||
if (atomic_dec_and_lock(&inode->i_count, &inode_lock))
|
if (atomic_dec_and_lock(&inode->i_count, &inode->i_lock))
|
||||||
iput_final(inode);
|
iput_final(inode);
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|||||||
@@ -293,7 +293,7 @@ static int logfs_write_inode(struct inode *inode, struct writeback_control *wbc)
|
|||||||
return ret;
|
return ret;
|
||||||
}
|
}
|
||||||
|
|
||||||
/* called with inode_lock held */
|
/* called with inode->i_lock held */
|
||||||
static int logfs_drop_inode(struct inode *inode)
|
static int logfs_drop_inode(struct inode *inode)
|
||||||
{
|
{
|
||||||
struct logfs_super *super = logfs_super(inode->i_sb);
|
struct logfs_super *super = logfs_super(inode->i_sb);
|
||||||
|
|||||||
Reference in New Issue
Block a user