Commit f283c86a authored by Dave Chinner's avatar Dave Chinner Committed by Al Viro

fs: remove inode_lock from iput_final and prune_icache

Now that inode state changes are protected by the inode->i_lock and
the inode LRU manipulations by the inode_lru_lock, we can remove the
inode_lock from prune_icache and the initial part of iput_final().

instead of using the inode_lock to protect the inode during
iput_final, use the inode->i_lock instead. This protects the inode
against new references being taken while we change the inode state
to I_FREEING, as well as preventing prune_icache from grabbing the
inode while we are manipulating it. Hence we no longer need the
inode_lock in iput_final prior to setting I_FREEING on the inode.

For prune_icache, we no longer need the inode_lock to protect the
LRU list, and the inodes themselves are protected against freeing
races by the inode->i_lock. Hence we can lift the inode_lock from
prune_icache as well.
Signed-off-by: default avatarDave Chinner <dchinner@redhat.com>
Signed-off-by: default avatarAl Viro <viro@zeniv.linux.org.uk>
parent 02afc410
...@@ -128,7 +128,7 @@ alloc_inode: ...@@ -128,7 +128,7 @@ alloc_inode:
destroy_inode: destroy_inode:
dirty_inode: (must not sleep) dirty_inode: (must not sleep)
write_inode: write_inode:
drop_inode: !!!inode_lock!!! drop_inode: !!!inode->i_lock!!!
evict_inode: evict_inode:
put_super: write put_super: write
write_super: read write_super: read
......
...@@ -298,11 +298,14 @@ be used instead. It gets called whenever the inode is evicted, whether it has ...@@ -298,11 +298,14 @@ be used instead. It gets called whenever the inode is evicted, whether it has
remaining links or not. Caller does *not* evict the pagecache or inode-associated remaining links or not. Caller does *not* evict the pagecache or inode-associated
metadata buffers; getting rid of those is responsibility of method, as it had metadata buffers; getting rid of those is responsibility of method, as it had
been for ->delete_inode(). been for ->delete_inode().
->drop_inode() returns int now; it's called on final iput() with inode_lock
held and it returns true if filesystems wants the inode to be dropped. As before, ->drop_inode() returns int now; it's called on final iput() with
generic_drop_inode() is still the default and it's been updated appropriately. inode->i_lock held and it returns true if filesystems wants the inode to be
generic_delete_inode() is also alive and it consists simply of return 1. Note that dropped. As before, generic_drop_inode() is still the default and it's been
all actual eviction work is done by caller after ->drop_inode() returns. updated appropriately. generic_delete_inode() is also alive and it consists
simply of return 1. Note that all actual eviction work is done by caller after
->drop_inode() returns.
clear_inode() is gone; use end_writeback() instead. As before, it must clear_inode() is gone; use end_writeback() instead. As before, it must
be called exactly once on each call of ->evict_inode() (as it used to be for be called exactly once on each call of ->evict_inode() (as it used to be for
each call of ->delete_inode()). Unlike before, if you are using inode-associated each call of ->delete_inode()). Unlike before, if you are using inode-associated
...@@ -395,6 +398,9 @@ Currently you can only have FALLOC_FL_PUNCH_HOLE with FALLOC_FL_KEEP_SIZE set, ...@@ -395,6 +398,9 @@ Currently you can only have FALLOC_FL_PUNCH_HOLE with FALLOC_FL_KEEP_SIZE set,
so the i_size should not change when hole punching, even when puching the end of so the i_size should not change when hole punching, even when puching the end of
a file off. a file off.
--
[mandatory]
-- --
[mandatory] [mandatory]
->get_sb() is gone. Switch to use of ->mount(). Typically it's just ->get_sb() is gone. Switch to use of ->mount(). Typically it's just
......
...@@ -254,7 +254,7 @@ or bottom half). ...@@ -254,7 +254,7 @@ or bottom half).
should be synchronous or not, not all filesystems check this flag. should be synchronous or not, not all filesystems check this flag.
drop_inode: called when the last access to the inode is dropped, drop_inode: called when the last access to the inode is dropped,
with the inode_lock spinlock held. with the inode->i_lock spinlock held.
This method should be either NULL (normal UNIX filesystem This method should be either NULL (normal UNIX filesystem
semantics) or "generic_delete_inode" (for filesystems that do not semantics) or "generic_delete_inode" (for filesystems that do not
......
...@@ -650,7 +650,6 @@ static void prune_icache(int nr_to_scan) ...@@ -650,7 +650,6 @@ static void prune_icache(int nr_to_scan)
unsigned long reap = 0; unsigned long reap = 0;
down_read(&iprune_sem); down_read(&iprune_sem);
spin_lock(&inode_lock);
spin_lock(&inode_lru_lock); spin_lock(&inode_lru_lock);
for (nr_scanned = 0; nr_scanned < nr_to_scan; nr_scanned++) { for (nr_scanned = 0; nr_scanned < nr_to_scan; nr_scanned++) {
struct inode *inode; struct inode *inode;
...@@ -676,8 +675,8 @@ static void prune_icache(int nr_to_scan) ...@@ -676,8 +675,8 @@ static void prune_icache(int nr_to_scan)
*/ */
if (atomic_read(&inode->i_count) || if (atomic_read(&inode->i_count) ||
(inode->i_state & ~I_REFERENCED)) { (inode->i_state & ~I_REFERENCED)) {
spin_unlock(&inode->i_lock);
list_del_init(&inode->i_lru); list_del_init(&inode->i_lru);
spin_unlock(&inode->i_lock);
inodes_stat.nr_unused--; inodes_stat.nr_unused--;
continue; continue;
} }
...@@ -685,20 +684,18 @@ static void prune_icache(int nr_to_scan) ...@@ -685,20 +684,18 @@ static void prune_icache(int nr_to_scan)
/* recently referenced inodes get one more pass */ /* recently referenced inodes get one more pass */
if (inode->i_state & I_REFERENCED) { if (inode->i_state & I_REFERENCED) {
inode->i_state &= ~I_REFERENCED; inode->i_state &= ~I_REFERENCED;
spin_unlock(&inode->i_lock);
list_move(&inode->i_lru, &inode_lru); list_move(&inode->i_lru, &inode_lru);
spin_unlock(&inode->i_lock);
continue; continue;
} }
if (inode_has_buffers(inode) || inode->i_data.nrpages) { if (inode_has_buffers(inode) || inode->i_data.nrpages) {
__iget(inode); __iget(inode);
spin_unlock(&inode->i_lock); spin_unlock(&inode->i_lock);
spin_unlock(&inode_lru_lock); spin_unlock(&inode_lru_lock);
spin_unlock(&inode_lock);
if (remove_inode_buffers(inode)) if (remove_inode_buffers(inode))
reap += invalidate_mapping_pages(&inode->i_data, reap += invalidate_mapping_pages(&inode->i_data,
0, -1); 0, -1);
iput(inode); iput(inode);
spin_lock(&inode_lock);
spin_lock(&inode_lru_lock); spin_lock(&inode_lru_lock);
if (inode != list_entry(inode_lru.next, if (inode != list_entry(inode_lru.next,
...@@ -724,7 +721,6 @@ static void prune_icache(int nr_to_scan) ...@@ -724,7 +721,6 @@ static void prune_icache(int nr_to_scan)
else else
__count_vm_events(PGINODESTEAL, reap); __count_vm_events(PGINODESTEAL, reap);
spin_unlock(&inode_lru_lock); spin_unlock(&inode_lru_lock);
spin_unlock(&inode_lock);
dispose_list(&freeable); dispose_list(&freeable);
up_read(&iprune_sem); up_read(&iprune_sem);
...@@ -1082,7 +1078,6 @@ EXPORT_SYMBOL(iunique); ...@@ -1082,7 +1078,6 @@ EXPORT_SYMBOL(iunique);
struct inode *igrab(struct inode *inode) struct inode *igrab(struct inode *inode)
{ {
spin_lock(&inode_lock);
spin_lock(&inode->i_lock); spin_lock(&inode->i_lock);
if (!(inode->i_state & (I_FREEING|I_WILL_FREE))) { if (!(inode->i_state & (I_FREEING|I_WILL_FREE))) {
__iget(inode); __iget(inode);
...@@ -1096,7 +1091,6 @@ struct inode *igrab(struct inode *inode) ...@@ -1096,7 +1091,6 @@ struct inode *igrab(struct inode *inode)
*/ */
inode = NULL; inode = NULL;
} }
spin_unlock(&inode_lock);
return inode; return inode;
} }
EXPORT_SYMBOL(igrab); EXPORT_SYMBOL(igrab);
...@@ -1439,7 +1433,6 @@ static void iput_final(struct inode *inode) ...@@ -1439,7 +1433,6 @@ static void iput_final(struct inode *inode)
const struct super_operations *op = inode->i_sb->s_op; const struct super_operations *op = inode->i_sb->s_op;
int drop; int drop;
spin_lock(&inode->i_lock);
WARN_ON(inode->i_state & I_NEW); WARN_ON(inode->i_state & I_NEW);
if (op && op->drop_inode) if (op && op->drop_inode)
...@@ -1452,16 +1445,13 @@ static void iput_final(struct inode *inode) ...@@ -1452,16 +1445,13 @@ static void iput_final(struct inode *inode)
if (!(inode->i_state & (I_DIRTY|I_SYNC))) if (!(inode->i_state & (I_DIRTY|I_SYNC)))
inode_lru_list_add(inode); inode_lru_list_add(inode);
spin_unlock(&inode->i_lock); spin_unlock(&inode->i_lock);
spin_unlock(&inode_lock);
return; return;
} }
if (!drop) { if (!drop) {
inode->i_state |= I_WILL_FREE; inode->i_state |= I_WILL_FREE;
spin_unlock(&inode->i_lock); spin_unlock(&inode->i_lock);
spin_unlock(&inode_lock);
write_inode_now(inode, 1); write_inode_now(inode, 1);
spin_lock(&inode_lock);
spin_lock(&inode->i_lock); spin_lock(&inode->i_lock);
WARN_ON(inode->i_state & I_NEW); WARN_ON(inode->i_state & I_NEW);
inode->i_state &= ~I_WILL_FREE; inode->i_state &= ~I_WILL_FREE;
...@@ -1470,7 +1460,6 @@ static void iput_final(struct inode *inode) ...@@ -1470,7 +1460,6 @@ static void iput_final(struct inode *inode)
inode->i_state |= I_FREEING; inode->i_state |= I_FREEING;
inode_lru_list_del(inode); inode_lru_list_del(inode);
spin_unlock(&inode->i_lock); spin_unlock(&inode->i_lock);
spin_unlock(&inode_lock);
evict(inode); evict(inode);
} }
...@@ -1489,7 +1478,7 @@ void iput(struct inode *inode) ...@@ -1489,7 +1478,7 @@ void iput(struct inode *inode)
if (inode) { if (inode) {
BUG_ON(inode->i_state & I_CLEAR); BUG_ON(inode->i_state & I_CLEAR);
if (atomic_dec_and_lock(&inode->i_count, &inode_lock)) if (atomic_dec_and_lock(&inode->i_count, &inode->i_lock))
iput_final(inode); iput_final(inode);
} }
} }
......
...@@ -293,7 +293,7 @@ static int logfs_write_inode(struct inode *inode, struct writeback_control *wbc) ...@@ -293,7 +293,7 @@ static int logfs_write_inode(struct inode *inode, struct writeback_control *wbc)
return ret; return ret;
} }
/* called with inode_lock held */ /* called with inode->i_lock held */
static int logfs_drop_inode(struct inode *inode) static int logfs_drop_inode(struct inode *inode)
{ {
struct logfs_super *super = logfs_super(inode->i_sb); struct logfs_super *super = logfs_super(inode->i_sb);
......
Markdown is supported
0%
or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment