ceph: use I_COMPLETE inode flag instead of D_COMPLETE flag
commit c6ffe10015
moved the flag that tracks if the dcache contents
for a directory are complete to dentry. The problem is there are
lots of places that use ceph_dir_{set,clear,test}_complete() while
holding i_ceph_lock. but ceph_dir_{set,clear,test}_complete() may
sleep because they call dput().
This patch basically reverts that commit. For ceph_d_prune(), it's
called with both the dentry to prune and the parent dentry are
locked. So it's safe to access the parent dentry's d_inode and
clear I_COMPLETE flag.
Signed-off-by: Yan, Zheng <zheng.z.yan@intel.com>
Reviewed-by: Greg Farnum <greg@inktank.com>
Reviewed-by: Sage Weil <sage@inktank.com>
This commit is contained in:
@@ -107,7 +107,7 @@ static unsigned fpos_off(loff_t p)
|
||||
* falling back to a "normal" sync readdir if any dentries in the dir
|
||||
* are dropped.
|
||||
*
|
||||
* D_COMPLETE tells indicates we have all dentries in the dir. It is
|
||||
* I_COMPLETE tells indicates we have all dentries in the dir. It is
|
||||
* defined IFF we hold CEPH_CAP_FILE_SHARED (which will be revoked by
|
||||
* the MDS if/when the directory is modified).
|
||||
*/
|
||||
@@ -198,8 +198,8 @@ more:
|
||||
filp->f_pos++;
|
||||
|
||||
/* make sure a dentry wasn't dropped while we didn't have parent lock */
|
||||
if (!ceph_dir_test_complete(dir)) {
|
||||
dout(" lost D_COMPLETE on %p; falling back to mds\n", dir);
|
||||
if (!ceph_i_test(dir, CEPH_I_COMPLETE)) {
|
||||
dout(" lost I_COMPLETE on %p; falling back to mds\n", dir);
|
||||
err = -EAGAIN;
|
||||
goto out;
|
||||
}
|
||||
@@ -284,7 +284,7 @@ static int ceph_readdir(struct file *filp, void *dirent, filldir_t filldir)
|
||||
if ((filp->f_pos == 2 || fi->dentry) &&
|
||||
!ceph_test_mount_opt(fsc, NOASYNCREADDIR) &&
|
||||
ceph_snap(inode) != CEPH_SNAPDIR &&
|
||||
ceph_dir_test_complete(inode) &&
|
||||
(ci->i_ceph_flags & CEPH_I_COMPLETE) &&
|
||||
__ceph_caps_issued_mask(ci, CEPH_CAP_FILE_SHARED, 1)) {
|
||||
spin_unlock(&ci->i_ceph_lock);
|
||||
err = __dcache_readdir(filp, dirent, filldir);
|
||||
@@ -350,7 +350,7 @@ more:
|
||||
|
||||
if (!req->r_did_prepopulate) {
|
||||
dout("readdir !did_prepopulate");
|
||||
fi->dir_release_count--; /* preclude D_COMPLETE */
|
||||
fi->dir_release_count--; /* preclude I_COMPLETE */
|
||||
}
|
||||
|
||||
/* note next offset and last dentry name */
|
||||
@@ -429,7 +429,8 @@ more:
|
||||
*/
|
||||
spin_lock(&ci->i_ceph_lock);
|
||||
if (ci->i_release_count == fi->dir_release_count) {
|
||||
ceph_dir_set_complete(inode);
|
||||
dout(" marking %p complete\n", inode);
|
||||
ci->i_ceph_flags |= CEPH_I_COMPLETE;
|
||||
ci->i_max_offset = filp->f_pos;
|
||||
}
|
||||
spin_unlock(&ci->i_ceph_lock);
|
||||
@@ -604,7 +605,7 @@ static struct dentry *ceph_lookup(struct inode *dir, struct dentry *dentry,
|
||||
fsc->mount_options->snapdir_name,
|
||||
dentry->d_name.len) &&
|
||||
!is_root_ceph_dentry(dir, dentry) &&
|
||||
ceph_dir_test_complete(dir) &&
|
||||
(ci->i_ceph_flags & CEPH_I_COMPLETE) &&
|
||||
(__ceph_caps_issued_mask(ci, CEPH_CAP_FILE_SHARED, 1))) {
|
||||
spin_unlock(&ci->i_ceph_lock);
|
||||
dout(" dir %p complete, -ENOENT\n", dir);
|
||||
@@ -908,7 +909,7 @@ static int ceph_rename(struct inode *old_dir, struct dentry *old_dentry,
|
||||
*/
|
||||
|
||||
/* d_move screws up d_subdirs order */
|
||||
ceph_dir_clear_complete(new_dir);
|
||||
ceph_i_clear(new_dir, CEPH_I_COMPLETE);
|
||||
|
||||
d_move(old_dentry, new_dentry);
|
||||
|
||||
@@ -1064,44 +1065,6 @@ static int ceph_snapdir_d_revalidate(struct dentry *dentry,
|
||||
return 1;
|
||||
}
|
||||
|
||||
/*
|
||||
* Set/clear/test dir complete flag on the dir's dentry.
|
||||
*/
|
||||
void ceph_dir_set_complete(struct inode *inode)
|
||||
{
|
||||
struct dentry *dentry = d_find_any_alias(inode);
|
||||
|
||||
if (dentry && ceph_dentry(dentry) &&
|
||||
ceph_test_mount_opt(ceph_sb_to_client(dentry->d_sb), DCACHE)) {
|
||||
dout(" marking %p (%p) complete\n", inode, dentry);
|
||||
set_bit(CEPH_D_COMPLETE, &ceph_dentry(dentry)->flags);
|
||||
}
|
||||
dput(dentry);
|
||||
}
|
||||
|
||||
void ceph_dir_clear_complete(struct inode *inode)
|
||||
{
|
||||
struct dentry *dentry = d_find_any_alias(inode);
|
||||
|
||||
if (dentry && ceph_dentry(dentry)) {
|
||||
dout(" marking %p (%p) complete\n", inode, dentry);
|
||||
set_bit(CEPH_D_COMPLETE, &ceph_dentry(dentry)->flags);
|
||||
}
|
||||
dput(dentry);
|
||||
}
|
||||
|
||||
bool ceph_dir_test_complete(struct inode *inode)
|
||||
{
|
||||
struct dentry *dentry = d_find_any_alias(inode);
|
||||
|
||||
if (dentry && ceph_dentry(dentry)) {
|
||||
dout(" marking %p (%p) NOT complete\n", inode, dentry);
|
||||
clear_bit(CEPH_D_COMPLETE, &ceph_dentry(dentry)->flags);
|
||||
}
|
||||
dput(dentry);
|
||||
return false;
|
||||
}
|
||||
|
||||
/*
|
||||
* When the VFS prunes a dentry from the cache, we need to clear the
|
||||
* complete flag on the parent directory.
|
||||
@@ -1110,15 +1073,13 @@ bool ceph_dir_test_complete(struct inode *inode)
|
||||
*/
|
||||
static void ceph_d_prune(struct dentry *dentry)
|
||||
{
|
||||
struct ceph_dentry_info *di;
|
||||
|
||||
dout("ceph_d_prune %p\n", dentry);
|
||||
|
||||
/* do we have a valid parent? */
|
||||
if (IS_ROOT(dentry))
|
||||
return;
|
||||
|
||||
/* if we are not hashed, we don't affect D_COMPLETE */
|
||||
/* if we are not hashed, we don't affect I_COMPLETE */
|
||||
if (d_unhashed(dentry))
|
||||
return;
|
||||
|
||||
@@ -1126,8 +1087,7 @@ static void ceph_d_prune(struct dentry *dentry)
|
||||
* we hold d_lock, so d_parent is stable, and d_fsdata is never
|
||||
* cleared until d_release
|
||||
*/
|
||||
di = ceph_dentry(dentry->d_parent);
|
||||
clear_bit(CEPH_D_COMPLETE, &di->flags);
|
||||
ceph_i_clear(dentry->d_parent->d_inode, CEPH_I_COMPLETE);
|
||||
}
|
||||
|
||||
/*
|
||||
|
Reference in New Issue
Block a user