Re: [PATCH 1/2] f2fs: support RENAME_WHITEOUT

From: Jaegeuk Kim
Date: Tue May 19 2015 - 01:51:25 EST


Hi Chao,

On Mon, May 18, 2015 at 01:54:22PM +0800, Chao Yu wrote:
> As the description of rename in manual, RENAME_WHITEOUT is a special operation
> that only makes sense for overlay/union type filesystem.
>
> When performing rename with RENAME_WHITEOUT, dst will be replace with src, and
> meanwhile, a 'whiteout' will be create with name of src.
>
> A "whiteout" is designed to be a char device with 0,0 device number, it has
> specially meaning for stackable filesystem. In these filesystems, there are
> multiple layers exist, and only top of these can be modified. So a whiteout
> in top layer is used to hide a corresponding file in lower layer, as well
> removal of whiteout will make the file appear.
>
> Now in overlayfs, when we rename a file which is exist in lower layer, it
> will be copied up to upper if it is not on upper layer yet, and then rename
> it on upper layer, source file will be whiteouted to hide corresponding file
> in lower layer at the same time.
>
> So in upper layer filesystem, implementation of RENAME_WHITEOUT provide a
> atomic operation for stackable filesystem to support rename operation.
>
> There are multiple ways to implement RENAME_WHITEOUT in log of this commit:
> 7dcf5c3e4527 ("xfs: add RENAME_WHITEOUT support") which pointed out by
> Dave Chinner.
>
> For now, we just try to follow the way that xfs/ext4 use.

Could you merge the two patches into one?
And, after finishing xfstests, kernel reports missing inode objects.
Could you check it out?
I didn't take a closer look at it.

>
> Signed-off-by: Chao Yu <chao2.yu@xxxxxxxxxxx>
> ---
> fs/f2fs/namei.c | 140 ++++++++++++++++++++++++++++++++++++--------------------
> 1 file changed, 90 insertions(+), 50 deletions(-)
>
> diff --git a/fs/f2fs/namei.c b/fs/f2fs/namei.c
> index 16b74da..bed0cb0 100644
> --- a/fs/f2fs/namei.c
> +++ b/fs/f2fs/namei.c
> @@ -510,14 +510,80 @@ out:
> return err;
> }
>
> +static int __f2fs_tmpfile(struct inode *dir, struct dentry *dentry,
> + umode_t mode, struct inode **whiteout)
> +{
> + struct f2fs_sb_info *sbi = F2FS_I_SB(dir);
> + struct inode *inode;
> + int err;
> +
> + inode = f2fs_new_inode(dir, mode);
> + if (IS_ERR(inode))
> + return PTR_ERR(inode);
> +
> + if (whiteout) {
> + init_special_inode(inode, inode->i_mode, WHITEOUT_DEV);
> + inode->i_op = &f2fs_special_inode_operations;
> + } else {
> + inode->i_op = &f2fs_file_inode_operations;
> + inode->i_fop = &f2fs_file_operations;
> + inode->i_mapping->a_ops = &f2fs_dblock_aops;
> + }
> +
> + f2fs_lock_op(sbi);
> + err = acquire_orphan_inode(sbi);
> + if (err)
> + goto out;
> +
> + err = f2fs_do_tmpfile(inode, dir);
> + if (err)
> + goto release_out;
> +
> + /*
> + * add this non-linked tmpfile to orphan list, in this way we could
> + * remove all unused data of tmpfile after abnormal power-off.
> + */
> + add_orphan_inode(sbi, inode->i_ino);
> + f2fs_unlock_op(sbi);
> +
> + alloc_nid_done(sbi, inode->i_ino);
> +
> + if (whiteout) {
> + inode_dec_link_count(inode);

Maybe due to this?
We don't need to decrease its link count?

Thanks,

> + *whiteout = inode;
> + } else {
> + d_tmpfile(dentry, inode);
> + }
> + unlock_new_inode(inode);
> + return 0;
> +
> +release_out:
> + release_orphan_inode(sbi);
> +out:
> + handle_failed_inode(inode);
> + return err;
> +}
> +
> +static int f2fs_tmpfile(struct inode *dir, struct dentry *dentry, umode_t mode)
> +{
> + return __f2fs_tmpfile(dir, dentry, mode, NULL);
> +}
> +
> +static int f2fs_create_whiteout(struct inode *dir, struct inode **whiteout)
> +{
> + return __f2fs_tmpfile(dir, NULL, S_IFCHR | WHITEOUT_MODE, whiteout);
> +}
> +
> static int f2fs_rename(struct inode *old_dir, struct dentry *old_dentry,
> - struct inode *new_dir, struct dentry *new_dentry)
> + struct inode *new_dir, struct dentry *new_dentry,
> + unsigned int flags)
> {
> struct f2fs_sb_info *sbi = F2FS_I_SB(old_dir);
> struct inode *old_inode = d_inode(old_dentry);
> struct inode *new_inode = d_inode(new_dentry);
> + struct inode *whiteout = NULL;
> struct page *old_dir_page;
> - struct page *old_page, *new_page;
> + struct page *old_page, *new_page = NULL;
> struct f2fs_dir_entry *old_dir_entry = NULL;
> struct f2fs_dir_entry *old_entry;
> struct f2fs_dir_entry *new_entry;
> @@ -543,6 +609,12 @@ static int f2fs_rename(struct inode *old_dir, struct dentry *old_dentry,
> goto out_old;
> }
>
> + if (flags & RENAME_WHITEOUT) {
> + err = f2fs_create_whiteout(old_dir, &whiteout);
> + if (err)
> + goto out_dir;
> + }
> +
> if (new_inode) {
>
> err = -ENOTEMPTY;
> @@ -611,8 +683,17 @@ static int f2fs_rename(struct inode *old_dir, struct dentry *old_dentry,
>
> f2fs_delete_entry(old_entry, old_page, old_dir, NULL);
>
> + if (whiteout) {
> + whiteout->i_state |= I_LINKABLE;
> + set_inode_flag(F2FS_I(whiteout), FI_INC_LINK);
> + err = f2fs_add_link(old_dentry, whiteout);
> + if (err)
> + goto put_out_dir;
> + whiteout->i_state &= ~I_LINKABLE;
> + }
> +
> if (old_dir_entry) {
> - if (old_dir != new_dir) {
> + if (old_dir != new_dir && !whiteout) {
> f2fs_set_link(old_inode, old_dir_entry,
> old_dir_page, new_dir);
> update_inode_page(old_inode);
> @@ -633,8 +714,10 @@ static int f2fs_rename(struct inode *old_dir, struct dentry *old_dentry,
>
> put_out_dir:
> f2fs_unlock_op(sbi);
> - f2fs_dentry_kunmap(new_dir, new_page);
> - f2fs_put_page(new_page, 0);
> + if (new_page) {
> + f2fs_dentry_kunmap(new_dir, new_page);
> + f2fs_put_page(new_page, 0);
> + }
> out_dir:
> if (old_dir_entry) {
> f2fs_dentry_kunmap(old_inode, old_dir_page);
> @@ -805,7 +888,7 @@ static int f2fs_rename2(struct inode *old_dir, struct dentry *old_dentry,
> struct inode *new_dir, struct dentry *new_dentry,
> unsigned int flags)
> {
> - if (flags & ~(RENAME_NOREPLACE | RENAME_EXCHANGE))
> + if (flags & ~(RENAME_NOREPLACE | RENAME_EXCHANGE | RENAME_WHITEOUT))
> return -EINVAL;
>
> if (flags & RENAME_EXCHANGE) {
> @@ -816,50 +899,7 @@ static int f2fs_rename2(struct inode *old_dir, struct dentry *old_dentry,
> * VFS has already handled the new dentry existence case,
> * here, we just deal with "RENAME_NOREPLACE" as regular rename.
> */
> - return f2fs_rename(old_dir, old_dentry, new_dir, new_dentry);
> -}
> -
> -static int f2fs_tmpfile(struct inode *dir, struct dentry *dentry, umode_t mode)
> -{
> - struct f2fs_sb_info *sbi = F2FS_I_SB(dir);
> - struct inode *inode;
> - int err;
> -
> - inode = f2fs_new_inode(dir, mode);
> - if (IS_ERR(inode))
> - return PTR_ERR(inode);
> -
> - inode->i_op = &f2fs_file_inode_operations;
> - inode->i_fop = &f2fs_file_operations;
> - inode->i_mapping->a_ops = &f2fs_dblock_aops;
> -
> - f2fs_lock_op(sbi);
> - err = acquire_orphan_inode(sbi);
> - if (err)
> - goto out;
> -
> - err = f2fs_do_tmpfile(inode, dir);
> - if (err)
> - goto release_out;
> -
> - /*
> - * add this non-linked tmpfile to orphan list, in this way we could
> - * remove all unused data of tmpfile after abnormal power-off.
> - */
> - add_orphan_inode(sbi, inode->i_ino);
> - f2fs_unlock_op(sbi);
> -
> - alloc_nid_done(sbi, inode->i_ino);
> -
> - d_tmpfile(dentry, inode);
> - unlock_new_inode(inode);
> - return 0;
> -
> -release_out:
> - release_orphan_inode(sbi);
> -out:
> - handle_failed_inode(inode);
> - return err;
> + return f2fs_rename(old_dir, old_dentry, new_dir, new_dentry, flags);
> }
>
> #ifdef CONFIG_F2FS_FS_ENCRYPTION
> --
> 2.3.3
--
To unsubscribe from this list: send the line "unsubscribe linux-kernel" in
the body of a message to majordomo@xxxxxxxxxxxxxxx
More majordomo info at http://vger.kernel.org/majordomo-info.html
Please read the FAQ at http://www.tux.org/lkml/