On 2018-10-1 9:27, Jaegeuk Kim wrote: > On 10/01, Chao Yu wrote: >> On 2018-10-1 7:58, Jaegeuk Kim wrote: >>> On 09/29, Chao Yu wrote: >>>> On 2018/9/29 7:40, Jaegeuk Kim wrote: >>>>> Testing other fix. >>>>> >>>>> --- >>>>> fs/f2fs/checkpoint.c | 7 +++++++ >>>>> fs/f2fs/f2fs.h | 1 + >>>>> fs/f2fs/gc.c | 10 +++++++++- >>>>> fs/f2fs/super.c | 22 +++++++++++++++++++++- >>>>> 4 files changed, 38 insertions(+), 2 deletions(-) >>>>> >>>>> diff --git a/fs/f2fs/checkpoint.c b/fs/f2fs/checkpoint.c >>>>> index 524b87667cf4..3fde91f41a91 100644 >>>>> --- a/fs/f2fs/checkpoint.c >>>>> +++ b/fs/f2fs/checkpoint.c >>>>> @@ -1494,6 +1494,7 @@ int f2fs_write_checkpoint(struct f2fs_sb_info *sbi, >>>>> struct cp_control *cpc) >>>>> { >>>>> struct f2fs_checkpoint *ckpt = F2FS_CKPT(sbi); >>>>> unsigned long long ckpt_ver; >>>>> + bool need_up = false; >>>>> int err = 0; >>>>> >>>>> if (unlikely(is_sbi_flag_set(sbi, SBI_CP_DISABLED))) { >>>>> @@ -1506,6 +1507,10 @@ int f2fs_write_checkpoint(struct f2fs_sb_info >>>>> *sbi, struct cp_control *cpc) >>>>> f2fs_msg(sbi->sb, KERN_WARNING, >>>>> "Start checkpoint disabled!"); >>>>> } >>>>> + if (!is_sbi_flag_set(sbi, SBI_QUOTA_INIT)) { >>>>> + need_up = true; >>>>> + down_read(&sbi->sb->s_umount); >>>> >>>> This is to avoid show warning when calling dquot_writeback_dquots() in >>>> f2fs_quota_sync(), right? >>> >>> Yup. Unfortunately, this can't fix all the issues, so I'm testing trylock >>> simply in this case. >> >> Oh, that's just warning, it could not be harmful, I think we can simply >> remove >> WARN_ON_ONCE in dquot_writeback_dquots to fix this? > > Well, I think it'd be better to keep it.
We'd better to ask suggestion from maintainer of quota subsystem? Thanks, > >> >>> >>>> >>>>> + } >>>>> mutex_lock(&sbi->cp_mutex); >>>>> >>>>> if (!is_sbi_flag_set(sbi, SBI_IS_DIRTY) && >>>>> @@ -1582,6 +1587,8 @@ int f2fs_write_checkpoint(struct f2fs_sb_info *sbi, >>>>> struct cp_control *cpc) >>>>> trace_f2fs_write_checkpoint(sbi->sb, cpc->reason, "finish checkpoint"); >>>>> out: >>>>> mutex_unlock(&sbi->cp_mutex); >>>>> + if (need_up) >>>>> + up_read(&sbi->sb->s_umount); >>>>> return err; >>>>> } >>>>> >>>>> diff --git a/fs/f2fs/f2fs.h b/fs/f2fs/f2fs.h >>>>> index 57c829dd107e..30194f2f108e 100644 >>>>> --- a/fs/f2fs/f2fs.h >>>>> +++ b/fs/f2fs/f2fs.h >>>>> @@ -1096,6 +1096,7 @@ enum { >>>>> SBI_IS_SHUTDOWN, /* shutdown by ioctl */ >>>>> SBI_IS_RECOVERED, /* recovered orphan/data */ >>>>> SBI_CP_DISABLED, /* CP was disabled last mount */ >>>>> + SBI_QUOTA_INIT, /* avoid sb->s_umount lock */ >>>>> SBI_QUOTA_NEED_FLUSH, /* need to flush quota info in >>>>> CP */ >>>>> SBI_QUOTA_SKIP_FLUSH, /* skip flushing quota in >>>>> current CP */ >>>>> SBI_QUOTA_NEED_REPAIR, /* quota file may be corrupted >>>>> */ >>>>> diff --git a/fs/f2fs/gc.c b/fs/f2fs/gc.c >>>>> index adaf5a695b12..deece448cb3b 100644 >>>>> --- a/fs/f2fs/gc.c >>>>> +++ b/fs/f2fs/gc.c >>>>> @@ -55,9 +55,14 @@ static int gc_thread_func(void *data) >>>>> f2fs_stop_checkpoint(sbi, false); >>>>> } >>>>> >>>>> - if (!sb_start_write_trylock(sbi->sb)) >>>>> + if (!down_read_trylock(&sbi->sb->s_umount)) >>>>> continue; >>>>> >>>>> + set_sbi_flag(sbi, SBI_QUOTA_INIT); >>>>> + >>>>> + if (!sb_start_write_trylock(sbi->sb)) >>>>> + goto next_umount; >>>>> + >>>>> /* >>>>> * [GC triggering condition] >>>>> * 0. GC is not conducted currently. >>>>> @@ -104,6 +109,9 @@ static int gc_thread_func(void *data) >>>>> f2fs_balance_fs_bg(sbi); >>>>> next: >>>>> sb_end_write(sbi->sb); >>>>> +next_umount: >>>>> + clear_sbi_flag(sbi, SBI_QUOTA_INIT); >>>>> + up_read(&sbi->sb->s_umount); >>>>> >>>>> } while (!kthread_should_stop()); >>>>> return 0; >>>>> diff --git a/fs/f2fs/super.c b/fs/f2fs/super.c >>>>> index a28c245b1288..40a77a4eb465 100644 >>>>> --- a/fs/f2fs/super.c >>>>> +++ b/fs/f2fs/super.c >>>>> @@ -1029,6 +1029,8 @@ static void f2fs_put_super(struct super_block *sb) >>>>> int i; >>>>> bool dropped; >>>>> >>>>> + set_sbi_flag(sbi, SBI_QUOTA_INIT); >>>>> + >>>>> f2fs_quota_off_umount(sb); >>>>> >>>>> /* prevent remaining shrinker jobs */ >>>>> @@ -1122,11 +1124,17 @@ int f2fs_sync_fs(struct super_block *sb, int sync) >>>>> >>>>> if (sync) { >>>>> struct cp_control cpc; >>>>> + bool keep = is_sbi_flag_set(sbi, SBI_QUOTA_INIT); >>>>> >>>>> cpc.reason = __get_cp_reason(sbi); >>>>> >>>>> mutex_lock(&sbi->gc_mutex); >>>>> + if (sbi->sb->s_writers.frozen >= SB_FREEZE_WRITE) >>>>> + set_sbi_flag(sbi, SBI_QUOTA_INIT); >>>>> + >>>>> err = f2fs_write_checkpoint(sbi, &cpc); >>>>> + if (!keep) >>>>> + clear_sbi_flag(sbi, SBI_QUOTA_INIT); >>>>> mutex_unlock(&sbi->gc_mutex); >>>>> } >>>>> f2fs_trace_ios(NULL, 1); >>>>> @@ -1534,6 +1542,7 @@ static int f2fs_remount(struct super_block *sb, int >>>>> *flags, char *data) >>>>> } >>>>> } >>>>> #endif >>>>> + set_sbi_flag(sbi, SBI_QUOTA_INIT); >>>>> >>>>> /* recover superblocks we couldn't write due to previous RO mount */ >>>>> if (!(*flags & SB_RDONLY) && is_sbi_flag_set(sbi, SBI_NEED_SB_WRITE)) { >>>>> @@ -1653,6 +1662,7 @@ static int f2fs_remount(struct super_block *sb, int >>>>> *flags, char *data) >>>>> (test_opt(sbi, POSIX_ACL) ? SB_POSIXACL : 0); >>>>> >>>>> limit_reserve_root(sbi); >>>>> + clear_sbi_flag(sbi, SBI_QUOTA_INIT); >>>>> *flags = (*flags & ~SB_LAZYTIME) | (sb->s_flags & SB_LAZYTIME); >>>>> return 0; >>>>> restore_gc: >>>>> @@ -1673,6 +1683,7 @@ static int f2fs_remount(struct super_block *sb, int >>>>> *flags, char *data) >>>>> #endif >>>>> sbi->mount_opt = org_mount_opt; >>>>> sb->s_flags = old_sb_flags; >>>>> + clear_sbi_flag(sbi, SBI_QUOTA_INIT); >>>>> return err; >>>>> } >>>>> >>>>> @@ -1706,6 +1717,7 @@ static ssize_t f2fs_quota_read(struct super_block >>>>> *sb, int type, char *data, >>>>> congestion_wait(BLK_RW_ASYNC, HZ/50); >>>>> goto repeat; >>>>> } >>>>> + set_sbi_flag(F2FS_SB(sb), SBI_QUOTA_NEED_REPAIR); >>>>> return PTR_ERR(page); >>>>> } >>>>> >>>>> @@ -1717,6 +1729,7 @@ static ssize_t f2fs_quota_read(struct super_block >>>>> *sb, int type, char *data, >>>>> } >>>>> if (unlikely(!PageUptodate(page))) { >>>>> f2fs_put_page(page, 1); >>>>> + set_sbi_flag(F2FS_SB(sb), SBI_QUOTA_NEED_REPAIR); >>>>> return -EIO; >>>>> } >>>>> >>>>> @@ -1758,6 +1771,7 @@ static ssize_t f2fs_quota_write(struct super_block >>>>> *sb, int type, >>>>> congestion_wait(BLK_RW_ASYNC, HZ/50); >>>>> goto retry; >>>>> } >>>>> + set_sbi_flag(F2FS_SB(sb), SBI_QUOTA_NEED_REPAIR); >>>>> break; >>>> >>>> I added these before, but later I didn't encounter quota corruption w/o >>>> them, so I removed them. >>>> >>>> Do you still hit corruption after this change? >>> >>> I found one issue where we must avoid roll-forward recovery, if fsck >>> overwrote some >>> blocks to fix quota which will be used for recovery. >> >> That's correct, IMO, the right way is that fsck needs to be aware of whole >> dnode >> chain and block address in dnode block, when doing allocation, it needs to >> bypass those block address of dnode and block which can be recovered later by >> kernel, so that fsynced data can not be lost. >> >> But, in order to trouble shoot current problem more quickly, we can just >> disable >> kernel recovery once fsck recovers quota file for now. >> >> Thanks, >> >>> >>>> >>>> Thanks, >>>> >>>>> } >>>>> >>>>> @@ -1794,7 +1808,6 @@ static qsize_t *f2fs_get_reserved_space(struct >>>>> inode *inode) >>>>> >>>>> static int f2fs_quota_on_mount(struct f2fs_sb_info *sbi, int type) >>>>> { >>>>> - >>>>> if (is_set_ckpt_flags(sbi, CP_QUOTA_NEED_FSCK_FLAG)) { >>>>> f2fs_msg(sbi->sb, KERN_ERR, >>>>> "quota sysfile may be corrupted, skip loading it"); >>>>> @@ -1958,7 +1971,9 @@ static int f2fs_quota_on(struct super_block *sb, >>>>> int type, int format_id, >>>>> if (err) >>>>> return err; >>>>> >>>>> + set_sbi_flag(F2FS_SB(sb), SBI_QUOTA_INIT); >>>>> err = dquot_quota_on(sb, type, format_id, path); >>>>> + clear_sbi_flag(F2FS_SB(sb), SBI_QUOTA_INIT); >>>>> if (err) >>>>> return err; >>>>> >>>>> @@ -3179,6 +3194,7 @@ static int f2fs_fill_super(struct super_block *sb, >>>>> void *data, int silent) >>>>> goto free_meta_inode; >>>>> } >>>>> >>>>> + set_sbi_flag(sbi, SBI_QUOTA_INIT); >>>>> if (__is_set_ckpt_flags(F2FS_CKPT(sbi), CP_QUOTA_NEED_FSCK_FLAG)) >>>>> set_sbi_flag(sbi, SBI_QUOTA_NEED_REPAIR); >>>>> >>>>> @@ -3370,6 +3386,8 @@ static int f2fs_fill_super(struct super_block *sb, >>>>> void *data, int silent) >>>>> cur_cp_version(F2FS_CKPT(sbi))); >>>>> f2fs_update_time(sbi, CP_TIME); >>>>> f2fs_update_time(sbi, REQ_TIME); >>>>> + >>>>> + clear_sbi_flag(sbi, SBI_QUOTA_INIT); >>>>> return 0; >>>>> >>>>> free_meta: >>>>> @@ -3434,6 +3452,7 @@ static int f2fs_fill_super(struct super_block *sb, >>>>> void *data, int silent) >>>>> shrink_dcache_sb(sb); >>>>> goto try_onemore; >>>>> } >>>>> + clear_sbi_flag(sbi, SBI_QUOTA_INIT); >>>>> return err; >>>>> } >>>>> >>>>> @@ -3449,6 +3468,7 @@ static void kill_f2fs_super(struct super_block *sb) >>>>> struct f2fs_sb_info *sbi = F2FS_SB(sb); >>>>> >>>>> set_sbi_flag(sbi, SBI_IS_CLOSE); >>>>> + set_sbi_flag(sbi, SBI_QUOTA_INIT); >>>>> f2fs_stop_gc_thread(sbi); >>>>> f2fs_stop_discard_thread(sbi); >>>>> >>>>> >>> >>> >>> _______________________________________________ >>> Linux-f2fs-devel mailing list >>> linux-f2fs-de...@lists.sourceforge.net >>> https://lists.sourceforge.net/lists/listinfo/linux-f2fs-devel >>>