On 06/18, Chao Yu wrote:
> On 2019/6/14 10:46, Jaegeuk Kim wrote:
> > On 06/11, Chao Yu wrote:
> >> On 2019/6/5 2:36, Jaegeuk Kim wrote:
> >>> Two paths to update quota and f2fs_lock_op:
> >>>
> >>> 1.
> >>>  - lock_op
> >>>  |  - quota_update
> >>>  `- unlock_op
> >>>
> >>> 2.
> >>>  - quota_update
> >>>  - lock_op
> >>>  `- unlock_op
> >>>
> >>> But, we need to make a transaction on quota_update + lock_op in #2 case.
> >>> So, this patch introduces:
> >>> 1. lock_op
> >>> 2. down_write
> >>> 3. check __need_flush
> >>> 4. up_write
> >>> 5. if there is dirty quota entries, flush them
> >>> 6. otherwise, good to go
> >>>
> >>> Signed-off-by: Jaegeuk Kim <[email protected]>
> >>> ---
> >>>
> >>> v3 from v2:
> >>>  - refactor to fix quota corruption issue
> >>>   : it seems that the previous scenario is not real and no deadlock case 
> >>> was
> >>>     encountered.
> >>
> >> - f2fs_dquot_commit
> >>  - down_read(&sbi->quota_sem)
> >>                                    - block_operation
> >>                                     - f2fs_lock_all
> >>                                      - need_flush_quota
> >>                                       - down_write(&sbi->quota_sem)
> >>   - f2fs_quota_write
> >>    - f2fs_lock_op
> >>
> >> Why can't this happen?
> >>
> >> Once more question, should we hold quota_sem during checkpoint to avoid 
> >> further
> >> quota update? f2fs_lock_op can do this job as well?
> > 
> > I couldn't find write_dquot() call to make this happen, and f2fs_lock_op 
> > was not
> 
> - f2fs_dquot_commit
>  - dquot_commit
>   ->commit_dqblk (v2_write_dquot)
>    - qtree_write_dquot
>     ->quota_write (f2fs_quota_write)
>      - f2fs_lock_op
> 
> Do you mean there is no such way that calling f2fs_lock_op() from
> f2fs_quota_write()? So that deadlock condition is not existing?

I mean write_dquot->f2fs_dquot_commit and block_operation seems not racing
together.

> 
> Thanks,
> 
> > enough to cover quota updates. Current stress & power-cut tests are running 
> > for
> > several days without problem with this patch.
> > 
> >>
> >> Thanks,
> >>
> >>>
> >>>  fs/f2fs/checkpoint.c | 41 +++++++++++++++++++----------------------
> >>>  fs/f2fs/f2fs.h       |  1 +
> >>>  fs/f2fs/super.c      | 26 +++++++++++++++++++++-----
> >>>  3 files changed, 41 insertions(+), 27 deletions(-)
> >>>
> >>> diff --git a/fs/f2fs/checkpoint.c b/fs/f2fs/checkpoint.c
> >>> index 89825261d474..43f65f0962e5 100644
> >>> --- a/fs/f2fs/checkpoint.c
> >>> +++ b/fs/f2fs/checkpoint.c
> >>> @@ -1131,17 +1131,24 @@ static void __prepare_cp_block(struct 
> >>> f2fs_sb_info *sbi)
> >>>  
> >>>  static bool __need_flush_quota(struct f2fs_sb_info *sbi)
> >>>  {
> >>> + bool ret = false;
> >>> +
> >>>   if (!is_journalled_quota(sbi))
> >>>           return false;
> >>> - if (is_sbi_flag_set(sbi, SBI_QUOTA_SKIP_FLUSH))
> >>> -         return false;
> >>> - if (is_sbi_flag_set(sbi, SBI_QUOTA_NEED_REPAIR))
> >>> -         return false;
> >>> - if (is_sbi_flag_set(sbi, SBI_QUOTA_NEED_FLUSH))
> >>> -         return true;
> >>> - if (get_pages(sbi, F2FS_DIRTY_QDATA))
> >>> -         return true;
> >>> - return false;
> >>> +
> >>> + down_write(&sbi->quota_sem);
> >>> + if (is_sbi_flag_set(sbi, SBI_QUOTA_SKIP_FLUSH)) {
> >>> +         ret = false;
> >>> + } else if (is_sbi_flag_set(sbi, SBI_QUOTA_NEED_REPAIR)) {
> >>> +         ret = false;
> >>> + } else if (is_sbi_flag_set(sbi, SBI_QUOTA_NEED_FLUSH)) {
> >>> +         clear_sbi_flag(sbi, SBI_QUOTA_NEED_FLUSH);
> >>> +         ret = true;
> >>> + } else if (get_pages(sbi, F2FS_DIRTY_QDATA)) {
> >>> +         ret = true;
> >>> + }
> >>> + up_write(&sbi->quota_sem);
> >>> + return ret;
> >>>  }
> >>>  
> >>>  /*
> >>> @@ -1160,26 +1167,22 @@ static int block_operations(struct f2fs_sb_info 
> >>> *sbi)
> >>>   blk_start_plug(&plug);
> >>>  
> >>>  retry_flush_quotas:
> >>> + f2fs_lock_all(sbi);
> >>>   if (__need_flush_quota(sbi)) {
> >>>           int locked;
> >>>  
> >>>           if (++cnt > DEFAULT_RETRY_QUOTA_FLUSH_COUNT) {
> >>>                   set_sbi_flag(sbi, SBI_QUOTA_SKIP_FLUSH);
> >>> -                 f2fs_lock_all(sbi);
> >>> +                 set_sbi_flag(sbi, SBI_QUOTA_NEED_FLUSH);
> >>>                   goto retry_flush_dents;
> >>>           }
> >>> -         clear_sbi_flag(sbi, SBI_QUOTA_NEED_FLUSH);
> >>> +         f2fs_unlock_all(sbi);
> >>>  
> >>>           /* only failed during mount/umount/freeze/quotactl */
> >>>           locked = down_read_trylock(&sbi->sb->s_umount);
> >>>           f2fs_quota_sync(sbi->sb, -1);
> >>>           if (locked)
> >>>                   up_read(&sbi->sb->s_umount);
> >>> - }
> >>> -
> >>> - f2fs_lock_all(sbi);
> >>> - if (__need_flush_quota(sbi)) {
> >>> -         f2fs_unlock_all(sbi);
> >>>           cond_resched();
> >>>           goto retry_flush_quotas;
> >>>   }
> >>> @@ -1201,12 +1204,6 @@ static int block_operations(struct f2fs_sb_info 
> >>> *sbi)
> >>>    */
> >>>   down_write(&sbi->node_change);
> >>>  
> >>> - if (__need_flush_quota(sbi)) {
> >>> -         up_write(&sbi->node_change);
> >>> -         f2fs_unlock_all(sbi);
> >>> -         goto retry_flush_quotas;
> >>> - }
> >>> -
> >>>   if (get_pages(sbi, F2FS_DIRTY_IMETA)) {
> >>>           up_write(&sbi->node_change);
> >>>           f2fs_unlock_all(sbi);
> >>> diff --git a/fs/f2fs/f2fs.h b/fs/f2fs/f2fs.h
> >>> index 9674a85154b2..9bd2bf0f559b 100644
> >>> --- a/fs/f2fs/f2fs.h
> >>> +++ b/fs/f2fs/f2fs.h
> >>> @@ -1253,6 +1253,7 @@ struct f2fs_sb_info {
> >>>   block_t unusable_block_count;           /* # of blocks saved by last cp 
> >>> */
> >>>  
> >>>   unsigned int nquota_files;              /* # of quota sysfile */
> >>> + struct rw_semaphore quota_sem;          /* blocking cp for flags */
> >>>  
> >>>   /* # of pages, see count_type */
> >>>   atomic_t nr_pages[NR_COUNT_TYPE];
> >>> diff --git a/fs/f2fs/super.c b/fs/f2fs/super.c
> >>> index 15d7e30bfc72..5a318399a2fa 100644
> >>> --- a/fs/f2fs/super.c
> >>> +++ b/fs/f2fs/super.c
> >>> @@ -1964,6 +1964,7 @@ int f2fs_quota_sync(struct super_block *sb, int 
> >>> type)
> >>>   int cnt;
> >>>   int ret;
> >>>  
> >>> + down_read(&sbi->quota_sem);
> >>>   ret = dquot_writeback_dquots(sb, type);
> >>>   if (ret)
> >>>           goto out;
> >>> @@ -2001,6 +2002,7 @@ int f2fs_quota_sync(struct super_block *sb, int 
> >>> type)
> >>>  out:
> >>>   if (ret)
> >>>           set_sbi_flag(F2FS_SB(sb), SBI_QUOTA_NEED_REPAIR);
> >>> + up_read(&sbi->quota_sem);
> >>>   return ret;
> >>>  }
> >>>  
> >>> @@ -2094,32 +2096,40 @@ static void 
> >>> f2fs_truncate_quota_inode_pages(struct super_block *sb)
> >>>  
> >>>  static int f2fs_dquot_commit(struct dquot *dquot)
> >>>  {
> >>> + struct f2fs_sb_info *sbi = F2FS_SB(dquot->dq_sb);
> >>>   int ret;
> >>>  
> >>> + down_read(&sbi->quota_sem);
> >>>   ret = dquot_commit(dquot);
> >>>   if (ret < 0)
> >>> -         set_sbi_flag(F2FS_SB(dquot->dq_sb), SBI_QUOTA_NEED_REPAIR);
> >>> +         set_sbi_flag(sbi, SBI_QUOTA_NEED_REPAIR);
> >>> + up_read(&sbi->quota_sem);
> >>>   return ret;
> >>>  }
> >>>  
> >>>  static int f2fs_dquot_acquire(struct dquot *dquot)
> >>>  {
> >>> + struct f2fs_sb_info *sbi = F2FS_SB(dquot->dq_sb);
> >>>   int ret;
> >>>  
> >>> + down_read(&sbi->quota_sem);
> >>>   ret = dquot_acquire(dquot);
> >>>   if (ret < 0)
> >>> -         set_sbi_flag(F2FS_SB(dquot->dq_sb), SBI_QUOTA_NEED_REPAIR);
> >>> -
> >>> +         set_sbi_flag(sbi, SBI_QUOTA_NEED_REPAIR);
> >>> + up_read(&sbi->quota_sem);
> >>>   return ret;
> >>>  }
> >>>  
> >>>  static int f2fs_dquot_release(struct dquot *dquot)
> >>>  {
> >>> + struct f2fs_sb_info *sbi = F2FS_SB(dquot->dq_sb);
> >>>   int ret;
> >>>  
> >>> + down_read(&sbi->quota_sem);
> >>>   ret = dquot_release(dquot);
> >>>   if (ret < 0)
> >>> -         set_sbi_flag(F2FS_SB(dquot->dq_sb), SBI_QUOTA_NEED_REPAIR);
> >>> +         set_sbi_flag(sbi, SBI_QUOTA_NEED_REPAIR);
> >>> + up_read(&sbi->quota_sem);
> >>>   return ret;
> >>>  }
> >>>  
> >>> @@ -2129,22 +2139,27 @@ static int f2fs_dquot_mark_dquot_dirty(struct 
> >>> dquot *dquot)
> >>>   struct f2fs_sb_info *sbi = F2FS_SB(sb);
> >>>   int ret;
> >>>  
> >>> + down_read(&sbi->quota_sem);
> >>>   ret = dquot_mark_dquot_dirty(dquot);
> >>>  
> >>>   /* if we are using journalled quota */
> >>>   if (is_journalled_quota(sbi))
> >>>           set_sbi_flag(sbi, SBI_QUOTA_NEED_FLUSH);
> >>>  
> >>> + up_read(&sbi->quota_sem);
> >>>   return ret;
> >>>  }
> >>>  
> >>>  static int f2fs_dquot_commit_info(struct super_block *sb, int type)
> >>>  {
> >>> + struct f2fs_sb_info *sbi = F2FS_SB(sb);
> >>>   int ret;
> >>>  
> >>> + down_read(&sbi->quota_sem);
> >>>   ret = dquot_commit_info(sb, type);
> >>>   if (ret < 0)
> >>> -         set_sbi_flag(F2FS_SB(sb), SBI_QUOTA_NEED_REPAIR);
> >>> +         set_sbi_flag(sbi, SBI_QUOTA_NEED_REPAIR);
> >>> + up_read(&sbi->quota_sem);
> >>>   return ret;
> >>>  }
> >>>  
> >>> @@ -3253,6 +3268,7 @@ static int f2fs_fill_super(struct super_block *sb, 
> >>> void *data, int silent)
> >>>   }
> >>>  
> >>>   init_rwsem(&sbi->cp_rwsem);
> >>> + init_rwsem(&sbi->quota_sem);
> >>>   init_waitqueue_head(&sbi->cp_wait);
> >>>   init_sb_info(sbi);
> >>>  
> >>>
> > .
> > 

Reply via email to