Skip to content

Commit d11cef1

Browse files
yonggilsongJaegeuk Kim
authored andcommitted
f2fs: Fix system crash due to lack of free space in LFS
When f2fs tries to checkpoint during foreground gc in LFS mode, system crash occurs due to lack of free space if the amount of dirty node and dentry pages generated by data migration exceeds free space. The reproduction sequence is as follows. - 20GiB capacity block device (null_blk) - format and mount with LFS mode - create a file and write 20,000MiB - 4k random write on full range of the file RIP: 0010:new_curseg+0x48a/0x510 [f2fs] Code: 55 e7 f5 89 c0 48 0f af c3 48 8b 5d c0 48 c1 e8 20 83 c0 01 89 43 6c 48 83 c4 28 5b 41 5c 41 5d 41 5e 41 5f 5d c3 cc cc cc cc <0f> 0b f0 41 80 4f 48 04 45 85 f6 0f 84 ba fd ff ff e9 ef fe ff ff RSP: 0018:ffff977bc397b218 EFLAGS: 00010246 RAX: 00000000000027b9 RBX: 0000000000000000 RCX: 00000000000027c0 RDX: 0000000000000000 RSI: 00000000000027b9 RDI: ffff8c25ab4e74f8 RBP: ffff977bc397b268 R08: 00000000000027b9 R09: ffff8c29e4a34b40 R10: 0000000000000001 R11: ffff977bc397b0d8 R12: 0000000000000000 R13: ffff8c25b4dd81a0 R14: 0000000000000000 R15: ffff8c2f667f9000 FS: 0000000000000000(0000) GS:ffff8c344ec80000(0000) knlGS:0000000000000000 CS: 0010 DS: 0000 ES: 0000 CR0: 0000000080050033 CR2: 000000c00055d000 CR3: 0000000e30810003 CR4: 00000000003706e0 DR0: 0000000000000000 DR1: 0000000000000000 DR2: 0000000000000000 DR3: 0000000000000000 DR6: 00000000fffe0ff0 DR7: 0000000000000400 Call Trace: <TASK> allocate_segment_by_default+0x9c/0x110 [f2fs] f2fs_allocate_data_block+0x243/0xa30 [f2fs] ? __mod_lruvec_page_state+0xa0/0x150 do_write_page+0x80/0x160 [f2fs] f2fs_do_write_node_page+0x32/0x50 [f2fs] __write_node_page+0x339/0x730 [f2fs] f2fs_sync_node_pages+0x5a6/0x780 [f2fs] block_operations+0x257/0x340 [f2fs] f2fs_write_checkpoint+0x102/0x1050 [f2fs] f2fs_gc+0x27c/0x630 [f2fs] ? folio_mark_dirty+0x36/0x70 f2fs_balance_fs+0x16f/0x180 [f2fs] This patch adds checking whether free sections are enough before checkpoint during gc. Signed-off-by: Yonggil Song <yonggil.song@samsung.com> [Jaegeuk Kim: code clean-up] Reviewed-by: Chao Yu <chao@kernel.org> Signed-off-by: Jaegeuk Kim <jaegeuk@kernel.org>
1 parent 19e0e21 commit d11cef1

3 files changed

Lines changed: 40 additions & 11 deletions

File tree

fs/f2fs/gc.c

Lines changed: 8 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -1805,6 +1805,7 @@ int f2fs_gc(struct f2fs_sb_info *sbi, struct f2fs_gc_control *gc_control)
18051805
.iroot = RADIX_TREE_INIT(gc_list.iroot, GFP_NOFS),
18061806
};
18071807
unsigned int skipped_round = 0, round = 0;
1808+
unsigned int upper_secs;
18081809

18091810
trace_f2fs_gc_begin(sbi->sb, gc_type, gc_control->no_bg_gc,
18101811
gc_control->nr_free_secs,
@@ -1890,8 +1891,13 @@ int f2fs_gc(struct f2fs_sb_info *sbi, struct f2fs_gc_control *gc_control)
18901891
}
18911892
}
18921893

1893-
/* Write checkpoint to reclaim prefree segments */
1894-
if (free_sections(sbi) < NR_CURSEG_PERSIST_TYPE &&
1894+
__get_secs_required(sbi, NULL, &upper_secs, NULL);
1895+
1896+
/*
1897+
* Write checkpoint to reclaim prefree segments.
1898+
* We need more three extra sections for writer's data/node/dentry.
1899+
*/
1900+
if (free_sections(sbi) <= upper_secs + NR_GC_CHECKPOINT_SECS &&
18951901
prefree_segments(sbi)) {
18961902
ret = f2fs_write_checkpoint(sbi, &cpc);
18971903
if (ret)

fs/f2fs/gc.h

Lines changed: 2 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -30,6 +30,8 @@
3030
/* Search max. number of dirty segments to select a victim segment */
3131
#define DEF_MAX_VICTIM_SEARCH 4096 /* covers 8GB */
3232

33+
#define NR_GC_CHECKPOINT_SECS (3) /* data/node/dentry sections */
34+
3335
struct f2fs_gc_kthread {
3436
struct task_struct *f2fs_gc_task;
3537
wait_queue_head_t gc_wait_queue_head;

fs/f2fs/segment.h

Lines changed: 30 additions & 9 deletions
Original file line numberDiff line numberDiff line change
@@ -595,8 +595,12 @@ static inline bool has_curseg_enough_space(struct f2fs_sb_info *sbi,
595595
return true;
596596
}
597597

598-
static inline bool has_not_enough_free_secs(struct f2fs_sb_info *sbi,
599-
int freed, int needed)
598+
/*
599+
* calculate needed sections for dirty node/dentry
600+
* and call has_curseg_enough_space
601+
*/
602+
static inline void __get_secs_required(struct f2fs_sb_info *sbi,
603+
unsigned int *lower_p, unsigned int *upper_p, bool *curseg_p)
600604
{
601605
unsigned int total_node_blocks = get_pages(sbi, F2FS_DIRTY_NODES) +
602606
get_pages(sbi, F2FS_DIRTY_DENTS) +
@@ -606,20 +610,37 @@ static inline bool has_not_enough_free_secs(struct f2fs_sb_info *sbi,
606610
unsigned int dent_secs = total_dent_blocks / CAP_BLKS_PER_SEC(sbi);
607611
unsigned int node_blocks = total_node_blocks % CAP_BLKS_PER_SEC(sbi);
608612
unsigned int dent_blocks = total_dent_blocks % CAP_BLKS_PER_SEC(sbi);
609-
unsigned int free, need_lower, need_upper;
613+
614+
if (lower_p)
615+
*lower_p = node_secs + dent_secs;
616+
if (upper_p)
617+
*upper_p = node_secs + dent_secs +
618+
(node_blocks ? 1 : 0) + (dent_blocks ? 1 : 0);
619+
if (curseg_p)
620+
*curseg_p = has_curseg_enough_space(sbi,
621+
node_blocks, dent_blocks);
622+
}
623+
624+
static inline bool has_not_enough_free_secs(struct f2fs_sb_info *sbi,
625+
int freed, int needed)
626+
{
627+
unsigned int free_secs, lower_secs, upper_secs;
628+
bool curseg_space;
610629

611630
if (unlikely(is_sbi_flag_set(sbi, SBI_POR_DOING)))
612631
return false;
613632

614-
free = free_sections(sbi) + freed;
615-
need_lower = node_secs + dent_secs + reserved_sections(sbi) + needed;
616-
need_upper = need_lower + (node_blocks ? 1 : 0) + (dent_blocks ? 1 : 0);
633+
__get_secs_required(sbi, &lower_secs, &upper_secs, &curseg_space);
634+
635+
free_secs = free_sections(sbi) + freed;
636+
lower_secs += needed + reserved_sections(sbi);
637+
upper_secs += needed + reserved_sections(sbi);
617638

618-
if (free > need_upper)
639+
if (free_secs > upper_secs)
619640
return false;
620-
else if (free <= need_lower)
641+
else if (free_secs <= lower_secs)
621642
return true;
622-
return !has_curseg_enough_space(sbi, node_blocks, dent_blocks);
643+
return !curseg_space;
623644
}
624645

625646
static inline bool f2fs_is_checkpoint_ready(struct f2fs_sb_info *sbi)

0 commit comments

Comments
 (0)