blob: 12559a4b6c244470364f739dcda97585d2a99cd1 [file] [log] [blame]
Jaegeuk Kim0a8165d2012-11-29 13:28:09 +09001/*
Jaegeuk Kim127e6702012-11-02 17:08:18 +09002 * fs/f2fs/checkpoint.c
3 *
4 * Copyright (c) 2012 Samsung Electronics Co., Ltd.
5 * http://www.samsung.com/
6 *
7 * This program is free software; you can redistribute it and/or modify
8 * it under the terms of the GNU General Public License version 2 as
9 * published by the Free Software Foundation.
10 */
11#include <linux/fs.h>
12#include <linux/bio.h>
13#include <linux/mpage.h>
14#include <linux/writeback.h>
15#include <linux/blkdev.h>
16#include <linux/f2fs_fs.h>
17#include <linux/pagevec.h>
18#include <linux/swap.h>
19
20#include "f2fs.h"
21#include "node.h"
22#include "segment.h"
Jaegeuk Kim9e4ded32014-12-17 19:58:58 -080023#include "trace.h"
Namjae Jeon2af4bd62013-04-23 18:26:54 +090024#include <trace/events/f2fs.h>
Jaegeuk Kim127e6702012-11-02 17:08:18 +090025
Jaegeuk Kim6451e042014-07-25 15:47:17 -070026static struct kmem_cache *ino_entry_slab;
Chao Yu06292072014-12-29 15:56:18 +080027struct kmem_cache *inode_entry_slab;
Jaegeuk Kim127e6702012-11-02 17:08:18 +090028
Jaegeuk Kim38f91ca2016-05-18 14:07:56 -070029void f2fs_stop_checkpoint(struct f2fs_sb_info *sbi, bool end_io)
30{
Chao Yuaaec2b12016-09-20 11:04:18 +080031 set_ckpt_flags(sbi, CP_ERROR_FLAG);
Jaegeuk Kim38f91ca2016-05-18 14:07:56 -070032 sbi->sb->s_flags |= MS_RDONLY;
33 if (!end_io)
Jaegeuk Kimb9109b02017-05-10 11:28:38 -070034 f2fs_flush_merged_writes(sbi);
Jaegeuk Kim38f91ca2016-05-18 14:07:56 -070035}
36
Jaegeuk Kim0a8165d2012-11-29 13:28:09 +090037/*
Jaegeuk Kim127e6702012-11-02 17:08:18 +090038 * We guarantee no failure on the returned page.
39 */
40struct page *grab_meta_page(struct f2fs_sb_info *sbi, pgoff_t index)
41{
Gu Zheng9df27d92014-01-20 18:37:04 +080042 struct address_space *mapping = META_MAPPING(sbi);
Jaegeuk Kim127e6702012-11-02 17:08:18 +090043 struct page *page = NULL;
44repeat:
Jaegeuk Kim300e1292016-04-29 16:11:53 -070045 page = f2fs_grab_cache_page(mapping, index, false);
Jaegeuk Kim127e6702012-11-02 17:08:18 +090046 if (!page) {
47 cond_resched();
48 goto repeat;
49 }
Jaegeuk Kimfec1d652016-01-20 23:43:51 +080050 f2fs_wait_on_page_writeback(page, META, true);
Jaegeuk Kim237c0792016-06-30 18:49:15 -070051 if (!PageUptodate(page))
52 SetPageUptodate(page);
Jaegeuk Kim127e6702012-11-02 17:08:18 +090053 return page;
54}
55
Jaegeuk Kim0a8165d2012-11-29 13:28:09 +090056/*
Jaegeuk Kim127e6702012-11-02 17:08:18 +090057 * We guarantee no failure on the returned page.
58 */
Chao Yu2b947002015-10-12 17:04:21 +080059static struct page *__get_meta_page(struct f2fs_sb_info *sbi, pgoff_t index,
60 bool is_meta)
Jaegeuk Kim127e6702012-11-02 17:08:18 +090061{
Gu Zheng9df27d92014-01-20 18:37:04 +080062 struct address_space *mapping = META_MAPPING(sbi);
Jaegeuk Kim127e6702012-11-02 17:08:18 +090063 struct page *page;
Jaegeuk Kimcf04e8e2014-12-17 19:33:13 -080064 struct f2fs_io_info fio = {
Jaegeuk Kim05ca3632015-04-23 14:38:15 -070065 .sbi = sbi,
Jaegeuk Kimcf04e8e2014-12-17 19:33:13 -080066 .type = META,
Mike Christie04d328d2016-06-05 14:31:55 -050067 .op = REQ_OP_READ,
Christoph Hellwig70fd7612016-11-01 07:40:10 -060068 .op_flags = REQ_META | REQ_PRIO,
Chao Yu7a9d7542016-02-22 18:36:38 +080069 .old_blkaddr = index,
70 .new_blkaddr = index,
Jaegeuk Kim4375a332015-04-23 12:04:33 -070071 .encrypted_page = NULL,
Jaegeuk Kimcf04e8e2014-12-17 19:33:13 -080072 };
Chao Yu2b947002015-10-12 17:04:21 +080073
74 if (unlikely(!is_meta))
Mike Christie04d328d2016-06-05 14:31:55 -050075 fio.op_flags &= ~REQ_META;
Jaegeuk Kim127e6702012-11-02 17:08:18 +090076repeat:
Jaegeuk Kim300e1292016-04-29 16:11:53 -070077 page = f2fs_grab_cache_page(mapping, index, false);
Jaegeuk Kim127e6702012-11-02 17:08:18 +090078 if (!page) {
79 cond_resched();
80 goto repeat;
81 }
Jaegeuk Kim393ff912013-03-08 21:29:23 +090082 if (PageUptodate(page))
83 goto out;
Jaegeuk Kim127e6702012-11-02 17:08:18 +090084
Jaegeuk Kim05ca3632015-04-23 14:38:15 -070085 fio.page = page;
86
Jaegeuk Kim86531d62015-07-15 13:08:21 -070087 if (f2fs_submit_page_bio(&fio)) {
88 f2fs_put_page(page, 1);
Jaegeuk Kim393ff912013-03-08 21:29:23 +090089 goto repeat;
Jaegeuk Kim86531d62015-07-15 13:08:21 -070090 }
Jaegeuk Kim393ff912013-03-08 21:29:23 +090091
92 lock_page(page);
Jaegeuk Kim6bacf522013-12-06 15:00:58 +090093 if (unlikely(page->mapping != mapping)) {
Jaegeuk Kimafcb7ca02013-04-26 11:55:17 +090094 f2fs_put_page(page, 1);
95 goto repeat;
96 }
Chao Yuf3f338c2015-07-29 17:33:13 +080097
98 /*
99 * if there is any IO error when accessing device, make our filesystem
100 * readonly and make sure do not write checkpoint with non-uptodate
101 * meta page.
102 */
103 if (unlikely(!PageUptodate(page)))
Jaegeuk Kim38f91ca2016-05-18 14:07:56 -0700104 f2fs_stop_checkpoint(sbi, false);
Jaegeuk Kim393ff912013-03-08 21:29:23 +0900105out:
Jaegeuk Kim127e6702012-11-02 17:08:18 +0900106 return page;
107}
108
Chao Yu2b947002015-10-12 17:04:21 +0800109struct page *get_meta_page(struct f2fs_sb_info *sbi, pgoff_t index)
110{
111 return __get_meta_page(sbi, index, true);
112}
113
114/* for POR only */
115struct page *get_tmp_page(struct f2fs_sb_info *sbi, pgoff_t index)
116{
117 return __get_meta_page(sbi, index, false);
118}
119
Chao Yuf0c9cad2015-04-18 18:05:36 +0800120bool is_valid_blkaddr(struct f2fs_sb_info *sbi, block_t blkaddr, int type)
Chao Yu662befd2014-02-07 16:11:53 +0800121{
122 switch (type) {
123 case META_NAT:
Chao Yu66b00c12014-12-08 14:59:17 +0800124 break;
Chao Yu662befd2014-02-07 16:11:53 +0800125 case META_SIT:
Chao Yu66b00c12014-12-08 14:59:17 +0800126 if (unlikely(blkaddr >= SIT_BLK_CNT(sbi)))
127 return false;
128 break;
Chao Yu81c1a0f12014-02-27 19:12:24 +0800129 case META_SSA:
Chao Yu66b00c12014-12-08 14:59:17 +0800130 if (unlikely(blkaddr >= MAIN_BLKADDR(sbi) ||
131 blkaddr < SM_I(sbi)->ssa_blkaddr))
132 return false;
133 break;
Chao Yu662befd2014-02-07 16:11:53 +0800134 case META_CP:
Chao Yu66b00c12014-12-08 14:59:17 +0800135 if (unlikely(blkaddr >= SIT_I(sbi)->sit_base_addr ||
136 blkaddr < __start_cp_addr(sbi)))
137 return false;
138 break;
Jaegeuk Kim4c521f492014-09-11 13:49:55 -0700139 case META_POR:
Chao Yu66b00c12014-12-08 14:59:17 +0800140 if (unlikely(blkaddr >= MAX_BLKADDR(sbi) ||
141 blkaddr < MAIN_BLKADDR(sbi)))
142 return false;
143 break;
Chao Yu662befd2014-02-07 16:11:53 +0800144 default:
145 BUG();
146 }
Chao Yu66b00c12014-12-08 14:59:17 +0800147
148 return true;
Chao Yu662befd2014-02-07 16:11:53 +0800149}
150
151/*
Chao Yu81c1a0f12014-02-27 19:12:24 +0800152 * Readahead CP/NAT/SIT/SSA pages
Chao Yu662befd2014-02-07 16:11:53 +0800153 */
Chao Yu26879fb2015-10-12 17:05:59 +0800154int ra_meta_pages(struct f2fs_sb_info *sbi, block_t start, int nrpages,
155 int type, bool sync)
Chao Yu662befd2014-02-07 16:11:53 +0800156{
Chao Yu662befd2014-02-07 16:11:53 +0800157 struct page *page;
Jaegeuk Kim4c521f492014-09-11 13:49:55 -0700158 block_t blkno = start;
Chao Yu662befd2014-02-07 16:11:53 +0800159 struct f2fs_io_info fio = {
Jaegeuk Kim05ca3632015-04-23 14:38:15 -0700160 .sbi = sbi,
Chao Yu662befd2014-02-07 16:11:53 +0800161 .type = META,
Mike Christie04d328d2016-06-05 14:31:55 -0500162 .op = REQ_OP_READ,
Christoph Hellwig70fd7612016-11-01 07:40:10 -0600163 .op_flags = sync ? (REQ_META | REQ_PRIO) : REQ_RAHEAD,
Jaegeuk Kim4375a332015-04-23 12:04:33 -0700164 .encrypted_page = NULL,
Chao Yufb830fc2017-05-19 23:37:01 +0800165 .in_list = false,
Chao Yu662befd2014-02-07 16:11:53 +0800166 };
Chao Yue9f5b8b2016-02-14 18:54:33 +0800167 struct blk_plug plug;
Chao Yu662befd2014-02-07 16:11:53 +0800168
Chao Yu2b947002015-10-12 17:04:21 +0800169 if (unlikely(type == META_POR))
Mike Christie04d328d2016-06-05 14:31:55 -0500170 fio.op_flags &= ~REQ_META;
Chao Yu2b947002015-10-12 17:04:21 +0800171
Chao Yue9f5b8b2016-02-14 18:54:33 +0800172 blk_start_plug(&plug);
Chao Yu662befd2014-02-07 16:11:53 +0800173 for (; nrpages-- > 0; blkno++) {
Chao Yu662befd2014-02-07 16:11:53 +0800174
Chao Yu66b00c12014-12-08 14:59:17 +0800175 if (!is_valid_blkaddr(sbi, blkno, type))
176 goto out;
177
Chao Yu662befd2014-02-07 16:11:53 +0800178 switch (type) {
179 case META_NAT:
Chao Yu66b00c12014-12-08 14:59:17 +0800180 if (unlikely(blkno >=
181 NAT_BLOCK_OFFSET(NM_I(sbi)->max_nid)))
Chao Yu662befd2014-02-07 16:11:53 +0800182 blkno = 0;
Chao Yu66b00c12014-12-08 14:59:17 +0800183 /* get nat block addr */
Chao Yu7a9d7542016-02-22 18:36:38 +0800184 fio.new_blkaddr = current_nat_addr(sbi,
Chao Yu662befd2014-02-07 16:11:53 +0800185 blkno * NAT_ENTRY_PER_BLOCK);
186 break;
187 case META_SIT:
188 /* get sit block addr */
Chao Yu7a9d7542016-02-22 18:36:38 +0800189 fio.new_blkaddr = current_sit_addr(sbi,
Chao Yu662befd2014-02-07 16:11:53 +0800190 blkno * SIT_ENTRY_PER_BLOCK);
Chao Yu662befd2014-02-07 16:11:53 +0800191 break;
Chao Yu81c1a0f12014-02-27 19:12:24 +0800192 case META_SSA:
Chao Yu662befd2014-02-07 16:11:53 +0800193 case META_CP:
Jaegeuk Kim4c521f492014-09-11 13:49:55 -0700194 case META_POR:
Chao Yu7a9d7542016-02-22 18:36:38 +0800195 fio.new_blkaddr = blkno;
Chao Yu662befd2014-02-07 16:11:53 +0800196 break;
197 default:
198 BUG();
199 }
200
Jaegeuk Kim300e1292016-04-29 16:11:53 -0700201 page = f2fs_grab_cache_page(META_MAPPING(sbi),
202 fio.new_blkaddr, false);
Chao Yu662befd2014-02-07 16:11:53 +0800203 if (!page)
204 continue;
205 if (PageUptodate(page)) {
Chao Yu662befd2014-02-07 16:11:53 +0800206 f2fs_put_page(page, 1);
207 continue;
208 }
209
Jaegeuk Kim05ca3632015-04-23 14:38:15 -0700210 fio.page = page;
Jaegeuk Kim1919ffc2017-05-10 11:23:36 -0700211 f2fs_submit_page_bio(&fio);
Chao Yu662befd2014-02-07 16:11:53 +0800212 f2fs_put_page(page, 0);
213 }
214out:
Chao Yue9f5b8b2016-02-14 18:54:33 +0800215 blk_finish_plug(&plug);
Chao Yu662befd2014-02-07 16:11:53 +0800216 return blkno - start;
217}
218
Chao Yu635aee12014-12-08 15:02:52 +0800219void ra_meta_pages_cond(struct f2fs_sb_info *sbi, pgoff_t index)
220{
221 struct page *page;
222 bool readahead = false;
223
224 page = find_get_page(META_MAPPING(sbi), index);
Jaegeuk Kim4da7bf52016-04-06 11:27:03 -0700225 if (!page || !PageUptodate(page))
Chao Yu635aee12014-12-08 15:02:52 +0800226 readahead = true;
227 f2fs_put_page(page, 0);
228
229 if (readahead)
Jaegeuk Kim664ba972016-10-18 11:07:45 -0700230 ra_meta_pages(sbi, index, BIO_MAX_PAGES, META_POR, true);
Chao Yu635aee12014-12-08 15:02:52 +0800231}
232
Jaegeuk Kim127e6702012-11-02 17:08:18 +0900233static int f2fs_write_meta_page(struct page *page,
234 struct writeback_control *wbc)
235{
Jaegeuk Kim40813632014-09-02 15:31:18 -0700236 struct f2fs_sb_info *sbi = F2FS_P_SB(page);
Jaegeuk Kim577e3492013-01-24 19:56:11 +0900237
Chao Yuecda0de2014-05-06 16:48:26 +0800238 trace_f2fs_writepage(page, META);
239
Chao Yucaf00472015-01-28 17:48:42 +0800240 if (unlikely(is_sbi_flag_set(sbi, SBI_POR_DOING)))
Chao Yucfb271d2013-12-05 17:15:22 +0800241 goto redirty_out;
Jaegeuk Kim857dc4e2014-11-19 11:03:34 -0800242 if (wbc->for_reclaim && page->index < GET_SUM_BLOCK(sbi, 0))
Chao Yucfb271d2013-12-05 17:15:22 +0800243 goto redirty_out;
Jaegeuk Kim1e968fd2014-08-11 16:49:25 -0700244 if (unlikely(f2fs_cp_error(sbi)))
Jaegeuk Kimcf779ca2014-08-11 18:37:46 -0700245 goto redirty_out;
Jaegeuk Kim127e6702012-11-02 17:08:18 +0900246
Jaegeuk Kim577e3492013-01-24 19:56:11 +0900247 write_meta_page(sbi, page);
Jaegeuk Kim127e6702012-11-02 17:08:18 +0900248 dec_page_count(sbi, F2FS_DIRTY_META);
Chao Yu0c3a5792016-01-18 18:28:11 +0800249
250 if (wbc->for_reclaim)
Jaegeuk Kimb9109b02017-05-10 11:28:38 -0700251 f2fs_submit_merged_write_cond(sbi, page->mapping->host,
252 0, page->index, META);
Chao Yu0c3a5792016-01-18 18:28:11 +0800253
Jaegeuk Kim577e3492013-01-24 19:56:11 +0900254 unlock_page(page);
Jaegeuk Kim857dc4e2014-11-19 11:03:34 -0800255
Chao Yu0c3a5792016-01-18 18:28:11 +0800256 if (unlikely(f2fs_cp_error(sbi)))
Jaegeuk Kimb9109b02017-05-10 11:28:38 -0700257 f2fs_submit_merged_write(sbi, META);
Chao Yu0c3a5792016-01-18 18:28:11 +0800258
Jaegeuk Kim577e3492013-01-24 19:56:11 +0900259 return 0;
Chao Yucfb271d2013-12-05 17:15:22 +0800260
261redirty_out:
Jaegeuk Kim76f60262014-04-15 16:04:15 +0900262 redirty_page_for_writepage(wbc, page);
Chao Yucfb271d2013-12-05 17:15:22 +0800263 return AOP_WRITEPAGE_ACTIVATE;
Jaegeuk Kim127e6702012-11-02 17:08:18 +0900264}
265
266static int f2fs_write_meta_pages(struct address_space *mapping,
267 struct writeback_control *wbc)
268{
Jaegeuk Kim40813632014-09-02 15:31:18 -0700269 struct f2fs_sb_info *sbi = F2FS_M_SB(mapping);
Jaegeuk Kim50c8cdb2014-03-18 13:47:11 +0900270 long diff, written;
Jaegeuk Kim127e6702012-11-02 17:08:18 +0900271
Jaegeuk Kim5459aa92013-12-17 17:28:41 +0900272 /* collect a number of dirty meta pages and write together */
Jaegeuk Kim50c8cdb2014-03-18 13:47:11 +0900273 if (wbc->for_kupdate ||
274 get_pages(sbi, F2FS_DIRTY_META) < nr_pages_to_skip(sbi, META))
Jaegeuk Kimd3baf952014-03-18 13:43:05 +0900275 goto skip_write;
Jaegeuk Kim127e6702012-11-02 17:08:18 +0900276
Yunlei Hea29d0e02017-03-01 18:07:10 +0800277 /* if locked failed, cp will flush dirty pages instead */
278 if (!mutex_trylock(&sbi->cp_mutex))
279 goto skip_write;
Yunlei Hed31c7c32016-02-04 16:14:00 +0800280
Yunlei Hea29d0e02017-03-01 18:07:10 +0800281 trace_f2fs_writepages(mapping->host, wbc, META);
Jaegeuk Kim50c8cdb2014-03-18 13:47:11 +0900282 diff = nr_pages_to_write(sbi, META, wbc);
283 written = sync_meta_pages(sbi, META, wbc->nr_to_write);
Jaegeuk Kim127e6702012-11-02 17:08:18 +0900284 mutex_unlock(&sbi->cp_mutex);
Jaegeuk Kim50c8cdb2014-03-18 13:47:11 +0900285 wbc->nr_to_write = max((long)0, wbc->nr_to_write - written - diff);
Jaegeuk Kim127e6702012-11-02 17:08:18 +0900286 return 0;
Jaegeuk Kimd3baf952014-03-18 13:43:05 +0900287
288skip_write:
289 wbc->pages_skipped += get_pages(sbi, F2FS_DIRTY_META);
Yunlei Hed31c7c32016-02-04 16:14:00 +0800290 trace_f2fs_writepages(mapping->host, wbc, META);
Jaegeuk Kimd3baf952014-03-18 13:43:05 +0900291 return 0;
Jaegeuk Kim127e6702012-11-02 17:08:18 +0900292}
293
294long sync_meta_pages(struct f2fs_sb_info *sbi, enum page_type type,
295 long nr_to_write)
296{
Gu Zheng9df27d92014-01-20 18:37:04 +0800297 struct address_space *mapping = META_MAPPING(sbi);
Chao Yu80dd9c02016-02-24 17:20:44 +0800298 pgoff_t index = 0, end = ULONG_MAX, prev = ULONG_MAX;
Jaegeuk Kim127e6702012-11-02 17:08:18 +0900299 struct pagevec pvec;
300 long nwritten = 0;
301 struct writeback_control wbc = {
302 .for_reclaim = 0,
303 };
Chao Yue9f5b8b2016-02-14 18:54:33 +0800304 struct blk_plug plug;
Jaegeuk Kim127e6702012-11-02 17:08:18 +0900305
306 pagevec_init(&pvec, 0);
307
Chao Yue9f5b8b2016-02-14 18:54:33 +0800308 blk_start_plug(&plug);
309
Jaegeuk Kim127e6702012-11-02 17:08:18 +0900310 while (index <= end) {
311 int i, nr_pages;
312 nr_pages = pagevec_lookup_tag(&pvec, mapping, &index,
313 PAGECACHE_TAG_DIRTY,
314 min(end - index, (pgoff_t)PAGEVEC_SIZE-1) + 1);
Chao Yucfb271d2013-12-05 17:15:22 +0800315 if (unlikely(nr_pages == 0))
Jaegeuk Kim127e6702012-11-02 17:08:18 +0900316 break;
317
318 for (i = 0; i < nr_pages; i++) {
319 struct page *page = pvec.pages[i];
Jaegeuk Kim203681f2014-02-05 13:03:57 +0900320
Chao Yu80dd9c02016-02-24 17:20:44 +0800321 if (prev == ULONG_MAX)
Jaegeuk Kim6066d8c2015-10-01 16:42:55 -0700322 prev = page->index - 1;
323 if (nr_to_write != LONG_MAX && page->index != prev + 1) {
324 pagevec_release(&pvec);
325 goto stop;
326 }
327
Jaegeuk Kim127e6702012-11-02 17:08:18 +0900328 lock_page(page);
Jaegeuk Kim203681f2014-02-05 13:03:57 +0900329
330 if (unlikely(page->mapping != mapping)) {
331continue_unlock:
332 unlock_page(page);
333 continue;
334 }
335 if (!PageDirty(page)) {
336 /* someone wrote it for us */
337 goto continue_unlock;
338 }
339
Jaegeuk Kimfa3d2bd2016-01-28 11:48:52 -0800340 f2fs_wait_on_page_writeback(page, META, true);
341
342 BUG_ON(PageWriteback(page));
Jaegeuk Kim203681f2014-02-05 13:03:57 +0900343 if (!clear_page_dirty_for_io(page))
344 goto continue_unlock;
345
Chao Yu97dc3fd2015-02-16 16:19:22 +0800346 if (mapping->a_ops->writepage(page, &wbc)) {
Jaegeuk Kim577e3492013-01-24 19:56:11 +0900347 unlock_page(page);
348 break;
349 }
Chao Yucfb271d2013-12-05 17:15:22 +0800350 nwritten++;
Jaegeuk Kim6066d8c2015-10-01 16:42:55 -0700351 prev = page->index;
Chao Yucfb271d2013-12-05 17:15:22 +0800352 if (unlikely(nwritten >= nr_to_write))
Jaegeuk Kim127e6702012-11-02 17:08:18 +0900353 break;
354 }
355 pagevec_release(&pvec);
356 cond_resched();
357 }
Jaegeuk Kim6066d8c2015-10-01 16:42:55 -0700358stop:
Jaegeuk Kim127e6702012-11-02 17:08:18 +0900359 if (nwritten)
Jaegeuk Kimb9109b02017-05-10 11:28:38 -0700360 f2fs_submit_merged_write(sbi, type);
Jaegeuk Kim127e6702012-11-02 17:08:18 +0900361
Chao Yue9f5b8b2016-02-14 18:54:33 +0800362 blk_finish_plug(&plug);
363
Jaegeuk Kim127e6702012-11-02 17:08:18 +0900364 return nwritten;
365}
366
367static int f2fs_set_meta_page_dirty(struct page *page)
368{
Jaegeuk Kim26c6b882013-10-24 17:53:29 +0900369 trace_f2fs_set_page_dirty(page, META);
370
Jaegeuk Kim237c0792016-06-30 18:49:15 -0700371 if (!PageUptodate(page))
372 SetPageUptodate(page);
Jaegeuk Kim127e6702012-11-02 17:08:18 +0900373 if (!PageDirty(page)) {
Jaegeuk Kimfe76b792016-06-30 18:40:10 -0700374 f2fs_set_page_dirty_nobuffers(page);
Jaegeuk Kim40813632014-09-02 15:31:18 -0700375 inc_page_count(F2FS_P_SB(page), F2FS_DIRTY_META);
Chao Yu16018392015-01-19 20:24:37 +0800376 SetPagePrivate(page);
Jaegeuk Kim9e4ded32014-12-17 19:58:58 -0800377 f2fs_trace_pid(page);
Jaegeuk Kim127e6702012-11-02 17:08:18 +0900378 return 1;
379 }
380 return 0;
381}
382
383const struct address_space_operations f2fs_meta_aops = {
384 .writepage = f2fs_write_meta_page,
385 .writepages = f2fs_write_meta_pages,
386 .set_page_dirty = f2fs_set_meta_page_dirty,
Chao Yu487261f2015-02-05 17:44:29 +0800387 .invalidatepage = f2fs_invalidate_page,
388 .releasepage = f2fs_release_page,
Weichao Guo5b7a4872016-09-20 05:03:27 +0800389#ifdef CONFIG_MIGRATION
390 .migratepage = f2fs_migrate_page,
391#endif
Jaegeuk Kim127e6702012-11-02 17:08:18 +0900392};
393
Jaegeuk Kim6451e042014-07-25 15:47:17 -0700394static void __add_ino_entry(struct f2fs_sb_info *sbi, nid_t ino, int type)
Jaegeuk Kim953e6cc2014-07-25 15:47:16 -0700395{
Chao Yu67298802014-11-18 11:18:36 +0800396 struct inode_management *im = &sbi->im[type];
Jaegeuk Kim80c54502015-08-20 08:51:56 -0700397 struct ino_entry *e, *tmp;
398
399 tmp = f2fs_kmem_cache_alloc(ino_entry_slab, GFP_NOFS);
Jaegeuk Kim39efac42014-07-24 18:15:17 -0700400retry:
Jaegeuk Kim80c54502015-08-20 08:51:56 -0700401 radix_tree_preload(GFP_NOFS | __GFP_NOFAIL);
Jaegeuk Kim769ec6e2014-12-03 20:47:26 -0800402
Chao Yu67298802014-11-18 11:18:36 +0800403 spin_lock(&im->ino_lock);
Chao Yu67298802014-11-18 11:18:36 +0800404 e = radix_tree_lookup(&im->ino_root, ino);
Jaegeuk Kim39efac42014-07-24 18:15:17 -0700405 if (!e) {
Jaegeuk Kim80c54502015-08-20 08:51:56 -0700406 e = tmp;
Chao Yu67298802014-11-18 11:18:36 +0800407 if (radix_tree_insert(&im->ino_root, ino, e)) {
408 spin_unlock(&im->ino_lock);
Jaegeuk Kim769ec6e2014-12-03 20:47:26 -0800409 radix_tree_preload_end();
Jaegeuk Kim39efac42014-07-24 18:15:17 -0700410 goto retry;
411 }
412 memset(e, 0, sizeof(struct ino_entry));
413 e->ino = ino;
414
Chao Yu67298802014-11-18 11:18:36 +0800415 list_add_tail(&e->list, &im->ino_list);
Jaegeuk Kim8c402942014-11-06 15:16:04 -0800416 if (type != ORPHAN_INO)
Chao Yu67298802014-11-18 11:18:36 +0800417 im->ino_num++;
Jaegeuk Kim39efac42014-07-24 18:15:17 -0700418 }
Chao Yu67298802014-11-18 11:18:36 +0800419 spin_unlock(&im->ino_lock);
Jaegeuk Kim769ec6e2014-12-03 20:47:26 -0800420 radix_tree_preload_end();
Jaegeuk Kim80c54502015-08-20 08:51:56 -0700421
422 if (e != tmp)
423 kmem_cache_free(ino_entry_slab, tmp);
Jaegeuk Kim953e6cc2014-07-25 15:47:16 -0700424}
425
Jaegeuk Kim6451e042014-07-25 15:47:17 -0700426static void __remove_ino_entry(struct f2fs_sb_info *sbi, nid_t ino, int type)
Jaegeuk Kim953e6cc2014-07-25 15:47:16 -0700427{
Chao Yu67298802014-11-18 11:18:36 +0800428 struct inode_management *im = &sbi->im[type];
Jaegeuk Kim6451e042014-07-25 15:47:17 -0700429 struct ino_entry *e;
Jaegeuk Kim953e6cc2014-07-25 15:47:16 -0700430
Chao Yu67298802014-11-18 11:18:36 +0800431 spin_lock(&im->ino_lock);
432 e = radix_tree_lookup(&im->ino_root, ino);
Jaegeuk Kim39efac42014-07-24 18:15:17 -0700433 if (e) {
434 list_del(&e->list);
Chao Yu67298802014-11-18 11:18:36 +0800435 radix_tree_delete(&im->ino_root, ino);
436 im->ino_num--;
437 spin_unlock(&im->ino_lock);
Jaegeuk Kim39efac42014-07-24 18:15:17 -0700438 kmem_cache_free(ino_entry_slab, e);
439 return;
Jaegeuk Kim953e6cc2014-07-25 15:47:16 -0700440 }
Chao Yu67298802014-11-18 11:18:36 +0800441 spin_unlock(&im->ino_lock);
Jaegeuk Kim953e6cc2014-07-25 15:47:16 -0700442}
443
Chao Yua49324f2015-12-15 13:29:47 +0800444void add_ino_entry(struct f2fs_sb_info *sbi, nid_t ino, int type)
Jaegeuk Kimfff04f92014-07-25 07:40:59 -0700445{
446 /* add new dirty ino entry into list */
447 __add_ino_entry(sbi, ino, type);
448}
449
Chao Yua49324f2015-12-15 13:29:47 +0800450void remove_ino_entry(struct f2fs_sb_info *sbi, nid_t ino, int type)
Jaegeuk Kimfff04f92014-07-25 07:40:59 -0700451{
452 /* remove dirty ino entry from list */
453 __remove_ino_entry(sbi, ino, type);
454}
455
456/* mode should be APPEND_INO or UPDATE_INO */
457bool exist_written_data(struct f2fs_sb_info *sbi, nid_t ino, int mode)
458{
Chao Yu67298802014-11-18 11:18:36 +0800459 struct inode_management *im = &sbi->im[mode];
Jaegeuk Kimfff04f92014-07-25 07:40:59 -0700460 struct ino_entry *e;
Chao Yu67298802014-11-18 11:18:36 +0800461
462 spin_lock(&im->ino_lock);
463 e = radix_tree_lookup(&im->ino_root, ino);
464 spin_unlock(&im->ino_lock);
Jaegeuk Kimfff04f92014-07-25 07:40:59 -0700465 return e ? true : false;
466}
467
Jaegeuk Kim74ef9242016-05-02 22:09:56 -0700468void release_ino_entry(struct f2fs_sb_info *sbi, bool all)
Jaegeuk Kimfff04f92014-07-25 07:40:59 -0700469{
470 struct ino_entry *e, *tmp;
471 int i;
472
Jaegeuk Kim74ef9242016-05-02 22:09:56 -0700473 for (i = all ? ORPHAN_INO: APPEND_INO; i <= UPDATE_INO; i++) {
Chao Yu67298802014-11-18 11:18:36 +0800474 struct inode_management *im = &sbi->im[i];
475
476 spin_lock(&im->ino_lock);
477 list_for_each_entry_safe(e, tmp, &im->ino_list, list) {
Jaegeuk Kimfff04f92014-07-25 07:40:59 -0700478 list_del(&e->list);
Chao Yu67298802014-11-18 11:18:36 +0800479 radix_tree_delete(&im->ino_root, e->ino);
Jaegeuk Kimfff04f92014-07-25 07:40:59 -0700480 kmem_cache_free(ino_entry_slab, e);
Chao Yu67298802014-11-18 11:18:36 +0800481 im->ino_num--;
Jaegeuk Kimfff04f92014-07-25 07:40:59 -0700482 }
Chao Yu67298802014-11-18 11:18:36 +0800483 spin_unlock(&im->ino_lock);
Jaegeuk Kimfff04f92014-07-25 07:40:59 -0700484 }
485}
486
Jaegeuk Kimcbd56e72013-07-30 11:36:53 +0900487int acquire_orphan_inode(struct f2fs_sb_info *sbi)
Jaegeuk Kim127e6702012-11-02 17:08:18 +0900488{
Chao Yu67298802014-11-18 11:18:36 +0800489 struct inode_management *im = &sbi->im[ORPHAN_INO];
Jaegeuk Kim127e6702012-11-02 17:08:18 +0900490 int err = 0;
491
Chao Yu67298802014-11-18 11:18:36 +0800492 spin_lock(&im->ino_lock);
Jaegeuk Kimcb789422016-04-29 16:29:22 -0700493
494#ifdef CONFIG_F2FS_FAULT_INJECTION
Chao Yu1ecc0c52016-09-23 21:30:09 +0800495 if (time_to_inject(sbi, FAULT_ORPHAN)) {
Jaegeuk Kimcb789422016-04-29 16:29:22 -0700496 spin_unlock(&im->ino_lock);
Chao Yu55523512017-02-25 11:08:28 +0800497 f2fs_show_injection_info(FAULT_ORPHAN);
Jaegeuk Kimcb789422016-04-29 16:29:22 -0700498 return -ENOSPC;
499 }
500#endif
Chao Yu67298802014-11-18 11:18:36 +0800501 if (unlikely(im->ino_num >= sbi->max_orphans))
Jaegeuk Kim127e6702012-11-02 17:08:18 +0900502 err = -ENOSPC;
Jaegeuk Kimcbd56e72013-07-30 11:36:53 +0900503 else
Chao Yu67298802014-11-18 11:18:36 +0800504 im->ino_num++;
505 spin_unlock(&im->ino_lock);
Gu Zheng0d47c1a2013-12-26 18:24:19 +0800506
Jaegeuk Kim127e6702012-11-02 17:08:18 +0900507 return err;
508}
509
Jaegeuk Kimcbd56e72013-07-30 11:36:53 +0900510void release_orphan_inode(struct f2fs_sb_info *sbi)
511{
Chao Yu67298802014-11-18 11:18:36 +0800512 struct inode_management *im = &sbi->im[ORPHAN_INO];
513
514 spin_lock(&im->ino_lock);
515 f2fs_bug_on(sbi, im->ino_num == 0);
516 im->ino_num--;
517 spin_unlock(&im->ino_lock);
Jaegeuk Kimcbd56e72013-07-30 11:36:53 +0900518}
519
Jaegeuk Kim67c37582016-06-13 18:27:02 -0700520void add_orphan_inode(struct inode *inode)
Jaegeuk Kim127e6702012-11-02 17:08:18 +0900521{
Jaegeuk Kim39efac42014-07-24 18:15:17 -0700522 /* add new orphan ino entry into list */
Jaegeuk Kim67c37582016-06-13 18:27:02 -0700523 __add_ino_entry(F2FS_I_SB(inode), inode->i_ino, ORPHAN_INO);
524 update_inode_page(inode);
Jaegeuk Kim127e6702012-11-02 17:08:18 +0900525}
526
527void remove_orphan_inode(struct f2fs_sb_info *sbi, nid_t ino)
528{
Jaegeuk Kim953e6cc2014-07-25 15:47:16 -0700529 /* remove orphan entry from orphan list */
Jaegeuk Kim6451e042014-07-25 15:47:17 -0700530 __remove_ino_entry(sbi, ino, ORPHAN_INO);
Jaegeuk Kim127e6702012-11-02 17:08:18 +0900531}
532
Chao Yu8c14bfa2015-08-07 17:58:43 +0800533static int recover_orphan_inode(struct f2fs_sb_info *sbi, nid_t ino)
Jaegeuk Kim127e6702012-11-02 17:08:18 +0900534{
Chao Yu8c14bfa2015-08-07 17:58:43 +0800535 struct inode *inode;
Jaegeuk Kim5905f9a2016-09-12 15:08:37 -0700536 struct node_info ni;
Jaegeuk Kimd41065e2016-09-21 11:39:42 -0700537 int err = acquire_orphan_inode(sbi);
538
539 if (err) {
540 set_sbi_flag(sbi, SBI_NEED_FSCK);
541 f2fs_msg(sbi->sb, KERN_WARNING,
542 "%s: orphan failed (ino=%x), run fsck to fix.",
543 __func__, ino);
544 return err;
545 }
546
547 __add_ino_entry(sbi, ino, ORPHAN_INO);
Chao Yu8c14bfa2015-08-07 17:58:43 +0800548
Jaegeuk Kim5905f9a2016-09-12 15:08:37 -0700549 inode = f2fs_iget_retry(sbi->sb, ino);
Chao Yu8c14bfa2015-08-07 17:58:43 +0800550 if (IS_ERR(inode)) {
551 /*
552 * there should be a bug that we can't find the entry
553 * to orphan inode.
554 */
555 f2fs_bug_on(sbi, PTR_ERR(inode) == -ENOENT);
556 return PTR_ERR(inode);
557 }
558
Jaegeuk Kim127e6702012-11-02 17:08:18 +0900559 clear_nlink(inode);
560
561 /* truncate all the data during iput */
562 iput(inode);
Jaegeuk Kim5905f9a2016-09-12 15:08:37 -0700563
564 get_node_info(sbi, ino, &ni);
565
566 /* ENOMEM was fully retried in f2fs_evict_inode. */
567 if (ni.blk_addr != NULL_ADDR) {
Jaegeuk Kimd41065e2016-09-21 11:39:42 -0700568 set_sbi_flag(sbi, SBI_NEED_FSCK);
569 f2fs_msg(sbi->sb, KERN_WARNING,
Jaegeuk Kim5ce47382017-03-07 13:54:56 -0800570 "%s: orphan failed (ino=%x) by kernel, retry mount.",
Jaegeuk Kimd41065e2016-09-21 11:39:42 -0700571 __func__, ino);
572 return -EIO;
Jaegeuk Kim5905f9a2016-09-12 15:08:37 -0700573 }
Jaegeuk Kimd41065e2016-09-21 11:39:42 -0700574 __remove_ino_entry(sbi, ino, ORPHAN_INO);
Chao Yu8c14bfa2015-08-07 17:58:43 +0800575 return 0;
Jaegeuk Kim127e6702012-11-02 17:08:18 +0900576}
577
Chao Yu8c14bfa2015-08-07 17:58:43 +0800578int recover_orphan_inodes(struct f2fs_sb_info *sbi)
Jaegeuk Kim127e6702012-11-02 17:08:18 +0900579{
Wanpeng Li3c642982015-02-26 07:57:21 +0800580 block_t start_blk, orphan_blocks, i, j;
Chao Yu8c14bfa2015-08-07 17:58:43 +0800581 int err;
Jaegeuk Kim127e6702012-11-02 17:08:18 +0900582
Chao Yuaaec2b12016-09-20 11:04:18 +0800583 if (!is_set_ckpt_flags(sbi, CP_ORPHAN_PRESENT_FLAG))
Chao Yu8c14bfa2015-08-07 17:58:43 +0800584 return 0;
Jaegeuk Kim127e6702012-11-02 17:08:18 +0900585
Wanpeng Li55141482015-02-26 07:57:20 +0800586 start_blk = __start_cp_addr(sbi) + 1 + __cp_payload(sbi);
Wanpeng Li3c642982015-02-26 07:57:21 +0800587 orphan_blocks = __start_sum_addr(sbi) - 1 - __cp_payload(sbi);
Jaegeuk Kim127e6702012-11-02 17:08:18 +0900588
Chao Yu26879fb2015-10-12 17:05:59 +0800589 ra_meta_pages(sbi, start_blk, orphan_blocks, META_CP, true);
Chao Yu662befd2014-02-07 16:11:53 +0800590
Wanpeng Li3c642982015-02-26 07:57:21 +0800591 for (i = 0; i < orphan_blocks; i++) {
Jaegeuk Kim127e6702012-11-02 17:08:18 +0900592 struct page *page = get_meta_page(sbi, start_blk + i);
593 struct f2fs_orphan_block *orphan_blk;
594
595 orphan_blk = (struct f2fs_orphan_block *)page_address(page);
596 for (j = 0; j < le32_to_cpu(orphan_blk->entry_count); j++) {
597 nid_t ino = le32_to_cpu(orphan_blk->ino[j]);
Chao Yu8c14bfa2015-08-07 17:58:43 +0800598 err = recover_orphan_inode(sbi, ino);
599 if (err) {
600 f2fs_put_page(page, 1);
Chao Yu8c14bfa2015-08-07 17:58:43 +0800601 return err;
602 }
Jaegeuk Kim127e6702012-11-02 17:08:18 +0900603 }
604 f2fs_put_page(page, 1);
605 }
606 /* clear Orphan Flag */
Chao Yuaaec2b12016-09-20 11:04:18 +0800607 clear_ckpt_flags(sbi, CP_ORPHAN_PRESENT_FLAG);
Chao Yu8c14bfa2015-08-07 17:58:43 +0800608 return 0;
Jaegeuk Kim127e6702012-11-02 17:08:18 +0900609}
610
611static void write_orphan_inodes(struct f2fs_sb_info *sbi, block_t start_blk)
612{
Gu Zheng502c6e02013-11-19 18:03:58 +0800613 struct list_head *head;
Jaegeuk Kim127e6702012-11-02 17:08:18 +0900614 struct f2fs_orphan_block *orphan_blk = NULL;
Jaegeuk Kim127e6702012-11-02 17:08:18 +0900615 unsigned int nentries = 0;
Chao Yubd936f82015-07-13 17:44:25 +0800616 unsigned short index = 1;
Jaegeuk Kim8c402942014-11-06 15:16:04 -0800617 unsigned short orphan_blocks;
Gu Zheng45319292014-01-10 18:09:02 +0800618 struct page *page = NULL;
Jaegeuk Kim6451e042014-07-25 15:47:17 -0700619 struct ino_entry *orphan = NULL;
Chao Yu67298802014-11-18 11:18:36 +0800620 struct inode_management *im = &sbi->im[ORPHAN_INO];
Jaegeuk Kim127e6702012-11-02 17:08:18 +0900621
Chao Yu67298802014-11-18 11:18:36 +0800622 orphan_blocks = GET_ORPHAN_BLOCKS(im->ino_num);
Jaegeuk Kim8c402942014-11-06 15:16:04 -0800623
Jaegeuk Kimd6c67a42015-05-01 11:08:59 -0700624 /*
625 * we don't need to do spin_lock(&im->ino_lock) here, since all the
626 * orphan inode operations are covered under f2fs_lock_op().
627 * And, spin_lock should be avoided due to page operations below.
628 */
Chao Yu67298802014-11-18 11:18:36 +0800629 head = &im->ino_list;
Jaegeuk Kim127e6702012-11-02 17:08:18 +0900630
631 /* loop for each orphan inode entry and write them in Jornal block */
Gu Zheng502c6e02013-11-19 18:03:58 +0800632 list_for_each_entry(orphan, head, list) {
633 if (!page) {
Chao Yubd936f82015-07-13 17:44:25 +0800634 page = grab_meta_page(sbi, start_blk++);
Gu Zheng502c6e02013-11-19 18:03:58 +0800635 orphan_blk =
636 (struct f2fs_orphan_block *)page_address(page);
637 memset(orphan_blk, 0, sizeof(*orphan_blk));
638 }
Jaegeuk Kim127e6702012-11-02 17:08:18 +0900639
Gu Zheng36795562013-11-26 16:44:16 +0800640 orphan_blk->ino[nentries++] = cpu_to_le32(orphan->ino);
Jaegeuk Kim127e6702012-11-02 17:08:18 +0900641
Gu Zheng36795562013-11-26 16:44:16 +0800642 if (nentries == F2FS_ORPHANS_PER_BLOCK) {
Jaegeuk Kim127e6702012-11-02 17:08:18 +0900643 /*
644 * an orphan block is full of 1020 entries,
645 * then we need to flush current orphan blocks
646 * and bring another one in memory
647 */
648 orphan_blk->blk_addr = cpu_to_le16(index);
649 orphan_blk->blk_count = cpu_to_le16(orphan_blocks);
650 orphan_blk->entry_count = cpu_to_le32(nentries);
651 set_page_dirty(page);
652 f2fs_put_page(page, 1);
653 index++;
Jaegeuk Kim127e6702012-11-02 17:08:18 +0900654 nentries = 0;
655 page = NULL;
656 }
Jaegeuk Kim127e6702012-11-02 17:08:18 +0900657 }
Jaegeuk Kim127e6702012-11-02 17:08:18 +0900658
Gu Zheng502c6e02013-11-19 18:03:58 +0800659 if (page) {
660 orphan_blk->blk_addr = cpu_to_le16(index);
661 orphan_blk->blk_count = cpu_to_le16(orphan_blocks);
662 orphan_blk->entry_count = cpu_to_le32(nentries);
663 set_page_dirty(page);
664 f2fs_put_page(page, 1);
665 }
Jaegeuk Kim127e6702012-11-02 17:08:18 +0900666}
667
Tiezhu Yangfc0065a2016-09-30 08:24:53 +0800668static int get_checkpoint_version(struct f2fs_sb_info *sbi, block_t cp_addr,
669 struct f2fs_checkpoint **cp_block, struct page **cp_page,
670 unsigned long long *version)
671{
672 unsigned long blk_size = sbi->blocksize;
673 size_t crc_offset = 0;
674 __u32 crc = 0;
675
676 *cp_page = get_meta_page(sbi, cp_addr);
677 *cp_block = (struct f2fs_checkpoint *)page_address(*cp_page);
678
679 crc_offset = le32_to_cpu((*cp_block)->checksum_offset);
Kinglong Meec6f89df2017-03-15 21:12:50 +0800680 if (crc_offset > (blk_size - sizeof(__le32))) {
Tiezhu Yangfc0065a2016-09-30 08:24:53 +0800681 f2fs_msg(sbi->sb, KERN_WARNING,
682 "invalid crc_offset: %zu", crc_offset);
683 return -EINVAL;
684 }
685
Kinglong Meeced2c7e2017-02-25 19:53:39 +0800686 crc = cur_cp_crc(*cp_block);
Tiezhu Yangfc0065a2016-09-30 08:24:53 +0800687 if (!f2fs_crc_valid(sbi, crc, *cp_block, crc_offset)) {
688 f2fs_msg(sbi->sb, KERN_WARNING, "invalid crc value");
689 return -EINVAL;
690 }
691
692 *version = cur_cp_version(*cp_block);
693 return 0;
694}
695
Jaegeuk Kim127e6702012-11-02 17:08:18 +0900696static struct page *validate_checkpoint(struct f2fs_sb_info *sbi,
697 block_t cp_addr, unsigned long long *version)
698{
Tiezhu Yangfc0065a2016-09-30 08:24:53 +0800699 struct page *cp_page_1 = NULL, *cp_page_2 = NULL;
700 struct f2fs_checkpoint *cp_block = NULL;
Jaegeuk Kim127e6702012-11-02 17:08:18 +0900701 unsigned long long cur_version = 0, pre_version = 0;
Tiezhu Yangfc0065a2016-09-30 08:24:53 +0800702 int err;
Jaegeuk Kim127e6702012-11-02 17:08:18 +0900703
Tiezhu Yangfc0065a2016-09-30 08:24:53 +0800704 err = get_checkpoint_version(sbi, cp_addr, &cp_block,
705 &cp_page_1, version);
706 if (err)
Jaegeuk Kim127e6702012-11-02 17:08:18 +0900707 goto invalid_cp1;
Tiezhu Yangfc0065a2016-09-30 08:24:53 +0800708 pre_version = *version;
Jaegeuk Kim127e6702012-11-02 17:08:18 +0900709
Jaegeuk Kim25ca9232012-11-28 16:12:41 +0900710 cp_addr += le32_to_cpu(cp_block->cp_pack_total_block_count) - 1;
Tiezhu Yangfc0065a2016-09-30 08:24:53 +0800711 err = get_checkpoint_version(sbi, cp_addr, &cp_block,
712 &cp_page_2, version);
713 if (err)
Jaegeuk Kim127e6702012-11-02 17:08:18 +0900714 goto invalid_cp2;
Tiezhu Yangfc0065a2016-09-30 08:24:53 +0800715 cur_version = *version;
Jaegeuk Kim127e6702012-11-02 17:08:18 +0900716
717 if (cur_version == pre_version) {
718 *version = cur_version;
719 f2fs_put_page(cp_page_2, 1);
720 return cp_page_1;
721 }
722invalid_cp2:
723 f2fs_put_page(cp_page_2, 1);
724invalid_cp1:
725 f2fs_put_page(cp_page_1, 1);
726 return NULL;
727}
728
729int get_valid_checkpoint(struct f2fs_sb_info *sbi)
730{
731 struct f2fs_checkpoint *cp_block;
732 struct f2fs_super_block *fsb = sbi->raw_super;
733 struct page *cp1, *cp2, *cur_page;
734 unsigned long blk_size = sbi->blocksize;
735 unsigned long long cp1_version = 0, cp2_version = 0;
736 unsigned long long cp_start_blk_no;
Wanpeng Li55141482015-02-26 07:57:20 +0800737 unsigned int cp_blks = 1 + __cp_payload(sbi);
Changman Lee1dbe4152014-05-12 12:27:43 +0900738 block_t cp_blk_no;
739 int i;
Jaegeuk Kim127e6702012-11-02 17:08:18 +0900740
Changman Lee1dbe4152014-05-12 12:27:43 +0900741 sbi->ckpt = kzalloc(cp_blks * blk_size, GFP_KERNEL);
Jaegeuk Kim127e6702012-11-02 17:08:18 +0900742 if (!sbi->ckpt)
743 return -ENOMEM;
744 /*
745 * Finding out valid cp block involves read both
746 * sets( cp pack1 and cp pack 2)
747 */
748 cp_start_blk_no = le32_to_cpu(fsb->cp_blkaddr);
749 cp1 = validate_checkpoint(sbi, cp_start_blk_no, &cp1_version);
750
751 /* The second checkpoint pack should start at the next segment */
Jaegeuk Kimf9a4e6d2013-11-28 12:44:05 +0900752 cp_start_blk_no += ((unsigned long long)1) <<
753 le32_to_cpu(fsb->log_blocks_per_seg);
Jaegeuk Kim127e6702012-11-02 17:08:18 +0900754 cp2 = validate_checkpoint(sbi, cp_start_blk_no, &cp2_version);
755
756 if (cp1 && cp2) {
757 if (ver_after(cp2_version, cp1_version))
758 cur_page = cp2;
759 else
760 cur_page = cp1;
761 } else if (cp1) {
762 cur_page = cp1;
763 } else if (cp2) {
764 cur_page = cp2;
765 } else {
766 goto fail_no_cp;
767 }
768
769 cp_block = (struct f2fs_checkpoint *)page_address(cur_page);
770 memcpy(sbi->ckpt, cp_block, blk_size);
771
Shawn Lin984ec632016-02-17 11:26:32 +0800772 /* Sanity checking of checkpoint */
773 if (sanity_check_ckpt(sbi))
Jaegeuk Kima2125ff2016-12-05 17:25:32 -0800774 goto free_fail_no_cp;
Shawn Lin984ec632016-02-17 11:26:32 +0800775
Jaegeuk Kim8508e442016-11-24 12:45:15 -0800776 if (cur_page == cp1)
777 sbi->cur_cp_pack = 1;
778 else
779 sbi->cur_cp_pack = 2;
Changman Lee1dbe4152014-05-12 12:27:43 +0900780
781 if (cp_blks <= 1)
782 goto done;
783
784 cp_blk_no = le32_to_cpu(fsb->cp_blkaddr);
785 if (cur_page == cp2)
786 cp_blk_no += 1 << le32_to_cpu(fsb->log_blocks_per_seg);
787
788 for (i = 1; i < cp_blks; i++) {
789 void *sit_bitmap_ptr;
790 unsigned char *ckpt = (unsigned char *)sbi->ckpt;
791
792 cur_page = get_meta_page(sbi, cp_blk_no + i);
793 sit_bitmap_ptr = page_address(cur_page);
Jaegeuk Kim127e6702012-11-02 17:08:18 +0900794 memcpy(ckpt + i * blk_size, sit_bitmap_ptr, blk_size);
795 f2fs_put_page(cur_page, 1);
796 }
797done:
798 f2fs_put_page(cp1, 1);
799 f2fs_put_page(cp2, 1);
800 return 0;
801
Jaegeuk Kima2125ff2016-12-05 17:25:32 -0800802free_fail_no_cp:
803 f2fs_put_page(cp1, 1);
804 f2fs_put_page(cp2, 1);
Jaegeuk Kim127e6702012-11-02 17:08:18 +0900805fail_no_cp:
806 kfree(sbi->ckpt);
807 return -EINVAL;
808}
809
Chao Yuc227f912015-12-16 13:09:20 +0800810static void __add_dirty_inode(struct inode *inode, enum inode_type type)
Jaegeuk Kim127e6702012-11-02 17:08:18 +0900811{
Jaegeuk Kim40813632014-09-02 15:31:18 -0700812 struct f2fs_sb_info *sbi = F2FS_I_SB(inode);
Chao Yuc227f912015-12-16 13:09:20 +0800813 int flag = (type == DIR_INODE) ? FI_DIRTY_DIR : FI_DIRTY_FILE;
Jaegeuk Kim127e6702012-11-02 17:08:18 +0900814
Jaegeuk Kim91942322016-05-20 10:13:22 -0700815 if (is_inode_flag_set(inode, flag))
Chao Yu2710fd72015-12-15 13:30:45 +0800816 return;
Chao Yu2d7b8222014-03-29 11:33:17 +0800817
Jaegeuk Kim91942322016-05-20 10:13:22 -0700818 set_inode_flag(inode, flag);
Chao Yu99f4b912017-03-22 17:23:46 +0800819 if (!f2fs_is_volatile_file(inode))
820 list_add_tail(&F2FS_I(inode)->dirty_list,
821 &sbi->inode_list[type]);
Chao Yu33fbd512015-12-17 17:14:44 +0800822 stat_inc_dirty_inode(sbi, type);
Jaegeuk Kim5deb8262013-06-05 17:42:45 +0900823}
824
Chao Yuc227f912015-12-16 13:09:20 +0800825static void __remove_dirty_inode(struct inode *inode, enum inode_type type)
Chao Yu6ad76092015-12-15 13:31:40 +0800826{
Chao Yuc227f912015-12-16 13:09:20 +0800827 int flag = (type == DIR_INODE) ? FI_DIRTY_DIR : FI_DIRTY_FILE;
Chao Yu6ad76092015-12-15 13:31:40 +0800828
Jaegeuk Kim91942322016-05-20 10:13:22 -0700829 if (get_dirty_pages(inode) || !is_inode_flag_set(inode, flag))
Chao Yu6ad76092015-12-15 13:31:40 +0800830 return;
831
Jaegeuk Kim91942322016-05-20 10:13:22 -0700832 list_del_init(&F2FS_I(inode)->dirty_list);
833 clear_inode_flag(inode, flag);
Chao Yu33fbd512015-12-17 17:14:44 +0800834 stat_dec_dirty_inode(F2FS_I_SB(inode), type);
Chao Yu6ad76092015-12-15 13:31:40 +0800835}
836
Jaegeuk Kima7ffdbe2014-09-12 15:53:45 -0700837void update_dirty_page(struct inode *inode, struct page *page)
Jaegeuk Kim5deb8262013-06-05 17:42:45 +0900838{
Jaegeuk Kim40813632014-09-02 15:31:18 -0700839 struct f2fs_sb_info *sbi = F2FS_I_SB(inode);
Chao Yuc227f912015-12-16 13:09:20 +0800840 enum inode_type type = S_ISDIR(inode->i_mode) ? DIR_INODE : FILE_INODE;
Jaegeuk Kim5deb8262013-06-05 17:42:45 +0900841
Chao Yu5ac9f362015-06-29 18:14:10 +0800842 if (!S_ISDIR(inode->i_mode) && !S_ISREG(inode->i_mode) &&
843 !S_ISLNK(inode->i_mode))
Jaegeuk Kim127e6702012-11-02 17:08:18 +0900844 return;
Gu Zheng7bd59382013-10-22 14:52:26 +0800845
Jaegeuk Kim1c4bf762016-06-01 20:55:51 -0700846 spin_lock(&sbi->inode_lock[type]);
847 if (type != FILE_INODE || test_opt(sbi, DATA_FLUSH))
Jaegeuk Kim10aa97c2016-05-16 10:33:40 -0700848 __add_dirty_inode(inode, type);
Yunlei Heb951a4e2016-05-13 14:57:43 +0800849 inode_inc_dirty_pages(inode);
Jaegeuk Kim1c4bf762016-06-01 20:55:51 -0700850 spin_unlock(&sbi->inode_lock[type]);
851
Jaegeuk Kima7ffdbe2014-09-12 15:53:45 -0700852 SetPagePrivate(page);
Jaegeuk Kim9e4ded32014-12-17 19:58:58 -0800853 f2fs_trace_pid(page);
Jaegeuk Kim5deb8262013-06-05 17:42:45 +0900854}
Jaegeuk Kim127e6702012-11-02 17:08:18 +0900855
Chao Yuc227f912015-12-16 13:09:20 +0800856void remove_dirty_inode(struct inode *inode)
Jaegeuk Kim127e6702012-11-02 17:08:18 +0900857{
Jaegeuk Kim40813632014-09-02 15:31:18 -0700858 struct f2fs_sb_info *sbi = F2FS_I_SB(inode);
Chao Yuc227f912015-12-16 13:09:20 +0800859 enum inode_type type = S_ISDIR(inode->i_mode) ? DIR_INODE : FILE_INODE;
Jaegeuk Kim127e6702012-11-02 17:08:18 +0900860
Chao Yuc227f912015-12-16 13:09:20 +0800861 if (!S_ISDIR(inode->i_mode) && !S_ISREG(inode->i_mode) &&
862 !S_ISLNK(inode->i_mode))
Jaegeuk Kim127e6702012-11-02 17:08:18 +0900863 return;
864
Jaegeuk Kim10aa97c2016-05-16 10:33:40 -0700865 if (type == FILE_INODE && !test_opt(sbi, DATA_FLUSH))
866 return;
867
Chao Yuc227f912015-12-16 13:09:20 +0800868 spin_lock(&sbi->inode_lock[type]);
869 __remove_dirty_inode(inode, type);
870 spin_unlock(&sbi->inode_lock[type]);
Jaegeuk Kim74d0b912013-05-15 16:40:02 +0900871}
872
Chao Yu6d5a1492015-12-24 18:04:56 +0800873int sync_dirty_inodes(struct f2fs_sb_info *sbi, enum inode_type type)
Jaegeuk Kim127e6702012-11-02 17:08:18 +0900874{
Gu Zhengce3b7d82013-11-19 18:03:47 +0800875 struct list_head *head;
Jaegeuk Kim127e6702012-11-02 17:08:18 +0900876 struct inode *inode;
Chao Yu2710fd72015-12-15 13:30:45 +0800877 struct f2fs_inode_info *fi;
Chao Yu4cf18532015-12-17 17:17:16 +0800878 bool is_dir = (type == DIR_INODE);
879
880 trace_f2fs_sync_dirty_inodes_enter(sbi->sb, is_dir,
881 get_pages(sbi, is_dir ?
882 F2FS_DIRTY_DENTS : F2FS_DIRTY_DATA));
Jaegeuk Kim127e6702012-11-02 17:08:18 +0900883retry:
Jaegeuk Kimaf41d3e2014-10-17 14:14:16 -0700884 if (unlikely(f2fs_cp_error(sbi)))
Chao Yu6d5a1492015-12-24 18:04:56 +0800885 return -EIO;
Jaegeuk Kimaf41d3e2014-10-17 14:14:16 -0700886
Chao Yuc227f912015-12-16 13:09:20 +0800887 spin_lock(&sbi->inode_lock[type]);
Gu Zhengce3b7d82013-11-19 18:03:47 +0800888
Chao Yuc227f912015-12-16 13:09:20 +0800889 head = &sbi->inode_list[type];
Jaegeuk Kim127e6702012-11-02 17:08:18 +0900890 if (list_empty(head)) {
Chao Yuc227f912015-12-16 13:09:20 +0800891 spin_unlock(&sbi->inode_lock[type]);
Chao Yu4cf18532015-12-17 17:17:16 +0800892 trace_f2fs_sync_dirty_inodes_exit(sbi->sb, is_dir,
893 get_pages(sbi, is_dir ?
894 F2FS_DIRTY_DENTS : F2FS_DIRTY_DATA));
Chao Yu6d5a1492015-12-24 18:04:56 +0800895 return 0;
Jaegeuk Kim127e6702012-11-02 17:08:18 +0900896 }
Chao Yu939afa92017-01-07 18:49:42 +0800897 fi = list_first_entry(head, struct f2fs_inode_info, dirty_list);
Chao Yu2710fd72015-12-15 13:30:45 +0800898 inode = igrab(&fi->vfs_inode);
Chao Yuc227f912015-12-16 13:09:20 +0800899 spin_unlock(&sbi->inode_lock[type]);
Jaegeuk Kim127e6702012-11-02 17:08:18 +0900900 if (inode) {
Jaegeuk Kim87d6f892014-03-18 12:40:49 +0900901 filemap_fdatawrite(inode->i_mapping);
Jaegeuk Kim127e6702012-11-02 17:08:18 +0900902 iput(inode);
903 } else {
904 /*
905 * We should submit bio, since it exists several
906 * wribacking dentry pages in the freeing inode.
907 */
Jaegeuk Kimb9109b02017-05-10 11:28:38 -0700908 f2fs_submit_merged_write(sbi, DATA);
Sebastian Andrzej Siewior7ecebe52015-02-27 13:13:14 +0100909 cond_resched();
Jaegeuk Kim127e6702012-11-02 17:08:18 +0900910 }
911 goto retry;
912}
913
Jaegeuk Kim0f18b462016-05-20 11:10:10 -0700914int f2fs_sync_inode_meta(struct f2fs_sb_info *sbi)
915{
916 struct list_head *head = &sbi->inode_list[DIRTY_META];
917 struct inode *inode;
918 struct f2fs_inode_info *fi;
919 s64 total = get_pages(sbi, F2FS_DIRTY_IMETA);
920
921 while (total--) {
922 if (unlikely(f2fs_cp_error(sbi)))
923 return -EIO;
924
925 spin_lock(&sbi->inode_lock[DIRTY_META]);
926 if (list_empty(head)) {
927 spin_unlock(&sbi->inode_lock[DIRTY_META]);
928 return 0;
929 }
Chao Yu939afa92017-01-07 18:49:42 +0800930 fi = list_first_entry(head, struct f2fs_inode_info,
Jaegeuk Kim0f18b462016-05-20 11:10:10 -0700931 gdirty_list);
932 inode = igrab(&fi->vfs_inode);
933 spin_unlock(&sbi->inode_lock[DIRTY_META]);
934 if (inode) {
Jaegeuk Kim18340ed2016-10-19 18:27:56 -0700935 sync_inode_metadata(inode, 0);
936
937 /* it's on eviction */
938 if (is_inode_flag_set(inode, FI_DIRTY_INODE))
939 update_inode_page(inode);
Jaegeuk Kim0f18b462016-05-20 11:10:10 -0700940 iput(inode);
941 }
942 };
943 return 0;
944}
945
Yunlei He59c90812017-03-13 20:22:18 +0800946static void __prepare_cp_block(struct f2fs_sb_info *sbi)
947{
948 struct f2fs_checkpoint *ckpt = F2FS_CKPT(sbi);
949 struct f2fs_nm_info *nm_i = NM_I(sbi);
950 nid_t last_nid = nm_i->next_scan_nid;
951
952 next_free_nid(sbi, &last_nid);
953 ckpt->valid_block_count = cpu_to_le64(valid_user_blocks(sbi));
954 ckpt->valid_node_count = cpu_to_le32(valid_node_count(sbi));
955 ckpt->valid_inode_count = cpu_to_le32(valid_inode_count(sbi));
956 ckpt->next_free_nid = cpu_to_le32(last_nid);
957}
958
Jaegeuk Kim0a8165d2012-11-29 13:28:09 +0900959/*
Jaegeuk Kim127e6702012-11-02 17:08:18 +0900960 * Freeze all the FS-operations for checkpoint.
961 */
Jaegeuk Kimcf779ca2014-08-11 18:37:46 -0700962static int block_operations(struct f2fs_sb_info *sbi)
Jaegeuk Kim127e6702012-11-02 17:08:18 +0900963{
Jaegeuk Kim127e6702012-11-02 17:08:18 +0900964 struct writeback_control wbc = {
965 .sync_mode = WB_SYNC_ALL,
966 .nr_to_write = LONG_MAX,
967 .for_reclaim = 0,
968 };
Jaegeuk Kimc718379b2013-04-24 13:19:56 +0900969 struct blk_plug plug;
Jaegeuk Kimcf779ca2014-08-11 18:37:46 -0700970 int err = 0;
Jaegeuk Kimc718379b2013-04-24 13:19:56 +0900971
972 blk_start_plug(&plug);
973
Jaegeuk Kim39936832012-11-22 16:21:29 +0900974retry_flush_dents:
Gu Zhenge4795562013-09-27 18:08:30 +0800975 f2fs_lock_all(sbi);
Jaegeuk Kim127e6702012-11-02 17:08:18 +0900976 /* write all the dirty dentry pages */
Jaegeuk Kim127e6702012-11-02 17:08:18 +0900977 if (get_pages(sbi, F2FS_DIRTY_DENTS)) {
Gu Zhenge4795562013-09-27 18:08:30 +0800978 f2fs_unlock_all(sbi);
Chao Yu6d5a1492015-12-24 18:04:56 +0800979 err = sync_dirty_inodes(sbi, DIR_INODE);
980 if (err)
Jaegeuk Kimcf779ca2014-08-11 18:37:46 -0700981 goto out;
Jaegeuk Kim30973882017-04-11 19:15:33 -0700982 cond_resched();
Jaegeuk Kim39936832012-11-22 16:21:29 +0900983 goto retry_flush_dents;
Jaegeuk Kim127e6702012-11-02 17:08:18 +0900984 }
985
Yunlei He59c90812017-03-13 20:22:18 +0800986 /*
987 * POR: we should ensure that there are no dirty node pages
988 * until finishing nat/sit flush. inode->i_blocks can be updated.
989 */
990 down_write(&sbi->node_change);
991
Jaegeuk Kim0f18b462016-05-20 11:10:10 -0700992 if (get_pages(sbi, F2FS_DIRTY_IMETA)) {
Yunlei He59c90812017-03-13 20:22:18 +0800993 up_write(&sbi->node_change);
Jaegeuk Kim0f18b462016-05-20 11:10:10 -0700994 f2fs_unlock_all(sbi);
995 err = f2fs_sync_inode_meta(sbi);
996 if (err)
997 goto out;
Jaegeuk Kim30973882017-04-11 19:15:33 -0700998 cond_resched();
Jaegeuk Kim0f18b462016-05-20 11:10:10 -0700999 goto retry_flush_dents;
1000 }
1001
Jaegeuk Kim39936832012-11-22 16:21:29 +09001002retry_flush_nodes:
Chao Yub3582c62014-07-03 18:58:39 +08001003 down_write(&sbi->node_write);
Jaegeuk Kim127e6702012-11-02 17:08:18 +09001004
1005 if (get_pages(sbi, F2FS_DIRTY_NODES)) {
Chao Yub3582c62014-07-03 18:58:39 +08001006 up_write(&sbi->node_write);
Jaegeuk Kim52681372016-04-13 16:24:44 -07001007 err = sync_node_pages(sbi, &wbc);
Chao Yu6d5a1492015-12-24 18:04:56 +08001008 if (err) {
Yunlei He59c90812017-03-13 20:22:18 +08001009 up_write(&sbi->node_change);
Jaegeuk Kimcf779ca2014-08-11 18:37:46 -07001010 f2fs_unlock_all(sbi);
Jaegeuk Kimcf779ca2014-08-11 18:37:46 -07001011 goto out;
1012 }
Jaegeuk Kim30973882017-04-11 19:15:33 -07001013 cond_resched();
Jaegeuk Kim39936832012-11-22 16:21:29 +09001014 goto retry_flush_nodes;
Jaegeuk Kim127e6702012-11-02 17:08:18 +09001015 }
Yunlei He59c90812017-03-13 20:22:18 +08001016
1017 /*
1018 * sbi->node_change is used only for AIO write_begin path which produces
1019 * dirty node blocks and some checkpoint values by block allocation.
1020 */
1021 __prepare_cp_block(sbi);
1022 up_write(&sbi->node_change);
Jaegeuk Kimcf779ca2014-08-11 18:37:46 -07001023out:
Jaegeuk Kimc718379b2013-04-24 13:19:56 +09001024 blk_finish_plug(&plug);
Jaegeuk Kimcf779ca2014-08-11 18:37:46 -07001025 return err;
Jaegeuk Kim127e6702012-11-02 17:08:18 +09001026}
1027
1028static void unblock_operations(struct f2fs_sb_info *sbi)
1029{
Chao Yub3582c62014-07-03 18:58:39 +08001030 up_write(&sbi->node_write);
Gu Zhenge4795562013-09-27 18:08:30 +08001031 f2fs_unlock_all(sbi);
Jaegeuk Kim127e6702012-11-02 17:08:18 +09001032}
1033
Changman Leefb51b5e2013-11-07 12:48:25 +09001034static void wait_on_all_pages_writeback(struct f2fs_sb_info *sbi)
1035{
1036 DEFINE_WAIT(wait);
1037
1038 for (;;) {
1039 prepare_to_wait(&sbi->cp_wait, &wait, TASK_UNINTERRUPTIBLE);
1040
Chao Yu36951b32016-11-16 10:41:20 +08001041 if (!get_pages(sbi, F2FS_WB_CP_DATA))
Changman Leefb51b5e2013-11-07 12:48:25 +09001042 break;
1043
Yunlei He0ff21642016-02-23 12:07:56 +08001044 io_schedule_timeout(5*HZ);
Changman Leefb51b5e2013-11-07 12:48:25 +09001045 }
1046 finish_wait(&sbi->cp_wait, &wait);
1047}
1048
Jaegeuk Kime4c5d842016-09-30 17:37:43 -07001049static void update_ckpt_flags(struct f2fs_sb_info *sbi, struct cp_control *cpc)
1050{
1051 unsigned long orphan_num = sbi->im[ORPHAN_INO].ino_num;
1052 struct f2fs_checkpoint *ckpt = F2FS_CKPT(sbi);
1053
1054 spin_lock(&sbi->cp_lock);
1055
Chao Yuc473f1a2017-04-27 20:40:39 +08001056 if ((cpc->reason & CP_UMOUNT) &&
Kinglong Mee10047f52017-03-11 21:18:01 +08001057 le32_to_cpu(ckpt->cp_pack_total_block_count) >
Jaegeuk Kim22ad0b62017-02-09 10:38:09 -08001058 sbi->blocks_per_seg - NM_I(sbi)->nat_bits_blocks)
1059 disable_nat_bits(sbi, false);
1060
Chao Yu1f43e2a2017-04-28 13:56:08 +08001061 if (cpc->reason & CP_TRIMMED)
1062 __set_ckpt_flags(ckpt, CP_TRIMMED_FLAG);
1063
Chao Yuc473f1a2017-04-27 20:40:39 +08001064 if (cpc->reason & CP_UMOUNT)
Jaegeuk Kime4c5d842016-09-30 17:37:43 -07001065 __set_ckpt_flags(ckpt, CP_UMOUNT_FLAG);
1066 else
1067 __clear_ckpt_flags(ckpt, CP_UMOUNT_FLAG);
1068
Chao Yuc473f1a2017-04-27 20:40:39 +08001069 if (cpc->reason & CP_FASTBOOT)
Jaegeuk Kime4c5d842016-09-30 17:37:43 -07001070 __set_ckpt_flags(ckpt, CP_FASTBOOT_FLAG);
1071 else
1072 __clear_ckpt_flags(ckpt, CP_FASTBOOT_FLAG);
1073
1074 if (orphan_num)
1075 __set_ckpt_flags(ckpt, CP_ORPHAN_PRESENT_FLAG);
1076 else
1077 __clear_ckpt_flags(ckpt, CP_ORPHAN_PRESENT_FLAG);
1078
1079 if (is_sbi_flag_set(sbi, SBI_NEED_FSCK))
1080 __set_ckpt_flags(ckpt, CP_FSCK_FLAG);
1081
1082 /* set this flag to activate crc|cp_ver for recovery */
1083 __set_ckpt_flags(ckpt, CP_CRC_RECOVERY_FLAG);
1084
1085 spin_unlock(&sbi->cp_lock);
1086}
1087
Chao Yuc34f42e2015-12-23 17:50:30 +08001088static int do_checkpoint(struct f2fs_sb_info *sbi, struct cp_control *cpc)
Jaegeuk Kim127e6702012-11-02 17:08:18 +09001089{
1090 struct f2fs_checkpoint *ckpt = F2FS_CKPT(sbi);
Huang Ying77041822014-09-12 20:19:48 +08001091 struct f2fs_nm_info *nm_i = NM_I(sbi);
Chao Yu67298802014-11-18 11:18:36 +08001092 unsigned long orphan_num = sbi->im[ORPHAN_INO].ino_num;
Jaegeuk Kim127e6702012-11-02 17:08:18 +09001093 block_t start_blk;
Jaegeuk Kim127e6702012-11-02 17:08:18 +09001094 unsigned int data_sum_blocks, orphan_blocks;
Jaegeuk Kim7e586fa2013-06-19 20:47:19 +09001095 __u32 crc32 = 0;
Jaegeuk Kim127e6702012-11-02 17:08:18 +09001096 int i;
Wanpeng Li55141482015-02-26 07:57:20 +08001097 int cp_payload_blks = __cp_payload(sbi);
Shuoran Liu8f1dbbb2016-01-27 09:57:30 +08001098 struct super_block *sb = sbi->sb;
1099 struct curseg_info *seg_i = CURSEG_I(sbi, CURSEG_HOT_NODE);
1100 u64 kbytes_written;
Jaegeuk Kim127e6702012-11-02 17:08:18 +09001101
1102 /* Flush all the NAT/SIT pages */
Jaegeuk Kimcf779ca2014-08-11 18:37:46 -07001103 while (get_pages(sbi, F2FS_DIRTY_META)) {
Jaegeuk Kim127e6702012-11-02 17:08:18 +09001104 sync_meta_pages(sbi, META, LONG_MAX);
Jaegeuk Kimcf779ca2014-08-11 18:37:46 -07001105 if (unlikely(f2fs_cp_error(sbi)))
Chao Yuc34f42e2015-12-23 17:50:30 +08001106 return -EIO;
Jaegeuk Kimcf779ca2014-08-11 18:37:46 -07001107 }
Jaegeuk Kim127e6702012-11-02 17:08:18 +09001108
Jaegeuk Kim127e6702012-11-02 17:08:18 +09001109 /*
1110 * modify checkpoint
1111 * version number is already updated
1112 */
1113 ckpt->elapsed_time = cpu_to_le64(get_mtime(sbi));
Jaegeuk Kim127e6702012-11-02 17:08:18 +09001114 ckpt->free_segment_count = cpu_to_le32(free_segments(sbi));
Chao Yub5b82202014-08-22 16:17:38 +08001115 for (i = 0; i < NR_CURSEG_NODE_TYPE; i++) {
Jaegeuk Kim127e6702012-11-02 17:08:18 +09001116 ckpt->cur_node_segno[i] =
1117 cpu_to_le32(curseg_segno(sbi, i + CURSEG_HOT_NODE));
1118 ckpt->cur_node_blkoff[i] =
1119 cpu_to_le16(curseg_blkoff(sbi, i + CURSEG_HOT_NODE));
1120 ckpt->alloc_type[i + CURSEG_HOT_NODE] =
1121 curseg_alloc_type(sbi, i + CURSEG_HOT_NODE);
1122 }
Chao Yub5b82202014-08-22 16:17:38 +08001123 for (i = 0; i < NR_CURSEG_DATA_TYPE; i++) {
Jaegeuk Kim127e6702012-11-02 17:08:18 +09001124 ckpt->cur_data_segno[i] =
1125 cpu_to_le32(curseg_segno(sbi, i + CURSEG_HOT_DATA));
1126 ckpt->cur_data_blkoff[i] =
1127 cpu_to_le16(curseg_blkoff(sbi, i + CURSEG_HOT_DATA));
1128 ckpt->alloc_type[i + CURSEG_HOT_DATA] =
1129 curseg_alloc_type(sbi, i + CURSEG_HOT_DATA);
1130 }
1131
Jaegeuk Kim127e6702012-11-02 17:08:18 +09001132 /* 2 cp + n data seg summary + orphan inode blocks */
Chao Yu3fa06d72014-12-09 14:21:46 +08001133 data_sum_blocks = npages_for_summary_flush(sbi, false);
Chao Yuaaec2b12016-09-20 11:04:18 +08001134 spin_lock(&sbi->cp_lock);
Chao Yub5b82202014-08-22 16:17:38 +08001135 if (data_sum_blocks < NR_CURSEG_DATA_TYPE)
Chao Yuaaec2b12016-09-20 11:04:18 +08001136 __set_ckpt_flags(ckpt, CP_COMPACT_SUM_FLAG);
Jaegeuk Kim127e6702012-11-02 17:08:18 +09001137 else
Chao Yuaaec2b12016-09-20 11:04:18 +08001138 __clear_ckpt_flags(ckpt, CP_COMPACT_SUM_FLAG);
1139 spin_unlock(&sbi->cp_lock);
Jaegeuk Kim127e6702012-11-02 17:08:18 +09001140
Chao Yu67298802014-11-18 11:18:36 +08001141 orphan_blocks = GET_ORPHAN_BLOCKS(orphan_num);
Changman Lee1dbe4152014-05-12 12:27:43 +09001142 ckpt->cp_pack_start_sum = cpu_to_le32(1 + cp_payload_blks +
1143 orphan_blocks);
Jaegeuk Kim127e6702012-11-02 17:08:18 +09001144
Jaegeuk Kim119ee912015-01-29 11:45:33 -08001145 if (__remain_node_summaries(cpc->reason))
Chao Yub5b82202014-08-22 16:17:38 +08001146 ckpt->cp_pack_total_block_count = cpu_to_le32(F2FS_CP_PACKS+
Changman Lee1dbe4152014-05-12 12:27:43 +09001147 cp_payload_blks + data_sum_blocks +
1148 orphan_blocks + NR_CURSEG_NODE_TYPE);
Jaegeuk Kim119ee912015-01-29 11:45:33 -08001149 else
Chao Yub5b82202014-08-22 16:17:38 +08001150 ckpt->cp_pack_total_block_count = cpu_to_le32(F2FS_CP_PACKS +
Changman Lee1dbe4152014-05-12 12:27:43 +09001151 cp_payload_blks + data_sum_blocks +
1152 orphan_blocks);
Jaegeuk Kim119ee912015-01-29 11:45:33 -08001153
Jaegeuk Kime4c5d842016-09-30 17:37:43 -07001154 /* update ckpt flag for checkpoint */
1155 update_ckpt_flags(sbi, cpc);
Jaegeuk Kima468f0e2016-09-19 17:55:10 -07001156
Jaegeuk Kim127e6702012-11-02 17:08:18 +09001157 /* update SIT/NAT bitmap */
1158 get_sit_bitmap(sbi, __bitmap_ptr(sbi, SIT_BITMAP));
1159 get_nat_bitmap(sbi, __bitmap_ptr(sbi, NAT_BITMAP));
1160
Keith Mok43b65732016-03-02 12:04:24 -08001161 crc32 = f2fs_crc32(sbi, ckpt, le32_to_cpu(ckpt->checksum_offset));
Jaegeuk Kim7e586fa2013-06-19 20:47:19 +09001162 *((__le32 *)((unsigned char *)ckpt +
1163 le32_to_cpu(ckpt->checksum_offset)))
Jaegeuk Kim127e6702012-11-02 17:08:18 +09001164 = cpu_to_le32(crc32);
1165
Jaegeuk Kim8508e442016-11-24 12:45:15 -08001166 start_blk = __start_cp_next_addr(sbi);
Jaegeuk Kim127e6702012-11-02 17:08:18 +09001167
Jaegeuk Kim22ad0b62017-02-09 10:38:09 -08001168 /* write nat bits */
1169 if (enabled_nat_bits(sbi, cpc)) {
1170 __u64 cp_ver = cur_cp_version(ckpt);
Jaegeuk Kim22ad0b62017-02-09 10:38:09 -08001171 block_t blk;
1172
1173 cp_ver |= ((__u64)crc32 << 32);
1174 *(__le64 *)nm_i->nat_bits = cpu_to_le64(cp_ver);
1175
1176 blk = start_blk + sbi->blocks_per_seg - nm_i->nat_bits_blocks;
1177 for (i = 0; i < nm_i->nat_bits_blocks; i++)
1178 update_meta_page(sbi, nm_i->nat_bits +
1179 (i << F2FS_BLKSIZE_BITS), blk + i);
1180
1181 /* Flush all the NAT BITS pages */
1182 while (get_pages(sbi, F2FS_DIRTY_META)) {
1183 sync_meta_pages(sbi, META, LONG_MAX);
1184 if (unlikely(f2fs_cp_error(sbi)))
1185 return -EIO;
1186 }
1187 }
1188
Jaegeuk Kima7230d12015-09-16 14:06:54 -07001189 /* need to wait for end_io results */
1190 wait_on_all_pages_writeback(sbi);
1191 if (unlikely(f2fs_cp_error(sbi)))
Chao Yuc34f42e2015-12-23 17:50:30 +08001192 return -EIO;
Jaegeuk Kima7230d12015-09-16 14:06:54 -07001193
Jaegeuk Kim127e6702012-11-02 17:08:18 +09001194 /* write out checkpoint buffer at block 0 */
Chao Yu381722d2015-05-19 17:40:04 +08001195 update_meta_page(sbi, ckpt, start_blk++);
Jaegeuk Kim127e6702012-11-02 17:08:18 +09001196
Chao Yu381722d2015-05-19 17:40:04 +08001197 for (i = 1; i < 1 + cp_payload_blks; i++)
1198 update_meta_page(sbi, (char *)ckpt + i * F2FS_BLKSIZE,
1199 start_blk++);
Changman Lee1dbe4152014-05-12 12:27:43 +09001200
Chao Yu67298802014-11-18 11:18:36 +08001201 if (orphan_num) {
Jaegeuk Kim127e6702012-11-02 17:08:18 +09001202 write_orphan_inodes(sbi, start_blk);
1203 start_blk += orphan_blocks;
1204 }
1205
1206 write_data_summaries(sbi, start_blk);
1207 start_blk += data_sum_blocks;
Shuoran Liu8f1dbbb2016-01-27 09:57:30 +08001208
1209 /* Record write statistics in the hot node summary */
1210 kbytes_written = sbi->kbytes_written;
1211 if (sb->s_bdev->bd_part)
1212 kbytes_written += BD_PART_WRITTEN(sbi);
1213
Chao Yub7ad7512016-02-19 18:08:46 +08001214 seg_i->journal->info.kbytes_written = cpu_to_le64(kbytes_written);
Shuoran Liu8f1dbbb2016-01-27 09:57:30 +08001215
Jaegeuk Kim119ee912015-01-29 11:45:33 -08001216 if (__remain_node_summaries(cpc->reason)) {
Jaegeuk Kim127e6702012-11-02 17:08:18 +09001217 write_node_summaries(sbi, start_blk);
1218 start_blk += NR_CURSEG_NODE_TYPE;
1219 }
1220
1221 /* writeout checkpoint block */
Chao Yu381722d2015-05-19 17:40:04 +08001222 update_meta_page(sbi, ckpt, start_blk);
Jaegeuk Kim127e6702012-11-02 17:08:18 +09001223
1224 /* wait for previous submitted node/meta pages writeback */
Changman Leefb51b5e2013-11-07 12:48:25 +09001225 wait_on_all_pages_writeback(sbi);
Jaegeuk Kim127e6702012-11-02 17:08:18 +09001226
Jaegeuk Kimcf779ca2014-08-11 18:37:46 -07001227 if (unlikely(f2fs_cp_error(sbi)))
Chao Yuc34f42e2015-12-23 17:50:30 +08001228 return -EIO;
Jaegeuk Kimcf779ca2014-08-11 18:37:46 -07001229
Chao Yu80dd9c02016-02-24 17:20:44 +08001230 filemap_fdatawait_range(NODE_MAPPING(sbi), 0, LLONG_MAX);
1231 filemap_fdatawait_range(META_MAPPING(sbi), 0, LLONG_MAX);
Jaegeuk Kim127e6702012-11-02 17:08:18 +09001232
1233 /* update user_block_counts */
1234 sbi->last_valid_block_count = sbi->total_valid_block_count;
Jaegeuk Kim41382ec2016-05-16 11:06:50 -07001235 percpu_counter_set(&sbi->alloc_valid_block_count, 0);
Jaegeuk Kim127e6702012-11-02 17:08:18 +09001236
1237 /* Here, we only have one bio having CP pack */
Jaegeuk Kim577e3492013-01-24 19:56:11 +09001238 sync_meta_pages(sbi, META_FLUSH, LONG_MAX);
Jaegeuk Kim127e6702012-11-02 17:08:18 +09001239
Jaegeuk Kim6a8f8ca2014-10-29 14:37:22 -07001240 /* wait for previous submitted meta pages writeback */
1241 wait_on_all_pages_writeback(sbi);
1242
Jaegeuk Kim74ef9242016-05-02 22:09:56 -07001243 release_ino_entry(sbi, false);
Jaegeuk Kimcf779ca2014-08-11 18:37:46 -07001244
1245 if (unlikely(f2fs_cp_error(sbi)))
Chao Yuc34f42e2015-12-23 17:50:30 +08001246 return -EIO;
Jaegeuk Kimcf779ca2014-08-11 18:37:46 -07001247
Chao Yucaf00472015-01-28 17:48:42 +08001248 clear_sbi_flag(sbi, SBI_IS_DIRTY);
Jaegeuk Kimbbf156f2016-08-29 18:23:45 -07001249 clear_sbi_flag(sbi, SBI_NEED_CP);
Jaegeuk Kim8508e442016-11-24 12:45:15 -08001250 __set_cp_next_pack(sbi);
Chao Yuc34f42e2015-12-23 17:50:30 +08001251
Chao Yuc2a080a2016-08-31 10:43:19 +08001252 /*
1253 * redirty superblock if metadata like node page or inode cache is
1254 * updated during writing checkpoint.
1255 */
1256 if (get_pages(sbi, F2FS_DIRTY_NODES) ||
1257 get_pages(sbi, F2FS_DIRTY_IMETA))
1258 set_sbi_flag(sbi, SBI_IS_DIRTY);
1259
1260 f2fs_bug_on(sbi, get_pages(sbi, F2FS_DIRTY_DENTS));
1261
Chao Yuc34f42e2015-12-23 17:50:30 +08001262 return 0;
Jaegeuk Kim127e6702012-11-02 17:08:18 +09001263}
1264
Jaegeuk Kim0a8165d2012-11-29 13:28:09 +09001265/*
arter97e1c42042014-08-06 23:22:50 +09001266 * We guarantee that this checkpoint procedure will not fail.
Jaegeuk Kim127e6702012-11-02 17:08:18 +09001267 */
Chao Yuc34f42e2015-12-23 17:50:30 +08001268int write_checkpoint(struct f2fs_sb_info *sbi, struct cp_control *cpc)
Jaegeuk Kim127e6702012-11-02 17:08:18 +09001269{
1270 struct f2fs_checkpoint *ckpt = F2FS_CKPT(sbi);
1271 unsigned long long ckpt_ver;
Chao Yuc34f42e2015-12-23 17:50:30 +08001272 int err = 0;
Jaegeuk Kim127e6702012-11-02 17:08:18 +09001273
Jaegeuk Kim43727522013-02-04 15:11:17 +09001274 mutex_lock(&sbi->cp_mutex);
Jaegeuk Kim85010172014-08-11 18:37:46 -07001275
Chao Yucaf00472015-01-28 17:48:42 +08001276 if (!is_sbi_flag_set(sbi, SBI_IS_DIRTY) &&
Chao Yuc473f1a2017-04-27 20:40:39 +08001277 ((cpc->reason & CP_FASTBOOT) || (cpc->reason & CP_SYNC) ||
1278 ((cpc->reason & CP_DISCARD) && !sbi->discard_blks)))
Jaegeuk Kim85010172014-08-11 18:37:46 -07001279 goto out;
Chao Yuc34f42e2015-12-23 17:50:30 +08001280 if (unlikely(f2fs_cp_error(sbi))) {
1281 err = -EIO;
Jaegeuk Kimcf779ca2014-08-11 18:37:46 -07001282 goto out;
Chao Yuc34f42e2015-12-23 17:50:30 +08001283 }
1284 if (f2fs_readonly(sbi->sb)) {
1285 err = -EROFS;
Jaegeuk Kim11504a82015-01-23 18:43:45 -08001286 goto out;
Chao Yuc34f42e2015-12-23 17:50:30 +08001287 }
Wanpeng Li2bda5422015-02-27 15:56:16 +08001288
1289 trace_f2fs_write_checkpoint(sbi->sb, cpc->reason, "start block_ops");
1290
Chao Yuc34f42e2015-12-23 17:50:30 +08001291 err = block_operations(sbi);
1292 if (err)
Jaegeuk Kimcf779ca2014-08-11 18:37:46 -07001293 goto out;
Jaegeuk Kim127e6702012-11-02 17:08:18 +09001294
Jaegeuk Kim75ab4cb2014-09-20 21:57:51 -07001295 trace_f2fs_write_checkpoint(sbi->sb, cpc->reason, "finish block_ops");
Namjae Jeon2af4bd62013-04-23 18:26:54 +09001296
Jaegeuk Kimb9109b02017-05-10 11:28:38 -07001297 f2fs_flush_merged_writes(sbi);
Jaegeuk Kim127e6702012-11-02 17:08:18 +09001298
Yunlei He58cce382016-08-18 21:01:19 +08001299 /* this is the case of multiple fstrims without any changes */
Chao Yuc473f1a2017-04-27 20:40:39 +08001300 if (cpc->reason & CP_DISCARD) {
Jaegeuk Kim25290fa2016-12-29 22:06:15 -08001301 if (!exist_trim_candidates(sbi, cpc)) {
1302 unblock_operations(sbi);
1303 goto out;
1304 }
1305
Jaegeuk Kim0333ad42016-12-29 16:58:54 -08001306 if (NM_I(sbi)->dirty_nat_cnt == 0 &&
1307 SIT_I(sbi)->dirty_sentries == 0 &&
1308 prefree_segments(sbi) == 0) {
1309 flush_sit_entries(sbi, cpc);
1310 clear_prefree_segments(sbi, cpc);
1311 unblock_operations(sbi);
1312 goto out;
1313 }
Yunlei He58cce382016-08-18 21:01:19 +08001314 }
1315
Jaegeuk Kim127e6702012-11-02 17:08:18 +09001316 /*
1317 * update checkpoint pack index
1318 * Increase the version number so that
1319 * SIT entries and seg summaries are written at correct place
1320 */
Jaegeuk Kimd71b5562013-08-09 15:03:21 +09001321 ckpt_ver = cur_cp_version(ckpt);
Jaegeuk Kim127e6702012-11-02 17:08:18 +09001322 ckpt->checkpoint_ver = cpu_to_le64(++ckpt_ver);
1323
1324 /* write cached NAT/SIT entries to NAT/SIT area */
Jaegeuk Kim22ad0b62017-02-09 10:38:09 -08001325 flush_nat_entries(sbi, cpc);
Jaegeuk Kim4b2fecc2014-09-20 22:06:39 -07001326 flush_sit_entries(sbi, cpc);
Jaegeuk Kim127e6702012-11-02 17:08:18 +09001327
Jaegeuk Kim127e6702012-11-02 17:08:18 +09001328 /* unlock all the fs_lock[] in do_checkpoint() */
Chao Yuc34f42e2015-12-23 17:50:30 +08001329 err = do_checkpoint(sbi, cpc);
Jaegeuk Kim4e6a8d92016-12-29 14:07:53 -08001330 if (err)
Chao Yu2dd15652016-10-11 22:57:00 +08001331 release_discard_addrs(sbi);
Jaegeuk Kim4e6a8d92016-12-29 14:07:53 -08001332 else
Chao Yu2dd15652016-10-11 22:57:00 +08001333 clear_prefree_segments(sbi, cpc);
Chao Yu275b66b2016-08-29 23:58:34 +08001334
Jaegeuk Kim127e6702012-11-02 17:08:18 +09001335 unblock_operations(sbi);
Changman Lee942e0be2014-02-13 15:12:29 +09001336 stat_inc_cp_count(sbi->stat_info);
Jaegeuk Kim10027552015-04-09 17:03:53 -07001337
Chao Yuc473f1a2017-04-27 20:40:39 +08001338 if (cpc->reason & CP_RECOVERY)
Jaegeuk Kim10027552015-04-09 17:03:53 -07001339 f2fs_msg(sbi->sb, KERN_NOTICE,
1340 "checkpoint: version = %llx", ckpt_ver);
Jaegeuk Kim60b99b42015-10-05 14:49:57 -07001341
1342 /* do checkpoint periodically */
Jaegeuk Kim6beceb52016-01-08 15:51:50 -08001343 f2fs_update_time(sbi, CP_TIME);
Jaegeuk Kim55d1cdb2015-12-15 16:07:14 -08001344 trace_f2fs_write_checkpoint(sbi->sb, cpc->reason, "finish checkpoint");
Jaegeuk Kim85010172014-08-11 18:37:46 -07001345out:
1346 mutex_unlock(&sbi->cp_mutex);
Chao Yuc34f42e2015-12-23 17:50:30 +08001347 return err;
Jaegeuk Kim127e6702012-11-02 17:08:18 +09001348}
1349
Jaegeuk Kim6451e042014-07-25 15:47:17 -07001350void init_ino_entry_info(struct f2fs_sb_info *sbi)
Jaegeuk Kim127e6702012-11-02 17:08:18 +09001351{
Jaegeuk Kim6451e042014-07-25 15:47:17 -07001352 int i;
1353
1354 for (i = 0; i < MAX_INO_ENTRY; i++) {
Chao Yu67298802014-11-18 11:18:36 +08001355 struct inode_management *im = &sbi->im[i];
1356
1357 INIT_RADIX_TREE(&im->ino_root, GFP_ATOMIC);
1358 spin_lock_init(&im->ino_lock);
1359 INIT_LIST_HEAD(&im->ino_list);
1360 im->ino_num = 0;
Jaegeuk Kim6451e042014-07-25 15:47:17 -07001361 }
1362
Chao Yub5b82202014-08-22 16:17:38 +08001363 sbi->max_orphans = (sbi->blocks_per_seg - F2FS_CP_PACKS -
Wanpeng Li14b42812015-02-27 17:38:13 +08001364 NR_CURSEG_TYPE - __cp_payload(sbi)) *
1365 F2FS_ORPHANS_PER_BLOCK;
Jaegeuk Kim127e6702012-11-02 17:08:18 +09001366}
1367
Namjae Jeon6e6093a2013-01-17 00:08:30 +09001368int __init create_checkpoint_caches(void)
Jaegeuk Kim127e6702012-11-02 17:08:18 +09001369{
Jaegeuk Kim6451e042014-07-25 15:47:17 -07001370 ino_entry_slab = f2fs_kmem_cache_create("f2fs_ino_entry",
1371 sizeof(struct ino_entry));
1372 if (!ino_entry_slab)
Jaegeuk Kim127e6702012-11-02 17:08:18 +09001373 return -ENOMEM;
Chao Yu06292072014-12-29 15:56:18 +08001374 inode_entry_slab = f2fs_kmem_cache_create("f2fs_inode_entry",
1375 sizeof(struct inode_entry));
Jaegeuk Kim6bacf522013-12-06 15:00:58 +09001376 if (!inode_entry_slab) {
Jaegeuk Kim6451e042014-07-25 15:47:17 -07001377 kmem_cache_destroy(ino_entry_slab);
Jaegeuk Kim127e6702012-11-02 17:08:18 +09001378 return -ENOMEM;
1379 }
1380 return 0;
1381}
1382
1383void destroy_checkpoint_caches(void)
1384{
Jaegeuk Kim6451e042014-07-25 15:47:17 -07001385 kmem_cache_destroy(ino_entry_slab);
Jaegeuk Kim127e6702012-11-02 17:08:18 +09001386 kmem_cache_destroy(inode_entry_slab);
1387}