Merge branch 'i2c/for-5.3' of git://git.kernel.org/pub/scm/linux/kernel/git/wsa/linux
[linux-2.6-block.git] / fs / f2fs / recovery.c
CommitLineData
7c1a000d 1// SPDX-License-Identifier: GPL-2.0
0a8165d7 2/*
d624c96f
JK
3 * fs/f2fs/recovery.c
4 *
5 * Copyright (c) 2012 Samsung Electronics Co., Ltd.
6 * http://www.samsung.com/
d624c96f
JK
7 */
8#include <linux/fs.h>
9#include <linux/f2fs_fs.h>
10#include "f2fs.h"
11#include "node.h"
12#include "segment.h"
13
441ac5cb
JK
14/*
15 * Roll forward recovery scenarios.
16 *
17 * [Term] F: fsync_mark, D: dentry_mark
18 *
19 * 1. inode(x) | CP | inode(x) | dnode(F)
20 * -> Update the latest inode(x).
21 *
22 * 2. inode(x) | CP | inode(F) | dnode(F)
23 * -> No problem.
24 *
25 * 3. inode(x) | CP | dnode(F) | inode(x)
26 * -> Recover to the latest dnode(F), and drop the last inode(x)
27 *
28 * 4. inode(x) | CP | dnode(F) | inode(F)
29 * -> No problem.
30 *
31 * 5. CP | inode(x) | dnode(F)
32 * -> The inode(DF) was missing. Should drop this dnode(F).
33 *
34 * 6. CP | inode(DF) | dnode(F)
35 * -> No problem.
36 *
37 * 7. CP | dnode(F) | inode(DF)
38 * -> If f2fs_iget fails, then goto next to find inode(DF).
39 *
40 * 8. CP | dnode(F) | inode(x)
41 * -> If f2fs_iget fails, then goto next to find inode(DF).
42 * But it will fail due to no inode(DF).
43 */
44
d624c96f
JK
45static struct kmem_cache *fsync_entry_slab;
46
4d57b86d 47bool f2fs_space_for_roll_forward(struct f2fs_sb_info *sbi)
d624c96f 48{
41382ec4
JK
49 s64 nalloc = percpu_counter_sum_positive(&sbi->alloc_valid_block_count);
50
51 if (sbi->last_valid_block_count + nalloc > sbi->user_block_count)
d624c96f
JK
52 return false;
53 return true;
54}
55
56static struct fsync_inode_entry *get_fsync_inode(struct list_head *head,
57 nid_t ino)
58{
d624c96f
JK
59 struct fsync_inode_entry *entry;
60
2d7b822a 61 list_for_each_entry(entry, head, list)
d624c96f
JK
62 if (entry->inode->i_ino == ino)
63 return entry;
2d7b822a 64
d624c96f
JK
65 return NULL;
66}
67
f4702d61 68static struct fsync_inode_entry *add_fsync_inode(struct f2fs_sb_info *sbi,
4b2414d0 69 struct list_head *head, nid_t ino, bool quota_inode)
3f8ab270 70{
e8ea9b3d 71 struct inode *inode;
3f8ab270 72 struct fsync_inode_entry *entry;
4b2414d0 73 int err;
3f8ab270 74
e8ea9b3d 75 inode = f2fs_iget_retry(sbi->sb, ino);
f4702d61
JK
76 if (IS_ERR(inode))
77 return ERR_CAST(inode);
78
4b2414d0
CY
79 err = dquot_initialize(inode);
80 if (err)
81 goto err_out;
82
83 if (quota_inode) {
84 err = dquot_alloc_inode(inode);
85 if (err)
86 goto err_out;
87 }
88
e8ea9b3d 89 entry = f2fs_kmem_cache_alloc(fsync_entry_slab, GFP_F2FS_ZERO);
3f8ab270
CY
90 entry->inode = inode;
91 list_add_tail(&entry->list, head);
92
93 return entry;
4b2414d0
CY
94err_out:
95 iput(inode);
96 return ERR_PTR(err);
3f8ab270
CY
97}
98
26b5a079 99static void del_fsync_inode(struct fsync_inode_entry *entry, int drop)
3f8ab270 100{
26b5a079
SY
101 if (drop) {
102 /* inode should not be recovered, drop it */
103 f2fs_inode_synced(entry->inode);
104 }
3f8ab270
CY
105 iput(entry->inode);
106 list_del(&entry->list);
107 kmem_cache_free(fsync_entry_slab, entry);
108}
109
f61cce5b
CY
110static int recover_dentry(struct inode *inode, struct page *ipage,
111 struct list_head *dir_list)
d624c96f 112{
58bfaf44 113 struct f2fs_inode *raw_inode = F2FS_INODE(ipage);
74d0b917 114 nid_t pino = le32_to_cpu(raw_inode->i_pino);
6b8213d9 115 struct f2fs_dir_entry *de;
e7ba108a 116 struct fscrypt_name fname;
d624c96f 117 struct page *page;
6b8213d9 118 struct inode *dir, *einode;
f61cce5b 119 struct fsync_inode_entry *entry;
d624c96f 120 int err = 0;
e7ba108a 121 char *name;
d624c96f 122
f61cce5b
CY
123 entry = get_fsync_inode(dir_list, pino);
124 if (!entry) {
4b2414d0
CY
125 entry = add_fsync_inode(F2FS_I_SB(inode), dir_list,
126 pino, false);
f4702d61
JK
127 if (IS_ERR(entry)) {
128 dir = ERR_CAST(entry);
129 err = PTR_ERR(entry);
f61cce5b
CY
130 goto out;
131 }
ed57c27f
JK
132 }
133
f61cce5b
CY
134 dir = entry->inode;
135
e7ba108a
SL
136 memset(&fname, 0, sizeof(struct fscrypt_name));
137 fname.disk_name.len = le32_to_cpu(raw_inode->i_namelen);
138 fname.disk_name.name = raw_inode->i_name;
d96b1431 139
e7ba108a 140 if (unlikely(fname.disk_name.len > F2FS_NAME_LEN)) {
d96b1431
CY
141 WARN_ON(1);
142 err = -ENAMETOOLONG;
f61cce5b 143 goto out;
d96b1431 144 }
6b8213d9 145retry:
e7ba108a 146 de = __f2fs_find_entry(dir, &fname, &page);
418f6c27 147 if (de && inode->i_ino == le32_to_cpu(de->ino))
bdbc90fa 148 goto out_put;
418f6c27 149
6b8213d9 150 if (de) {
e8ea9b3d 151 einode = f2fs_iget_retry(inode->i_sb, le32_to_cpu(de->ino));
6b8213d9
JK
152 if (IS_ERR(einode)) {
153 WARN_ON(1);
5c1f9927
CY
154 err = PTR_ERR(einode);
155 if (err == -ENOENT)
6b8213d9 156 err = -EEXIST;
bdbc90fa 157 goto out_put;
2e5558f4 158 }
4b2414d0
CY
159
160 err = dquot_initialize(einode);
161 if (err) {
162 iput(einode);
bdbc90fa 163 goto out_put;
4b2414d0
CY
164 }
165
4d57b86d 166 err = f2fs_acquire_orphan_inode(F2FS_I_SB(inode));
2e5558f4
RK
167 if (err) {
168 iput(einode);
bdbc90fa 169 goto out_put;
6b8213d9 170 }
dbeacf02 171 f2fs_delete_entry(de, page, dir, einode);
6b8213d9
JK
172 iput(einode);
173 goto retry;
91246c21
CY
174 } else if (IS_ERR(page)) {
175 err = PTR_ERR(page);
176 } else {
4d57b86d 177 err = f2fs_add_dentry(dir, &fname, inode,
91246c21 178 inode->i_ino, inode->i_mode);
d624c96f 179 }
e8ea9b3d
JK
180 if (err == -ENOMEM)
181 goto retry;
2e5558f4
RK
182 goto out;
183
bdbc90fa 184out_put:
2e5558f4 185 f2fs_put_page(page, 0);
d624c96f 186out:
e7ba108a
SL
187 if (file_enc_name(inode))
188 name = "<encrypted>";
189 else
190 name = raw_inode->i_name;
dcbb4c10
JP
191 f2fs_notice(F2FS_I_SB(inode), "%s: ino = %x, name = %s, dir = %lx, err = %d",
192 __func__, ino_of_node(ipage), name,
193 IS_ERR(dir) ? 0 : dir->i_ino, err);
d624c96f
JK
194 return err;
195}
196
af033b2a
CY
197static int recover_quota_data(struct inode *inode, struct page *page)
198{
199 struct f2fs_inode *raw = F2FS_INODE(page);
200 struct iattr attr;
201 uid_t i_uid = le32_to_cpu(raw->i_uid);
202 gid_t i_gid = le32_to_cpu(raw->i_gid);
203 int err;
204
205 memset(&attr, 0, sizeof(attr));
206
207 attr.ia_uid = make_kuid(inode->i_sb->s_user_ns, i_uid);
208 attr.ia_gid = make_kgid(inode->i_sb->s_user_ns, i_gid);
209
210 if (!uid_eq(attr.ia_uid, inode->i_uid))
211 attr.ia_valid |= ATTR_UID;
212 if (!gid_eq(attr.ia_gid, inode->i_gid))
213 attr.ia_valid |= ATTR_GID;
214
215 if (!attr.ia_valid)
216 return 0;
217
218 err = dquot_transfer(inode, &attr);
219 if (err)
220 set_sbi_flag(F2FS_I_SB(inode), SBI_QUOTA_NEED_REPAIR);
221 return err;
222}
223
37a086f0
JK
224static void recover_inline_flags(struct inode *inode, struct f2fs_inode *ri)
225{
226 if (ri->i_inline & F2FS_PIN_FILE)
227 set_inode_flag(inode, FI_PIN_FILE);
228 else
229 clear_inode_flag(inode, FI_PIN_FILE);
230 if (ri->i_inline & F2FS_DATA_EXIST)
231 set_inode_flag(inode, FI_DATA_EXIST);
232 else
233 clear_inode_flag(inode, FI_DATA_EXIST);
37a086f0
JK
234}
235
af033b2a 236static int recover_inode(struct inode *inode, struct page *page)
d624c96f 237{
441ac5cb 238 struct f2fs_inode *raw = F2FS_INODE(page);
e7d55452 239 char *name;
af033b2a 240 int err;
441ac5cb
JK
241
242 inode->i_mode = le16_to_cpu(raw->i_mode);
af033b2a
CY
243
244 err = recover_quota_data(inode, page);
245 if (err)
246 return err;
247
dc4cd125
CY
248 i_uid_write(inode, le32_to_cpu(raw->i_uid));
249 i_gid_write(inode, le32_to_cpu(raw->i_gid));
f4474aa6
CY
250
251 if (raw->i_inline & F2FS_EXTRA_ATTR) {
7beb01f7 252 if (f2fs_sb_has_project_quota(F2FS_I_SB(inode)) &&
f4474aa6
CY
253 F2FS_FITS_IN_INODE(raw, le16_to_cpu(raw->i_extra_isize),
254 i_projid)) {
255 projid_t i_projid;
78130819 256 kprojid_t kprojid;
f4474aa6
CY
257
258 i_projid = (projid_t)le32_to_cpu(raw->i_projid);
78130819
CY
259 kprojid = make_kprojid(&init_user_ns, i_projid);
260
261 if (!projid_eq(kprojid, F2FS_I(inode)->i_projid)) {
262 err = f2fs_transfer_project_quota(inode,
263 kprojid);
264 if (err)
265 return err;
266 F2FS_I(inode)->i_projid = kprojid;
267 }
f4474aa6
CY
268 }
269 }
270
fc9581c8 271 f2fs_i_size_write(inode, le64_to_cpu(raw->i_size));
9f0552e0 272 inode->i_atime.tv_sec = le64_to_cpu(raw->i_atime);
441ac5cb
JK
273 inode->i_ctime.tv_sec = le64_to_cpu(raw->i_ctime);
274 inode->i_mtime.tv_sec = le64_to_cpu(raw->i_mtime);
9f0552e0 275 inode->i_atime.tv_nsec = le32_to_cpu(raw->i_atime_nsec);
441ac5cb
JK
276 inode->i_ctime.tv_nsec = le32_to_cpu(raw->i_ctime_nsec);
277 inode->i_mtime.tv_nsec = le32_to_cpu(raw->i_mtime_nsec);
f356fe0c 278
26787236 279 F2FS_I(inode)->i_advise = raw->i_advise;
19c73a69 280 F2FS_I(inode)->i_flags = le32_to_cpu(raw->i_flags);
0c093b59 281 f2fs_set_inode_flags(inode);
7de36cf3
CY
282 F2FS_I(inode)->i_gc_failures[GC_FAILURE_PIN] =
283 le16_to_cpu(raw->i_gc_failures);
26787236 284
37a086f0
JK
285 recover_inline_flags(inode, raw);
286
4a1728ca
CY
287 f2fs_mark_inode_dirty_sync(inode, true);
288
e7d55452
JK
289 if (file_enc_name(inode))
290 name = "<encrypted>";
291 else
292 name = F2FS_INODE(page)->i_name;
293
dcbb4c10
JP
294 f2fs_notice(F2FS_I_SB(inode), "recover_inode: ino = %x, name = %s, inline = %x",
295 ino_of_node(page), name, raw->i_inline);
af033b2a 296 return 0;
d624c96f
JK
297}
298
d40d30c5
JK
299static int find_fsync_dnodes(struct f2fs_sb_info *sbi, struct list_head *head,
300 bool check_only)
d624c96f 301{
d624c96f 302 struct curseg_info *curseg;
4c521f49 303 struct page *page = NULL;
d624c96f 304 block_t blkaddr;
fb0e72c8 305 unsigned int loop_cnt = 0;
82902c06
CY
306 unsigned int free_blocks = MAIN_SEGS(sbi) * sbi->blocks_per_seg -
307 valid_user_blocks(sbi);
d624c96f
JK
308 int err = 0;
309
310 /* get node pages in the current segment */
311 curseg = CURSEG_I(sbi, CURSEG_WARM_NODE);
695fd1ed 312 blkaddr = NEXT_FREE_BLKADDR(sbi, curseg);
d624c96f 313
d624c96f
JK
314 while (1) {
315 struct fsync_inode_entry *entry;
316
e1da7872 317 if (!f2fs_is_valid_blkaddr(sbi, blkaddr, META_POR))
4c521f49 318 return 0;
d624c96f 319
4d57b86d 320 page = f2fs_get_tmp_page(sbi, blkaddr);
7735730d
CY
321 if (IS_ERR(page)) {
322 err = PTR_ERR(page);
323 break;
324 }
393ff91f 325
98838579
CY
326 if (!is_recoverable_dnode(page)) {
327 f2fs_put_page(page, 1);
f356fe0c 328 break;
98838579 329 }
d624c96f
JK
330
331 if (!is_fsync_dnode(page))
332 goto next;
333
334 entry = get_fsync_inode(head, ino_of_node(page));
d47b8715 335 if (!entry) {
4b2414d0
CY
336 bool quota_inode = false;
337
d40d30c5
JK
338 if (!check_only &&
339 IS_INODE(page) && is_dent_dnode(page)) {
4d57b86d 340 err = f2fs_recover_inode_page(sbi, page);
98838579
CY
341 if (err) {
342 f2fs_put_page(page, 1);
f356fe0c 343 break;
98838579 344 }
4b2414d0 345 quota_inode = true;
d624c96f
JK
346 }
347
441ac5cb
JK
348 /*
349 * CP | dnode(F) | inode(DF)
350 * For this case, we should not give up now.
351 */
4b2414d0
CY
352 entry = add_fsync_inode(sbi, head, ino_of_node(page),
353 quota_inode);
f4702d61
JK
354 if (IS_ERR(entry)) {
355 err = PTR_ERR(entry);
8fbc418f
JK
356 if (err == -ENOENT) {
357 err = 0;
441ac5cb 358 goto next;
8fbc418f 359 }
98838579 360 f2fs_put_page(page, 1);
f356fe0c 361 break;
d624c96f 362 }
d624c96f 363 }
addbe45b
JK
364 entry->blkaddr = blkaddr;
365
608514de
JK
366 if (IS_INODE(page) && is_dent_dnode(page))
367 entry->last_dentry = blkaddr;
d624c96f 368next:
fb0e72c8
CY
369 /* sanity check in order to detect looped node chain */
370 if (++loop_cnt >= free_blocks ||
371 blkaddr == next_blkaddr_of_node(page)) {
dcbb4c10
JP
372 f2fs_notice(sbi, "%s: detect looped node chain, blkaddr:%u, next:%u",
373 __func__, blkaddr,
374 next_blkaddr_of_node(page));
98838579 375 f2fs_put_page(page, 1);
fb0e72c8
CY
376 err = -EINVAL;
377 break;
378 }
379
d624c96f
JK
380 /* check next segment */
381 blkaddr = next_blkaddr_of_node(page);
4c521f49 382 f2fs_put_page(page, 1);
635aee1f 383
4d57b86d 384 f2fs_ra_meta_pages_cond(sbi, blkaddr);
d624c96f 385 }
d624c96f
JK
386 return err;
387}
388
26b5a079 389static void destroy_fsync_dnodes(struct list_head *head, int drop)
d624c96f 390{
d8b79b2f
DC
391 struct fsync_inode_entry *entry, *tmp;
392
3f8ab270 393 list_for_each_entry_safe(entry, tmp, head, list)
26b5a079 394 del_fsync_inode(entry, drop);
d624c96f
JK
395}
396
39cf72cf 397static int check_index_in_prev_nodes(struct f2fs_sb_info *sbi,
b292dcab 398 block_t blkaddr, struct dnode_of_data *dn)
d624c96f
JK
399{
400 struct seg_entry *sentry;
401 unsigned int segno = GET_SEGNO(sbi, blkaddr);
491c0854 402 unsigned short blkoff = GET_BLKOFF_FROM_SEG0(sbi, blkaddr);
f6517cfc 403 struct f2fs_summary_block *sum_node;
d624c96f 404 struct f2fs_summary sum;
f6517cfc 405 struct page *sum_page, *node_page;
c9ef4810 406 struct dnode_of_data tdn = *dn;
b292dcab 407 nid_t ino, nid;
d624c96f 408 struct inode *inode;
de93653f 409 unsigned int offset;
d624c96f
JK
410 block_t bidx;
411 int i;
412
413 sentry = get_seg_entry(sbi, segno);
414 if (!f2fs_test_bit(blkoff, sentry->cur_valid_map))
39cf72cf 415 return 0;
d624c96f
JK
416
417 /* Get the previous summary */
125c9fb1 418 for (i = CURSEG_HOT_DATA; i <= CURSEG_COLD_DATA; i++) {
d624c96f
JK
419 struct curseg_info *curseg = CURSEG_I(sbi, i);
420 if (curseg->segno == segno) {
421 sum = curseg->sum_blk->entries[blkoff];
f6517cfc 422 goto got_it;
d624c96f
JK
423 }
424 }
d624c96f 425
4d57b86d 426 sum_page = f2fs_get_sum_page(sbi, segno);
edc55aaf
JK
427 if (IS_ERR(sum_page))
428 return PTR_ERR(sum_page);
f6517cfc
JK
429 sum_node = (struct f2fs_summary_block *)page_address(sum_page);
430 sum = sum_node->entries[blkoff];
431 f2fs_put_page(sum_page, 1);
432got_it:
b292dcab
JK
433 /* Use the locked dnode page and inode */
434 nid = le32_to_cpu(sum.nid);
435 if (dn->inode->i_ino == nid) {
b292dcab 436 tdn.nid = nid;
c9ef4810
JK
437 if (!dn->inode_page_locked)
438 lock_page(dn->inode_page);
b292dcab 439 tdn.node_page = dn->inode_page;
060dd67b 440 tdn.ofs_in_node = le16_to_cpu(sum.ofs_in_node);
c9ef4810 441 goto truncate_out;
b292dcab 442 } else if (dn->nid == nid) {
060dd67b 443 tdn.ofs_in_node = le16_to_cpu(sum.ofs_in_node);
c9ef4810 444 goto truncate_out;
b292dcab
JK
445 }
446
d624c96f 447 /* Get the node page */
4d57b86d 448 node_page = f2fs_get_node_page(sbi, nid);
39cf72cf
JK
449 if (IS_ERR(node_page))
450 return PTR_ERR(node_page);
de93653f
JK
451
452 offset = ofs_of_node(node_page);
d624c96f
JK
453 ino = ino_of_node(node_page);
454 f2fs_put_page(node_page, 1);
455
60979115 456 if (ino != dn->inode->i_ino) {
4b2414d0
CY
457 int ret;
458
60979115 459 /* Deallocate previous index in the node page */
e8ea9b3d 460 inode = f2fs_iget_retry(sbi->sb, ino);
60979115
JK
461 if (IS_ERR(inode))
462 return PTR_ERR(inode);
4b2414d0
CY
463
464 ret = dquot_initialize(inode);
465 if (ret) {
466 iput(inode);
467 return ret;
468 }
60979115
JK
469 } else {
470 inode = dn->inode;
471 }
06025f4d 472
4d57b86d
CY
473 bidx = f2fs_start_bidx_of_node(offset, inode) +
474 le16_to_cpu(sum.ofs_in_node);
de93653f 475
c9ef4810
JK
476 /*
477 * if inode page is locked, unlock temporarily, but its reference
478 * count keeps alive.
479 */
480 if (ino == dn->inode->i_ino && dn->inode_page_locked)
481 unlock_page(dn->inode_page);
482
483 set_new_dnode(&tdn, inode, NULL, NULL, 0);
4d57b86d 484 if (f2fs_get_dnode_of_data(&tdn, bidx, LOOKUP_NODE))
c9ef4810
JK
485 goto out;
486
487 if (tdn.data_blkaddr == blkaddr)
4d57b86d 488 f2fs_truncate_data_blocks_range(&tdn, 1);
c9ef4810
JK
489
490 f2fs_put_dnode(&tdn);
491out:
492 if (ino != dn->inode->i_ino)
60979115 493 iput(inode);
c9ef4810
JK
494 else if (dn->inode_page_locked)
495 lock_page(dn->inode_page);
496 return 0;
497
498truncate_out:
7a2af766
CY
499 if (datablock_addr(tdn.inode, tdn.node_page,
500 tdn.ofs_in_node) == blkaddr)
4d57b86d 501 f2fs_truncate_data_blocks_range(&tdn, 1);
c9ef4810
JK
502 if (dn->inode->i_ino == nid && !dn->inode_page_locked)
503 unlock_page(dn->inode_page);
39cf72cf 504 return 0;
d624c96f
JK
505}
506
6ead1142 507static int do_recover_data(struct f2fs_sb_info *sbi, struct inode *inode,
e17d488b 508 struct page *page)
d624c96f 509{
d624c96f 510 struct dnode_of_data dn;
d624c96f 511 struct node_info ni;
81ca7350 512 unsigned int start, end;
f356fe0c 513 int err = 0, recovered = 0;
d624c96f 514
1c35a90e
JK
515 /* step 1: recover xattr */
516 if (IS_INODE(page)) {
4d57b86d 517 f2fs_recover_inline_xattr(inode, page);
1c35a90e 518 } else if (f2fs_has_xattr_block(ofs_of_node(page))) {
4d57b86d 519 err = f2fs_recover_xattr_data(inode, page);
d260081c
CY
520 if (!err)
521 recovered++;
1e1bb4ba 522 goto out;
1c35a90e 523 }
1e1bb4ba 524
1c35a90e 525 /* step 2: recover inline data */
4d57b86d 526 if (f2fs_recover_inline_data(inode, page))
abb2366c
JK
527 goto out;
528
1c35a90e 529 /* step 3: recover data indices */
4d57b86d 530 start = f2fs_start_bidx_of_node(ofs_of_node(page), inode);
81ca7350 531 end = start + ADDRS_PER_PAGE(page, inode);
d624c96f
JK
532
533 set_new_dnode(&dn, inode, NULL, NULL, 0);
e8ea9b3d 534retry_dn:
4d57b86d 535 err = f2fs_get_dnode_of_data(&dn, start, ALLOC_NODE);
e8ea9b3d
JK
536 if (err) {
537 if (err == -ENOMEM) {
538 congestion_wait(BLK_RW_ASYNC, HZ/50);
539 goto retry_dn;
540 }
1e1bb4ba 541 goto out;
e8ea9b3d 542 }
d624c96f 543
bae0ee7a 544 f2fs_wait_on_page_writeback(dn.node_page, NODE, true, true);
d624c96f 545
7735730d
CY
546 err = f2fs_get_node_info(sbi, dn.nid, &ni);
547 if (err)
548 goto err;
549
9850cf4a 550 f2fs_bug_on(sbi, ni.ino != ino_of_node(page));
22d61e28
CY
551
552 if (ofs_of_node(dn.node_page) != ofs_of_node(page)) {
dcbb4c10
JP
553 f2fs_warn(sbi, "Inconsistent ofs_of_node, ino:%lu, ofs:%u, %u",
554 inode->i_ino, ofs_of_node(dn.node_page),
555 ofs_of_node(page));
10f966bb 556 err = -EFSCORRUPTED;
22d61e28
CY
557 goto err;
558 }
d624c96f 559
12a8343e 560 for (; start < end; start++, dn.ofs_in_node++) {
d624c96f
JK
561 block_t src, dest;
562
7a2af766
CY
563 src = datablock_addr(dn.inode, dn.node_page, dn.ofs_in_node);
564 dest = datablock_addr(dn.inode, page, dn.ofs_in_node);
d624c96f 565
93770ab7
CY
566 if (__is_valid_data_blkaddr(src) &&
567 !f2fs_is_valid_blkaddr(sbi, src, META_POR)) {
10f966bb 568 err = -EFSCORRUPTED;
93770ab7
CY
569 goto err;
570 }
571
572 if (__is_valid_data_blkaddr(dest) &&
573 !f2fs_is_valid_blkaddr(sbi, dest, META_POR)) {
10f966bb 574 err = -EFSCORRUPTED;
93770ab7
CY
575 goto err;
576 }
577
12a8343e
CY
578 /* skip recovering if dest is the same as src */
579 if (src == dest)
580 continue;
581
582 /* dest is invalid, just invalidate src block */
583 if (dest == NULL_ADDR) {
4d57b86d 584 f2fs_truncate_data_blocks_range(&dn, 1);
12a8343e
CY
585 continue;
586 }
587
26787236 588 if (!file_keep_isize(inode) &&
dba79f38
CY
589 (i_size_read(inode) <= ((loff_t)start << PAGE_SHIFT)))
590 f2fs_i_size_write(inode,
591 (loff_t)(start + 1) << PAGE_SHIFT);
26de9b11 592
12a8343e
CY
593 /*
594 * dest is reserved block, invalidate src block
595 * and then reserve one new block in dnode page.
596 */
597 if (dest == NEW_ADDR) {
4d57b86d
CY
598 f2fs_truncate_data_blocks_range(&dn, 1);
599 f2fs_reserve_new_block(&dn);
12a8343e
CY
600 continue;
601 }
602
603 /* dest is valid block, try to recover from src to dest */
e1da7872 604 if (f2fs_is_valid_blkaddr(sbi, dest, META_POR)) {
e03b07d9 605
d624c96f 606 if (src == NULL_ADDR) {
4d57b86d 607 err = f2fs_reserve_new_block(&dn);
7fa750a1
AB
608 while (err &&
609 IS_ENABLED(CONFIG_F2FS_FAULT_INJECTION))
4d57b86d 610 err = f2fs_reserve_new_block(&dn);
d624c96f 611 /* We should not get -ENOSPC */
9850cf4a 612 f2fs_bug_on(sbi, err);
6f3ec995
JK
613 if (err)
614 goto err;
d624c96f 615 }
e8ea9b3d 616retry_prev:
d624c96f 617 /* Check the previous node page having this index */
39cf72cf 618 err = check_index_in_prev_nodes(sbi, dest, &dn);
e8ea9b3d
JK
619 if (err) {
620 if (err == -ENOMEM) {
621 congestion_wait(BLK_RW_ASYNC, HZ/50);
622 goto retry_prev;
623 }
39cf72cf 624 goto err;
e8ea9b3d 625 }
d624c96f 626
d624c96f 627 /* write dummy data page */
528e3459 628 f2fs_replace_block(sbi, &dn, src, dest,
28bc106b 629 ni.version, false, false);
f356fe0c 630 recovered++;
d624c96f 631 }
d624c96f
JK
632 }
633
d624c96f
JK
634 copy_node_footer(dn.node_page, page);
635 fill_node_footer(dn.node_page, dn.nid, ni.ino,
636 ofs_of_node(page), false);
637 set_page_dirty(dn.node_page);
39cf72cf 638err:
d624c96f 639 f2fs_put_dnode(&dn);
1e1bb4ba 640out:
dcbb4c10
JP
641 f2fs_notice(sbi, "recover_data: ino = %lx (i_size: %s) recovered = %d, err = %d",
642 inode->i_ino, file_keep_isize(inode) ? "keep" : "recover",
643 recovered, err);
39cf72cf 644 return err;
d624c96f
JK
645}
646
f61cce5b 647static int recover_data(struct f2fs_sb_info *sbi, struct list_head *inode_list,
26b5a079 648 struct list_head *tmp_inode_list, struct list_head *dir_list)
d624c96f 649{
d624c96f 650 struct curseg_info *curseg;
4c521f49 651 struct page *page = NULL;
6ead1142 652 int err = 0;
d624c96f
JK
653 block_t blkaddr;
654
655 /* get node pages in the current segment */
b7973f23 656 curseg = CURSEG_I(sbi, CURSEG_WARM_NODE);
d624c96f
JK
657 blkaddr = NEXT_FREE_BLKADDR(sbi, curseg);
658
d624c96f
JK
659 while (1) {
660 struct fsync_inode_entry *entry;
661
e1da7872 662 if (!f2fs_is_valid_blkaddr(sbi, blkaddr, META_POR))
4c521f49 663 break;
d624c96f 664
4d57b86d 665 f2fs_ra_meta_pages_cond(sbi, blkaddr);
635aee1f 666
4d57b86d 667 page = f2fs_get_tmp_page(sbi, blkaddr);
7735730d
CY
668 if (IS_ERR(page)) {
669 err = PTR_ERR(page);
670 break;
671 }
393ff91f 672
a468f0ef 673 if (!is_recoverable_dnode(page)) {
4c521f49 674 f2fs_put_page(page, 1);
45856aff 675 break;
4c521f49 676 }
d624c96f 677
f61cce5b 678 entry = get_fsync_inode(inode_list, ino_of_node(page));
d624c96f
JK
679 if (!entry)
680 goto next;
441ac5cb
JK
681 /*
682 * inode(x) | CP | inode(x) | dnode(F)
683 * In this case, we can lose the latest inode(x).
c52e1b10 684 * So, call recover_inode for the inode update.
441ac5cb 685 */
af033b2a
CY
686 if (IS_INODE(page)) {
687 err = recover_inode(entry->inode, page);
98838579
CY
688 if (err) {
689 f2fs_put_page(page, 1);
af033b2a 690 break;
98838579 691 }
af033b2a 692 }
c52e1b10 693 if (entry->last_dentry == blkaddr) {
f61cce5b 694 err = recover_dentry(entry->inode, page, dir_list);
c52e1b10
JK
695 if (err) {
696 f2fs_put_page(page, 1);
697 break;
698 }
699 }
e17d488b 700 err = do_recover_data(sbi, entry->inode, page);
4c521f49
JK
701 if (err) {
702 f2fs_put_page(page, 1);
45856aff 703 break;
4c521f49 704 }
d624c96f 705
3f8ab270 706 if (entry->blkaddr == blkaddr)
26b5a079 707 list_move_tail(&entry->list, tmp_inode_list);
d624c96f
JK
708next:
709 /* check next segment */
710 blkaddr = next_blkaddr_of_node(page);
4c521f49 711 f2fs_put_page(page, 1);
d624c96f 712 }
6ead1142 713 if (!err)
4d57b86d 714 f2fs_allocate_new_segments(sbi);
6ead1142 715 return err;
d624c96f
JK
716}
717
4d57b86d 718int f2fs_recover_fsync_data(struct f2fs_sb_info *sbi, bool check_only)
d624c96f 719{
26b5a079 720 struct list_head inode_list, tmp_inode_list;
f61cce5b 721 struct list_head dir_list;
6ead1142 722 int err;
6781eabb 723 int ret = 0;
4b2414d0 724 unsigned long s_flags = sbi->sb->s_flags;
aabe5136 725 bool need_writecp = false;
ea676733
JK
726#ifdef CONFIG_QUOTA
727 int quota_enabled;
728#endif
d624c96f 729
1751e8a6 730 if (s_flags & SB_RDONLY) {
dcbb4c10 731 f2fs_info(sbi, "recover fsync data on readonly fs");
1751e8a6 732 sbi->sb->s_flags &= ~SB_RDONLY;
4b2414d0
CY
733 }
734
735#ifdef CONFIG_QUOTA
736 /* Needed for iput() to work correctly and not trash data */
1751e8a6 737 sbi->sb->s_flags |= SB_ACTIVE;
4b2414d0 738 /* Turn on quotas so that they are updated correctly */
1751e8a6 739 quota_enabled = f2fs_enable_quota_files(sbi, s_flags & SB_RDONLY);
4b2414d0
CY
740#endif
741
d624c96f 742 fsync_entry_slab = f2fs_kmem_cache_create("f2fs_fsync_inode_entry",
e8512d2e 743 sizeof(struct fsync_inode_entry));
4b2414d0
CY
744 if (!fsync_entry_slab) {
745 err = -ENOMEM;
746 goto out;
747 }
d624c96f
JK
748
749 INIT_LIST_HEAD(&inode_list);
26b5a079 750 INIT_LIST_HEAD(&tmp_inode_list);
f61cce5b 751 INIT_LIST_HEAD(&dir_list);
d624c96f 752
14f4e690
JK
753 /* prevent checkpoint */
754 mutex_lock(&sbi->cp_mutex);
755
315df839 756 /* step #1: find fsynced inode numbers */
d40d30c5 757 err = find_fsync_dnodes(sbi, &inode_list, check_only);
6781eabb 758 if (err || list_empty(&inode_list))
4b2414d0 759 goto skip;
d624c96f 760
6781eabb
JK
761 if (check_only) {
762 ret = 1;
4b2414d0 763 goto skip;
6781eabb 764 }
d624c96f 765
aabe5136 766 need_writecp = true;
691c6fd2 767
d624c96f 768 /* step #2: recover data */
26b5a079 769 err = recover_data(sbi, &inode_list, &tmp_inode_list, &dir_list);
b307384e 770 if (!err)
9850cf4a 771 f2fs_bug_on(sbi, !list_empty(&inode_list));
26b5a079
SY
772 else {
773 /* restore s_flags to let iput() trash data */
774 sbi->sb->s_flags = s_flags;
775 }
4b2414d0 776skip:
26b5a079
SY
777 destroy_fsync_dnodes(&inode_list, err);
778 destroy_fsync_dnodes(&tmp_inode_list, err);
cf2271e7 779
4c521f49
JK
780 /* truncate meta pages to be used by the recovery */
781 truncate_inode_pages_range(META_MAPPING(sbi),
09cbfeaf 782 (loff_t)MAIN_BLKADDR(sbi) << PAGE_SHIFT, -1);
4c521f49 783
cf2271e7
JK
784 if (err) {
785 truncate_inode_pages_final(NODE_MAPPING(sbi));
786 truncate_inode_pages_final(META_MAPPING(sbi));
26b5a079
SY
787 } else {
788 clear_sbi_flag(sbi, SBI_POR_DOING);
cf2271e7 789 }
a468f0ef
JK
790 mutex_unlock(&sbi->cp_mutex);
791
9e1e6df4 792 /* let's drop all the directory inodes for clean checkpoint */
26b5a079 793 destroy_fsync_dnodes(&dir_list, err);
9e1e6df4 794
1378752b
CY
795 if (need_writecp) {
796 set_sbi_flag(sbi, SBI_IS_RECOVERED);
797
798 if (!err) {
799 struct cp_control cpc = {
800 .reason = CP_RECOVERY,
801 };
802 err = f2fs_write_checkpoint(sbi, &cpc);
803 }
cf2271e7 804 }
f61cce5b 805
f61cce5b 806 kmem_cache_destroy(fsync_entry_slab);
4b2414d0
CY
807out:
808#ifdef CONFIG_QUOTA
809 /* Turn quotas off */
ea676733
JK
810 if (quota_enabled)
811 f2fs_quota_off_umount(sbi->sb);
4b2414d0 812#endif
1751e8a6 813 sbi->sb->s_flags = s_flags; /* Restore SB_RDONLY status */
4b2414d0 814
6781eabb 815 return ret ? ret: err;
d624c96f 816}