]>
Commit | Line | Data |
---|---|---|
0a8165d7 | 1 | /* |
d624c96f JK |
2 | * fs/f2fs/recovery.c |
3 | * | |
4 | * Copyright (c) 2012 Samsung Electronics Co., Ltd. | |
5 | * http://www.samsung.com/ | |
6 | * | |
7 | * This program is free software; you can redistribute it and/or modify | |
8 | * it under the terms of the GNU General Public License version 2 as | |
9 | * published by the Free Software Foundation. | |
10 | */ | |
11 | #include <linux/fs.h> | |
12 | #include <linux/f2fs_fs.h> | |
13 | #include "f2fs.h" | |
14 | #include "node.h" | |
15 | #include "segment.h" | |
16 | ||
441ac5cb JK |
17 | /* |
18 | * Roll forward recovery scenarios. | |
19 | * | |
20 | * [Term] F: fsync_mark, D: dentry_mark | |
21 | * | |
22 | * 1. inode(x) | CP | inode(x) | dnode(F) | |
23 | * -> Update the latest inode(x). | |
24 | * | |
25 | * 2. inode(x) | CP | inode(F) | dnode(F) | |
26 | * -> No problem. | |
27 | * | |
28 | * 3. inode(x) | CP | dnode(F) | inode(x) | |
29 | * -> Recover to the latest dnode(F), and drop the last inode(x) | |
30 | * | |
31 | * 4. inode(x) | CP | dnode(F) | inode(F) | |
32 | * -> No problem. | |
33 | * | |
34 | * 5. CP | inode(x) | dnode(F) | |
35 | * -> The inode(DF) was missing. Should drop this dnode(F). | |
36 | * | |
37 | * 6. CP | inode(DF) | dnode(F) | |
38 | * -> No problem. | |
39 | * | |
40 | * 7. CP | dnode(F) | inode(DF) | |
41 | * -> If f2fs_iget fails, then goto next to find inode(DF). | |
42 | * | |
43 | * 8. CP | dnode(F) | inode(x) | |
44 | * -> If f2fs_iget fails, then goto next to find inode(DF). | |
45 | * But it will fail due to no inode(DF). | |
46 | */ | |
47 | ||
d624c96f JK |
48 | static struct kmem_cache *fsync_entry_slab; |
49 | ||
50 | bool space_for_roll_forward(struct f2fs_sb_info *sbi) | |
51 | { | |
41382ec4 JK |
52 | s64 nalloc = percpu_counter_sum_positive(&sbi->alloc_valid_block_count); |
53 | ||
54 | if (sbi->last_valid_block_count + nalloc > sbi->user_block_count) | |
d624c96f JK |
55 | return false; |
56 | return true; | |
57 | } | |
58 | ||
59 | static struct fsync_inode_entry *get_fsync_inode(struct list_head *head, | |
60 | nid_t ino) | |
61 | { | |
d624c96f JK |
62 | struct fsync_inode_entry *entry; |
63 | ||
2d7b822a | 64 | list_for_each_entry(entry, head, list) |
d624c96f JK |
65 | if (entry->inode->i_ino == ino) |
66 | return entry; | |
2d7b822a | 67 | |
d624c96f JK |
68 | return NULL; |
69 | } | |
70 | ||
f4702d61 JK |
71 | static struct fsync_inode_entry *add_fsync_inode(struct f2fs_sb_info *sbi, |
72 | struct list_head *head, nid_t ino) | |
3f8ab270 | 73 | { |
e8ea9b3d | 74 | struct inode *inode; |
3f8ab270 CY |
75 | struct fsync_inode_entry *entry; |
76 | ||
e8ea9b3d | 77 | inode = f2fs_iget_retry(sbi->sb, ino); |
f4702d61 JK |
78 | if (IS_ERR(inode)) |
79 | return ERR_CAST(inode); | |
80 | ||
e8ea9b3d | 81 | entry = f2fs_kmem_cache_alloc(fsync_entry_slab, GFP_F2FS_ZERO); |
3f8ab270 CY |
82 | entry->inode = inode; |
83 | list_add_tail(&entry->list, head); | |
84 | ||
85 | return entry; | |
86 | } | |
87 | ||
88 | static void del_fsync_inode(struct fsync_inode_entry *entry) | |
89 | { | |
90 | iput(entry->inode); | |
91 | list_del(&entry->list); | |
92 | kmem_cache_free(fsync_entry_slab, entry); | |
93 | } | |
94 | ||
f61cce5b CY |
95 | static int recover_dentry(struct inode *inode, struct page *ipage, |
96 | struct list_head *dir_list) | |
d624c96f | 97 | { |
58bfaf44 | 98 | struct f2fs_inode *raw_inode = F2FS_INODE(ipage); |
74d0b917 | 99 | nid_t pino = le32_to_cpu(raw_inode->i_pino); |
6b8213d9 | 100 | struct f2fs_dir_entry *de; |
e7ba108a | 101 | struct fscrypt_name fname; |
d624c96f | 102 | struct page *page; |
6b8213d9 | 103 | struct inode *dir, *einode; |
f61cce5b | 104 | struct fsync_inode_entry *entry; |
d624c96f | 105 | int err = 0; |
e7ba108a | 106 | char *name; |
d624c96f | 107 | |
f61cce5b CY |
108 | entry = get_fsync_inode(dir_list, pino); |
109 | if (!entry) { | |
f4702d61 JK |
110 | entry = add_fsync_inode(F2FS_I_SB(inode), dir_list, pino); |
111 | if (IS_ERR(entry)) { | |
112 | dir = ERR_CAST(entry); | |
113 | err = PTR_ERR(entry); | |
f61cce5b CY |
114 | goto out; |
115 | } | |
ed57c27f JK |
116 | } |
117 | ||
f61cce5b CY |
118 | dir = entry->inode; |
119 | ||
e7ba108a SL |
120 | memset(&fname, 0, sizeof(struct fscrypt_name)); |
121 | fname.disk_name.len = le32_to_cpu(raw_inode->i_namelen); | |
122 | fname.disk_name.name = raw_inode->i_name; | |
d96b1431 | 123 | |
e7ba108a | 124 | if (unlikely(fname.disk_name.len > F2FS_NAME_LEN)) { |
d96b1431 CY |
125 | WARN_ON(1); |
126 | err = -ENAMETOOLONG; | |
f61cce5b | 127 | goto out; |
d96b1431 | 128 | } |
6b8213d9 | 129 | retry: |
e7ba108a | 130 | de = __f2fs_find_entry(dir, &fname, &page); |
418f6c27 | 131 | if (de && inode->i_ino == le32_to_cpu(de->ino)) |
2e5558f4 | 132 | goto out_unmap_put; |
418f6c27 | 133 | |
6b8213d9 | 134 | if (de) { |
e8ea9b3d | 135 | einode = f2fs_iget_retry(inode->i_sb, le32_to_cpu(de->ino)); |
6b8213d9 JK |
136 | if (IS_ERR(einode)) { |
137 | WARN_ON(1); | |
5c1f9927 CY |
138 | err = PTR_ERR(einode); |
139 | if (err == -ENOENT) | |
6b8213d9 | 140 | err = -EEXIST; |
2e5558f4 RK |
141 | goto out_unmap_put; |
142 | } | |
4081363f | 143 | err = acquire_orphan_inode(F2FS_I_SB(inode)); |
2e5558f4 RK |
144 | if (err) { |
145 | iput(einode); | |
146 | goto out_unmap_put; | |
6b8213d9 | 147 | } |
dbeacf02 | 148 | f2fs_delete_entry(de, page, dir, einode); |
6b8213d9 JK |
149 | iput(einode); |
150 | goto retry; | |
91246c21 CY |
151 | } else if (IS_ERR(page)) { |
152 | err = PTR_ERR(page); | |
153 | } else { | |
e7ba108a | 154 | err = __f2fs_do_add_link(dir, &fname, inode, |
91246c21 | 155 | inode->i_ino, inode->i_mode); |
d624c96f | 156 | } |
e8ea9b3d JK |
157 | if (err == -ENOMEM) |
158 | goto retry; | |
2e5558f4 RK |
159 | goto out; |
160 | ||
161 | out_unmap_put: | |
9486ba44 | 162 | f2fs_dentry_kunmap(dir, page); |
2e5558f4 | 163 | f2fs_put_page(page, 0); |
d624c96f | 164 | out: |
e7ba108a SL |
165 | if (file_enc_name(inode)) |
166 | name = "<encrypted>"; | |
167 | else | |
168 | name = raw_inode->i_name; | |
6c311ec6 CF |
169 | f2fs_msg(inode->i_sb, KERN_NOTICE, |
170 | "%s: ino = %x, name = %s, dir = %lx, err = %d", | |
e7ba108a | 171 | __func__, ino_of_node(ipage), name, |
f28c06fa | 172 | IS_ERR(dir) ? 0 : dir->i_ino, err); |
d624c96f JK |
173 | return err; |
174 | } | |
175 | ||
c52e1b10 | 176 | static void recover_inode(struct inode *inode, struct page *page) |
d624c96f | 177 | { |
441ac5cb | 178 | struct f2fs_inode *raw = F2FS_INODE(page); |
e7d55452 | 179 | char *name; |
441ac5cb JK |
180 | |
181 | inode->i_mode = le16_to_cpu(raw->i_mode); | |
fc9581c8 | 182 | f2fs_i_size_write(inode, le64_to_cpu(raw->i_size)); |
441ac5cb JK |
183 | inode->i_atime.tv_sec = le64_to_cpu(raw->i_mtime); |
184 | inode->i_ctime.tv_sec = le64_to_cpu(raw->i_ctime); | |
185 | inode->i_mtime.tv_sec = le64_to_cpu(raw->i_mtime); | |
186 | inode->i_atime.tv_nsec = le32_to_cpu(raw->i_mtime_nsec); | |
187 | inode->i_ctime.tv_nsec = le32_to_cpu(raw->i_ctime_nsec); | |
188 | inode->i_mtime.tv_nsec = le32_to_cpu(raw->i_mtime_nsec); | |
f356fe0c | 189 | |
e7d55452 JK |
190 | if (file_enc_name(inode)) |
191 | name = "<encrypted>"; | |
192 | else | |
193 | name = F2FS_INODE(page)->i_name; | |
194 | ||
f356fe0c | 195 | f2fs_msg(inode->i_sb, KERN_NOTICE, "recover_inode: ino = %x, name = %s", |
e7d55452 | 196 | ino_of_node(page), name); |
d624c96f JK |
197 | } |
198 | ||
807b1e1c JK |
199 | static bool is_same_inode(struct inode *inode, struct page *ipage) |
200 | { | |
201 | struct f2fs_inode *ri = F2FS_INODE(ipage); | |
202 | struct timespec disk; | |
203 | ||
204 | if (!IS_INODE(ipage)) | |
205 | return true; | |
206 | ||
207 | disk.tv_sec = le64_to_cpu(ri->i_ctime); | |
208 | disk.tv_nsec = le32_to_cpu(ri->i_ctime_nsec); | |
209 | if (timespec_compare(&inode->i_ctime, &disk) > 0) | |
210 | return false; | |
211 | ||
212 | disk.tv_sec = le64_to_cpu(ri->i_atime); | |
213 | disk.tv_nsec = le32_to_cpu(ri->i_atime_nsec); | |
214 | if (timespec_compare(&inode->i_atime, &disk) > 0) | |
215 | return false; | |
216 | ||
217 | disk.tv_sec = le64_to_cpu(ri->i_mtime); | |
218 | disk.tv_nsec = le32_to_cpu(ri->i_mtime_nsec); | |
219 | if (timespec_compare(&inode->i_mtime, &disk) > 0) | |
220 | return false; | |
221 | ||
222 | return true; | |
223 | } | |
224 | ||
d624c96f JK |
225 | static int find_fsync_dnodes(struct f2fs_sb_info *sbi, struct list_head *head) |
226 | { | |
d71b5564 | 227 | unsigned long long cp_ver = cur_cp_version(F2FS_CKPT(sbi)); |
d624c96f | 228 | struct curseg_info *curseg; |
4c521f49 | 229 | struct page *page = NULL; |
d624c96f JK |
230 | block_t blkaddr; |
231 | int err = 0; | |
232 | ||
233 | /* get node pages in the current segment */ | |
234 | curseg = CURSEG_I(sbi, CURSEG_WARM_NODE); | |
695fd1ed | 235 | blkaddr = NEXT_FREE_BLKADDR(sbi, curseg); |
d624c96f | 236 | |
d624c96f JK |
237 | while (1) { |
238 | struct fsync_inode_entry *entry; | |
239 | ||
f0c9cada | 240 | if (!is_valid_blkaddr(sbi, blkaddr, META_POR)) |
4c521f49 | 241 | return 0; |
d624c96f | 242 | |
2b947003 | 243 | page = get_tmp_page(sbi, blkaddr); |
393ff91f | 244 | |
6ead1142 | 245 | if (cp_ver != cpver_of_node(page)) |
f356fe0c | 246 | break; |
d624c96f JK |
247 | |
248 | if (!is_fsync_dnode(page)) | |
249 | goto next; | |
250 | ||
251 | entry = get_fsync_inode(head, ino_of_node(page)); | |
807b1e1c JK |
252 | if (entry) { |
253 | if (!is_same_inode(entry->inode, page)) | |
254 | goto next; | |
255 | } else { | |
d624c96f | 256 | if (IS_INODE(page) && is_dent_dnode(page)) { |
6ead1142 JK |
257 | err = recover_inode_page(sbi, page); |
258 | if (err) | |
f356fe0c | 259 | break; |
d624c96f JK |
260 | } |
261 | ||
441ac5cb JK |
262 | /* |
263 | * CP | dnode(F) | inode(DF) | |
264 | * For this case, we should not give up now. | |
265 | */ | |
f4702d61 JK |
266 | entry = add_fsync_inode(sbi, head, ino_of_node(page)); |
267 | if (IS_ERR(entry)) { | |
268 | err = PTR_ERR(entry); | |
8fbc418f JK |
269 | if (err == -ENOENT) { |
270 | err = 0; | |
441ac5cb | 271 | goto next; |
8fbc418f | 272 | } |
f356fe0c | 273 | break; |
d624c96f | 274 | } |
d624c96f | 275 | } |
addbe45b JK |
276 | entry->blkaddr = blkaddr; |
277 | ||
608514de JK |
278 | if (IS_INODE(page) && is_dent_dnode(page)) |
279 | entry->last_dentry = blkaddr; | |
d624c96f JK |
280 | next: |
281 | /* check next segment */ | |
282 | blkaddr = next_blkaddr_of_node(page); | |
4c521f49 | 283 | f2fs_put_page(page, 1); |
635aee1f CY |
284 | |
285 | ra_meta_pages_cond(sbi, blkaddr); | |
d624c96f | 286 | } |
4c521f49 | 287 | f2fs_put_page(page, 1); |
d624c96f JK |
288 | return err; |
289 | } | |
290 | ||
5ebefc5b | 291 | static void destroy_fsync_dnodes(struct list_head *head) |
d624c96f | 292 | { |
d8b79b2f DC |
293 | struct fsync_inode_entry *entry, *tmp; |
294 | ||
3f8ab270 CY |
295 | list_for_each_entry_safe(entry, tmp, head, list) |
296 | del_fsync_inode(entry); | |
d624c96f JK |
297 | } |
298 | ||
39cf72cf | 299 | static int check_index_in_prev_nodes(struct f2fs_sb_info *sbi, |
b292dcab | 300 | block_t blkaddr, struct dnode_of_data *dn) |
d624c96f JK |
301 | { |
302 | struct seg_entry *sentry; | |
303 | unsigned int segno = GET_SEGNO(sbi, blkaddr); | |
491c0854 | 304 | unsigned short blkoff = GET_BLKOFF_FROM_SEG0(sbi, blkaddr); |
f6517cfc | 305 | struct f2fs_summary_block *sum_node; |
d624c96f | 306 | struct f2fs_summary sum; |
f6517cfc | 307 | struct page *sum_page, *node_page; |
c9ef4810 | 308 | struct dnode_of_data tdn = *dn; |
b292dcab | 309 | nid_t ino, nid; |
d624c96f | 310 | struct inode *inode; |
de93653f | 311 | unsigned int offset; |
d624c96f JK |
312 | block_t bidx; |
313 | int i; | |
314 | ||
315 | sentry = get_seg_entry(sbi, segno); | |
316 | if (!f2fs_test_bit(blkoff, sentry->cur_valid_map)) | |
39cf72cf | 317 | return 0; |
d624c96f JK |
318 | |
319 | /* Get the previous summary */ | |
320 | for (i = CURSEG_WARM_DATA; i <= CURSEG_COLD_DATA; i++) { | |
321 | struct curseg_info *curseg = CURSEG_I(sbi, i); | |
322 | if (curseg->segno == segno) { | |
323 | sum = curseg->sum_blk->entries[blkoff]; | |
f6517cfc | 324 | goto got_it; |
d624c96f JK |
325 | } |
326 | } | |
d624c96f | 327 | |
f6517cfc JK |
328 | sum_page = get_sum_page(sbi, segno); |
329 | sum_node = (struct f2fs_summary_block *)page_address(sum_page); | |
330 | sum = sum_node->entries[blkoff]; | |
331 | f2fs_put_page(sum_page, 1); | |
332 | got_it: | |
b292dcab JK |
333 | /* Use the locked dnode page and inode */ |
334 | nid = le32_to_cpu(sum.nid); | |
335 | if (dn->inode->i_ino == nid) { | |
b292dcab | 336 | tdn.nid = nid; |
c9ef4810 JK |
337 | if (!dn->inode_page_locked) |
338 | lock_page(dn->inode_page); | |
b292dcab | 339 | tdn.node_page = dn->inode_page; |
060dd67b | 340 | tdn.ofs_in_node = le16_to_cpu(sum.ofs_in_node); |
c9ef4810 | 341 | goto truncate_out; |
b292dcab | 342 | } else if (dn->nid == nid) { |
060dd67b | 343 | tdn.ofs_in_node = le16_to_cpu(sum.ofs_in_node); |
c9ef4810 | 344 | goto truncate_out; |
b292dcab JK |
345 | } |
346 | ||
d624c96f | 347 | /* Get the node page */ |
b292dcab | 348 | node_page = get_node_page(sbi, nid); |
39cf72cf JK |
349 | if (IS_ERR(node_page)) |
350 | return PTR_ERR(node_page); | |
de93653f JK |
351 | |
352 | offset = ofs_of_node(node_page); | |
d624c96f JK |
353 | ino = ino_of_node(node_page); |
354 | f2fs_put_page(node_page, 1); | |
355 | ||
60979115 JK |
356 | if (ino != dn->inode->i_ino) { |
357 | /* Deallocate previous index in the node page */ | |
e8ea9b3d | 358 | inode = f2fs_iget_retry(sbi->sb, ino); |
60979115 JK |
359 | if (IS_ERR(inode)) |
360 | return PTR_ERR(inode); | |
361 | } else { | |
362 | inode = dn->inode; | |
363 | } | |
06025f4d | 364 | |
81ca7350 | 365 | bidx = start_bidx_of_node(offset, inode) + le16_to_cpu(sum.ofs_in_node); |
de93653f | 366 | |
c9ef4810 JK |
367 | /* |
368 | * if inode page is locked, unlock temporarily, but its reference | |
369 | * count keeps alive. | |
370 | */ | |
371 | if (ino == dn->inode->i_ino && dn->inode_page_locked) | |
372 | unlock_page(dn->inode_page); | |
373 | ||
374 | set_new_dnode(&tdn, inode, NULL, NULL, 0); | |
375 | if (get_dnode_of_data(&tdn, bidx, LOOKUP_NODE)) | |
376 | goto out; | |
377 | ||
378 | if (tdn.data_blkaddr == blkaddr) | |
379 | truncate_data_blocks_range(&tdn, 1); | |
380 | ||
381 | f2fs_put_dnode(&tdn); | |
382 | out: | |
383 | if (ino != dn->inode->i_ino) | |
60979115 | 384 | iput(inode); |
c9ef4810 JK |
385 | else if (dn->inode_page_locked) |
386 | lock_page(dn->inode_page); | |
387 | return 0; | |
388 | ||
389 | truncate_out: | |
390 | if (datablock_addr(tdn.node_page, tdn.ofs_in_node) == blkaddr) | |
391 | truncate_data_blocks_range(&tdn, 1); | |
392 | if (dn->inode->i_ino == nid && !dn->inode_page_locked) | |
393 | unlock_page(dn->inode_page); | |
39cf72cf | 394 | return 0; |
d624c96f JK |
395 | } |
396 | ||
6ead1142 | 397 | static int do_recover_data(struct f2fs_sb_info *sbi, struct inode *inode, |
d624c96f JK |
398 | struct page *page, block_t blkaddr) |
399 | { | |
d624c96f | 400 | struct dnode_of_data dn; |
d624c96f | 401 | struct node_info ni; |
81ca7350 | 402 | unsigned int start, end; |
f356fe0c | 403 | int err = 0, recovered = 0; |
d624c96f | 404 | |
1c35a90e JK |
405 | /* step 1: recover xattr */ |
406 | if (IS_INODE(page)) { | |
407 | recover_inline_xattr(inode, page); | |
408 | } else if (f2fs_has_xattr_block(ofs_of_node(page))) { | |
bc4a1f87 JK |
409 | /* |
410 | * Deprecated; xattr blocks should be found from cold log. | |
411 | * But, we should remain this for backward compatibility. | |
412 | */ | |
1c35a90e | 413 | recover_xattr_data(inode, page, blkaddr); |
1e1bb4ba | 414 | goto out; |
1c35a90e | 415 | } |
1e1bb4ba | 416 | |
1c35a90e JK |
417 | /* step 2: recover inline data */ |
418 | if (recover_inline_data(inode, page)) | |
abb2366c JK |
419 | goto out; |
420 | ||
1c35a90e | 421 | /* step 3: recover data indices */ |
81ca7350 CY |
422 | start = start_bidx_of_node(ofs_of_node(page), inode); |
423 | end = start + ADDRS_PER_PAGE(page, inode); | |
d624c96f JK |
424 | |
425 | set_new_dnode(&dn, inode, NULL, NULL, 0); | |
e8ea9b3d | 426 | retry_dn: |
6ead1142 | 427 | err = get_dnode_of_data(&dn, start, ALLOC_NODE); |
e8ea9b3d JK |
428 | if (err) { |
429 | if (err == -ENOMEM) { | |
430 | congestion_wait(BLK_RW_ASYNC, HZ/50); | |
431 | goto retry_dn; | |
432 | } | |
1e1bb4ba | 433 | goto out; |
e8ea9b3d | 434 | } |
d624c96f | 435 | |
fec1d657 | 436 | f2fs_wait_on_page_writeback(dn.node_page, NODE, true); |
d624c96f JK |
437 | |
438 | get_node_info(sbi, dn.nid, &ni); | |
9850cf4a JK |
439 | f2fs_bug_on(sbi, ni.ino != ino_of_node(page)); |
440 | f2fs_bug_on(sbi, ofs_of_node(dn.node_page) != ofs_of_node(page)); | |
d624c96f | 441 | |
12a8343e | 442 | for (; start < end; start++, dn.ofs_in_node++) { |
d624c96f JK |
443 | block_t src, dest; |
444 | ||
445 | src = datablock_addr(dn.node_page, dn.ofs_in_node); | |
446 | dest = datablock_addr(page, dn.ofs_in_node); | |
447 | ||
12a8343e CY |
448 | /* skip recovering if dest is the same as src */ |
449 | if (src == dest) | |
450 | continue; | |
451 | ||
452 | /* dest is invalid, just invalidate src block */ | |
453 | if (dest == NULL_ADDR) { | |
454 | truncate_data_blocks_range(&dn, 1); | |
455 | continue; | |
456 | } | |
457 | ||
26de9b11 JK |
458 | if ((start + 1) << PAGE_SHIFT > i_size_read(inode)) |
459 | f2fs_i_size_write(inode, (start + 1) << PAGE_SHIFT); | |
460 | ||
12a8343e CY |
461 | /* |
462 | * dest is reserved block, invalidate src block | |
463 | * and then reserve one new block in dnode page. | |
464 | */ | |
465 | if (dest == NEW_ADDR) { | |
466 | truncate_data_blocks_range(&dn, 1); | |
3b9b10f9 | 467 | reserve_new_block(&dn); |
12a8343e CY |
468 | continue; |
469 | } | |
470 | ||
471 | /* dest is valid block, try to recover from src to dest */ | |
472 | if (is_valid_blkaddr(sbi, dest, META_POR)) { | |
e03b07d9 | 473 | |
d624c96f | 474 | if (src == NULL_ADDR) { |
5d56b671 | 475 | err = reserve_new_block(&dn); |
975756c4 JK |
476 | #ifdef CONFIG_F2FS_FAULT_INJECTION |
477 | while (err) | |
478 | err = reserve_new_block(&dn); | |
479 | #endif | |
d624c96f | 480 | /* We should not get -ENOSPC */ |
9850cf4a | 481 | f2fs_bug_on(sbi, err); |
6f3ec995 JK |
482 | if (err) |
483 | goto err; | |
d624c96f | 484 | } |
e8ea9b3d | 485 | retry_prev: |
d624c96f | 486 | /* Check the previous node page having this index */ |
39cf72cf | 487 | err = check_index_in_prev_nodes(sbi, dest, &dn); |
e8ea9b3d JK |
488 | if (err) { |
489 | if (err == -ENOMEM) { | |
490 | congestion_wait(BLK_RW_ASYNC, HZ/50); | |
491 | goto retry_prev; | |
492 | } | |
39cf72cf | 493 | goto err; |
e8ea9b3d | 494 | } |
d624c96f | 495 | |
d624c96f | 496 | /* write dummy data page */ |
528e3459 | 497 | f2fs_replace_block(sbi, &dn, src, dest, |
28bc106b | 498 | ni.version, false, false); |
f356fe0c | 499 | recovered++; |
d624c96f | 500 | } |
d624c96f JK |
501 | } |
502 | ||
d624c96f JK |
503 | copy_node_footer(dn.node_page, page); |
504 | fill_node_footer(dn.node_page, dn.nid, ni.ino, | |
505 | ofs_of_node(page), false); | |
506 | set_page_dirty(dn.node_page); | |
39cf72cf | 507 | err: |
d624c96f | 508 | f2fs_put_dnode(&dn); |
1e1bb4ba | 509 | out: |
6c311ec6 CF |
510 | f2fs_msg(sbi->sb, KERN_NOTICE, |
511 | "recover_data: ino = %lx, recovered = %d blocks, err = %d", | |
512 | inode->i_ino, recovered, err); | |
39cf72cf | 513 | return err; |
d624c96f JK |
514 | } |
515 | ||
f61cce5b CY |
516 | static int recover_data(struct f2fs_sb_info *sbi, struct list_head *inode_list, |
517 | struct list_head *dir_list) | |
d624c96f | 518 | { |
d71b5564 | 519 | unsigned long long cp_ver = cur_cp_version(F2FS_CKPT(sbi)); |
d624c96f | 520 | struct curseg_info *curseg; |
4c521f49 | 521 | struct page *page = NULL; |
6ead1142 | 522 | int err = 0; |
d624c96f JK |
523 | block_t blkaddr; |
524 | ||
525 | /* get node pages in the current segment */ | |
b7973f23 | 526 | curseg = CURSEG_I(sbi, CURSEG_WARM_NODE); |
d624c96f JK |
527 | blkaddr = NEXT_FREE_BLKADDR(sbi, curseg); |
528 | ||
d624c96f JK |
529 | while (1) { |
530 | struct fsync_inode_entry *entry; | |
531 | ||
f0c9cada | 532 | if (!is_valid_blkaddr(sbi, blkaddr, META_POR)) |
4c521f49 | 533 | break; |
d624c96f | 534 | |
635aee1f CY |
535 | ra_meta_pages_cond(sbi, blkaddr); |
536 | ||
2b947003 | 537 | page = get_tmp_page(sbi, blkaddr); |
393ff91f | 538 | |
4c521f49 JK |
539 | if (cp_ver != cpver_of_node(page)) { |
540 | f2fs_put_page(page, 1); | |
45856aff | 541 | break; |
4c521f49 | 542 | } |
d624c96f | 543 | |
f61cce5b | 544 | entry = get_fsync_inode(inode_list, ino_of_node(page)); |
d624c96f JK |
545 | if (!entry) |
546 | goto next; | |
441ac5cb JK |
547 | /* |
548 | * inode(x) | CP | inode(x) | dnode(F) | |
549 | * In this case, we can lose the latest inode(x). | |
c52e1b10 | 550 | * So, call recover_inode for the inode update. |
441ac5cb | 551 | */ |
608514de | 552 | if (IS_INODE(page)) |
c52e1b10 JK |
553 | recover_inode(entry->inode, page); |
554 | if (entry->last_dentry == blkaddr) { | |
f61cce5b | 555 | err = recover_dentry(entry->inode, page, dir_list); |
c52e1b10 JK |
556 | if (err) { |
557 | f2fs_put_page(page, 1); | |
558 | break; | |
559 | } | |
560 | } | |
6ead1142 | 561 | err = do_recover_data(sbi, entry->inode, page, blkaddr); |
4c521f49 JK |
562 | if (err) { |
563 | f2fs_put_page(page, 1); | |
45856aff | 564 | break; |
4c521f49 | 565 | } |
d624c96f | 566 | |
3f8ab270 CY |
567 | if (entry->blkaddr == blkaddr) |
568 | del_fsync_inode(entry); | |
d624c96f JK |
569 | next: |
570 | /* check next segment */ | |
571 | blkaddr = next_blkaddr_of_node(page); | |
4c521f49 | 572 | f2fs_put_page(page, 1); |
d624c96f | 573 | } |
6ead1142 JK |
574 | if (!err) |
575 | allocate_new_segments(sbi); | |
576 | return err; | |
d624c96f JK |
577 | } |
578 | ||
6781eabb | 579 | int recover_fsync_data(struct f2fs_sb_info *sbi, bool check_only) |
d624c96f | 580 | { |
cf2271e7 | 581 | struct curseg_info *curseg = CURSEG_I(sbi, CURSEG_WARM_NODE); |
d624c96f | 582 | struct list_head inode_list; |
f61cce5b | 583 | struct list_head dir_list; |
cf2271e7 | 584 | block_t blkaddr; |
6ead1142 | 585 | int err; |
6781eabb | 586 | int ret = 0; |
aabe5136 | 587 | bool need_writecp = false; |
d624c96f JK |
588 | |
589 | fsync_entry_slab = f2fs_kmem_cache_create("f2fs_fsync_inode_entry", | |
e8512d2e | 590 | sizeof(struct fsync_inode_entry)); |
6bacf52f | 591 | if (!fsync_entry_slab) |
6ead1142 | 592 | return -ENOMEM; |
d624c96f JK |
593 | |
594 | INIT_LIST_HEAD(&inode_list); | |
f61cce5b | 595 | INIT_LIST_HEAD(&dir_list); |
d624c96f | 596 | |
14f4e690 JK |
597 | /* prevent checkpoint */ |
598 | mutex_lock(&sbi->cp_mutex); | |
599 | ||
cf2271e7 JK |
600 | blkaddr = NEXT_FREE_BLKADDR(sbi, curseg); |
601 | ||
315df839 | 602 | /* step #1: find fsynced inode numbers */ |
6ead1142 | 603 | err = find_fsync_dnodes(sbi, &inode_list); |
6781eabb | 604 | if (err || list_empty(&inode_list)) |
d624c96f JK |
605 | goto out; |
606 | ||
6781eabb JK |
607 | if (check_only) { |
608 | ret = 1; | |
d624c96f | 609 | goto out; |
6781eabb | 610 | } |
d624c96f | 611 | |
aabe5136 | 612 | need_writecp = true; |
691c6fd2 | 613 | |
d624c96f | 614 | /* step #2: recover data */ |
f61cce5b | 615 | err = recover_data(sbi, &inode_list, &dir_list); |
b307384e | 616 | if (!err) |
9850cf4a | 617 | f2fs_bug_on(sbi, !list_empty(&inode_list)); |
d624c96f | 618 | out: |
5ebefc5b | 619 | destroy_fsync_dnodes(&inode_list); |
cf2271e7 | 620 | |
4c521f49 JK |
621 | /* truncate meta pages to be used by the recovery */ |
622 | truncate_inode_pages_range(META_MAPPING(sbi), | |
09cbfeaf | 623 | (loff_t)MAIN_BLKADDR(sbi) << PAGE_SHIFT, -1); |
4c521f49 | 624 | |
cf2271e7 JK |
625 | if (err) { |
626 | truncate_inode_pages_final(NODE_MAPPING(sbi)); | |
627 | truncate_inode_pages_final(META_MAPPING(sbi)); | |
628 | } | |
629 | ||
caf0047e | 630 | clear_sbi_flag(sbi, SBI_POR_DOING); |
cf2271e7 | 631 | if (err) { |
e90c2d28 CY |
632 | bool invalidate = false; |
633 | ||
36abef4e JK |
634 | if (test_opt(sbi, LFS)) { |
635 | update_meta_page(sbi, NULL, blkaddr); | |
e90c2d28 | 636 | invalidate = true; |
36abef4e JK |
637 | } else if (discard_next_dnode(sbi, blkaddr)) { |
638 | invalidate = true; | |
639 | } | |
cf2271e7 | 640 | |
275b66b0 CY |
641 | f2fs_wait_all_discard_bio(sbi); |
642 | ||
cf2271e7 JK |
643 | /* Flush all the NAT/SIT pages */ |
644 | while (get_pages(sbi, F2FS_DIRTY_META)) | |
645 | sync_meta_pages(sbi, META, LONG_MAX); | |
e90c2d28 CY |
646 | |
647 | /* invalidate temporary meta page */ | |
648 | if (invalidate) | |
649 | invalidate_mapping_pages(META_MAPPING(sbi), | |
650 | blkaddr, blkaddr); | |
651 | ||
14f4e690 JK |
652 | set_ckpt_flags(sbi->ckpt, CP_ERROR_FLAG); |
653 | mutex_unlock(&sbi->cp_mutex); | |
cf2271e7 | 654 | } else if (need_writecp) { |
75ab4cb8 | 655 | struct cp_control cpc = { |
10027551 | 656 | .reason = CP_RECOVERY, |
75ab4cb8 | 657 | }; |
14f4e690 | 658 | mutex_unlock(&sbi->cp_mutex); |
c34f42e2 | 659 | err = write_checkpoint(sbi, &cpc); |
14f4e690 JK |
660 | } else { |
661 | mutex_unlock(&sbi->cp_mutex); | |
cf2271e7 | 662 | } |
f61cce5b CY |
663 | |
664 | destroy_fsync_dnodes(&dir_list); | |
665 | kmem_cache_destroy(fsync_entry_slab); | |
6781eabb | 666 | return ret ? ret: err; |
d624c96f | 667 | } |