4 * Copyright (c) 2012 Samsung Electronics Co., Ltd.
5 * http://www.samsung.com/
7 * This program is free software; you can redistribute it and/or modify
8 * it under the terms of the GNU General Public License version 2 as
9 * published by the Free Software Foundation.
12 #include <linux/f2fs_fs.h>
18 static unsigned long dir_blocks(struct inode
*inode
)
20 return ((unsigned long long) (i_size_read(inode
) + PAGE_CACHE_SIZE
- 1))
24 static unsigned int dir_buckets(unsigned int level
, int dir_level
)
26 if (level
+ dir_level
< MAX_DIR_HASH_DEPTH
/ 2)
27 return 1 << (level
+ dir_level
);
29 return MAX_DIR_BUCKETS
;
32 static unsigned int bucket_blocks(unsigned int level
)
34 if (level
< MAX_DIR_HASH_DEPTH
/ 2)
40 static unsigned char f2fs_filetype_table
[F2FS_FT_MAX
] = {
41 [F2FS_FT_UNKNOWN
] = DT_UNKNOWN
,
42 [F2FS_FT_REG_FILE
] = DT_REG
,
43 [F2FS_FT_DIR
] = DT_DIR
,
44 [F2FS_FT_CHRDEV
] = DT_CHR
,
45 [F2FS_FT_BLKDEV
] = DT_BLK
,
46 [F2FS_FT_FIFO
] = DT_FIFO
,
47 [F2FS_FT_SOCK
] = DT_SOCK
,
48 [F2FS_FT_SYMLINK
] = DT_LNK
,
52 static unsigned char f2fs_type_by_mode
[S_IFMT
>> S_SHIFT
] = {
53 [S_IFREG
>> S_SHIFT
] = F2FS_FT_REG_FILE
,
54 [S_IFDIR
>> S_SHIFT
] = F2FS_FT_DIR
,
55 [S_IFCHR
>> S_SHIFT
] = F2FS_FT_CHRDEV
,
56 [S_IFBLK
>> S_SHIFT
] = F2FS_FT_BLKDEV
,
57 [S_IFIFO
>> S_SHIFT
] = F2FS_FT_FIFO
,
58 [S_IFSOCK
>> S_SHIFT
] = F2FS_FT_SOCK
,
59 [S_IFLNK
>> S_SHIFT
] = F2FS_FT_SYMLINK
,
62 static void set_de_type(struct f2fs_dir_entry
*de
, struct inode
*inode
)
64 umode_t mode
= inode
->i_mode
;
65 de
->file_type
= f2fs_type_by_mode
[(mode
& S_IFMT
) >> S_SHIFT
];
68 static unsigned long dir_block_index(unsigned int level
,
69 int dir_level
, unsigned int idx
)
72 unsigned long bidx
= 0;
74 for (i
= 0; i
< level
; i
++)
75 bidx
+= dir_buckets(i
, dir_level
) * bucket_blocks(i
);
76 bidx
+= idx
* bucket_blocks(level
);
80 static bool early_match_name(size_t namelen
, f2fs_hash_t namehash
,
81 struct f2fs_dir_entry
*de
)
83 if (le16_to_cpu(de
->name_len
) != namelen
)
86 if (de
->hash_code
!= namehash
)
92 static struct f2fs_dir_entry
*find_in_block(struct page
*dentry_page
,
93 struct qstr
*name
, int *max_slots
,
94 f2fs_hash_t namehash
, struct page
**res_page
)
96 struct f2fs_dir_entry
*de
;
97 unsigned long bit_pos
= 0;
98 struct f2fs_dentry_block
*dentry_blk
= kmap(dentry_page
);
99 const void *dentry_bits
= &dentry_blk
->dentry_bitmap
;
102 while (bit_pos
< NR_DENTRY_IN_BLOCK
) {
103 if (!test_bit_le(bit_pos
, dentry_bits
)) {
106 else if (!test_bit_le(bit_pos
- 1, dentry_bits
))
111 de
= &dentry_blk
->dentry
[bit_pos
];
112 if (early_match_name(name
->len
, namehash
, de
)) {
113 if (!memcmp(dentry_blk
->filename
[bit_pos
],
116 *res_page
= dentry_page
;
120 if (max_len
> *max_slots
) {
121 *max_slots
= max_len
;
124 bit_pos
+= GET_DENTRY_SLOTS(le16_to_cpu(de
->name_len
));
130 if (max_len
> *max_slots
)
131 *max_slots
= max_len
;
135 static struct f2fs_dir_entry
*find_in_level(struct inode
*dir
,
136 unsigned int level
, struct qstr
*name
,
137 f2fs_hash_t namehash
, struct page
**res_page
)
139 int s
= GET_DENTRY_SLOTS(name
->len
);
140 unsigned int nbucket
, nblock
;
141 unsigned int bidx
, end_block
;
142 struct page
*dentry_page
;
143 struct f2fs_dir_entry
*de
= NULL
;
147 f2fs_bug_on(level
> MAX_DIR_HASH_DEPTH
);
149 nbucket
= dir_buckets(level
, F2FS_I(dir
)->i_dir_level
);
150 nblock
= bucket_blocks(level
);
152 bidx
= dir_block_index(level
, F2FS_I(dir
)->i_dir_level
,
153 le32_to_cpu(namehash
) % nbucket
);
154 end_block
= bidx
+ nblock
;
156 for (; bidx
< end_block
; bidx
++) {
157 /* no need to allocate new dentry pages to all the indices */
158 dentry_page
= find_data_page(dir
, bidx
, true);
159 if (IS_ERR(dentry_page
)) {
164 de
= find_in_block(dentry_page
, name
, &max_slots
,
171 f2fs_put_page(dentry_page
, 0);
174 if (!de
&& room
&& F2FS_I(dir
)->chash
!= namehash
) {
175 F2FS_I(dir
)->chash
= namehash
;
176 F2FS_I(dir
)->clevel
= level
;
183 * Find an entry in the specified directory with the wanted name.
184 * It returns the page where the entry was found (as a parameter - res_page),
185 * and the entry itself. Page is returned mapped and unlocked.
186 * Entry is guaranteed to be valid.
188 struct f2fs_dir_entry
*f2fs_find_entry(struct inode
*dir
,
189 struct qstr
*child
, struct page
**res_page
)
191 unsigned long npages
= dir_blocks(dir
);
192 struct f2fs_dir_entry
*de
= NULL
;
193 f2fs_hash_t name_hash
;
194 unsigned int max_depth
;
202 name_hash
= f2fs_dentry_hash(child
);
203 max_depth
= F2FS_I(dir
)->i_current_depth
;
205 for (level
= 0; level
< max_depth
; level
++) {
206 de
= find_in_level(dir
, level
, child
, name_hash
, res_page
);
210 if (!de
&& F2FS_I(dir
)->chash
!= name_hash
) {
211 F2FS_I(dir
)->chash
= name_hash
;
212 F2FS_I(dir
)->clevel
= level
- 1;
217 struct f2fs_dir_entry
*f2fs_parent_dir(struct inode
*dir
, struct page
**p
)
220 struct f2fs_dir_entry
*de
;
221 struct f2fs_dentry_block
*dentry_blk
;
223 page
= get_lock_data_page(dir
, 0);
227 dentry_blk
= kmap(page
);
228 de
= &dentry_blk
->dentry
[1];
234 ino_t
f2fs_inode_by_name(struct inode
*dir
, struct qstr
*qstr
)
237 struct f2fs_dir_entry
*de
;
240 de
= f2fs_find_entry(dir
, qstr
, &page
);
242 res
= le32_to_cpu(de
->ino
);
244 f2fs_put_page(page
, 0);
250 void f2fs_set_link(struct inode
*dir
, struct f2fs_dir_entry
*de
,
251 struct page
*page
, struct inode
*inode
)
254 f2fs_wait_on_page_writeback(page
, DATA
);
255 de
->ino
= cpu_to_le32(inode
->i_ino
);
256 set_de_type(de
, inode
);
258 set_page_dirty(page
);
259 dir
->i_mtime
= dir
->i_ctime
= CURRENT_TIME
;
260 mark_inode_dirty(dir
);
262 f2fs_put_page(page
, 1);
265 static void init_dent_inode(const struct qstr
*name
, struct page
*ipage
)
267 struct f2fs_inode
*ri
;
269 f2fs_wait_on_page_writeback(ipage
, NODE
);
271 /* copy name info. to this inode page */
272 ri
= F2FS_INODE(ipage
);
273 ri
->i_namelen
= cpu_to_le32(name
->len
);
274 memcpy(ri
->i_name
, name
->name
, name
->len
);
275 set_page_dirty(ipage
);
278 int update_dent_inode(struct inode
*inode
, const struct qstr
*name
)
280 struct f2fs_sb_info
*sbi
= F2FS_SB(inode
->i_sb
);
283 page
= get_node_page(sbi
, inode
->i_ino
);
285 return PTR_ERR(page
);
287 init_dent_inode(name
, page
);
288 f2fs_put_page(page
, 1);
293 static int make_empty_dir(struct inode
*inode
,
294 struct inode
*parent
, struct page
*page
)
296 struct page
*dentry_page
;
297 struct f2fs_dentry_block
*dentry_blk
;
298 struct f2fs_dir_entry
*de
;
300 dentry_page
= get_new_data_page(inode
, page
, 0, true);
301 if (IS_ERR(dentry_page
))
302 return PTR_ERR(dentry_page
);
305 dentry_blk
= kmap_atomic(dentry_page
);
307 de
= &dentry_blk
->dentry
[0];
308 de
->name_len
= cpu_to_le16(1);
310 de
->ino
= cpu_to_le32(inode
->i_ino
);
311 memcpy(dentry_blk
->filename
[0], ".", 1);
312 set_de_type(de
, inode
);
314 de
= &dentry_blk
->dentry
[1];
316 de
->name_len
= cpu_to_le16(2);
317 de
->ino
= cpu_to_le32(parent
->i_ino
);
318 memcpy(dentry_blk
->filename
[1], "..", 2);
319 set_de_type(de
, inode
);
321 test_and_set_bit_le(0, &dentry_blk
->dentry_bitmap
);
322 test_and_set_bit_le(1, &dentry_blk
->dentry_bitmap
);
323 kunmap_atomic(dentry_blk
);
325 set_page_dirty(dentry_page
);
326 f2fs_put_page(dentry_page
, 1);
330 static struct page
*init_inode_metadata(struct inode
*inode
,
331 struct inode
*dir
, const struct qstr
*name
)
333 struct f2fs_sb_info
*sbi
= F2FS_SB(dir
->i_sb
);
337 if (is_inode_flag_set(F2FS_I(inode
), FI_NEW_INODE
)) {
338 page
= new_inode_page(inode
);
342 if (S_ISDIR(inode
->i_mode
)) {
343 err
= make_empty_dir(inode
, dir
, page
);
348 err
= f2fs_init_acl(inode
, dir
, page
);
352 err
= f2fs_init_security(inode
, dir
, name
, page
);
356 page
= get_node_page(F2FS_SB(dir
->i_sb
), inode
->i_ino
);
360 set_cold_node(inode
, page
);
364 init_dent_inode(name
, page
);
367 * This file should be checkpointed during fsync.
368 * We lost i_pino from now on.
370 if (is_inode_flag_set(F2FS_I(inode
), FI_INC_LINK
)) {
371 file_lost_pino(inode
);
373 * If link the tmpfile to alias through linkat path,
374 * we should remove this inode from orphan list.
376 if (inode
->i_nlink
== 0)
377 remove_orphan_inode(sbi
, inode
->i_ino
);
383 f2fs_put_page(page
, 1);
385 /* once the failed inode becomes a bad inode, i_mode is S_IFREG */
386 truncate_inode_pages(&inode
->i_data
, 0);
387 truncate_blocks(inode
, 0);
388 remove_dirty_dir_inode(inode
);
389 remove_inode_page(inode
);
393 static void update_parent_metadata(struct inode
*dir
, struct inode
*inode
,
394 unsigned int current_depth
)
396 if (is_inode_flag_set(F2FS_I(inode
), FI_NEW_INODE
)) {
397 if (S_ISDIR(inode
->i_mode
)) {
399 set_inode_flag(F2FS_I(dir
), FI_UPDATE_DIR
);
401 clear_inode_flag(F2FS_I(inode
), FI_NEW_INODE
);
403 dir
->i_mtime
= dir
->i_ctime
= CURRENT_TIME
;
404 mark_inode_dirty(dir
);
406 if (F2FS_I(dir
)->i_current_depth
!= current_depth
) {
407 F2FS_I(dir
)->i_current_depth
= current_depth
;
408 set_inode_flag(F2FS_I(dir
), FI_UPDATE_DIR
);
411 if (is_inode_flag_set(F2FS_I(inode
), FI_INC_LINK
))
412 clear_inode_flag(F2FS_I(inode
), FI_INC_LINK
);
415 static int room_for_filename(struct f2fs_dentry_block
*dentry_blk
, int slots
)
418 int zero_start
, zero_end
;
420 zero_start
= find_next_zero_bit_le(&dentry_blk
->dentry_bitmap
,
423 if (zero_start
>= NR_DENTRY_IN_BLOCK
)
424 return NR_DENTRY_IN_BLOCK
;
426 zero_end
= find_next_bit_le(&dentry_blk
->dentry_bitmap
,
429 if (zero_end
- zero_start
>= slots
)
432 bit_start
= zero_end
+ 1;
434 if (zero_end
+ 1 >= NR_DENTRY_IN_BLOCK
)
435 return NR_DENTRY_IN_BLOCK
;
440 * Caller should grab and release a rwsem by calling f2fs_lock_op() and
443 int __f2fs_add_link(struct inode
*dir
, const struct qstr
*name
,
446 unsigned int bit_pos
;
448 unsigned int current_depth
;
449 unsigned long bidx
, block
;
450 f2fs_hash_t dentry_hash
;
451 struct f2fs_dir_entry
*de
;
452 unsigned int nbucket
, nblock
;
453 size_t namelen
= name
->len
;
454 struct page
*dentry_page
= NULL
;
455 struct f2fs_dentry_block
*dentry_blk
= NULL
;
456 int slots
= GET_DENTRY_SLOTS(namelen
);
461 dentry_hash
= f2fs_dentry_hash(name
);
463 current_depth
= F2FS_I(dir
)->i_current_depth
;
464 if (F2FS_I(dir
)->chash
== dentry_hash
) {
465 level
= F2FS_I(dir
)->clevel
;
466 F2FS_I(dir
)->chash
= 0;
470 if (unlikely(current_depth
== MAX_DIR_HASH_DEPTH
))
473 /* Increase the depth, if required */
474 if (level
== current_depth
)
477 nbucket
= dir_buckets(level
, F2FS_I(dir
)->i_dir_level
);
478 nblock
= bucket_blocks(level
);
480 bidx
= dir_block_index(level
, F2FS_I(dir
)->i_dir_level
,
481 (le32_to_cpu(dentry_hash
) % nbucket
));
483 for (block
= bidx
; block
<= (bidx
+ nblock
- 1); block
++) {
484 dentry_page
= get_new_data_page(dir
, NULL
, block
, true);
485 if (IS_ERR(dentry_page
))
486 return PTR_ERR(dentry_page
);
488 dentry_blk
= kmap(dentry_page
);
489 bit_pos
= room_for_filename(dentry_blk
, slots
);
490 if (bit_pos
< NR_DENTRY_IN_BLOCK
)
494 f2fs_put_page(dentry_page
, 1);
497 /* Move to next level to find the empty slot for new dentry */
501 f2fs_wait_on_page_writeback(dentry_page
, DATA
);
503 down_write(&F2FS_I(inode
)->i_sem
);
504 page
= init_inode_metadata(inode
, dir
, name
);
509 de
= &dentry_blk
->dentry
[bit_pos
];
510 de
->hash_code
= dentry_hash
;
511 de
->name_len
= cpu_to_le16(namelen
);
512 memcpy(dentry_blk
->filename
[bit_pos
], name
->name
, name
->len
);
513 de
->ino
= cpu_to_le32(inode
->i_ino
);
514 set_de_type(de
, inode
);
515 for (i
= 0; i
< slots
; i
++)
516 test_and_set_bit_le(bit_pos
+ i
, &dentry_blk
->dentry_bitmap
);
517 set_page_dirty(dentry_page
);
519 /* we don't need to mark_inode_dirty now */
520 F2FS_I(inode
)->i_pino
= dir
->i_ino
;
521 update_inode(inode
, page
);
522 f2fs_put_page(page
, 1);
524 update_parent_metadata(dir
, inode
, current_depth
);
526 up_write(&F2FS_I(inode
)->i_sem
);
528 if (is_inode_flag_set(F2FS_I(dir
), FI_UPDATE_DIR
)) {
529 update_inode_page(dir
);
530 clear_inode_flag(F2FS_I(dir
), FI_UPDATE_DIR
);
533 f2fs_put_page(dentry_page
, 1);
537 int f2fs_do_tmpfile(struct inode
*inode
, struct inode
*dir
)
542 down_write(&F2FS_I(inode
)->i_sem
);
543 page
= init_inode_metadata(inode
, dir
, NULL
);
548 /* we don't need to mark_inode_dirty now */
549 update_inode(inode
, page
);
550 f2fs_put_page(page
, 1);
552 clear_inode_flag(F2FS_I(inode
), FI_NEW_INODE
);
554 up_write(&F2FS_I(inode
)->i_sem
);
559 * It only removes the dentry from the dentry page,corresponding name
560 * entry in name page does not need to be touched during deletion.
562 void f2fs_delete_entry(struct f2fs_dir_entry
*dentry
, struct page
*page
,
565 struct f2fs_dentry_block
*dentry_blk
;
566 unsigned int bit_pos
;
567 struct address_space
*mapping
= page
->mapping
;
568 struct inode
*dir
= mapping
->host
;
569 int slots
= GET_DENTRY_SLOTS(le16_to_cpu(dentry
->name_len
));
573 f2fs_wait_on_page_writeback(page
, DATA
);
575 dentry_blk
= page_address(page
);
576 bit_pos
= dentry
- dentry_blk
->dentry
;
577 for (i
= 0; i
< slots
; i
++)
578 test_and_clear_bit_le(bit_pos
+ i
, &dentry_blk
->dentry_bitmap
);
580 /* Let's check and deallocate this dentry page */
581 bit_pos
= find_next_bit_le(&dentry_blk
->dentry_bitmap
,
584 kunmap(page
); /* kunmap - pair of f2fs_find_entry */
585 set_page_dirty(page
);
587 dir
->i_ctime
= dir
->i_mtime
= CURRENT_TIME
;
590 struct f2fs_sb_info
*sbi
= F2FS_SB(dir
->i_sb
);
592 down_write(&F2FS_I(inode
)->i_sem
);
594 if (S_ISDIR(inode
->i_mode
)) {
596 update_inode_page(dir
);
598 inode
->i_ctime
= CURRENT_TIME
;
600 if (S_ISDIR(inode
->i_mode
)) {
602 i_size_write(inode
, 0);
604 up_write(&F2FS_I(inode
)->i_sem
);
605 update_inode_page(inode
);
607 if (inode
->i_nlink
== 0)
608 add_orphan_inode(sbi
, inode
->i_ino
);
610 release_orphan_inode(sbi
);
613 if (bit_pos
== NR_DENTRY_IN_BLOCK
) {
614 truncate_hole(dir
, page
->index
, page
->index
+ 1);
615 clear_page_dirty_for_io(page
);
616 ClearPageUptodate(page
);
617 inode_dec_dirty_dents(dir
);
619 f2fs_put_page(page
, 1);
622 bool f2fs_empty_dir(struct inode
*dir
)
625 struct page
*dentry_page
;
626 unsigned int bit_pos
;
627 struct f2fs_dentry_block
*dentry_blk
;
628 unsigned long nblock
= dir_blocks(dir
);
630 for (bidx
= 0; bidx
< nblock
; bidx
++) {
631 dentry_page
= get_lock_data_page(dir
, bidx
);
632 if (IS_ERR(dentry_page
)) {
633 if (PTR_ERR(dentry_page
) == -ENOENT
)
640 dentry_blk
= kmap_atomic(dentry_page
);
645 bit_pos
= find_next_bit_le(&dentry_blk
->dentry_bitmap
,
648 kunmap_atomic(dentry_blk
);
650 f2fs_put_page(dentry_page
, 1);
652 if (bit_pos
< NR_DENTRY_IN_BLOCK
)
658 static int f2fs_readdir(struct file
*file
, struct dir_context
*ctx
)
660 struct inode
*inode
= file_inode(file
);
661 unsigned long npages
= dir_blocks(inode
);
662 unsigned int bit_pos
= 0;
663 struct f2fs_dentry_block
*dentry_blk
= NULL
;
664 struct f2fs_dir_entry
*de
= NULL
;
665 struct page
*dentry_page
= NULL
;
666 struct file_ra_state
*ra
= &file
->f_ra
;
667 unsigned int n
= ((unsigned long)ctx
->pos
/ NR_DENTRY_IN_BLOCK
);
668 unsigned char d_type
= DT_UNKNOWN
;
670 bit_pos
= ((unsigned long)ctx
->pos
% NR_DENTRY_IN_BLOCK
);
672 /* readahead for multi pages of dir */
673 if (npages
- n
> 1 && !ra_has_index(ra
, n
))
674 page_cache_sync_readahead(inode
->i_mapping
, ra
, file
, n
,
675 min(npages
- n
, (pgoff_t
)MAX_DIR_RA_PAGES
));
677 for (; n
< npages
; n
++) {
678 dentry_page
= get_lock_data_page(inode
, n
);
679 if (IS_ERR(dentry_page
))
682 dentry_blk
= kmap(dentry_page
);
683 while (bit_pos
< NR_DENTRY_IN_BLOCK
) {
684 bit_pos
= find_next_bit_le(&dentry_blk
->dentry_bitmap
,
687 if (bit_pos
>= NR_DENTRY_IN_BLOCK
)
690 de
= &dentry_blk
->dentry
[bit_pos
];
691 if (de
->file_type
< F2FS_FT_MAX
)
692 d_type
= f2fs_filetype_table
[de
->file_type
];
696 dentry_blk
->filename
[bit_pos
],
697 le16_to_cpu(de
->name_len
),
698 le32_to_cpu(de
->ino
), d_type
))
701 bit_pos
+= GET_DENTRY_SLOTS(le16_to_cpu(de
->name_len
));
702 ctx
->pos
= n
* NR_DENTRY_IN_BLOCK
+ bit_pos
;
705 ctx
->pos
= (n
+ 1) * NR_DENTRY_IN_BLOCK
;
707 f2fs_put_page(dentry_page
, 1);
711 if (dentry_page
&& !IS_ERR(dentry_page
)) {
713 f2fs_put_page(dentry_page
, 1);
719 const struct file_operations f2fs_dir_operations
= {
720 .llseek
= generic_file_llseek
,
721 .read
= generic_read_dir
,
722 .iterate
= f2fs_readdir
,
723 .fsync
= f2fs_sync_file
,
724 .unlocked_ioctl
= f2fs_ioctl
,