4 * Copyright (c) 2012 Samsung Electronics Co., Ltd.
5 * http://www.samsung.com/
7 * This program is free software; you can redistribute it and/or modify
8 * it under the terms of the GNU General Public License version 2 as
9 * published by the Free Software Foundation.
14 #include <linux/types.h>
15 #include <linux/page-flags.h>
16 #include <linux/buffer_head.h>
17 #include <linux/slab.h>
18 #include <linux/crc32.h>
19 #include <linux/magic.h>
20 #include <linux/kobject.h>
21 #include <linux/sched.h>
23 #ifdef CONFIG_F2FS_CHECK_FS
24 #define f2fs_bug_on(condition) BUG_ON(condition)
25 #define f2fs_down_write(x, y) down_write_nest_lock(x, y)
27 #define f2fs_bug_on(condition)
28 #define f2fs_down_write(x, y) down_write(x)
34 #define F2FS_MOUNT_BG_GC 0x00000001
35 #define F2FS_MOUNT_DISABLE_ROLL_FORWARD 0x00000002
36 #define F2FS_MOUNT_DISCARD 0x00000004
37 #define F2FS_MOUNT_NOHEAP 0x00000008
38 #define F2FS_MOUNT_XATTR_USER 0x00000010
39 #define F2FS_MOUNT_POSIX_ACL 0x00000020
40 #define F2FS_MOUNT_DISABLE_EXT_IDENTIFY 0x00000040
41 #define F2FS_MOUNT_INLINE_XATTR 0x00000080
43 #define clear_opt(sbi, option) (sbi->mount_opt.opt &= ~F2FS_MOUNT_##option)
44 #define set_opt(sbi, option) (sbi->mount_opt.opt |= F2FS_MOUNT_##option)
45 #define test_opt(sbi, option) (sbi->mount_opt.opt & F2FS_MOUNT_##option)
47 #define ver_after(a, b) (typecheck(unsigned long long, a) && \
48 typecheck(unsigned long long, b) && \
49 ((long long)((a) - (b)) > 0))
51 typedef u32 block_t
; /*
52 * should not change u32, since it is the on-disk block
53 * address format, __le32.
57 struct f2fs_mount_info
{
61 #define CRCPOLY_LE 0xedb88320
63 static inline __u32
f2fs_crc32(void *buf
, size_t len
)
65 unsigned char *p
= (unsigned char *)buf
;
66 __u32 crc
= F2FS_SUPER_MAGIC
;
71 for (i
= 0; i
< 8; i
++)
72 crc
= (crc
>> 1) ^ ((crc
& 1) ? CRCPOLY_LE
: 0);
77 static inline bool f2fs_crc_valid(__u32 blk_crc
, void *buf
, size_t buf_size
)
79 return f2fs_crc32(buf
, buf_size
) == blk_crc
;
83 * For checkpoint manager
90 /* for the list of orphan inodes */
91 struct orphan_inode_entry
{
92 struct list_head list
; /* list head */
93 nid_t ino
; /* inode number */
96 /* for the list of directory inodes */
97 struct dir_inode_entry
{
98 struct list_head list
; /* list head */
99 struct inode
*inode
; /* vfs inode pointer */
102 /* for the list of blockaddresses to be discarded */
103 struct discard_entry
{
104 struct list_head list
; /* list head */
105 block_t blkaddr
; /* block address to be discarded */
106 int len
; /* # of consecutive blocks of the discard */
109 /* for the list of fsync inodes, used only during recovery */
110 struct fsync_inode_entry
{
111 struct list_head list
; /* list head */
112 struct inode
*inode
; /* vfs inode pointer */
113 block_t blkaddr
; /* block address locating the last inode */
116 #define nats_in_cursum(sum) (le16_to_cpu(sum->n_nats))
117 #define sits_in_cursum(sum) (le16_to_cpu(sum->n_sits))
119 #define nat_in_journal(sum, i) (sum->nat_j.entries[i].ne)
120 #define nid_in_journal(sum, i) (sum->nat_j.entries[i].nid)
121 #define sit_in_journal(sum, i) (sum->sit_j.entries[i].se)
122 #define segno_in_journal(sum, i) (sum->sit_j.entries[i].segno)
124 static inline int update_nats_in_cursum(struct f2fs_summary_block
*rs
, int i
)
126 int before
= nats_in_cursum(rs
);
127 rs
->n_nats
= cpu_to_le16(before
+ i
);
131 static inline int update_sits_in_cursum(struct f2fs_summary_block
*rs
, int i
)
133 int before
= sits_in_cursum(rs
);
134 rs
->n_sits
= cpu_to_le16(before
+ i
);
141 #define F2FS_IOC_GETFLAGS FS_IOC_GETFLAGS
142 #define F2FS_IOC_SETFLAGS FS_IOC_SETFLAGS
144 #if defined(__KERNEL__) && defined(CONFIG_COMPAT)
146 * ioctl commands in 32 bit emulation
148 #define F2FS_IOC32_GETFLAGS FS_IOC32_GETFLAGS
149 #define F2FS_IOC32_SETFLAGS FS_IOC32_SETFLAGS
153 * For INODE and NODE manager
156 * XATTR_NODE_OFFSET stores xattrs to one node block per file keeping -1
157 * as its node offset to distinguish from index node blocks.
158 * But some bits are used to mark the node block.
160 #define XATTR_NODE_OFFSET ((((unsigned int)-1) << OFFSET_BIT_SHIFT) \
163 ALLOC_NODE
, /* allocate a new node page if needed */
164 LOOKUP_NODE
, /* look up a node without readahead */
166 * look up a node with readahead called
167 * by get_datablock_ro.
171 #define F2FS_LINK_MAX 32000 /* maximum link count per file */
173 /* for in-memory extent cache entry */
174 #define F2FS_MIN_EXTENT_LEN 16 /* minimum extent length */
177 rwlock_t ext_lock
; /* rwlock for consistency */
178 unsigned int fofs
; /* start offset in a file */
179 u32 blk_addr
; /* start block address of the extent */
180 unsigned int len
; /* length of the extent */
184 * i_advise uses FADVISE_XXX_BIT. We can add additional hints later.
186 #define FADVISE_COLD_BIT 0x01
187 #define FADVISE_LOST_PINO_BIT 0x02
189 struct f2fs_inode_info
{
190 struct inode vfs_inode
; /* serve a vfs inode */
191 unsigned long i_flags
; /* keep an inode flags for ioctl */
192 unsigned char i_advise
; /* use to give file attribute hints */
193 unsigned int i_current_depth
; /* use only in directory structure */
194 unsigned int i_pino
; /* parent inode number */
195 umode_t i_acl_mode
; /* keep file acl mode temporarily */
197 /* Use below internally in f2fs*/
198 unsigned long flags
; /* use to pass per-file flags */
199 atomic_t dirty_dents
; /* # of dirty dentry pages */
200 f2fs_hash_t chash
; /* hash value of given file name */
201 unsigned int clevel
; /* maximum level of given file name */
202 nid_t i_xattr_nid
; /* node id that contains xattrs */
203 unsigned long long xattr_ver
; /* cp version of xattr modification */
204 struct extent_info ext
; /* in-memory extent cache entry */
207 static inline void get_extent_info(struct extent_info
*ext
,
208 struct f2fs_extent i_ext
)
210 write_lock(&ext
->ext_lock
);
211 ext
->fofs
= le32_to_cpu(i_ext
.fofs
);
212 ext
->blk_addr
= le32_to_cpu(i_ext
.blk_addr
);
213 ext
->len
= le32_to_cpu(i_ext
.len
);
214 write_unlock(&ext
->ext_lock
);
217 static inline void set_raw_extent(struct extent_info
*ext
,
218 struct f2fs_extent
*i_ext
)
220 read_lock(&ext
->ext_lock
);
221 i_ext
->fofs
= cpu_to_le32(ext
->fofs
);
222 i_ext
->blk_addr
= cpu_to_le32(ext
->blk_addr
);
223 i_ext
->len
= cpu_to_le32(ext
->len
);
224 read_unlock(&ext
->ext_lock
);
227 struct f2fs_nm_info
{
228 block_t nat_blkaddr
; /* base disk address of NAT */
229 nid_t max_nid
; /* maximum possible node ids */
230 nid_t next_scan_nid
; /* the next nid to be scanned */
232 /* NAT cache management */
233 struct radix_tree_root nat_root
;/* root of the nat entry cache */
234 rwlock_t nat_tree_lock
; /* protect nat_tree_lock */
235 unsigned int nat_cnt
; /* the # of cached nat entries */
236 struct list_head nat_entries
; /* cached nat entry list (clean) */
237 struct list_head dirty_nat_entries
; /* cached nat entry list (dirty) */
239 /* free node ids management */
240 struct list_head free_nid_list
; /* a list for free nids */
241 spinlock_t free_nid_list_lock
; /* protect free nid list */
242 unsigned int fcnt
; /* the number of free node id */
243 struct mutex build_lock
; /* lock for build free nids */
246 char *nat_bitmap
; /* NAT bitmap pointer */
247 int bitmap_size
; /* bitmap size */
251 * this structure is used as one of function parameters.
252 * all the information are dedicated to a given direct node block determined
253 * by the data offset in a file.
255 struct dnode_of_data
{
256 struct inode
*inode
; /* vfs inode pointer */
257 struct page
*inode_page
; /* its inode page, NULL is possible */
258 struct page
*node_page
; /* cached direct node page */
259 nid_t nid
; /* node id of the direct node block */
260 unsigned int ofs_in_node
; /* data offset in the node page */
261 bool inode_page_locked
; /* inode page is locked or not */
262 block_t data_blkaddr
; /* block address of the node block */
265 static inline void set_new_dnode(struct dnode_of_data
*dn
, struct inode
*inode
,
266 struct page
*ipage
, struct page
*npage
, nid_t nid
)
268 memset(dn
, 0, sizeof(*dn
));
270 dn
->inode_page
= ipage
;
271 dn
->node_page
= npage
;
278 * By default, there are 6 active log areas across the whole main area.
279 * When considering hot and cold data separation to reduce cleaning overhead,
280 * we split 3 for data logs and 3 for node logs as hot, warm, and cold types,
282 * In the current design, you should not change the numbers intentionally.
283 * Instead, as a mount option such as active_logs=x, you can use 2, 4, and 6
284 * logs individually according to the underlying devices. (default: 6)
285 * Just in case, on-disk layout covers maximum 16 logs that consist of 8 for
286 * data and 8 for node logs.
288 #define NR_CURSEG_DATA_TYPE (3)
289 #define NR_CURSEG_NODE_TYPE (3)
290 #define NR_CURSEG_TYPE (NR_CURSEG_DATA_TYPE + NR_CURSEG_NODE_TYPE)
293 CURSEG_HOT_DATA
= 0, /* directory entry blocks */
294 CURSEG_WARM_DATA
, /* data blocks */
295 CURSEG_COLD_DATA
, /* multimedia or GCed data blocks */
296 CURSEG_HOT_NODE
, /* direct node blocks of directory files */
297 CURSEG_WARM_NODE
, /* direct node blocks of normal files */
298 CURSEG_COLD_NODE
, /* indirect node blocks */
302 struct f2fs_sm_info
{
303 struct sit_info
*sit_info
; /* whole segment information */
304 struct free_segmap_info
*free_info
; /* free segment information */
305 struct dirty_seglist_info
*dirty_info
; /* dirty segment information */
306 struct curseg_info
*curseg_array
; /* active segment information */
308 struct list_head wblist_head
; /* list of under-writeback pages */
309 spinlock_t wblist_lock
; /* lock for checkpoint */
311 block_t seg0_blkaddr
; /* block address of 0'th segment */
312 block_t main_blkaddr
; /* start block address of main area */
313 block_t ssa_blkaddr
; /* start block address of SSA area */
315 unsigned int segment_count
; /* total # of segments */
316 unsigned int main_segments
; /* # of segments in main area */
317 unsigned int reserved_segments
; /* # of reserved segments */
318 unsigned int ovp_segments
; /* # of overprovision segments */
320 /* a threshold to reclaim prefree segments */
321 unsigned int rec_prefree_segments
;
323 /* for small discard management */
324 struct list_head discard_list
; /* 4KB discard list */
325 int nr_discards
; /* # of discards in the list */
326 int max_discards
; /* max. discards to be issued */
333 * COUNT_TYPE for monitoring
335 * f2fs monitors the number of several block types such as on-writeback,
336 * dirty dentry blocks, dirty node blocks, and dirty meta blocks.
347 * The below are the page types of bios used in submti_bio().
348 * The available types are:
349 * DATA User data pages. It operates as async mode.
350 * NODE Node pages. It operates as async mode.
351 * META FS metadata pages such as SIT, NAT, CP.
352 * NR_PAGE_TYPE The number of page types.
353 * META_FLUSH Make sure the previous pages are written
354 * with waiting the bio's completion
355 * ... Only can be used with META.
357 #define PAGE_TYPE_OF_BIO(type) ((type) > META ? META : (type))
366 struct f2fs_bio_info
{
367 struct bio
*bio
; /* bios to merge */
368 sector_t last_block_in_bio
; /* last block number */
369 struct mutex io_mutex
; /* mutex for bio */
372 struct f2fs_sb_info
{
373 struct super_block
*sb
; /* pointer to VFS super block */
374 struct proc_dir_entry
*s_proc
; /* proc entry */
375 struct buffer_head
*raw_super_buf
; /* buffer head of raw sb */
376 struct f2fs_super_block
*raw_super
; /* raw super block pointer */
377 int s_dirty
; /* dirty flag for checkpoint */
379 /* for node-related operations */
380 struct f2fs_nm_info
*nm_info
; /* node manager */
381 struct inode
*node_inode
; /* cache node blocks */
383 /* for segment-related operations */
384 struct f2fs_sm_info
*sm_info
; /* segment manager */
386 /* for bio operations */
387 struct f2fs_bio_info read_io
; /* for read bios */
388 struct f2fs_bio_info write_io
[NR_PAGE_TYPE
]; /* for write bios */
391 struct f2fs_checkpoint
*ckpt
; /* raw checkpoint pointer */
392 struct inode
*meta_inode
; /* cache meta blocks */
393 struct mutex cp_mutex
; /* checkpoint procedure lock */
394 struct rw_semaphore cp_rwsem
; /* blocking FS operations */
395 struct mutex node_write
; /* locking node writes */
396 struct mutex writepages
; /* mutex for writepages() */
397 bool por_doing
; /* recovery is doing or not */
398 bool on_build_free_nids
; /* build_free_nids is doing */
399 wait_queue_head_t cp_wait
;
401 /* for orphan inode management */
402 struct list_head orphan_inode_list
; /* orphan inode list */
403 struct mutex orphan_inode_mutex
; /* for orphan inode list */
404 unsigned int n_orphans
; /* # of orphan inodes */
406 /* for directory inode management */
407 struct list_head dir_inode_list
; /* dir inode list */
408 spinlock_t dir_inode_lock
; /* for dir inode list lock */
410 /* basic file system units */
411 unsigned int log_sectors_per_block
; /* log2 sectors per block */
412 unsigned int log_blocksize
; /* log2 block size */
413 unsigned int blocksize
; /* block size */
414 unsigned int root_ino_num
; /* root inode number*/
415 unsigned int node_ino_num
; /* node inode number*/
416 unsigned int meta_ino_num
; /* meta inode number*/
417 unsigned int log_blocks_per_seg
; /* log2 blocks per segment */
418 unsigned int blocks_per_seg
; /* blocks per segment */
419 unsigned int segs_per_sec
; /* segments per section */
420 unsigned int secs_per_zone
; /* sections per zone */
421 unsigned int total_sections
; /* total section count */
422 unsigned int total_node_count
; /* total node block count */
423 unsigned int total_valid_node_count
; /* valid node block count */
424 unsigned int total_valid_inode_count
; /* valid inode count */
425 int active_logs
; /* # of active logs */
427 block_t user_block_count
; /* # of user blocks */
428 block_t total_valid_block_count
; /* # of valid blocks */
429 block_t alloc_valid_block_count
; /* # of allocated blocks */
430 block_t last_valid_block_count
; /* for recovery */
431 u32 s_next_generation
; /* for NFS support */
432 atomic_t nr_pages
[NR_COUNT_TYPE
]; /* # of pages, see count_type */
434 struct f2fs_mount_info mount_opt
; /* mount options */
436 /* for cleaning operations */
437 struct mutex gc_mutex
; /* mutex for GC */
438 struct f2fs_gc_kthread
*gc_thread
; /* GC thread */
439 unsigned int cur_victim_sec
; /* current victim section num */
442 * for stat information.
443 * one is for the LFS mode, and the other is for the SSR mode.
445 #ifdef CONFIG_F2FS_STAT_FS
446 struct f2fs_stat_info
*stat_info
; /* FS status information */
447 unsigned int segment_count
[2]; /* # of allocated segments */
448 unsigned int block_count
[2]; /* # of allocated blocks */
449 int total_hit_ext
, read_hit_ext
; /* extent cache hit ratio */
450 int bg_gc
; /* background gc calls */
451 unsigned int n_dirty_dirs
; /* # of dir inodes */
453 unsigned int last_victim
[2]; /* last victim segment # */
454 spinlock_t stat_lock
; /* lock for stat operations */
456 /* For sysfs suppport */
457 struct kobject s_kobj
;
458 struct completion s_kobj_unregister
;
464 static inline struct f2fs_inode_info
*F2FS_I(struct inode
*inode
)
466 return container_of(inode
, struct f2fs_inode_info
, vfs_inode
);
469 static inline struct f2fs_sb_info
*F2FS_SB(struct super_block
*sb
)
471 return sb
->s_fs_info
;
474 static inline struct f2fs_super_block
*F2FS_RAW_SUPER(struct f2fs_sb_info
*sbi
)
476 return (struct f2fs_super_block
*)(sbi
->raw_super
);
479 static inline struct f2fs_checkpoint
*F2FS_CKPT(struct f2fs_sb_info
*sbi
)
481 return (struct f2fs_checkpoint
*)(sbi
->ckpt
);
484 static inline struct f2fs_node
*F2FS_NODE(struct page
*page
)
486 return (struct f2fs_node
*)page_address(page
);
489 static inline struct f2fs_nm_info
*NM_I(struct f2fs_sb_info
*sbi
)
491 return (struct f2fs_nm_info
*)(sbi
->nm_info
);
494 static inline struct f2fs_sm_info
*SM_I(struct f2fs_sb_info
*sbi
)
496 return (struct f2fs_sm_info
*)(sbi
->sm_info
);
499 static inline struct sit_info
*SIT_I(struct f2fs_sb_info
*sbi
)
501 return (struct sit_info
*)(SM_I(sbi
)->sit_info
);
504 static inline struct free_segmap_info
*FREE_I(struct f2fs_sb_info
*sbi
)
506 return (struct free_segmap_info
*)(SM_I(sbi
)->free_info
);
509 static inline struct dirty_seglist_info
*DIRTY_I(struct f2fs_sb_info
*sbi
)
511 return (struct dirty_seglist_info
*)(SM_I(sbi
)->dirty_info
);
514 static inline void F2FS_SET_SB_DIRT(struct f2fs_sb_info
*sbi
)
519 static inline void F2FS_RESET_SB_DIRT(struct f2fs_sb_info
*sbi
)
524 static inline unsigned long long cur_cp_version(struct f2fs_checkpoint
*cp
)
526 return le64_to_cpu(cp
->checkpoint_ver
);
529 static inline bool is_set_ckpt_flags(struct f2fs_checkpoint
*cp
, unsigned int f
)
531 unsigned int ckpt_flags
= le32_to_cpu(cp
->ckpt_flags
);
532 return ckpt_flags
& f
;
535 static inline void set_ckpt_flags(struct f2fs_checkpoint
*cp
, unsigned int f
)
537 unsigned int ckpt_flags
= le32_to_cpu(cp
->ckpt_flags
);
539 cp
->ckpt_flags
= cpu_to_le32(ckpt_flags
);
542 static inline void clear_ckpt_flags(struct f2fs_checkpoint
*cp
, unsigned int f
)
544 unsigned int ckpt_flags
= le32_to_cpu(cp
->ckpt_flags
);
546 cp
->ckpt_flags
= cpu_to_le32(ckpt_flags
);
549 static inline void f2fs_lock_op(struct f2fs_sb_info
*sbi
)
551 down_read(&sbi
->cp_rwsem
);
554 static inline void f2fs_unlock_op(struct f2fs_sb_info
*sbi
)
556 up_read(&sbi
->cp_rwsem
);
559 static inline void f2fs_lock_all(struct f2fs_sb_info
*sbi
)
561 f2fs_down_write(&sbi
->cp_rwsem
, &sbi
->cp_mutex
);
564 static inline void f2fs_unlock_all(struct f2fs_sb_info
*sbi
)
566 up_write(&sbi
->cp_rwsem
);
570 * Check whether the given nid is within node id range.
572 static inline int check_nid_range(struct f2fs_sb_info
*sbi
, nid_t nid
)
574 WARN_ON((nid
>= NM_I(sbi
)->max_nid
));
575 if (nid
>= NM_I(sbi
)->max_nid
)
580 #define F2FS_DEFAULT_ALLOCATED_BLOCKS 1
583 * Check whether the inode has blocks or not
585 static inline int F2FS_HAS_BLOCKS(struct inode
*inode
)
587 if (F2FS_I(inode
)->i_xattr_nid
)
588 return (inode
->i_blocks
> F2FS_DEFAULT_ALLOCATED_BLOCKS
+ 1);
590 return (inode
->i_blocks
> F2FS_DEFAULT_ALLOCATED_BLOCKS
);
593 static inline bool inc_valid_block_count(struct f2fs_sb_info
*sbi
,
594 struct inode
*inode
, blkcnt_t count
)
596 block_t valid_block_count
;
598 spin_lock(&sbi
->stat_lock
);
600 sbi
->total_valid_block_count
+ (block_t
)count
;
601 if (valid_block_count
> sbi
->user_block_count
) {
602 spin_unlock(&sbi
->stat_lock
);
605 inode
->i_blocks
+= count
;
606 sbi
->total_valid_block_count
= valid_block_count
;
607 sbi
->alloc_valid_block_count
+= (block_t
)count
;
608 spin_unlock(&sbi
->stat_lock
);
612 static inline void dec_valid_block_count(struct f2fs_sb_info
*sbi
,
616 spin_lock(&sbi
->stat_lock
);
617 f2fs_bug_on(sbi
->total_valid_block_count
< (block_t
) count
);
618 f2fs_bug_on(inode
->i_blocks
< count
);
619 inode
->i_blocks
-= count
;
620 sbi
->total_valid_block_count
-= (block_t
)count
;
621 spin_unlock(&sbi
->stat_lock
);
624 static inline void inc_page_count(struct f2fs_sb_info
*sbi
, int count_type
)
626 atomic_inc(&sbi
->nr_pages
[count_type
]);
627 F2FS_SET_SB_DIRT(sbi
);
630 static inline void inode_inc_dirty_dents(struct inode
*inode
)
632 atomic_inc(&F2FS_I(inode
)->dirty_dents
);
635 static inline void dec_page_count(struct f2fs_sb_info
*sbi
, int count_type
)
637 atomic_dec(&sbi
->nr_pages
[count_type
]);
640 static inline void inode_dec_dirty_dents(struct inode
*inode
)
642 atomic_dec(&F2FS_I(inode
)->dirty_dents
);
645 static inline int get_pages(struct f2fs_sb_info
*sbi
, int count_type
)
647 return atomic_read(&sbi
->nr_pages
[count_type
]);
650 static inline int get_blocktype_secs(struct f2fs_sb_info
*sbi
, int block_type
)
652 unsigned int pages_per_sec
= sbi
->segs_per_sec
*
653 (1 << sbi
->log_blocks_per_seg
);
654 return ((get_pages(sbi
, block_type
) + pages_per_sec
- 1)
655 >> sbi
->log_blocks_per_seg
) / sbi
->segs_per_sec
;
658 static inline block_t
valid_user_blocks(struct f2fs_sb_info
*sbi
)
661 spin_lock(&sbi
->stat_lock
);
662 ret
= sbi
->total_valid_block_count
;
663 spin_unlock(&sbi
->stat_lock
);
667 static inline unsigned long __bitmap_size(struct f2fs_sb_info
*sbi
, int flag
)
669 struct f2fs_checkpoint
*ckpt
= F2FS_CKPT(sbi
);
671 /* return NAT or SIT bitmap */
672 if (flag
== NAT_BITMAP
)
673 return le32_to_cpu(ckpt
->nat_ver_bitmap_bytesize
);
674 else if (flag
== SIT_BITMAP
)
675 return le32_to_cpu(ckpt
->sit_ver_bitmap_bytesize
);
680 static inline void *__bitmap_ptr(struct f2fs_sb_info
*sbi
, int flag
)
682 struct f2fs_checkpoint
*ckpt
= F2FS_CKPT(sbi
);
683 int offset
= (flag
== NAT_BITMAP
) ?
684 le32_to_cpu(ckpt
->sit_ver_bitmap_bytesize
) : 0;
685 return &ckpt
->sit_nat_version_bitmap
+ offset
;
688 static inline block_t
__start_cp_addr(struct f2fs_sb_info
*sbi
)
691 struct f2fs_checkpoint
*ckpt
= F2FS_CKPT(sbi
);
692 unsigned long long ckpt_version
= cur_cp_version(ckpt
);
694 start_addr
= le32_to_cpu(F2FS_RAW_SUPER(sbi
)->cp_blkaddr
);
697 * odd numbered checkpoint should at cp segment 0
698 * and even segent must be at cp segment 1
700 if (!(ckpt_version
& 1))
701 start_addr
+= sbi
->blocks_per_seg
;
706 static inline block_t
__start_sum_addr(struct f2fs_sb_info
*sbi
)
708 return le32_to_cpu(F2FS_CKPT(sbi
)->cp_pack_start_sum
);
711 static inline bool inc_valid_node_count(struct f2fs_sb_info
*sbi
,
714 block_t valid_block_count
;
715 unsigned int valid_node_count
;
717 spin_lock(&sbi
->stat_lock
);
719 valid_block_count
= sbi
->total_valid_block_count
+ 1;
720 if (valid_block_count
> sbi
->user_block_count
) {
721 spin_unlock(&sbi
->stat_lock
);
725 valid_node_count
= sbi
->total_valid_node_count
+ 1;
726 if (valid_node_count
> sbi
->total_node_count
) {
727 spin_unlock(&sbi
->stat_lock
);
734 sbi
->alloc_valid_block_count
++;
735 sbi
->total_valid_node_count
++;
736 sbi
->total_valid_block_count
++;
737 spin_unlock(&sbi
->stat_lock
);
742 static inline void dec_valid_node_count(struct f2fs_sb_info
*sbi
,
745 spin_lock(&sbi
->stat_lock
);
747 f2fs_bug_on(!sbi
->total_valid_block_count
);
748 f2fs_bug_on(!sbi
->total_valid_node_count
);
749 f2fs_bug_on(!inode
->i_blocks
);
752 sbi
->total_valid_node_count
--;
753 sbi
->total_valid_block_count
--;
755 spin_unlock(&sbi
->stat_lock
);
758 static inline unsigned int valid_node_count(struct f2fs_sb_info
*sbi
)
761 spin_lock(&sbi
->stat_lock
);
762 ret
= sbi
->total_valid_node_count
;
763 spin_unlock(&sbi
->stat_lock
);
767 static inline void inc_valid_inode_count(struct f2fs_sb_info
*sbi
)
769 spin_lock(&sbi
->stat_lock
);
770 f2fs_bug_on(sbi
->total_valid_inode_count
== sbi
->total_node_count
);
771 sbi
->total_valid_inode_count
++;
772 spin_unlock(&sbi
->stat_lock
);
775 static inline int dec_valid_inode_count(struct f2fs_sb_info
*sbi
)
777 spin_lock(&sbi
->stat_lock
);
778 f2fs_bug_on(!sbi
->total_valid_inode_count
);
779 sbi
->total_valid_inode_count
--;
780 spin_unlock(&sbi
->stat_lock
);
784 static inline unsigned int valid_inode_count(struct f2fs_sb_info
*sbi
)
787 spin_lock(&sbi
->stat_lock
);
788 ret
= sbi
->total_valid_inode_count
;
789 spin_unlock(&sbi
->stat_lock
);
793 static inline void f2fs_put_page(struct page
*page
, int unlock
)
795 if (!page
|| IS_ERR(page
))
799 f2fs_bug_on(!PageLocked(page
));
802 page_cache_release(page
);
805 static inline void f2fs_put_dnode(struct dnode_of_data
*dn
)
808 f2fs_put_page(dn
->node_page
, 1);
809 if (dn
->inode_page
&& dn
->node_page
!= dn
->inode_page
)
810 f2fs_put_page(dn
->inode_page
, 0);
811 dn
->node_page
= NULL
;
812 dn
->inode_page
= NULL
;
815 static inline struct kmem_cache
*f2fs_kmem_cache_create(const char *name
,
816 size_t size
, void (*ctor
)(void *))
818 return kmem_cache_create(name
, size
, 0, SLAB_RECLAIM_ACCOUNT
, ctor
);
821 static inline void *f2fs_kmem_cache_alloc(struct kmem_cache
*cachep
,
826 entry
= kmem_cache_alloc(cachep
, flags
);
835 #define RAW_IS_INODE(p) ((p)->footer.nid == (p)->footer.ino)
837 static inline bool IS_INODE(struct page
*page
)
839 struct f2fs_node
*p
= F2FS_NODE(page
);
840 return RAW_IS_INODE(p
);
843 static inline __le32
*blkaddr_in_node(struct f2fs_node
*node
)
845 return RAW_IS_INODE(node
) ? node
->i
.i_addr
: node
->dn
.addr
;
848 static inline block_t
datablock_addr(struct page
*node_page
,
851 struct f2fs_node
*raw_node
;
853 raw_node
= F2FS_NODE(node_page
);
854 addr_array
= blkaddr_in_node(raw_node
);
855 return le32_to_cpu(addr_array
[offset
]);
858 static inline int f2fs_test_bit(unsigned int nr
, char *addr
)
863 mask
= 1 << (7 - (nr
& 0x07));
867 static inline int f2fs_set_bit(unsigned int nr
, char *addr
)
873 mask
= 1 << (7 - (nr
& 0x07));
879 static inline int f2fs_clear_bit(unsigned int nr
, char *addr
)
885 mask
= 1 << (7 - (nr
& 0x07));
891 /* used for f2fs_inode_info->flags */
893 FI_NEW_INODE
, /* indicate newly allocated inode */
894 FI_DIRTY_INODE
, /* indicate inode is dirty or not */
895 FI_INC_LINK
, /* need to increment i_nlink */
896 FI_ACL_MODE
, /* indicate acl mode */
897 FI_NO_ALLOC
, /* should not allocate any blocks */
898 FI_UPDATE_DIR
, /* should update inode block for consistency */
899 FI_DELAY_IPUT
, /* used for the recovery */
900 FI_NO_EXTENT
, /* not to use the extent cache */
901 FI_INLINE_XATTR
, /* used for inline xattr */
904 static inline void set_inode_flag(struct f2fs_inode_info
*fi
, int flag
)
906 set_bit(flag
, &fi
->flags
);
909 static inline int is_inode_flag_set(struct f2fs_inode_info
*fi
, int flag
)
911 return test_bit(flag
, &fi
->flags
);
914 static inline void clear_inode_flag(struct f2fs_inode_info
*fi
, int flag
)
916 clear_bit(flag
, &fi
->flags
);
919 static inline void set_acl_inode(struct f2fs_inode_info
*fi
, umode_t mode
)
921 fi
->i_acl_mode
= mode
;
922 set_inode_flag(fi
, FI_ACL_MODE
);
925 static inline int cond_clear_inode_flag(struct f2fs_inode_info
*fi
, int flag
)
927 if (is_inode_flag_set(fi
, FI_ACL_MODE
)) {
928 clear_inode_flag(fi
, FI_ACL_MODE
);
934 static inline void get_inline_info(struct f2fs_inode_info
*fi
,
935 struct f2fs_inode
*ri
)
937 if (ri
->i_inline
& F2FS_INLINE_XATTR
)
938 set_inode_flag(fi
, FI_INLINE_XATTR
);
941 static inline void set_raw_inline(struct f2fs_inode_info
*fi
,
942 struct f2fs_inode
*ri
)
946 if (is_inode_flag_set(fi
, FI_INLINE_XATTR
))
947 ri
->i_inline
|= F2FS_INLINE_XATTR
;
950 static inline unsigned int addrs_per_inode(struct f2fs_inode_info
*fi
)
952 if (is_inode_flag_set(fi
, FI_INLINE_XATTR
))
953 return DEF_ADDRS_PER_INODE
- F2FS_INLINE_XATTR_ADDRS
;
954 return DEF_ADDRS_PER_INODE
;
957 static inline void *inline_xattr_addr(struct page
*page
)
959 struct f2fs_inode
*ri
;
960 ri
= (struct f2fs_inode
*)page_address(page
);
961 return (void *)&(ri
->i_addr
[DEF_ADDRS_PER_INODE
-
962 F2FS_INLINE_XATTR_ADDRS
]);
965 static inline int inline_xattr_size(struct inode
*inode
)
967 if (is_inode_flag_set(F2FS_I(inode
), FI_INLINE_XATTR
))
968 return F2FS_INLINE_XATTR_ADDRS
<< 2;
973 static inline int f2fs_readonly(struct super_block
*sb
)
975 return sb
->s_flags
& MS_RDONLY
;
981 int f2fs_sync_file(struct file
*, loff_t
, loff_t
, int);
982 void truncate_data_blocks(struct dnode_of_data
*);
983 void f2fs_truncate(struct inode
*);
984 int f2fs_getattr(struct vfsmount
*, struct dentry
*, struct kstat
*);
985 int f2fs_setattr(struct dentry
*, struct iattr
*);
986 int truncate_hole(struct inode
*, pgoff_t
, pgoff_t
);
987 int truncate_data_blocks_range(struct dnode_of_data
*, int);
988 long f2fs_ioctl(struct file
*, unsigned int, unsigned long);
989 long f2fs_compat_ioctl(struct file
*, unsigned int, unsigned long);
994 void f2fs_set_inode_flags(struct inode
*);
995 struct inode
*f2fs_iget(struct super_block
*, unsigned long);
996 int try_to_free_nats(struct f2fs_sb_info
*, int);
997 void update_inode(struct inode
*, struct page
*);
998 int update_inode_page(struct inode
*);
999 int f2fs_write_inode(struct inode
*, struct writeback_control
*);
1000 void f2fs_evict_inode(struct inode
*);
1005 struct dentry
*f2fs_get_parent(struct dentry
*child
);
1010 struct f2fs_dir_entry
*f2fs_find_entry(struct inode
*, struct qstr
*,
1012 struct f2fs_dir_entry
*f2fs_parent_dir(struct inode
*, struct page
**);
1013 ino_t
f2fs_inode_by_name(struct inode
*, struct qstr
*);
1014 void f2fs_set_link(struct inode
*, struct f2fs_dir_entry
*,
1015 struct page
*, struct inode
*);
1016 int update_dent_inode(struct inode
*, const struct qstr
*);
1017 int __f2fs_add_link(struct inode
*, const struct qstr
*, struct inode
*);
1018 void f2fs_delete_entry(struct f2fs_dir_entry
*, struct page
*, struct inode
*);
1019 int f2fs_make_empty(struct inode
*, struct inode
*);
1020 bool f2fs_empty_dir(struct inode
*);
1022 static inline int f2fs_add_link(struct dentry
*dentry
, struct inode
*inode
)
1024 return __f2fs_add_link(dentry
->d_parent
->d_inode
, &dentry
->d_name
,
1031 int f2fs_sync_fs(struct super_block
*, int);
1032 extern __printf(3, 4)
1033 void f2fs_msg(struct super_block
*, const char *, const char *, ...);
1038 f2fs_hash_t
f2fs_dentry_hash(const char *, size_t);
1043 struct dnode_of_data
;
1046 int is_checkpointed_node(struct f2fs_sb_info
*, nid_t
);
1047 void get_node_info(struct f2fs_sb_info
*, nid_t
, struct node_info
*);
1048 int get_dnode_of_data(struct dnode_of_data
*, pgoff_t
, int);
1049 int truncate_inode_blocks(struct inode
*, pgoff_t
);
1050 int truncate_xattr_node(struct inode
*, struct page
*);
1051 int wait_on_node_pages_writeback(struct f2fs_sb_info
*, nid_t
);
1052 void remove_inode_page(struct inode
*);
1053 struct page
*new_inode_page(struct inode
*, const struct qstr
*);
1054 struct page
*new_node_page(struct dnode_of_data
*, unsigned int, struct page
*);
1055 void ra_node_page(struct f2fs_sb_info
*, nid_t
);
1056 struct page
*get_node_page(struct f2fs_sb_info
*, pgoff_t
);
1057 struct page
*get_node_page_ra(struct page
*, int);
1058 void sync_inode_page(struct dnode_of_data
*);
1059 int sync_node_pages(struct f2fs_sb_info
*, nid_t
, struct writeback_control
*);
1060 bool alloc_nid(struct f2fs_sb_info
*, nid_t
*);
1061 void alloc_nid_done(struct f2fs_sb_info
*, nid_t
);
1062 void alloc_nid_failed(struct f2fs_sb_info
*, nid_t
);
1063 void recover_node_page(struct f2fs_sb_info
*, struct page
*,
1064 struct f2fs_summary
*, struct node_info
*, block_t
);
1065 int recover_inode_page(struct f2fs_sb_info
*, struct page
*);
1066 int restore_node_summary(struct f2fs_sb_info
*, unsigned int,
1067 struct f2fs_summary_block
*);
1068 void flush_nat_entries(struct f2fs_sb_info
*);
1069 int build_node_manager(struct f2fs_sb_info
*);
1070 void destroy_node_manager(struct f2fs_sb_info
*);
1071 int __init
create_node_manager_caches(void);
1072 void destroy_node_manager_caches(void);
1077 void f2fs_balance_fs(struct f2fs_sb_info
*);
1078 void f2fs_balance_fs_bg(struct f2fs_sb_info
*);
1079 void invalidate_blocks(struct f2fs_sb_info
*, block_t
);
1080 void clear_prefree_segments(struct f2fs_sb_info
*);
1081 int npages_for_summary_flush(struct f2fs_sb_info
*);
1082 void allocate_new_segments(struct f2fs_sb_info
*);
1083 struct page
*get_sum_page(struct f2fs_sb_info
*, unsigned int);
1084 struct bio
*f2fs_bio_alloc(struct block_device
*, int);
1085 void f2fs_submit_bio(struct f2fs_sb_info
*, enum page_type
, bool);
1086 void f2fs_wait_on_page_writeback(struct page
*, enum page_type
, bool);
1087 void write_meta_page(struct f2fs_sb_info
*, struct page
*);
1088 void write_node_page(struct f2fs_sb_info
*, struct page
*, unsigned int,
1089 block_t
, block_t
*);
1090 void write_data_page(struct inode
*, struct page
*, struct dnode_of_data
*,
1091 block_t
, block_t
*);
1092 void rewrite_data_page(struct f2fs_sb_info
*, struct page
*, block_t
);
1093 void recover_data_page(struct f2fs_sb_info
*, struct page
*,
1094 struct f2fs_summary
*, block_t
, block_t
);
1095 void rewrite_node_page(struct f2fs_sb_info
*, struct page
*,
1096 struct f2fs_summary
*, block_t
, block_t
);
1097 void write_data_summaries(struct f2fs_sb_info
*, block_t
);
1098 void write_node_summaries(struct f2fs_sb_info
*, block_t
);
1099 int lookup_journal_in_cursum(struct f2fs_summary_block
*,
1100 int, unsigned int, int);
1101 void flush_sit_entries(struct f2fs_sb_info
*);
1102 int build_segment_manager(struct f2fs_sb_info
*);
1103 void destroy_segment_manager(struct f2fs_sb_info
*);
1104 int __init
create_segment_manager_caches(void);
1105 void destroy_segment_manager_caches(void);
1110 struct page
*grab_meta_page(struct f2fs_sb_info
*, pgoff_t
);
1111 struct page
*get_meta_page(struct f2fs_sb_info
*, pgoff_t
);
1112 long sync_meta_pages(struct f2fs_sb_info
*, enum page_type
, long);
1113 int acquire_orphan_inode(struct f2fs_sb_info
*);
1114 void release_orphan_inode(struct f2fs_sb_info
*);
1115 void add_orphan_inode(struct f2fs_sb_info
*, nid_t
);
1116 void remove_orphan_inode(struct f2fs_sb_info
*, nid_t
);
1117 int recover_orphan_inodes(struct f2fs_sb_info
*);
1118 int get_valid_checkpoint(struct f2fs_sb_info
*);
1119 void set_dirty_dir_page(struct inode
*, struct page
*);
1120 void add_dirty_dir_inode(struct inode
*);
1121 void remove_dirty_dir_inode(struct inode
*);
1122 struct inode
*check_dirty_dir_inode(struct f2fs_sb_info
*, nid_t
);
1123 void sync_dirty_dir_inodes(struct f2fs_sb_info
*);
1124 void write_checkpoint(struct f2fs_sb_info
*, bool);
1125 void init_orphan_info(struct f2fs_sb_info
*);
1126 int __init
create_checkpoint_caches(void);
1127 void destroy_checkpoint_caches(void);
1132 int reserve_new_block(struct dnode_of_data
*);
1133 void update_extent_cache(block_t
, struct dnode_of_data
*);
1134 struct page
*find_data_page(struct inode
*, pgoff_t
, bool);
1135 struct page
*get_lock_data_page(struct inode
*, pgoff_t
);
1136 struct page
*get_new_data_page(struct inode
*, struct page
*, pgoff_t
, bool);
1137 int f2fs_readpage(struct f2fs_sb_info
*, struct page
*, block_t
, int);
1138 void f2fs_submit_read_bio(struct f2fs_sb_info
*, int);
1139 void submit_read_page(struct f2fs_sb_info
*, struct page
*, block_t
, int);
1140 int do_write_data_page(struct page
*);
1145 int start_gc_thread(struct f2fs_sb_info
*);
1146 void stop_gc_thread(struct f2fs_sb_info
*);
1147 block_t
start_bidx_of_node(unsigned int, struct f2fs_inode_info
*);
1148 int f2fs_gc(struct f2fs_sb_info
*);
1149 void build_gc_manager(struct f2fs_sb_info
*);
1150 int __init
create_gc_caches(void);
1151 void destroy_gc_caches(void);
1156 int recover_fsync_data(struct f2fs_sb_info
*);
1157 bool space_for_roll_forward(struct f2fs_sb_info
*);
1162 #ifdef CONFIG_F2FS_STAT_FS
1163 struct f2fs_stat_info
{
1164 struct list_head stat_list
;
1165 struct f2fs_sb_info
*sbi
;
1166 struct mutex stat_lock
;
1167 int all_area_segs
, sit_area_segs
, nat_area_segs
, ssa_area_segs
;
1168 int main_area_segs
, main_area_sections
, main_area_zones
;
1169 int hit_ext
, total_ext
;
1170 int ndirty_node
, ndirty_dent
, ndirty_dirs
, ndirty_meta
;
1171 int nats
, sits
, fnids
;
1172 int total_count
, utilization
;
1174 unsigned int valid_count
, valid_node_count
, valid_inode_count
;
1175 unsigned int bimodal
, avg_vblocks
;
1176 int util_free
, util_valid
, util_invalid
;
1177 int rsvd_segs
, overp_segs
;
1178 int dirty_count
, node_pages
, meta_pages
;
1179 int prefree_count
, call_count
;
1180 int tot_segs
, node_segs
, data_segs
, free_segs
, free_secs
;
1181 int tot_blks
, data_blks
, node_blks
;
1182 int curseg
[NR_CURSEG_TYPE
];
1183 int cursec
[NR_CURSEG_TYPE
];
1184 int curzone
[NR_CURSEG_TYPE
];
1186 unsigned int segment_count
[2];
1187 unsigned int block_count
[2];
1188 unsigned base_mem
, cache_mem
;
1191 static inline struct f2fs_stat_info
*F2FS_STAT(struct f2fs_sb_info
*sbi
)
1193 return (struct f2fs_stat_info
*)sbi
->stat_info
;
1196 #define stat_inc_call_count(si) ((si)->call_count++)
1197 #define stat_inc_bggc_count(sbi) ((sbi)->bg_gc++)
1198 #define stat_inc_dirty_dir(sbi) ((sbi)->n_dirty_dirs++)
1199 #define stat_dec_dirty_dir(sbi) ((sbi)->n_dirty_dirs--)
1200 #define stat_inc_total_hit(sb) ((F2FS_SB(sb))->total_hit_ext++)
1201 #define stat_inc_read_hit(sb) ((F2FS_SB(sb))->read_hit_ext++)
1202 #define stat_inc_seg_type(sbi, curseg) \
1203 ((sbi)->segment_count[(curseg)->alloc_type]++)
1204 #define stat_inc_block_count(sbi, curseg) \
1205 ((sbi)->block_count[(curseg)->alloc_type]++)
1207 #define stat_inc_seg_count(sbi, type) \
1209 struct f2fs_stat_info *si = F2FS_STAT(sbi); \
1211 if (type == SUM_TYPE_DATA) \
1217 #define stat_inc_tot_blk_count(si, blks) \
1218 (si->tot_blks += (blks))
1220 #define stat_inc_data_blk_count(sbi, blks) \
1222 struct f2fs_stat_info *si = F2FS_STAT(sbi); \
1223 stat_inc_tot_blk_count(si, blks); \
1224 si->data_blks += (blks); \
1227 #define stat_inc_node_blk_count(sbi, blks) \
1229 struct f2fs_stat_info *si = F2FS_STAT(sbi); \
1230 stat_inc_tot_blk_count(si, blks); \
1231 si->node_blks += (blks); \
1234 int f2fs_build_stats(struct f2fs_sb_info
*);
1235 void f2fs_destroy_stats(struct f2fs_sb_info
*);
1236 void __init
f2fs_create_root_stats(void);
1237 void f2fs_destroy_root_stats(void);
1239 #define stat_inc_call_count(si)
1240 #define stat_inc_bggc_count(si)
1241 #define stat_inc_dirty_dir(sbi)
1242 #define stat_dec_dirty_dir(sbi)
1243 #define stat_inc_total_hit(sb)
1244 #define stat_inc_read_hit(sb)
1245 #define stat_inc_seg_type(sbi, curseg)
1246 #define stat_inc_block_count(sbi, curseg)
1247 #define stat_inc_seg_count(si, type)
1248 #define stat_inc_tot_blk_count(si, blks)
1249 #define stat_inc_data_blk_count(si, blks)
1250 #define stat_inc_node_blk_count(sbi, blks)
1252 static inline int f2fs_build_stats(struct f2fs_sb_info
*sbi
) { return 0; }
1253 static inline void f2fs_destroy_stats(struct f2fs_sb_info
*sbi
) { }
1254 static inline void __init
f2fs_create_root_stats(void) { }
1255 static inline void f2fs_destroy_root_stats(void) { }
1258 extern const struct file_operations f2fs_dir_operations
;
1259 extern const struct file_operations f2fs_file_operations
;
1260 extern const struct inode_operations f2fs_file_inode_operations
;
1261 extern const struct address_space_operations f2fs_dblock_aops
;
1262 extern const struct address_space_operations f2fs_node_aops
;
1263 extern const struct address_space_operations f2fs_meta_aops
;
1264 extern const struct inode_operations f2fs_dir_inode_operations
;
1265 extern const struct inode_operations f2fs_symlink_inode_operations
;
1266 extern const struct inode_operations f2fs_special_inode_operations
;