4 * Copyright (c) 2012 Samsung Electronics Co., Ltd.
5 * http://www.samsung.com/
7 * This program is free software; you can redistribute it and/or modify
8 * it under the terms of the GNU General Public License version 2 as
9 * published by the Free Software Foundation.
12 #include <linux/f2fs_fs.h>
13 #include <linux/buffer_head.h>
14 #include <linux/backing-dev.h>
15 #include <linux/writeback.h>
21 #include <trace/events/f2fs.h>
23 void f2fs_mark_inode_dirty_sync(struct inode
*inode
, bool sync
)
25 if (is_inode_flag_set(inode
, FI_NEW_INODE
))
28 if (f2fs_inode_dirtied(inode
, sync
))
31 mark_inode_dirty_sync(inode
);
34 void f2fs_set_inode_flags(struct inode
*inode
)
36 unsigned int flags
= F2FS_I(inode
)->i_flags
;
37 unsigned int new_fl
= 0;
39 if (flags
& FS_SYNC_FL
)
41 if (flags
& FS_APPEND_FL
)
43 if (flags
& FS_IMMUTABLE_FL
)
44 new_fl
|= S_IMMUTABLE
;
45 if (flags
& FS_NOATIME_FL
)
47 if (flags
& FS_DIRSYNC_FL
)
49 if (f2fs_encrypted_inode(inode
))
50 new_fl
|= S_ENCRYPTED
;
51 inode_set_flags(inode
, new_fl
,
52 S_SYNC
|S_APPEND
|S_IMMUTABLE
|S_NOATIME
|S_DIRSYNC
|
56 static void __get_inode_rdev(struct inode
*inode
, struct f2fs_inode
*ri
)
58 int extra_size
= get_extra_isize(inode
);
60 if (S_ISCHR(inode
->i_mode
) || S_ISBLK(inode
->i_mode
) ||
61 S_ISFIFO(inode
->i_mode
) || S_ISSOCK(inode
->i_mode
)) {
62 if (ri
->i_addr
[extra_size
])
63 inode
->i_rdev
= old_decode_dev(
64 le32_to_cpu(ri
->i_addr
[extra_size
]));
66 inode
->i_rdev
= new_decode_dev(
67 le32_to_cpu(ri
->i_addr
[extra_size
+ 1]));
71 static bool __written_first_block(struct f2fs_inode
*ri
)
73 block_t addr
= le32_to_cpu(ri
->i_addr
[offset_in_addr(ri
)]);
75 if (addr
!= NEW_ADDR
&& addr
!= NULL_ADDR
)
80 static void __set_inode_rdev(struct inode
*inode
, struct f2fs_inode
*ri
)
82 int extra_size
= get_extra_isize(inode
);
84 if (S_ISCHR(inode
->i_mode
) || S_ISBLK(inode
->i_mode
)) {
85 if (old_valid_dev(inode
->i_rdev
)) {
86 ri
->i_addr
[extra_size
] =
87 cpu_to_le32(old_encode_dev(inode
->i_rdev
));
88 ri
->i_addr
[extra_size
+ 1] = 0;
90 ri
->i_addr
[extra_size
] = 0;
91 ri
->i_addr
[extra_size
+ 1] =
92 cpu_to_le32(new_encode_dev(inode
->i_rdev
));
93 ri
->i_addr
[extra_size
+ 2] = 0;
98 static void __recover_inline_status(struct inode
*inode
, struct page
*ipage
)
100 void *inline_data
= inline_data_addr(inode
, ipage
);
101 __le32
*start
= inline_data
;
102 __le32
*end
= start
+ MAX_INLINE_DATA(inode
) / sizeof(__le32
);
104 while (start
< end
) {
106 f2fs_wait_on_page_writeback(ipage
, NODE
, true);
108 set_inode_flag(inode
, FI_DATA_EXIST
);
109 set_raw_inline(inode
, F2FS_INODE(ipage
));
110 set_page_dirty(ipage
);
117 static bool f2fs_enable_inode_chksum(struct f2fs_sb_info
*sbi
, struct page
*page
)
119 struct f2fs_inode
*ri
= &F2FS_NODE(page
)->i
;
120 int extra_isize
= le32_to_cpu(ri
->i_extra_isize
);
122 if (!f2fs_sb_has_inode_chksum(sbi
->sb
))
125 if (!RAW_IS_INODE(F2FS_NODE(page
)) || !(ri
->i_inline
& F2FS_EXTRA_ATTR
))
128 if (!F2FS_FITS_IN_INODE(ri
, extra_isize
, i_inode_checksum
))
134 static __u32
f2fs_inode_chksum(struct f2fs_sb_info
*sbi
, struct page
*page
)
136 struct f2fs_node
*node
= F2FS_NODE(page
);
137 struct f2fs_inode
*ri
= &node
->i
;
138 __le32 ino
= node
->footer
.ino
;
139 __le32 gen
= ri
->i_generation
;
140 __u32 chksum
, chksum_seed
;
142 unsigned int offset
= offsetof(struct f2fs_inode
, i_inode_checksum
);
143 unsigned int cs_size
= sizeof(dummy_cs
);
145 chksum
= f2fs_chksum(sbi
, sbi
->s_chksum_seed
, (__u8
*)&ino
,
147 chksum_seed
= f2fs_chksum(sbi
, chksum
, (__u8
*)&gen
, sizeof(gen
));
149 chksum
= f2fs_chksum(sbi
, chksum_seed
, (__u8
*)ri
, offset
);
150 chksum
= f2fs_chksum(sbi
, chksum
, (__u8
*)&dummy_cs
, cs_size
);
152 chksum
= f2fs_chksum(sbi
, chksum
, (__u8
*)ri
+ offset
,
153 F2FS_BLKSIZE
- offset
);
157 bool f2fs_inode_chksum_verify(struct f2fs_sb_info
*sbi
, struct page
*page
)
159 struct f2fs_inode
*ri
;
160 __u32 provided
, calculated
;
162 if (!f2fs_enable_inode_chksum(sbi
, page
) ||
163 PageDirty(page
) || PageWriteback(page
))
166 ri
= &F2FS_NODE(page
)->i
;
167 provided
= le32_to_cpu(ri
->i_inode_checksum
);
168 calculated
= f2fs_inode_chksum(sbi
, page
);
170 if (provided
!= calculated
)
171 f2fs_msg(sbi
->sb
, KERN_WARNING
,
172 "checksum invalid, ino = %x, %x vs. %x",
173 ino_of_node(page
), provided
, calculated
);
175 return provided
== calculated
;
178 void f2fs_inode_chksum_set(struct f2fs_sb_info
*sbi
, struct page
*page
)
180 struct f2fs_inode
*ri
= &F2FS_NODE(page
)->i
;
182 if (!f2fs_enable_inode_chksum(sbi
, page
))
185 ri
->i_inode_checksum
= cpu_to_le32(f2fs_inode_chksum(sbi
, page
));
188 static int do_read_inode(struct inode
*inode
)
190 struct f2fs_sb_info
*sbi
= F2FS_I_SB(inode
);
191 struct f2fs_inode_info
*fi
= F2FS_I(inode
);
192 struct page
*node_page
;
193 struct f2fs_inode
*ri
;
196 /* Check if ino is within scope */
197 if (check_nid_range(sbi
, inode
->i_ino
)) {
198 f2fs_msg(inode
->i_sb
, KERN_ERR
, "bad inode number: %lu",
199 (unsigned long) inode
->i_ino
);
204 node_page
= get_node_page(sbi
, inode
->i_ino
);
205 if (IS_ERR(node_page
))
206 return PTR_ERR(node_page
);
208 ri
= F2FS_INODE(node_page
);
210 inode
->i_mode
= le16_to_cpu(ri
->i_mode
);
211 i_uid_write(inode
, le32_to_cpu(ri
->i_uid
));
212 i_gid_write(inode
, le32_to_cpu(ri
->i_gid
));
213 set_nlink(inode
, le32_to_cpu(ri
->i_links
));
214 inode
->i_size
= le64_to_cpu(ri
->i_size
);
215 inode
->i_blocks
= SECTOR_FROM_BLOCK(le64_to_cpu(ri
->i_blocks
) - 1);
217 inode
->i_atime
.tv_sec
= le64_to_cpu(ri
->i_atime
);
218 inode
->i_ctime
.tv_sec
= le64_to_cpu(ri
->i_ctime
);
219 inode
->i_mtime
.tv_sec
= le64_to_cpu(ri
->i_mtime
);
220 inode
->i_atime
.tv_nsec
= le32_to_cpu(ri
->i_atime_nsec
);
221 inode
->i_ctime
.tv_nsec
= le32_to_cpu(ri
->i_ctime_nsec
);
222 inode
->i_mtime
.tv_nsec
= le32_to_cpu(ri
->i_mtime_nsec
);
223 inode
->i_generation
= le32_to_cpu(ri
->i_generation
);
225 fi
->i_current_depth
= le32_to_cpu(ri
->i_current_depth
);
226 fi
->i_xattr_nid
= le32_to_cpu(ri
->i_xattr_nid
);
227 fi
->i_flags
= le32_to_cpu(ri
->i_flags
);
229 fi
->i_advise
= ri
->i_advise
;
230 fi
->i_pino
= le32_to_cpu(ri
->i_pino
);
231 fi
->i_dir_level
= ri
->i_dir_level
;
233 if (f2fs_init_extent_tree(inode
, &ri
->i_ext
))
234 set_page_dirty(node_page
);
236 get_inline_info(inode
, ri
);
238 fi
->i_extra_isize
= f2fs_has_extra_attr(inode
) ?
239 le16_to_cpu(ri
->i_extra_isize
) : 0;
241 if (f2fs_sb_has_flexible_inline_xattr(sbi
->sb
)) {
242 f2fs_bug_on(sbi
, !f2fs_has_extra_attr(inode
));
243 fi
->i_inline_xattr_size
= le16_to_cpu(ri
->i_inline_xattr_size
);
244 } else if (f2fs_has_inline_xattr(inode
) ||
245 f2fs_has_inline_dentry(inode
)) {
246 fi
->i_inline_xattr_size
= DEFAULT_INLINE_XATTR_ADDRS
;
250 * Previous inline data or directory always reserved 200 bytes
251 * in inode layout, even if inline_xattr is disabled. In order
252 * to keep inline_dentry's structure for backward compatibility,
253 * we get the space back only from inline_data.
255 fi
->i_inline_xattr_size
= 0;
258 /* check data exist */
259 if (f2fs_has_inline_data(inode
) && !f2fs_exist_data(inode
))
260 __recover_inline_status(inode
, node_page
);
262 /* get rdev by using inline_info */
263 __get_inode_rdev(inode
, ri
);
265 if (__written_first_block(ri
))
266 set_inode_flag(inode
, FI_FIRST_BLOCK_WRITTEN
);
268 if (!need_inode_block_update(sbi
, inode
->i_ino
))
269 fi
->last_disk_size
= inode
->i_size
;
271 if (fi
->i_flags
& FS_PROJINHERIT_FL
)
272 set_inode_flag(inode
, FI_PROJ_INHERIT
);
274 if (f2fs_has_extra_attr(inode
) && f2fs_sb_has_project_quota(sbi
->sb
) &&
275 F2FS_FITS_IN_INODE(ri
, fi
->i_extra_isize
, i_projid
))
276 i_projid
= (projid_t
)le32_to_cpu(ri
->i_projid
);
278 i_projid
= F2FS_DEF_PROJID
;
279 fi
->i_projid
= make_kprojid(&init_user_ns
, i_projid
);
281 if (f2fs_has_extra_attr(inode
) && f2fs_sb_has_inode_crtime(sbi
->sb
) &&
282 F2FS_FITS_IN_INODE(ri
, fi
->i_extra_isize
, i_crtime
)) {
283 fi
->i_crtime
.tv_sec
= le64_to_cpu(ri
->i_crtime
);
284 fi
->i_crtime
.tv_nsec
= le32_to_cpu(ri
->i_crtime_nsec
);
287 f2fs_put_page(node_page
, 1);
289 stat_inc_inline_xattr(inode
);
290 stat_inc_inline_inode(inode
);
291 stat_inc_inline_dir(inode
);
296 struct inode
*f2fs_iget(struct super_block
*sb
, unsigned long ino
)
298 struct f2fs_sb_info
*sbi
= F2FS_SB(sb
);
302 inode
= iget_locked(sb
, ino
);
304 return ERR_PTR(-ENOMEM
);
306 if (!(inode
->i_state
& I_NEW
)) {
307 trace_f2fs_iget(inode
);
310 if (ino
== F2FS_NODE_INO(sbi
) || ino
== F2FS_META_INO(sbi
))
313 ret
= do_read_inode(inode
);
317 if (ino
== F2FS_NODE_INO(sbi
)) {
318 inode
->i_mapping
->a_ops
= &f2fs_node_aops
;
319 mapping_set_gfp_mask(inode
->i_mapping
, GFP_F2FS_ZERO
);
320 } else if (ino
== F2FS_META_INO(sbi
)) {
321 inode
->i_mapping
->a_ops
= &f2fs_meta_aops
;
322 mapping_set_gfp_mask(inode
->i_mapping
, GFP_F2FS_ZERO
);
323 } else if (S_ISREG(inode
->i_mode
)) {
324 inode
->i_op
= &f2fs_file_inode_operations
;
325 inode
->i_fop
= &f2fs_file_operations
;
326 inode
->i_mapping
->a_ops
= &f2fs_dblock_aops
;
327 } else if (S_ISDIR(inode
->i_mode
)) {
328 inode
->i_op
= &f2fs_dir_inode_operations
;
329 inode
->i_fop
= &f2fs_dir_operations
;
330 inode
->i_mapping
->a_ops
= &f2fs_dblock_aops
;
331 mapping_set_gfp_mask(inode
->i_mapping
, GFP_F2FS_HIGH_ZERO
);
332 } else if (S_ISLNK(inode
->i_mode
)) {
333 if (f2fs_encrypted_inode(inode
))
334 inode
->i_op
= &f2fs_encrypted_symlink_inode_operations
;
336 inode
->i_op
= &f2fs_symlink_inode_operations
;
337 inode_nohighmem(inode
);
338 inode
->i_mapping
->a_ops
= &f2fs_dblock_aops
;
339 } else if (S_ISCHR(inode
->i_mode
) || S_ISBLK(inode
->i_mode
) ||
340 S_ISFIFO(inode
->i_mode
) || S_ISSOCK(inode
->i_mode
)) {
341 inode
->i_op
= &f2fs_special_inode_operations
;
342 init_special_inode(inode
, inode
->i_mode
, inode
->i_rdev
);
347 f2fs_set_inode_flags(inode
);
348 unlock_new_inode(inode
);
349 trace_f2fs_iget(inode
);
354 trace_f2fs_iget_exit(inode
, ret
);
358 struct inode
*f2fs_iget_retry(struct super_block
*sb
, unsigned long ino
)
362 inode
= f2fs_iget(sb
, ino
);
364 if (PTR_ERR(inode
) == -ENOMEM
) {
365 congestion_wait(BLK_RW_ASYNC
, HZ
/50);
372 void update_inode(struct inode
*inode
, struct page
*node_page
)
374 struct f2fs_inode
*ri
;
375 struct extent_tree
*et
= F2FS_I(inode
)->extent_tree
;
377 f2fs_wait_on_page_writeback(node_page
, NODE
, true);
378 set_page_dirty(node_page
);
380 f2fs_inode_synced(inode
);
382 ri
= F2FS_INODE(node_page
);
384 ri
->i_mode
= cpu_to_le16(inode
->i_mode
);
385 ri
->i_advise
= F2FS_I(inode
)->i_advise
;
386 ri
->i_uid
= cpu_to_le32(i_uid_read(inode
));
387 ri
->i_gid
= cpu_to_le32(i_gid_read(inode
));
388 ri
->i_links
= cpu_to_le32(inode
->i_nlink
);
389 ri
->i_size
= cpu_to_le64(i_size_read(inode
));
390 ri
->i_blocks
= cpu_to_le64(SECTOR_TO_BLOCK(inode
->i_blocks
) + 1);
393 read_lock(&et
->lock
);
394 set_raw_extent(&et
->largest
, &ri
->i_ext
);
395 read_unlock(&et
->lock
);
397 memset(&ri
->i_ext
, 0, sizeof(ri
->i_ext
));
399 set_raw_inline(inode
, ri
);
401 ri
->i_atime
= cpu_to_le64(inode
->i_atime
.tv_sec
);
402 ri
->i_ctime
= cpu_to_le64(inode
->i_ctime
.tv_sec
);
403 ri
->i_mtime
= cpu_to_le64(inode
->i_mtime
.tv_sec
);
404 ri
->i_atime_nsec
= cpu_to_le32(inode
->i_atime
.tv_nsec
);
405 ri
->i_ctime_nsec
= cpu_to_le32(inode
->i_ctime
.tv_nsec
);
406 ri
->i_mtime_nsec
= cpu_to_le32(inode
->i_mtime
.tv_nsec
);
407 ri
->i_current_depth
= cpu_to_le32(F2FS_I(inode
)->i_current_depth
);
408 ri
->i_xattr_nid
= cpu_to_le32(F2FS_I(inode
)->i_xattr_nid
);
409 ri
->i_flags
= cpu_to_le32(F2FS_I(inode
)->i_flags
);
410 ri
->i_pino
= cpu_to_le32(F2FS_I(inode
)->i_pino
);
411 ri
->i_generation
= cpu_to_le32(inode
->i_generation
);
412 ri
->i_dir_level
= F2FS_I(inode
)->i_dir_level
;
414 if (f2fs_has_extra_attr(inode
)) {
415 ri
->i_extra_isize
= cpu_to_le16(F2FS_I(inode
)->i_extra_isize
);
417 if (f2fs_sb_has_flexible_inline_xattr(F2FS_I_SB(inode
)->sb
))
418 ri
->i_inline_xattr_size
=
419 cpu_to_le16(F2FS_I(inode
)->i_inline_xattr_size
);
421 if (f2fs_sb_has_project_quota(F2FS_I_SB(inode
)->sb
) &&
422 F2FS_FITS_IN_INODE(ri
, F2FS_I(inode
)->i_extra_isize
,
426 i_projid
= from_kprojid(&init_user_ns
,
427 F2FS_I(inode
)->i_projid
);
428 ri
->i_projid
= cpu_to_le32(i_projid
);
431 if (f2fs_sb_has_inode_crtime(F2FS_I_SB(inode
)->sb
) &&
432 F2FS_FITS_IN_INODE(ri
, F2FS_I(inode
)->i_extra_isize
,
435 cpu_to_le64(F2FS_I(inode
)->i_crtime
.tv_sec
);
437 cpu_to_le32(F2FS_I(inode
)->i_crtime
.tv_nsec
);
441 __set_inode_rdev(inode
, ri
);
442 set_cold_node(inode
, node_page
);
445 if (inode
->i_nlink
== 0)
446 clear_inline_node(node_page
);
450 void update_inode_page(struct inode
*inode
)
452 struct f2fs_sb_info
*sbi
= F2FS_I_SB(inode
);
453 struct page
*node_page
;
455 node_page
= get_node_page(sbi
, inode
->i_ino
);
456 if (IS_ERR(node_page
)) {
457 int err
= PTR_ERR(node_page
);
458 if (err
== -ENOMEM
) {
461 } else if (err
!= -ENOENT
) {
462 f2fs_stop_checkpoint(sbi
, false);
466 update_inode(inode
, node_page
);
467 f2fs_put_page(node_page
, 1);
470 int f2fs_write_inode(struct inode
*inode
, struct writeback_control
*wbc
)
472 struct f2fs_sb_info
*sbi
= F2FS_I_SB(inode
);
474 if (inode
->i_ino
== F2FS_NODE_INO(sbi
) ||
475 inode
->i_ino
== F2FS_META_INO(sbi
))
478 if (!is_inode_flag_set(inode
, FI_DIRTY_INODE
))
482 * We need to balance fs here to prevent from producing dirty node pages
483 * during the urgent cleaning time when runing out of free sections.
485 update_inode_page(inode
);
486 if (wbc
&& wbc
->nr_to_write
)
487 f2fs_balance_fs(sbi
, true);
492 * Called at the last iput() if i_nlink is zero
494 void f2fs_evict_inode(struct inode
*inode
)
496 struct f2fs_sb_info
*sbi
= F2FS_I_SB(inode
);
497 nid_t xnid
= F2FS_I(inode
)->i_xattr_nid
;
500 /* some remained atomic pages should discarded */
501 if (f2fs_is_atomic_file(inode
))
502 drop_inmem_pages(inode
);
504 trace_f2fs_evict_inode(inode
);
505 truncate_inode_pages_final(&inode
->i_data
);
507 if (inode
->i_ino
== F2FS_NODE_INO(sbi
) ||
508 inode
->i_ino
== F2FS_META_INO(sbi
))
511 f2fs_bug_on(sbi
, get_dirty_pages(inode
));
512 remove_dirty_inode(inode
);
514 f2fs_destroy_extent_tree(inode
);
516 if (inode
->i_nlink
|| is_bad_inode(inode
))
519 dquot_initialize(inode
);
521 remove_ino_entry(sbi
, inode
->i_ino
, APPEND_INO
);
522 remove_ino_entry(sbi
, inode
->i_ino
, UPDATE_INO
);
523 remove_ino_entry(sbi
, inode
->i_ino
, FLUSH_INO
);
525 sb_start_intwrite(inode
->i_sb
);
526 set_inode_flag(inode
, FI_NO_ALLOC
);
527 i_size_write(inode
, 0);
529 if (F2FS_HAS_BLOCKS(inode
))
530 err
= f2fs_truncate(inode
);
532 #ifdef CONFIG_F2FS_FAULT_INJECTION
533 if (time_to_inject(sbi
, FAULT_EVICT_INODE
)) {
534 f2fs_show_injection_info(FAULT_EVICT_INODE
);
540 err
= remove_inode_page(inode
);
546 /* give more chances, if ENOMEM case */
547 if (err
== -ENOMEM
) {
553 update_inode_page(inode
);
554 dquot_free_inode(inode
);
555 sb_end_intwrite(inode
->i_sb
);
559 stat_dec_inline_xattr(inode
);
560 stat_dec_inline_dir(inode
);
561 stat_dec_inline_inode(inode
);
563 if (likely(!is_set_ckpt_flags(sbi
, CP_ERROR_FLAG
)))
564 f2fs_bug_on(sbi
, is_inode_flag_set(inode
, FI_DIRTY_INODE
));
566 f2fs_inode_synced(inode
);
568 /* ino == 0, if f2fs_new_inode() was failed t*/
570 invalidate_mapping_pages(NODE_MAPPING(sbi
), inode
->i_ino
,
573 invalidate_mapping_pages(NODE_MAPPING(sbi
), xnid
, xnid
);
574 if (inode
->i_nlink
) {
575 if (is_inode_flag_set(inode
, FI_APPEND_WRITE
))
576 add_ino_entry(sbi
, inode
->i_ino
, APPEND_INO
);
577 if (is_inode_flag_set(inode
, FI_UPDATE_WRITE
))
578 add_ino_entry(sbi
, inode
->i_ino
, UPDATE_INO
);
580 if (is_inode_flag_set(inode
, FI_FREE_NID
)) {
581 alloc_nid_failed(sbi
, inode
->i_ino
);
582 clear_inode_flag(inode
, FI_FREE_NID
);
584 f2fs_bug_on(sbi
, err
&&
585 !exist_written_data(sbi
, inode
->i_ino
, ORPHAN_INO
));
588 fscrypt_put_encryption_info(inode
);
592 /* caller should call f2fs_lock_op() */
593 void handle_failed_inode(struct inode
*inode
)
595 struct f2fs_sb_info
*sbi
= F2FS_I_SB(inode
);
599 * clear nlink of inode in order to release resource of inode
605 * we must call this to avoid inode being remained as dirty, resulting
606 * in a panic when flushing dirty inodes in gdirty_list.
608 update_inode_page(inode
);
609 f2fs_inode_synced(inode
);
611 /* don't make bad inode, since it becomes a regular file. */
612 unlock_new_inode(inode
);
615 * Note: we should add inode to orphan list before f2fs_unlock_op()
616 * so we can prevent losing this orphan when encoutering checkpoint
617 * and following suddenly power-off.
619 get_node_info(sbi
, inode
->i_ino
, &ni
);
621 if (ni
.blk_addr
!= NULL_ADDR
) {
622 int err
= acquire_orphan_inode(sbi
);
624 set_sbi_flag(sbi
, SBI_NEED_FSCK
);
625 f2fs_msg(sbi
->sb
, KERN_WARNING
,
626 "Too many orphan inodes, run fsck to fix.");
628 add_orphan_inode(inode
);
630 alloc_nid_done(sbi
, inode
->i_ino
);
632 set_inode_flag(inode
, FI_FREE_NID
);
637 /* iput will drop the inode object */