libceph: redo callbacks and factor out MOSDOpReply decoding
[linux/fpc-iii.git] / fs / f2fs / inode.c
blobcb269c46ac254ff6f508f9bd21a79028d3ae754e
1 /*
2 * fs/f2fs/inode.c
4 * Copyright (c) 2012 Samsung Electronics Co., Ltd.
5 * http://www.samsung.com/
7 * This program is free software; you can redistribute it and/or modify
8 * it under the terms of the GNU General Public License version 2 as
9 * published by the Free Software Foundation.
11 #include <linux/fs.h>
12 #include <linux/f2fs_fs.h>
13 #include <linux/buffer_head.h>
14 #include <linux/writeback.h>
16 #include "f2fs.h"
17 #include "node.h"
19 #include <trace/events/f2fs.h>
21 void f2fs_set_inode_flags(struct inode *inode)
23 unsigned int flags = F2FS_I(inode)->i_flags;
24 unsigned int new_fl = 0;
26 if (flags & FS_SYNC_FL)
27 new_fl |= S_SYNC;
28 if (flags & FS_APPEND_FL)
29 new_fl |= S_APPEND;
30 if (flags & FS_IMMUTABLE_FL)
31 new_fl |= S_IMMUTABLE;
32 if (flags & FS_NOATIME_FL)
33 new_fl |= S_NOATIME;
34 if (flags & FS_DIRSYNC_FL)
35 new_fl |= S_DIRSYNC;
36 inode_set_flags(inode, new_fl,
37 S_SYNC|S_APPEND|S_IMMUTABLE|S_NOATIME|S_DIRSYNC);
40 static void __get_inode_rdev(struct inode *inode, struct f2fs_inode *ri)
42 if (S_ISCHR(inode->i_mode) || S_ISBLK(inode->i_mode) ||
43 S_ISFIFO(inode->i_mode) || S_ISSOCK(inode->i_mode)) {
44 if (ri->i_addr[0])
45 inode->i_rdev =
46 old_decode_dev(le32_to_cpu(ri->i_addr[0]));
47 else
48 inode->i_rdev =
49 new_decode_dev(le32_to_cpu(ri->i_addr[1]));
53 static bool __written_first_block(struct f2fs_inode *ri)
55 block_t addr = le32_to_cpu(ri->i_addr[0]);
57 if (addr != NEW_ADDR && addr != NULL_ADDR)
58 return true;
59 return false;
62 static void __set_inode_rdev(struct inode *inode, struct f2fs_inode *ri)
64 if (S_ISCHR(inode->i_mode) || S_ISBLK(inode->i_mode)) {
65 if (old_valid_dev(inode->i_rdev)) {
66 ri->i_addr[0] =
67 cpu_to_le32(old_encode_dev(inode->i_rdev));
68 ri->i_addr[1] = 0;
69 } else {
70 ri->i_addr[0] = 0;
71 ri->i_addr[1] =
72 cpu_to_le32(new_encode_dev(inode->i_rdev));
73 ri->i_addr[2] = 0;
78 static void __recover_inline_status(struct inode *inode, struct page *ipage)
80 void *inline_data = inline_data_addr(ipage);
81 __le32 *start = inline_data;
82 __le32 *end = start + MAX_INLINE_DATA / sizeof(__le32);
84 while (start < end) {
85 if (*start++) {
86 f2fs_wait_on_page_writeback(ipage, NODE, true);
88 set_inode_flag(F2FS_I(inode), FI_DATA_EXIST);
89 set_raw_inline(F2FS_I(inode), F2FS_INODE(ipage));
90 set_page_dirty(ipage);
91 return;
94 return;
97 static int do_read_inode(struct inode *inode)
99 struct f2fs_sb_info *sbi = F2FS_I_SB(inode);
100 struct f2fs_inode_info *fi = F2FS_I(inode);
101 struct page *node_page;
102 struct f2fs_inode *ri;
104 /* Check if ino is within scope */
105 if (check_nid_range(sbi, inode->i_ino)) {
106 f2fs_msg(inode->i_sb, KERN_ERR, "bad inode number: %lu",
107 (unsigned long) inode->i_ino);
108 WARN_ON(1);
109 return -EINVAL;
112 node_page = get_node_page(sbi, inode->i_ino);
113 if (IS_ERR(node_page))
114 return PTR_ERR(node_page);
116 ri = F2FS_INODE(node_page);
118 inode->i_mode = le16_to_cpu(ri->i_mode);
119 i_uid_write(inode, le32_to_cpu(ri->i_uid));
120 i_gid_write(inode, le32_to_cpu(ri->i_gid));
121 set_nlink(inode, le32_to_cpu(ri->i_links));
122 inode->i_size = le64_to_cpu(ri->i_size);
123 inode->i_blocks = le64_to_cpu(ri->i_blocks);
125 inode->i_atime.tv_sec = le64_to_cpu(ri->i_atime);
126 inode->i_ctime.tv_sec = le64_to_cpu(ri->i_ctime);
127 inode->i_mtime.tv_sec = le64_to_cpu(ri->i_mtime);
128 inode->i_atime.tv_nsec = le32_to_cpu(ri->i_atime_nsec);
129 inode->i_ctime.tv_nsec = le32_to_cpu(ri->i_ctime_nsec);
130 inode->i_mtime.tv_nsec = le32_to_cpu(ri->i_mtime_nsec);
131 inode->i_generation = le32_to_cpu(ri->i_generation);
133 fi->i_current_depth = le32_to_cpu(ri->i_current_depth);
134 fi->i_xattr_nid = le32_to_cpu(ri->i_xattr_nid);
135 fi->i_flags = le32_to_cpu(ri->i_flags);
136 fi->flags = 0;
137 fi->i_advise = ri->i_advise;
138 fi->i_pino = le32_to_cpu(ri->i_pino);
139 fi->i_dir_level = ri->i_dir_level;
141 if (f2fs_init_extent_tree(inode, &ri->i_ext))
142 set_page_dirty(node_page);
144 get_inline_info(fi, ri);
146 /* check data exist */
147 if (f2fs_has_inline_data(inode) && !f2fs_exist_data(inode))
148 __recover_inline_status(inode, node_page);
150 /* get rdev by using inline_info */
151 __get_inode_rdev(inode, ri);
153 if (__written_first_block(ri))
154 set_inode_flag(F2FS_I(inode), FI_FIRST_BLOCK_WRITTEN);
156 f2fs_put_page(node_page, 1);
158 stat_inc_inline_xattr(inode);
159 stat_inc_inline_inode(inode);
160 stat_inc_inline_dir(inode);
162 return 0;
165 struct inode *f2fs_iget(struct super_block *sb, unsigned long ino)
167 struct f2fs_sb_info *sbi = F2FS_SB(sb);
168 struct inode *inode;
169 int ret = 0;
171 inode = iget_locked(sb, ino);
172 if (!inode)
173 return ERR_PTR(-ENOMEM);
175 if (!(inode->i_state & I_NEW)) {
176 trace_f2fs_iget(inode);
177 return inode;
179 if (ino == F2FS_NODE_INO(sbi) || ino == F2FS_META_INO(sbi))
180 goto make_now;
182 ret = do_read_inode(inode);
183 if (ret)
184 goto bad_inode;
185 make_now:
186 if (ino == F2FS_NODE_INO(sbi)) {
187 inode->i_mapping->a_ops = &f2fs_node_aops;
188 mapping_set_gfp_mask(inode->i_mapping, GFP_F2FS_ZERO);
189 } else if (ino == F2FS_META_INO(sbi)) {
190 inode->i_mapping->a_ops = &f2fs_meta_aops;
191 mapping_set_gfp_mask(inode->i_mapping, GFP_F2FS_ZERO);
192 } else if (S_ISREG(inode->i_mode)) {
193 inode->i_op = &f2fs_file_inode_operations;
194 inode->i_fop = &f2fs_file_operations;
195 inode->i_mapping->a_ops = &f2fs_dblock_aops;
196 } else if (S_ISDIR(inode->i_mode)) {
197 inode->i_op = &f2fs_dir_inode_operations;
198 inode->i_fop = &f2fs_dir_operations;
199 inode->i_mapping->a_ops = &f2fs_dblock_aops;
200 mapping_set_gfp_mask(inode->i_mapping, GFP_F2FS_HIGH_ZERO);
201 } else if (S_ISLNK(inode->i_mode)) {
202 if (f2fs_encrypted_inode(inode))
203 inode->i_op = &f2fs_encrypted_symlink_inode_operations;
204 else
205 inode->i_op = &f2fs_symlink_inode_operations;
206 inode_nohighmem(inode);
207 inode->i_mapping->a_ops = &f2fs_dblock_aops;
208 } else if (S_ISCHR(inode->i_mode) || S_ISBLK(inode->i_mode) ||
209 S_ISFIFO(inode->i_mode) || S_ISSOCK(inode->i_mode)) {
210 inode->i_op = &f2fs_special_inode_operations;
211 init_special_inode(inode, inode->i_mode, inode->i_rdev);
212 } else {
213 ret = -EIO;
214 goto bad_inode;
216 unlock_new_inode(inode);
217 trace_f2fs_iget(inode);
218 return inode;
220 bad_inode:
221 iget_failed(inode);
222 trace_f2fs_iget_exit(inode, ret);
223 return ERR_PTR(ret);
226 int update_inode(struct inode *inode, struct page *node_page)
228 struct f2fs_inode *ri;
230 f2fs_wait_on_page_writeback(node_page, NODE, true);
232 ri = F2FS_INODE(node_page);
234 ri->i_mode = cpu_to_le16(inode->i_mode);
235 ri->i_advise = F2FS_I(inode)->i_advise;
236 ri->i_uid = cpu_to_le32(i_uid_read(inode));
237 ri->i_gid = cpu_to_le32(i_gid_read(inode));
238 ri->i_links = cpu_to_le32(inode->i_nlink);
239 ri->i_size = cpu_to_le64(i_size_read(inode));
240 ri->i_blocks = cpu_to_le64(inode->i_blocks);
242 if (F2FS_I(inode)->extent_tree)
243 set_raw_extent(&F2FS_I(inode)->extent_tree->largest,
244 &ri->i_ext);
245 else
246 memset(&ri->i_ext, 0, sizeof(ri->i_ext));
247 set_raw_inline(F2FS_I(inode), ri);
249 ri->i_atime = cpu_to_le64(inode->i_atime.tv_sec);
250 ri->i_ctime = cpu_to_le64(inode->i_ctime.tv_sec);
251 ri->i_mtime = cpu_to_le64(inode->i_mtime.tv_sec);
252 ri->i_atime_nsec = cpu_to_le32(inode->i_atime.tv_nsec);
253 ri->i_ctime_nsec = cpu_to_le32(inode->i_ctime.tv_nsec);
254 ri->i_mtime_nsec = cpu_to_le32(inode->i_mtime.tv_nsec);
255 ri->i_current_depth = cpu_to_le32(F2FS_I(inode)->i_current_depth);
256 ri->i_xattr_nid = cpu_to_le32(F2FS_I(inode)->i_xattr_nid);
257 ri->i_flags = cpu_to_le32(F2FS_I(inode)->i_flags);
258 ri->i_pino = cpu_to_le32(F2FS_I(inode)->i_pino);
259 ri->i_generation = cpu_to_le32(inode->i_generation);
260 ri->i_dir_level = F2FS_I(inode)->i_dir_level;
262 __set_inode_rdev(inode, ri);
263 set_cold_node(inode, node_page);
264 clear_inode_flag(F2FS_I(inode), FI_DIRTY_INODE);
266 /* deleted inode */
267 if (inode->i_nlink == 0)
268 clear_inline_node(node_page);
270 return set_page_dirty(node_page);
273 int update_inode_page(struct inode *inode)
275 struct f2fs_sb_info *sbi = F2FS_I_SB(inode);
276 struct page *node_page;
277 int ret = 0;
278 retry:
279 node_page = get_node_page(sbi, inode->i_ino);
280 if (IS_ERR(node_page)) {
281 int err = PTR_ERR(node_page);
282 if (err == -ENOMEM) {
283 cond_resched();
284 goto retry;
285 } else if (err != -ENOENT) {
286 f2fs_stop_checkpoint(sbi);
288 return 0;
290 ret = update_inode(inode, node_page);
291 f2fs_put_page(node_page, 1);
292 return ret;
295 int f2fs_write_inode(struct inode *inode, struct writeback_control *wbc)
297 struct f2fs_sb_info *sbi = F2FS_I_SB(inode);
299 if (inode->i_ino == F2FS_NODE_INO(sbi) ||
300 inode->i_ino == F2FS_META_INO(sbi))
301 return 0;
303 if (!is_inode_flag_set(F2FS_I(inode), FI_DIRTY_INODE))
304 return 0;
307 * We need to balance fs here to prevent from producing dirty node pages
308 * during the urgent cleaning time when runing out of free sections.
310 if (update_inode_page(inode))
311 f2fs_balance_fs(sbi, true);
312 return 0;
316 * Called at the last iput() if i_nlink is zero
318 void f2fs_evict_inode(struct inode *inode)
320 struct f2fs_sb_info *sbi = F2FS_I_SB(inode);
321 struct f2fs_inode_info *fi = F2FS_I(inode);
322 nid_t xnid = fi->i_xattr_nid;
323 int err = 0;
325 /* some remained atomic pages should discarded */
326 if (f2fs_is_atomic_file(inode))
327 drop_inmem_pages(inode);
329 trace_f2fs_evict_inode(inode);
330 truncate_inode_pages_final(&inode->i_data);
332 if (inode->i_ino == F2FS_NODE_INO(sbi) ||
333 inode->i_ino == F2FS_META_INO(sbi))
334 goto out_clear;
336 f2fs_bug_on(sbi, get_dirty_pages(inode));
337 remove_dirty_inode(inode);
339 f2fs_destroy_extent_tree(inode);
341 if (inode->i_nlink || is_bad_inode(inode))
342 goto no_delete;
344 sb_start_intwrite(inode->i_sb);
345 set_inode_flag(fi, FI_NO_ALLOC);
346 i_size_write(inode, 0);
348 if (F2FS_HAS_BLOCKS(inode))
349 err = f2fs_truncate(inode, true);
351 if (!err) {
352 f2fs_lock_op(sbi);
353 err = remove_inode_page(inode);
354 f2fs_unlock_op(sbi);
357 sb_end_intwrite(inode->i_sb);
358 no_delete:
359 stat_dec_inline_xattr(inode);
360 stat_dec_inline_dir(inode);
361 stat_dec_inline_inode(inode);
363 invalidate_mapping_pages(NODE_MAPPING(sbi), inode->i_ino, inode->i_ino);
364 if (xnid)
365 invalidate_mapping_pages(NODE_MAPPING(sbi), xnid, xnid);
366 if (is_inode_flag_set(fi, FI_APPEND_WRITE))
367 add_ino_entry(sbi, inode->i_ino, APPEND_INO);
368 if (is_inode_flag_set(fi, FI_UPDATE_WRITE))
369 add_ino_entry(sbi, inode->i_ino, UPDATE_INO);
370 if (is_inode_flag_set(fi, FI_FREE_NID)) {
371 if (err && err != -ENOENT)
372 alloc_nid_done(sbi, inode->i_ino);
373 else
374 alloc_nid_failed(sbi, inode->i_ino);
375 clear_inode_flag(fi, FI_FREE_NID);
378 if (err && err != -ENOENT) {
379 if (!exist_written_data(sbi, inode->i_ino, ORPHAN_INO)) {
381 * get here because we failed to release resource
382 * of inode previously, reminder our user to run fsck
383 * for fixing.
385 set_sbi_flag(sbi, SBI_NEED_FSCK);
386 f2fs_msg(sbi->sb, KERN_WARNING,
387 "inode (ino:%lu) resource leak, run fsck "
388 "to fix this issue!", inode->i_ino);
391 out_clear:
392 fscrypt_put_encryption_info(inode, NULL);
393 clear_inode(inode);
396 /* caller should call f2fs_lock_op() */
397 void handle_failed_inode(struct inode *inode)
399 struct f2fs_sb_info *sbi = F2FS_I_SB(inode);
400 int err = 0;
402 clear_nlink(inode);
403 make_bad_inode(inode);
404 unlock_new_inode(inode);
406 i_size_write(inode, 0);
407 if (F2FS_HAS_BLOCKS(inode))
408 err = f2fs_truncate(inode, false);
410 if (!err)
411 err = remove_inode_page(inode);
414 * if we skip truncate_node in remove_inode_page bacause we failed
415 * before, it's better to find another way to release resource of
416 * this inode (e.g. valid block count, node block or nid). Here we
417 * choose to add this inode to orphan list, so that we can call iput
418 * for releasing in orphan recovery flow.
420 * Note: we should add inode to orphan list before f2fs_unlock_op()
421 * so we can prevent losing this orphan when encoutering checkpoint
422 * and following suddenly power-off.
424 if (err && err != -ENOENT) {
425 err = acquire_orphan_inode(sbi);
426 if (!err)
427 add_orphan_inode(sbi, inode->i_ino);
430 set_inode_flag(F2FS_I(inode), FI_FREE_NID);
431 f2fs_unlock_op(sbi);
433 /* iput will drop the inode object */
434 iput(inode);