f2fs: inject to produce some orphan inodes
[linux-2.6/btrfs-unstable.git] / fs / f2fs / inode.c
blob11cb60af815d5531f5ef76a8d857b31005aa40d4
1 /*
2 * fs/f2fs/inode.c
4 * Copyright (c) 2012 Samsung Electronics Co., Ltd.
5 * http://www.samsung.com/
7 * This program is free software; you can redistribute it and/or modify
8 * it under the terms of the GNU General Public License version 2 as
9 * published by the Free Software Foundation.
11 #include <linux/fs.h>
12 #include <linux/f2fs_fs.h>
13 #include <linux/buffer_head.h>
14 #include <linux/writeback.h>
16 #include "f2fs.h"
17 #include "node.h"
19 #include <trace/events/f2fs.h>
21 void f2fs_set_inode_flags(struct inode *inode)
23 unsigned int flags = F2FS_I(inode)->i_flags;
24 unsigned int new_fl = 0;
26 if (flags & FS_SYNC_FL)
27 new_fl |= S_SYNC;
28 if (flags & FS_APPEND_FL)
29 new_fl |= S_APPEND;
30 if (flags & FS_IMMUTABLE_FL)
31 new_fl |= S_IMMUTABLE;
32 if (flags & FS_NOATIME_FL)
33 new_fl |= S_NOATIME;
34 if (flags & FS_DIRSYNC_FL)
35 new_fl |= S_DIRSYNC;
36 inode_set_flags(inode, new_fl,
37 S_SYNC|S_APPEND|S_IMMUTABLE|S_NOATIME|S_DIRSYNC);
38 mark_inode_dirty_sync(inode);
41 static void __get_inode_rdev(struct inode *inode, struct f2fs_inode *ri)
43 if (S_ISCHR(inode->i_mode) || S_ISBLK(inode->i_mode) ||
44 S_ISFIFO(inode->i_mode) || S_ISSOCK(inode->i_mode)) {
45 if (ri->i_addr[0])
46 inode->i_rdev =
47 old_decode_dev(le32_to_cpu(ri->i_addr[0]));
48 else
49 inode->i_rdev =
50 new_decode_dev(le32_to_cpu(ri->i_addr[1]));
54 static bool __written_first_block(struct f2fs_inode *ri)
56 block_t addr = le32_to_cpu(ri->i_addr[0]);
58 if (addr != NEW_ADDR && addr != NULL_ADDR)
59 return true;
60 return false;
63 static void __set_inode_rdev(struct inode *inode, struct f2fs_inode *ri)
65 if (S_ISCHR(inode->i_mode) || S_ISBLK(inode->i_mode)) {
66 if (old_valid_dev(inode->i_rdev)) {
67 ri->i_addr[0] =
68 cpu_to_le32(old_encode_dev(inode->i_rdev));
69 ri->i_addr[1] = 0;
70 } else {
71 ri->i_addr[0] = 0;
72 ri->i_addr[1] =
73 cpu_to_le32(new_encode_dev(inode->i_rdev));
74 ri->i_addr[2] = 0;
79 static void __recover_inline_status(struct inode *inode, struct page *ipage)
81 void *inline_data = inline_data_addr(ipage);
82 __le32 *start = inline_data;
83 __le32 *end = start + MAX_INLINE_DATA / sizeof(__le32);
85 while (start < end) {
86 if (*start++) {
87 f2fs_wait_on_page_writeback(ipage, NODE, true);
89 set_inode_flag(inode, FI_DATA_EXIST);
90 set_raw_inline(inode, F2FS_INODE(ipage));
91 set_page_dirty(ipage);
92 return;
95 return;
98 static int do_read_inode(struct inode *inode)
100 struct f2fs_sb_info *sbi = F2FS_I_SB(inode);
101 struct f2fs_inode_info *fi = F2FS_I(inode);
102 struct page *node_page;
103 struct f2fs_inode *ri;
105 /* Check if ino is within scope */
106 if (check_nid_range(sbi, inode->i_ino)) {
107 f2fs_msg(inode->i_sb, KERN_ERR, "bad inode number: %lu",
108 (unsigned long) inode->i_ino);
109 WARN_ON(1);
110 return -EINVAL;
113 node_page = get_node_page(sbi, inode->i_ino);
114 if (IS_ERR(node_page))
115 return PTR_ERR(node_page);
117 ri = F2FS_INODE(node_page);
119 inode->i_mode = le16_to_cpu(ri->i_mode);
120 i_uid_write(inode, le32_to_cpu(ri->i_uid));
121 i_gid_write(inode, le32_to_cpu(ri->i_gid));
122 set_nlink(inode, le32_to_cpu(ri->i_links));
123 inode->i_size = le64_to_cpu(ri->i_size);
124 inode->i_blocks = le64_to_cpu(ri->i_blocks);
126 inode->i_atime.tv_sec = le64_to_cpu(ri->i_atime);
127 inode->i_ctime.tv_sec = le64_to_cpu(ri->i_ctime);
128 inode->i_mtime.tv_sec = le64_to_cpu(ri->i_mtime);
129 inode->i_atime.tv_nsec = le32_to_cpu(ri->i_atime_nsec);
130 inode->i_ctime.tv_nsec = le32_to_cpu(ri->i_ctime_nsec);
131 inode->i_mtime.tv_nsec = le32_to_cpu(ri->i_mtime_nsec);
132 inode->i_generation = le32_to_cpu(ri->i_generation);
134 fi->i_current_depth = le32_to_cpu(ri->i_current_depth);
135 fi->i_xattr_nid = le32_to_cpu(ri->i_xattr_nid);
136 fi->i_flags = le32_to_cpu(ri->i_flags);
137 fi->flags = 0;
138 fi->i_advise = ri->i_advise;
139 fi->i_pino = le32_to_cpu(ri->i_pino);
140 fi->i_dir_level = ri->i_dir_level;
142 if (f2fs_init_extent_tree(inode, &ri->i_ext))
143 set_page_dirty(node_page);
145 get_inline_info(inode, ri);
147 /* check data exist */
148 if (f2fs_has_inline_data(inode) && !f2fs_exist_data(inode))
149 __recover_inline_status(inode, node_page);
151 /* get rdev by using inline_info */
152 __get_inode_rdev(inode, ri);
154 if (__written_first_block(ri))
155 set_inode_flag(inode, FI_FIRST_BLOCK_WRITTEN);
157 if (!need_inode_block_update(sbi, inode->i_ino))
158 fi->last_disk_size = inode->i_size;
160 f2fs_put_page(node_page, 1);
162 stat_inc_inline_xattr(inode);
163 stat_inc_inline_inode(inode);
164 stat_inc_inline_dir(inode);
166 return 0;
169 struct inode *f2fs_iget(struct super_block *sb, unsigned long ino)
171 struct f2fs_sb_info *sbi = F2FS_SB(sb);
172 struct inode *inode;
173 int ret = 0;
175 inode = iget_locked(sb, ino);
176 if (!inode)
177 return ERR_PTR(-ENOMEM);
179 if (!(inode->i_state & I_NEW)) {
180 trace_f2fs_iget(inode);
181 return inode;
183 if (ino == F2FS_NODE_INO(sbi) || ino == F2FS_META_INO(sbi))
184 goto make_now;
186 ret = do_read_inode(inode);
187 if (ret)
188 goto bad_inode;
189 make_now:
190 if (ino == F2FS_NODE_INO(sbi)) {
191 inode->i_mapping->a_ops = &f2fs_node_aops;
192 mapping_set_gfp_mask(inode->i_mapping, GFP_F2FS_ZERO);
193 } else if (ino == F2FS_META_INO(sbi)) {
194 inode->i_mapping->a_ops = &f2fs_meta_aops;
195 mapping_set_gfp_mask(inode->i_mapping, GFP_F2FS_ZERO);
196 } else if (S_ISREG(inode->i_mode)) {
197 inode->i_op = &f2fs_file_inode_operations;
198 inode->i_fop = &f2fs_file_operations;
199 inode->i_mapping->a_ops = &f2fs_dblock_aops;
200 } else if (S_ISDIR(inode->i_mode)) {
201 inode->i_op = &f2fs_dir_inode_operations;
202 inode->i_fop = &f2fs_dir_operations;
203 inode->i_mapping->a_ops = &f2fs_dblock_aops;
204 mapping_set_gfp_mask(inode->i_mapping, GFP_F2FS_HIGH_ZERO);
205 } else if (S_ISLNK(inode->i_mode)) {
206 if (f2fs_encrypted_inode(inode))
207 inode->i_op = &f2fs_encrypted_symlink_inode_operations;
208 else
209 inode->i_op = &f2fs_symlink_inode_operations;
210 inode_nohighmem(inode);
211 inode->i_mapping->a_ops = &f2fs_dblock_aops;
212 } else if (S_ISCHR(inode->i_mode) || S_ISBLK(inode->i_mode) ||
213 S_ISFIFO(inode->i_mode) || S_ISSOCK(inode->i_mode)) {
214 inode->i_op = &f2fs_special_inode_operations;
215 init_special_inode(inode, inode->i_mode, inode->i_rdev);
216 } else {
217 ret = -EIO;
218 goto bad_inode;
220 unlock_new_inode(inode);
221 trace_f2fs_iget(inode);
222 return inode;
224 bad_inode:
225 iget_failed(inode);
226 trace_f2fs_iget_exit(inode, ret);
227 return ERR_PTR(ret);
230 int update_inode(struct inode *inode, struct page *node_page)
232 struct f2fs_inode *ri;
234 f2fs_wait_on_page_writeback(node_page, NODE, true);
236 ri = F2FS_INODE(node_page);
238 ri->i_mode = cpu_to_le16(inode->i_mode);
239 ri->i_advise = F2FS_I(inode)->i_advise;
240 ri->i_uid = cpu_to_le32(i_uid_read(inode));
241 ri->i_gid = cpu_to_le32(i_gid_read(inode));
242 ri->i_links = cpu_to_le32(inode->i_nlink);
243 ri->i_size = cpu_to_le64(i_size_read(inode));
244 ri->i_blocks = cpu_to_le64(inode->i_blocks);
246 if (F2FS_I(inode)->extent_tree)
247 set_raw_extent(&F2FS_I(inode)->extent_tree->largest,
248 &ri->i_ext);
249 else
250 memset(&ri->i_ext, 0, sizeof(ri->i_ext));
251 set_raw_inline(inode, ri);
253 ri->i_atime = cpu_to_le64(inode->i_atime.tv_sec);
254 ri->i_ctime = cpu_to_le64(inode->i_ctime.tv_sec);
255 ri->i_mtime = cpu_to_le64(inode->i_mtime.tv_sec);
256 ri->i_atime_nsec = cpu_to_le32(inode->i_atime.tv_nsec);
257 ri->i_ctime_nsec = cpu_to_le32(inode->i_ctime.tv_nsec);
258 ri->i_mtime_nsec = cpu_to_le32(inode->i_mtime.tv_nsec);
259 ri->i_current_depth = cpu_to_le32(F2FS_I(inode)->i_current_depth);
260 ri->i_xattr_nid = cpu_to_le32(F2FS_I(inode)->i_xattr_nid);
261 ri->i_flags = cpu_to_le32(F2FS_I(inode)->i_flags);
262 ri->i_pino = cpu_to_le32(F2FS_I(inode)->i_pino);
263 ri->i_generation = cpu_to_le32(inode->i_generation);
264 ri->i_dir_level = F2FS_I(inode)->i_dir_level;
266 __set_inode_rdev(inode, ri);
267 set_cold_node(inode, node_page);
268 f2fs_inode_synced(inode);
270 /* deleted inode */
271 if (inode->i_nlink == 0)
272 clear_inline_node(node_page);
274 return set_page_dirty(node_page);
277 int update_inode_page(struct inode *inode)
279 struct f2fs_sb_info *sbi = F2FS_I_SB(inode);
280 struct page *node_page;
281 int ret = 0;
282 retry:
283 node_page = get_node_page(sbi, inode->i_ino);
284 if (IS_ERR(node_page)) {
285 int err = PTR_ERR(node_page);
286 if (err == -ENOMEM) {
287 cond_resched();
288 goto retry;
289 } else if (err != -ENOENT) {
290 f2fs_stop_checkpoint(sbi, false);
292 f2fs_inode_synced(inode);
293 return 0;
295 ret = update_inode(inode, node_page);
296 f2fs_put_page(node_page, 1);
297 return ret;
300 int f2fs_write_inode(struct inode *inode, struct writeback_control *wbc)
302 struct f2fs_sb_info *sbi = F2FS_I_SB(inode);
304 if (inode->i_ino == F2FS_NODE_INO(sbi) ||
305 inode->i_ino == F2FS_META_INO(sbi))
306 return 0;
308 if (!is_inode_flag_set(inode, FI_DIRTY_INODE))
309 return 0;
312 * We need to balance fs here to prevent from producing dirty node pages
313 * during the urgent cleaning time when runing out of free sections.
315 if (update_inode_page(inode))
316 f2fs_balance_fs(sbi, true);
317 return 0;
321 * Called at the last iput() if i_nlink is zero
323 void f2fs_evict_inode(struct inode *inode)
325 struct f2fs_sb_info *sbi = F2FS_I_SB(inode);
326 nid_t xnid = F2FS_I(inode)->i_xattr_nid;
327 int err = 0;
329 /* some remained atomic pages should discarded */
330 if (f2fs_is_atomic_file(inode))
331 drop_inmem_pages(inode);
333 trace_f2fs_evict_inode(inode);
334 truncate_inode_pages_final(&inode->i_data);
336 if (inode->i_ino == F2FS_NODE_INO(sbi) ||
337 inode->i_ino == F2FS_META_INO(sbi))
338 goto out_clear;
340 f2fs_bug_on(sbi, get_dirty_pages(inode));
341 remove_dirty_inode(inode);
343 f2fs_destroy_extent_tree(inode);
345 if (inode->i_nlink || is_bad_inode(inode))
346 goto no_delete;
348 #ifdef CONFIG_F2FS_FAULT_INJECTION
349 if (time_to_inject(FAULT_EVICT_INODE))
350 goto no_delete;
351 #endif
353 sb_start_intwrite(inode->i_sb);
354 set_inode_flag(inode, FI_NO_ALLOC);
355 i_size_write(inode, 0);
356 retry:
357 if (F2FS_HAS_BLOCKS(inode))
358 err = f2fs_truncate(inode, true);
360 if (!err) {
361 f2fs_lock_op(sbi);
362 err = remove_inode_page(inode);
363 f2fs_unlock_op(sbi);
366 /* give more chances, if ENOMEM case */
367 if (err == -ENOMEM) {
368 err = 0;
369 goto retry;
372 if (err)
373 update_inode_page(inode);
374 sb_end_intwrite(inode->i_sb);
375 no_delete:
376 stat_dec_inline_xattr(inode);
377 stat_dec_inline_dir(inode);
378 stat_dec_inline_inode(inode);
380 invalidate_mapping_pages(NODE_MAPPING(sbi), inode->i_ino, inode->i_ino);
381 if (xnid)
382 invalidate_mapping_pages(NODE_MAPPING(sbi), xnid, xnid);
383 if (is_inode_flag_set(inode, FI_APPEND_WRITE))
384 add_ino_entry(sbi, inode->i_ino, APPEND_INO);
385 if (is_inode_flag_set(inode, FI_UPDATE_WRITE))
386 add_ino_entry(sbi, inode->i_ino, UPDATE_INO);
387 if (is_inode_flag_set(inode, FI_FREE_NID)) {
388 alloc_nid_failed(sbi, inode->i_ino);
389 clear_inode_flag(inode, FI_FREE_NID);
391 f2fs_bug_on(sbi, err &&
392 !exist_written_data(sbi, inode->i_ino, ORPHAN_INO));
393 out_clear:
394 fscrypt_put_encryption_info(inode, NULL);
396 f2fs_bug_on(sbi, is_inode_flag_set(inode, FI_DIRTY_INODE));
397 clear_inode(inode);
400 /* caller should call f2fs_lock_op() */
401 void handle_failed_inode(struct inode *inode)
403 struct f2fs_sb_info *sbi = F2FS_I_SB(inode);
404 struct node_info ni;
406 /* don't make bad inode, since it becomes a regular file. */
407 unlock_new_inode(inode);
410 * Note: we should add inode to orphan list before f2fs_unlock_op()
411 * so we can prevent losing this orphan when encoutering checkpoint
412 * and following suddenly power-off.
414 get_node_info(sbi, inode->i_ino, &ni);
416 if (ni.blk_addr != NULL_ADDR) {
417 int err = acquire_orphan_inode(sbi);
418 if (err) {
419 set_sbi_flag(sbi, SBI_NEED_FSCK);
420 f2fs_msg(sbi->sb, KERN_WARNING,
421 "Too many orphan inodes, run fsck to fix.");
422 } else {
423 add_orphan_inode(sbi, inode->i_ino);
425 alloc_nid_done(sbi, inode->i_ino);
426 } else {
427 set_inode_flag(inode, FI_FREE_NID);
430 f2fs_unlock_op(sbi);
432 /* iput will drop the inode object */
433 iput(inode);