f2fs: revisit inline_data to avoid data races and potential bugs
[GitHub/exynos8895/android_kernel_samsung_universal8895.git] / fs / f2fs / inode.c
CommitLineData
0a8165d7 1/*
19f99cee
JK
2 * fs/f2fs/inode.c
3 *
4 * Copyright (c) 2012 Samsung Electronics Co., Ltd.
5 * http://www.samsung.com/
6 *
7 * This program is free software; you can redistribute it and/or modify
8 * it under the terms of the GNU General Public License version 2 as
9 * published by the Free Software Foundation.
10 */
11#include <linux/fs.h>
12#include <linux/f2fs_fs.h>
13#include <linux/buffer_head.h>
14#include <linux/writeback.h>
8abfb36a 15#include <linux/bitops.h>
19f99cee
JK
16
17#include "f2fs.h"
18#include "node.h"
19
a2a4a7e4
NJ
20#include <trace/events/f2fs.h>
21
19f99cee
JK
22void f2fs_set_inode_flags(struct inode *inode)
23{
24 unsigned int flags = F2FS_I(inode)->i_flags;
8abfb36a 25 unsigned int new_fl = 0;
19f99cee
JK
26
27 if (flags & FS_SYNC_FL)
8abfb36a 28 new_fl |= S_SYNC;
19f99cee 29 if (flags & FS_APPEND_FL)
8abfb36a 30 new_fl |= S_APPEND;
19f99cee 31 if (flags & FS_IMMUTABLE_FL)
8abfb36a 32 new_fl |= S_IMMUTABLE;
19f99cee 33 if (flags & FS_NOATIME_FL)
8abfb36a 34 new_fl |= S_NOATIME;
19f99cee 35 if (flags & FS_DIRSYNC_FL)
8abfb36a
ZZ
36 new_fl |= S_DIRSYNC;
37 set_mask_bits(&inode->i_flags,
38 S_SYNC|S_APPEND|S_IMMUTABLE|S_NOATIME|S_DIRSYNC, new_fl);
19f99cee
JK
39}
40
3d1e3807
JK
41static void __get_inode_rdev(struct inode *inode, struct f2fs_inode *ri)
42{
43 if (S_ISCHR(inode->i_mode) || S_ISBLK(inode->i_mode) ||
44 S_ISFIFO(inode->i_mode) || S_ISSOCK(inode->i_mode)) {
45 if (ri->i_addr[0])
6c311ec6
CF
46 inode->i_rdev =
47 old_decode_dev(le32_to_cpu(ri->i_addr[0]));
3d1e3807 48 else
6c311ec6
CF
49 inode->i_rdev =
50 new_decode_dev(le32_to_cpu(ri->i_addr[1]));
3d1e3807
JK
51 }
52}
53
54static void __set_inode_rdev(struct inode *inode, struct f2fs_inode *ri)
55{
56 if (S_ISCHR(inode->i_mode) || S_ISBLK(inode->i_mode)) {
57 if (old_valid_dev(inode->i_rdev)) {
6c311ec6
CF
58 ri->i_addr[0] =
59 cpu_to_le32(old_encode_dev(inode->i_rdev));
3d1e3807
JK
60 ri->i_addr[1] = 0;
61 } else {
62 ri->i_addr[0] = 0;
6c311ec6
CF
63 ri->i_addr[1] =
64 cpu_to_le32(new_encode_dev(inode->i_rdev));
3d1e3807
JK
65 ri->i_addr[2] = 0;
66 }
67 }
68}
69
b3d208f9
JK
70static int __recover_inline_status(struct inode *inode, struct page *ipage)
71{
72 void *inline_data = inline_data_addr(ipage);
73 struct f2fs_inode *ri;
74 void *zbuf;
75
76 zbuf = kzalloc(MAX_INLINE_DATA, GFP_NOFS);
77 if (!zbuf)
78 return -ENOMEM;
79
80 if (!memcmp(zbuf, inline_data, MAX_INLINE_DATA)) {
81 kfree(zbuf);
82 return 0;
83 }
84 kfree(zbuf);
85
86 f2fs_wait_on_page_writeback(ipage, NODE);
87 set_inode_flag(F2FS_I(inode), FI_DATA_EXIST);
88
89 ri = F2FS_INODE(ipage);
90 set_raw_inline(F2FS_I(inode), ri);
91 set_page_dirty(ipage);
92 return 0;
93}
94
19f99cee
JK
95static int do_read_inode(struct inode *inode)
96{
4081363f 97 struct f2fs_sb_info *sbi = F2FS_I_SB(inode);
19f99cee
JK
98 struct f2fs_inode_info *fi = F2FS_I(inode);
99 struct page *node_page;
19f99cee 100 struct f2fs_inode *ri;
b3d208f9 101 int err = 0;
19f99cee
JK
102
103 /* Check if ino is within scope */
064e0823
NJ
104 if (check_nid_range(sbi, inode->i_ino)) {
105 f2fs_msg(inode->i_sb, KERN_ERR, "bad inode number: %lu",
106 (unsigned long) inode->i_ino);
d6b7d4b3 107 WARN_ON(1);
064e0823
NJ
108 return -EINVAL;
109 }
19f99cee
JK
110
111 node_page = get_node_page(sbi, inode->i_ino);
112 if (IS_ERR(node_page))
113 return PTR_ERR(node_page);
114
58bfaf44 115 ri = F2FS_INODE(node_page);
19f99cee
JK
116
117 inode->i_mode = le16_to_cpu(ri->i_mode);
118 i_uid_write(inode, le32_to_cpu(ri->i_uid));
119 i_gid_write(inode, le32_to_cpu(ri->i_gid));
120 set_nlink(inode, le32_to_cpu(ri->i_links));
121 inode->i_size = le64_to_cpu(ri->i_size);
122 inode->i_blocks = le64_to_cpu(ri->i_blocks);
123
124 inode->i_atime.tv_sec = le64_to_cpu(ri->i_atime);
125 inode->i_ctime.tv_sec = le64_to_cpu(ri->i_ctime);
126 inode->i_mtime.tv_sec = le64_to_cpu(ri->i_mtime);
127 inode->i_atime.tv_nsec = le32_to_cpu(ri->i_atime_nsec);
128 inode->i_ctime.tv_nsec = le32_to_cpu(ri->i_ctime_nsec);
129 inode->i_mtime.tv_nsec = le32_to_cpu(ri->i_mtime_nsec);
130 inode->i_generation = le32_to_cpu(ri->i_generation);
131
132 fi->i_current_depth = le32_to_cpu(ri->i_current_depth);
133 fi->i_xattr_nid = le32_to_cpu(ri->i_xattr_nid);
134 fi->i_flags = le32_to_cpu(ri->i_flags);
135 fi->flags = 0;
19f99cee 136 fi->i_advise = ri->i_advise;
6666e6aa 137 fi->i_pino = le32_to_cpu(ri->i_pino);
38431545 138 fi->i_dir_level = ri->i_dir_level;
3d1e3807 139
19f99cee 140 get_extent_info(&fi->ext, ri->i_ext);
444c580f 141 get_inline_info(fi, ri);
3d1e3807 142
b3d208f9
JK
143 /* check data exist */
144 if (f2fs_has_inline_data(inode) && !f2fs_exist_data(inode))
145 err = __recover_inline_status(inode, node_page);
146
3d1e3807
JK
147 /* get rdev by using inline_info */
148 __get_inode_rdev(inode, ri);
149
19f99cee 150 f2fs_put_page(node_page, 1);
b3d208f9 151 return err;
19f99cee
JK
152}
153
154struct inode *f2fs_iget(struct super_block *sb, unsigned long ino)
155{
156 struct f2fs_sb_info *sbi = F2FS_SB(sb);
157 struct inode *inode;
a2a4a7e4 158 int ret = 0;
19f99cee
JK
159
160 inode = iget_locked(sb, ino);
161 if (!inode)
162 return ERR_PTR(-ENOMEM);
a2a4a7e4
NJ
163
164 if (!(inode->i_state & I_NEW)) {
165 trace_f2fs_iget(inode);
19f99cee 166 return inode;
a2a4a7e4 167 }
19f99cee
JK
168 if (ino == F2FS_NODE_INO(sbi) || ino == F2FS_META_INO(sbi))
169 goto make_now;
170
171 ret = do_read_inode(inode);
172 if (ret)
173 goto bad_inode;
19f99cee
JK
174make_now:
175 if (ino == F2FS_NODE_INO(sbi)) {
176 inode->i_mapping->a_ops = &f2fs_node_aops;
177 mapping_set_gfp_mask(inode->i_mapping, GFP_F2FS_ZERO);
178 } else if (ino == F2FS_META_INO(sbi)) {
179 inode->i_mapping->a_ops = &f2fs_meta_aops;
180 mapping_set_gfp_mask(inode->i_mapping, GFP_F2FS_ZERO);
181 } else if (S_ISREG(inode->i_mode)) {
182 inode->i_op = &f2fs_file_inode_operations;
183 inode->i_fop = &f2fs_file_operations;
184 inode->i_mapping->a_ops = &f2fs_dblock_aops;
185 } else if (S_ISDIR(inode->i_mode)) {
186 inode->i_op = &f2fs_dir_inode_operations;
187 inode->i_fop = &f2fs_dir_operations;
188 inode->i_mapping->a_ops = &f2fs_dblock_aops;
a78186eb 189 mapping_set_gfp_mask(inode->i_mapping, GFP_F2FS_HIGH_ZERO);
19f99cee
JK
190 } else if (S_ISLNK(inode->i_mode)) {
191 inode->i_op = &f2fs_symlink_inode_operations;
192 inode->i_mapping->a_ops = &f2fs_dblock_aops;
193 } else if (S_ISCHR(inode->i_mode) || S_ISBLK(inode->i_mode) ||
194 S_ISFIFO(inode->i_mode) || S_ISSOCK(inode->i_mode)) {
195 inode->i_op = &f2fs_special_inode_operations;
196 init_special_inode(inode, inode->i_mode, inode->i_rdev);
197 } else {
198 ret = -EIO;
199 goto bad_inode;
200 }
201 unlock_new_inode(inode);
e7a2bf22 202 stat_inc_inline_inode(inode);
3289c061 203 stat_inc_inline_dir(inode);
a2a4a7e4 204 trace_f2fs_iget(inode);
19f99cee
JK
205 return inode;
206
207bad_inode:
208 iget_failed(inode);
a2a4a7e4 209 trace_f2fs_iget_exit(inode, ret);
19f99cee
JK
210 return ERR_PTR(ret);
211}
212
213void update_inode(struct inode *inode, struct page *node_page)
214{
19f99cee
JK
215 struct f2fs_inode *ri;
216
5514f0aa 217 f2fs_wait_on_page_writeback(node_page, NODE);
19f99cee 218
58bfaf44 219 ri = F2FS_INODE(node_page);
19f99cee
JK
220
221 ri->i_mode = cpu_to_le16(inode->i_mode);
222 ri->i_advise = F2FS_I(inode)->i_advise;
223 ri->i_uid = cpu_to_le32(i_uid_read(inode));
224 ri->i_gid = cpu_to_le32(i_gid_read(inode));
225 ri->i_links = cpu_to_le32(inode->i_nlink);
226 ri->i_size = cpu_to_le64(i_size_read(inode));
227 ri->i_blocks = cpu_to_le64(inode->i_blocks);
228 set_raw_extent(&F2FS_I(inode)->ext, &ri->i_ext);
444c580f 229 set_raw_inline(F2FS_I(inode), ri);
19f99cee
JK
230
231 ri->i_atime = cpu_to_le64(inode->i_atime.tv_sec);
232 ri->i_ctime = cpu_to_le64(inode->i_ctime.tv_sec);
233 ri->i_mtime = cpu_to_le64(inode->i_mtime.tv_sec);
234 ri->i_atime_nsec = cpu_to_le32(inode->i_atime.tv_nsec);
235 ri->i_ctime_nsec = cpu_to_le32(inode->i_ctime.tv_nsec);
236 ri->i_mtime_nsec = cpu_to_le32(inode->i_mtime.tv_nsec);
237 ri->i_current_depth = cpu_to_le32(F2FS_I(inode)->i_current_depth);
238 ri->i_xattr_nid = cpu_to_le32(F2FS_I(inode)->i_xattr_nid);
239 ri->i_flags = cpu_to_le32(F2FS_I(inode)->i_flags);
6666e6aa 240 ri->i_pino = cpu_to_le32(F2FS_I(inode)->i_pino);
19f99cee 241 ri->i_generation = cpu_to_le32(inode->i_generation);
38431545 242 ri->i_dir_level = F2FS_I(inode)->i_dir_level;
7d79e75f 243
3d1e3807 244 __set_inode_rdev(inode, ri);
398b1ac5 245 set_cold_node(inode, node_page);
19f99cee 246 set_page_dirty(node_page);
3d1e3807 247
b3783873 248 clear_inode_flag(F2FS_I(inode), FI_DIRTY_INODE);
19f99cee
JK
249}
250
744602cf 251void update_inode_page(struct inode *inode)
19f99cee 252{
4081363f 253 struct f2fs_sb_info *sbi = F2FS_I_SB(inode);
19f99cee 254 struct page *node_page;
744602cf 255retry:
19f99cee 256 node_page = get_node_page(sbi, inode->i_ino);
744602cf
JK
257 if (IS_ERR(node_page)) {
258 int err = PTR_ERR(node_page);
259 if (err == -ENOMEM) {
260 cond_resched();
261 goto retry;
262 } else if (err != -ENOENT) {
263 f2fs_stop_checkpoint(sbi);
264 }
265 return;
266 }
19f99cee
JK
267 update_inode(inode, node_page);
268 f2fs_put_page(node_page, 1);
19f99cee
JK
269}
270
39936837
JK
271int f2fs_write_inode(struct inode *inode, struct writeback_control *wbc)
272{
4081363f 273 struct f2fs_sb_info *sbi = F2FS_I_SB(inode);
39936837
JK
274
275 if (inode->i_ino == F2FS_NODE_INO(sbi) ||
276 inode->i_ino == F2FS_META_INO(sbi))
277 return 0;
278
b3783873
JK
279 if (!is_inode_flag_set(F2FS_I(inode), FI_DIRTY_INODE))
280 return 0;
281
39936837
JK
282 /*
283 * We need to lock here to prevent from producing dirty node pages
284 * during the urgent cleaning time when runing out of free sections.
285 */
e479556b 286 f2fs_lock_op(sbi);
744602cf 287 update_inode_page(inode);
e479556b 288 f2fs_unlock_op(sbi);
92c4342f
JX
289
290 if (wbc)
291 f2fs_balance_fs(sbi);
292
744602cf 293 return 0;
39936837
JK
294}
295
0a8165d7 296/*
19f99cee
JK
297 * Called at the last iput() if i_nlink is zero
298 */
299void f2fs_evict_inode(struct inode *inode)
300{
4081363f 301 struct f2fs_sb_info *sbi = F2FS_I_SB(inode);
002a41ca 302 nid_t xnid = F2FS_I(inode)->i_xattr_nid;
19f99cee 303
88b88a66 304 /* some remained atomic pages should discarded */
02a1335f 305 if (f2fs_is_atomic_file(inode) || f2fs_is_volatile_file(inode))
88b88a66
JK
306 commit_inmem_pages(inode, true);
307
a2a4a7e4 308 trace_f2fs_evict_inode(inode);
91b0abe3 309 truncate_inode_pages_final(&inode->i_data);
19f99cee
JK
310
311 if (inode->i_ino == F2FS_NODE_INO(sbi) ||
312 inode->i_ino == F2FS_META_INO(sbi))
dbf20cb2 313 goto out_clear;
19f99cee 314
a7ffdbe2 315 f2fs_bug_on(sbi, get_dirty_pages(inode));
19f99cee
JK
316 remove_dirty_dir_inode(inode);
317
318 if (inode->i_nlink || is_bad_inode(inode))
319 goto no_delete;
320
d6212a5f 321 sb_start_intwrite(inode->i_sb);
19f99cee
JK
322 set_inode_flag(F2FS_I(inode), FI_NO_ALLOC);
323 i_size_write(inode, 0);
324
325 if (F2FS_HAS_BLOCKS(inode))
326 f2fs_truncate(inode);
327
e479556b 328 f2fs_lock_op(sbi);
19f99cee 329 remove_inode_page(inode);
e479556b 330 f2fs_unlock_op(sbi);
39936837 331
d6212a5f 332 sb_end_intwrite(inode->i_sb);
19f99cee 333no_delete:
3289c061 334 stat_dec_inline_dir(inode);
e7a2bf22 335 stat_dec_inline_inode(inode);
8198899b 336 invalidate_mapping_pages(NODE_MAPPING(sbi), inode->i_ino, inode->i_ino);
002a41ca
CY
337 if (xnid)
338 invalidate_mapping_pages(NODE_MAPPING(sbi), xnid, xnid);
fff04f90
JK
339 if (is_inode_flag_set(F2FS_I(inode), FI_APPEND_WRITE))
340 add_dirty_inode(sbi, inode->i_ino, APPEND_INO);
341 if (is_inode_flag_set(F2FS_I(inode), FI_UPDATE_WRITE))
342 add_dirty_inode(sbi, inode->i_ino, UPDATE_INO);
dbf20cb2
CY
343out_clear:
344 clear_inode(inode);
19f99cee 345}
44c16156
JK
346
347/* caller should call f2fs_lock_op() */
348void handle_failed_inode(struct inode *inode)
349{
350 struct f2fs_sb_info *sbi = F2FS_I_SB(inode);
351
352 clear_nlink(inode);
353 make_bad_inode(inode);
354 unlock_new_inode(inode);
355
356 i_size_write(inode, 0);
357 if (F2FS_HAS_BLOCKS(inode))
358 f2fs_truncate(inode);
359
360 remove_inode_page(inode);
44c16156 361
b3d208f9 362 clear_inode_flag(F2FS_I(inode), FI_INLINE_DATA);
3289c061 363 clear_inode_flag(F2FS_I(inode), FI_INLINE_DENTRY);
44c16156
JK
364 alloc_nid_failed(sbi, inode->i_ino);
365 f2fs_unlock_op(sbi);
366
367 /* iput will drop the inode object */
368 iput(inode);
369}