block: remove QUEUE_FLAG_DISCARD
[linux-block.git] / fs / f2fs / file.c
CommitLineData
7c1a000d 1// SPDX-License-Identifier: GPL-2.0
0a8165d7 2/*
fbfa2cc5
JK
3 * fs/f2fs/file.c
4 *
5 * Copyright (c) 2012 Samsung Electronics Co., Ltd.
6 * http://www.samsung.com/
fbfa2cc5
JK
7 */
8#include <linux/fs.h>
9#include <linux/f2fs_fs.h>
10#include <linux/stat.h>
11#include <linux/buffer_head.h>
12#include <linux/writeback.h>
ae51fb31 13#include <linux/blkdev.h>
fbfa2cc5
JK
14#include <linux/falloc.h>
15#include <linux/types.h>
e9750824 16#include <linux/compat.h>
fbfa2cc5
JK
17#include <linux/uaccess.h>
18#include <linux/mount.h>
7f7670fe 19#include <linux/pagevec.h>
dc91de78 20#include <linux/uio.h>
8da4b8c4 21#include <linux/uuid.h>
4dd6f977 22#include <linux/file.h>
4507847c 23#include <linux/nls.h>
9af84648 24#include <linux/sched/signal.h>
9b1bb01c 25#include <linux/fileattr.h>
0f6b56ec 26#include <linux/fadvise.h>
a1e09b03 27#include <linux/iomap.h>
fbfa2cc5
JK
28
29#include "f2fs.h"
30#include "node.h"
31#include "segment.h"
32#include "xattr.h"
33#include "acl.h"
c1c1b583 34#include "gc.h"
52118743 35#include "iostat.h"
a2a4a7e4 36#include <trace/events/f2fs.h>
fa4320ce 37#include <uapi/linux/f2fs.h>
fbfa2cc5 38
ea4d479b 39static vm_fault_t f2fs_filemap_fault(struct vm_fault *vmf)
5a3a2d83
QS
40{
41 struct inode *inode = file_inode(vmf->vma->vm_file);
ea4d479b 42 vm_fault_t ret;
5a3a2d83 43
ea4d479b 44 ret = filemap_fault(vmf);
8b83ac81
CY
45 if (!ret)
46 f2fs_update_iostat(F2FS_I_SB(inode), APP_MAPPED_READ_IO,
47 F2FS_BLKSIZE);
48
d7648343
CY
49 trace_f2fs_filemap_fault(inode, vmf->pgoff, (unsigned long)ret);
50
ea4d479b 51 return ret;
5a3a2d83
QS
52}
53
ea4d479b 54static vm_fault_t f2fs_vm_page_mkwrite(struct vm_fault *vmf)
fbfa2cc5
JK
55{
56 struct page *page = vmf->page;
11bac800 57 struct inode *inode = file_inode(vmf->vma->vm_file);
4081363f 58 struct f2fs_sb_info *sbi = F2FS_I_SB(inode);
bdf03299 59 struct dnode_of_data dn;
4c8ff709
CY
60 bool need_alloc = true;
61 int err = 0;
fbfa2cc5 62
e0fcd015
CY
63 if (unlikely(IS_IMMUTABLE(inode)))
64 return VM_FAULT_SIGBUS;
65
c6140415
JK
66 if (is_inode_flag_set(inode, FI_COMPRESS_RELEASED))
67 return VM_FAULT_SIGBUS;
68
1f227a3e
JK
69 if (unlikely(f2fs_cp_error(sbi))) {
70 err = -EIO;
71 goto err;
72 }
73
00e09c0b
CY
74 if (!f2fs_is_checkpoint_ready(sbi)) {
75 err = -ENOSPC;
955ebcd3 76 goto err;
00e09c0b 77 }
1f227a3e 78
c8e43d55
CY
79 err = f2fs_convert_inline_inode(inode);
80 if (err)
81 goto err;
82
4c8ff709
CY
83#ifdef CONFIG_F2FS_FS_COMPRESSION
84 if (f2fs_compressed_file(inode)) {
85 int ret = f2fs_is_compressed_cluster(inode, page->index);
86
87 if (ret < 0) {
88 err = ret;
89 goto err;
90 } else if (ret) {
4c8ff709
CY
91 need_alloc = false;
92 }
93 }
94#endif
bdf03299 95 /* should do out of any locked page */
4c8ff709
CY
96 if (need_alloc)
97 f2fs_balance_fs(sbi, true);
bdf03299 98
fbfa2cc5 99 sb_start_pagefault(inode->i_sb);
b3d208f9
JK
100
101 f2fs_bug_on(sbi, f2fs_has_inline_data(inode));
b067ba1f 102
11bac800 103 file_update_time(vmf->vma->vm_file);
edc6d01b 104 filemap_invalidate_lock_shared(inode->i_mapping);
fbfa2cc5 105 lock_page(page);
6bacf52f 106 if (unlikely(page->mapping != inode->i_mapping ||
9851e6e1 107 page_offset(page) > i_size_read(inode) ||
6bacf52f 108 !PageUptodate(page))) {
fbfa2cc5
JK
109 unlock_page(page);
110 err = -EFAULT;
5a3a2d83 111 goto out_sem;
fbfa2cc5
JK
112 }
113
4c8ff709
CY
114 if (need_alloc) {
115 /* block allocation */
0ef81833 116 f2fs_do_map_lock(sbi, F2FS_GET_BLOCK_PRE_AIO, true);
4c8ff709
CY
117 set_new_dnode(&dn, inode, NULL, NULL, 0);
118 err = f2fs_get_block(&dn, page->index);
0ef81833 119 f2fs_do_map_lock(sbi, F2FS_GET_BLOCK_PRE_AIO, false);
39a86958
CY
120 }
121
06c7540f
CY
122#ifdef CONFIG_F2FS_FS_COMPRESSION
123 if (!need_alloc) {
124 set_new_dnode(&dn, inode, NULL, NULL, 0);
125 err = f2fs_get_dnode_of_data(&dn, page->index, LOOKUP_NODE);
126 f2fs_put_dnode(&dn);
127 }
128#endif
129 if (err) {
130 unlock_page(page);
131 goto out_sem;
39a86958
CY
132 }
133
bae0ee7a 134 f2fs_wait_on_page_writeback(page, DATA, false, true);
39a86958
CY
135
136 /* wait for GCed page writeback via META_MAPPING */
137 f2fs_wait_on_block_writeback(inode, dn.data_blkaddr);
138
fbfa2cc5
JK
139 /*
140 * check to see if the page is mapped already (no holes)
141 */
142 if (PageMappedToDisk(page))
39a86958 143 goto out_sem;
fbfa2cc5
JK
144
145 /* page is wholly or partially inside EOF */
09cbfeaf 146 if (((loff_t)(page->index + 1) << PAGE_SHIFT) >
9edcdabf 147 i_size_read(inode)) {
193bea1d 148 loff_t offset;
f11e98bd 149
09cbfeaf
KS
150 offset = i_size_read(inode) & ~PAGE_MASK;
151 zero_user_segment(page, offset, PAGE_SIZE);
fbfa2cc5
JK
152 }
153 set_page_dirty(page);
237c0790
JK
154 if (!PageUptodate(page))
155 SetPageUptodate(page);
fbfa2cc5 156
b0af6d49 157 f2fs_update_iostat(sbi, APP_MAPPED_IO, F2FS_BLKSIZE);
c75f2feb 158 f2fs_update_time(sbi, REQ_TIME);
b0af6d49 159
e943a10d 160 trace_f2fs_vm_page_mkwrite(page, DATA);
5a3a2d83 161out_sem:
edc6d01b 162 filemap_invalidate_unlock_shared(inode->i_mapping);
39a86958 163
fbfa2cc5 164 sb_end_pagefault(inode->i_sb);
1f227a3e 165err:
fbfa2cc5
JK
166 return block_page_mkwrite_return(err);
167}
168
169static const struct vm_operations_struct f2fs_file_vm_ops = {
5a3a2d83 170 .fault = f2fs_filemap_fault,
f1820361 171 .map_pages = filemap_map_pages,
692bb55d 172 .page_mkwrite = f2fs_vm_page_mkwrite,
fbfa2cc5
JK
173};
174
354a3399
JK
175static int get_parent_ino(struct inode *inode, nid_t *pino)
176{
177 struct dentry *dentry;
178
84c9c2de
EB
179 /*
180 * Make sure to get the non-deleted alias. The alias associated with
181 * the open file descriptor being fsync()'ed may be deleted already.
182 */
183 dentry = d_find_alias(inode);
354a3399
JK
184 if (!dentry)
185 return 0;
186
f0947e5c
JK
187 *pino = parent_ino(dentry);
188 dput(dentry);
354a3399
JK
189 return 1;
190}
191
a5fd5050 192static inline enum cp_reason_type need_do_checkpoint(struct inode *inode)
9d1589ef 193{
4081363f 194 struct f2fs_sb_info *sbi = F2FS_I_SB(inode);
a5fd5050 195 enum cp_reason_type cp_reason = CP_NO_NEEDED;
9d1589ef 196
a5fd5050
CY
197 if (!S_ISREG(inode->i_mode))
198 cp_reason = CP_NON_REGULAR;
4c8ff709
CY
199 else if (f2fs_compressed_file(inode))
200 cp_reason = CP_COMPRESSED;
a5fd5050
CY
201 else if (inode->i_nlink != 1)
202 cp_reason = CP_HARDLINK;
bbf156f7 203 else if (is_sbi_flag_set(sbi, SBI_NEED_CP))
a5fd5050 204 cp_reason = CP_SB_NEED_CP;
9d1589ef 205 else if (file_wrong_pino(inode))
a5fd5050 206 cp_reason = CP_WRONG_PINO;
4d57b86d 207 else if (!f2fs_space_for_roll_forward(sbi))
a5fd5050 208 cp_reason = CP_NO_SPC_ROLL;
4d57b86d 209 else if (!f2fs_is_checkpointed_node(sbi, F2FS_I(inode)->i_pino))
a5fd5050 210 cp_reason = CP_NODE_NEED_CP;
d5053a34 211 else if (test_opt(sbi, FASTBOOT))
a5fd5050 212 cp_reason = CP_FASTBOOT_MODE;
63189b78 213 else if (F2FS_OPTION(sbi).active_logs == 2)
a5fd5050 214 cp_reason = CP_SPEC_LOG_NUM;
63189b78 215 else if (F2FS_OPTION(sbi).fsync_mode == FSYNC_MODE_STRICT &&
4d57b86d
CY
216 f2fs_need_dentry_mark(sbi, inode->i_ino) &&
217 f2fs_exist_written_data(sbi, F2FS_I(inode)->i_pino,
218 TRANS_DIR_INO))
0a007b97 219 cp_reason = CP_RECOVER_DIR;
9d1589ef 220
a5fd5050 221 return cp_reason;
9d1589ef
CY
222}
223
9c7bb702
CL
224static bool need_inode_page_update(struct f2fs_sb_info *sbi, nid_t ino)
225{
226 struct page *i = find_get_page(NODE_MAPPING(sbi), ino);
227 bool ret = false;
228 /* But we need to avoid that there are some inode updates */
4d57b86d 229 if ((i && PageDirty(i)) || f2fs_need_inode_block_update(sbi, ino))
9c7bb702
CL
230 ret = true;
231 f2fs_put_page(i, 0);
232 return ret;
233}
234
51455b19
CL
235static void try_to_fix_pino(struct inode *inode)
236{
237 struct f2fs_inode_info *fi = F2FS_I(inode);
238 nid_t pino;
239
e4544b63 240 f2fs_down_write(&fi->i_sem);
51455b19
CL
241 if (file_wrong_pino(inode) && inode->i_nlink == 1 &&
242 get_parent_ino(inode, &pino)) {
205b9822 243 f2fs_i_pino_write(inode, pino);
51455b19 244 file_got_pino(inode);
51455b19 245 }
e4544b63 246 f2fs_up_write(&fi->i_sem);
51455b19
CL
247}
248
608514de
JK
249static int f2fs_do_sync_file(struct file *file, loff_t start, loff_t end,
250 int datasync, bool atomic)
fbfa2cc5
JK
251{
252 struct inode *inode = file->f_mapping->host;
4081363f 253 struct f2fs_sb_info *sbi = F2FS_I_SB(inode);
2403c155 254 nid_t ino = inode->i_ino;
fbfa2cc5 255 int ret = 0;
a5fd5050 256 enum cp_reason_type cp_reason = 0;
fbfa2cc5 257 struct writeback_control wbc = {
c81bf1c8 258 .sync_mode = WB_SYNC_ALL,
fbfa2cc5
JK
259 .nr_to_write = LONG_MAX,
260 .for_reclaim = 0,
261 };
50fa53ec 262 unsigned int seq_id = 0;
fbfa2cc5 263
dddd3d65 264 if (unlikely(f2fs_readonly(inode->i_sb)))
1fa95b0b
NJ
265 return 0;
266
a2a4a7e4 267 trace_f2fs_sync_file_enter(inode);
ea1aa12c 268
b61ac5b7
YH
269 if (S_ISDIR(inode->i_mode))
270 goto go_write;
271
ea1aa12c 272 /* if fdatasync is triggered, let's do in-place-update */
c46a155b 273 if (datasync || get_dirty_pages(inode) <= SM_I(sbi)->min_fsync_blocks)
91942321 274 set_inode_flag(inode, FI_NEED_IPU);
3b49c9a1 275 ret = file_write_and_wait_range(file, start, end);
91942321 276 clear_inode_flag(inode, FI_NEED_IPU);
c1ce1b02 277
dddd3d65 278 if (ret || is_sbi_flag_set(sbi, SBI_CP_DISABLED)) {
a5fd5050 279 trace_f2fs_sync_file_exit(inode, cp_reason, datasync, ret);
fbfa2cc5 280 return ret;
a2a4a7e4 281 }
fbfa2cc5 282
9c7bb702 283 /* if the inode is dirty, let's recover all the time */
281518c6 284 if (!f2fs_skip_inode_update(inode, datasync)) {
2286c020 285 f2fs_write_inode(inode, NULL);
9c7bb702
CL
286 goto go_write;
287 }
288
6d99ba41
JK
289 /*
290 * if there is no written data, don't waste time to write recovery info.
291 */
91942321 292 if (!is_inode_flag_set(inode, FI_APPEND_WRITE) &&
4d57b86d 293 !f2fs_exist_written_data(sbi, ino, APPEND_INO)) {
19c9c466 294
9c7bb702
CL
295 /* it may call write_inode just prior to fsync */
296 if (need_inode_page_update(sbi, ino))
19c9c466 297 goto go_write;
19c9c466 298
91942321 299 if (is_inode_flag_set(inode, FI_UPDATE_WRITE) ||
4d57b86d 300 f2fs_exist_written_data(sbi, ino, UPDATE_INO))
6d99ba41
JK
301 goto flush_out;
302 goto out;
27879915
CY
303 } else {
304 /*
305 * for OPU case, during fsync(), node can be persisted before
306 * data when lower device doesn't support write barrier, result
307 * in data corruption after SPO.
308 * So for strict fsync mode, force to use atomic write sematics
309 * to keep write order in between data/node and last node to
310 * avoid potential data corruption.
311 */
312 if (F2FS_OPTION(sbi).fsync_mode ==
313 FSYNC_MODE_STRICT && !atomic)
314 atomic = true;
6d99ba41 315 }
19c9c466 316go_write:
e5d2385e
JK
317 /*
318 * Both of fdatasync() and fsync() are able to be recovered from
319 * sudden-power-off.
320 */
e4544b63 321 f2fs_down_read(&F2FS_I(inode)->i_sem);
a5fd5050 322 cp_reason = need_do_checkpoint(inode);
e4544b63 323 f2fs_up_read(&F2FS_I(inode)->i_sem);
d928bfbf 324
a5fd5050 325 if (cp_reason) {
fbfa2cc5
JK
326 /* all the dirty node pages should be flushed for POR */
327 ret = f2fs_sync_fs(inode->i_sb, 1);
d928bfbf 328
51455b19
CL
329 /*
330 * We've secured consistency through sync_fs. Following pino
331 * will be used only for fsynced inodes after checkpoint.
332 */
333 try_to_fix_pino(inode);
91942321
JK
334 clear_inode_flag(inode, FI_APPEND_WRITE);
335 clear_inode_flag(inode, FI_UPDATE_WRITE);
51455b19
CL
336 goto out;
337 }
88bd02c9 338sync_nodes:
c29fd0c0 339 atomic_inc(&sbi->wb_sync_req[NODE]);
50fa53ec 340 ret = f2fs_fsync_node_pages(sbi, inode, &wbc, atomic, &seq_id);
c29fd0c0 341 atomic_dec(&sbi->wb_sync_req[NODE]);
c267ec15
JK
342 if (ret)
343 goto out;
51455b19 344
871f599f 345 /* if cp_error was enabled, we should avoid infinite loop */
6d5a1495
CY
346 if (unlikely(f2fs_cp_error(sbi))) {
347 ret = -EIO;
871f599f 348 goto out;
6d5a1495 349 }
871f599f 350
4d57b86d 351 if (f2fs_need_inode_block_update(sbi, ino)) {
7c45729a 352 f2fs_mark_inode_dirty_sync(inode, true);
51455b19
CL
353 f2fs_write_inode(inode, NULL);
354 goto sync_nodes;
fbfa2cc5 355 }
51455b19 356
b6a245eb
JK
357 /*
358 * If it's atomic_write, it's just fine to keep write ordering. So
359 * here we don't need to wait for node write completion, since we use
360 * node chain which serializes node blocks. If one of node writes are
361 * reordered, we can see simply broken chain, resulting in stopping
362 * roll-forward recovery. It means we'll recover all or none node blocks
363 * given fsync mark.
364 */
365 if (!atomic) {
50fa53ec 366 ret = f2fs_wait_on_node_pages_writeback(sbi, seq_id);
b6a245eb
JK
367 if (ret)
368 goto out;
369 }
51455b19
CL
370
371 /* once recovery info is written, don't need to tack this */
4d57b86d 372 f2fs_remove_ino_entry(sbi, ino, APPEND_INO);
91942321 373 clear_inode_flag(inode, FI_APPEND_WRITE);
51455b19 374flush_out:
d6290814 375 if (!atomic && F2FS_OPTION(sbi).fsync_mode != FSYNC_MODE_NOBARRIER)
39d787be 376 ret = f2fs_issue_flush(sbi, inode->i_ino);
3f06252f 377 if (!ret) {
4d57b86d 378 f2fs_remove_ino_entry(sbi, ino, UPDATE_INO);
3f06252f 379 clear_inode_flag(inode, FI_UPDATE_WRITE);
4d57b86d 380 f2fs_remove_ino_entry(sbi, ino, FLUSH_INO);
3f06252f 381 }
d0239e1b 382 f2fs_update_time(sbi, REQ_TIME);
fbfa2cc5 383out:
a5fd5050 384 trace_f2fs_sync_file_exit(inode, cp_reason, datasync, ret);
fbfa2cc5
JK
385 return ret;
386}
387
608514de
JK
388int f2fs_sync_file(struct file *file, loff_t start, loff_t end, int datasync)
389{
1f227a3e
JK
390 if (unlikely(f2fs_cp_error(F2FS_I_SB(file_inode(file)))))
391 return -EIO;
608514de
JK
392 return f2fs_do_sync_file(file, start, end, datasync, false);
393}
394
4cb03fec
MWO
395static bool __found_offset(struct address_space *mapping, block_t blkaddr,
396 pgoff_t index, int whence)
7f7670fe
JK
397{
398 switch (whence) {
399 case SEEK_DATA:
4cb03fec
MWO
400 if (__is_valid_data_blkaddr(blkaddr))
401 return true;
402 if (blkaddr == NEW_ADDR &&
403 xa_get_mark(&mapping->i_pages, index, PAGECACHE_TAG_DIRTY))
7f7670fe
JK
404 return true;
405 break;
406 case SEEK_HOLE:
407 if (blkaddr == NULL_ADDR)
408 return true;
409 break;
410 }
411 return false;
412}
413
267378d4
CY
414static loff_t f2fs_seek_block(struct file *file, loff_t offset, int whence)
415{
416 struct inode *inode = file->f_mapping->host;
417 loff_t maxbytes = inode->i_sb->s_maxbytes;
418 struct dnode_of_data dn;
4cb03fec 419 pgoff_t pgofs, end_offset;
7f7670fe
JK
420 loff_t data_ofs = offset;
421 loff_t isize;
267378d4
CY
422 int err = 0;
423
5955102c 424 inode_lock(inode);
267378d4
CY
425
426 isize = i_size_read(inode);
427 if (offset >= isize)
428 goto fail;
429
430 /* handle inline data case */
7a6e59d7
CY
431 if (f2fs_has_inline_data(inode)) {
432 if (whence == SEEK_HOLE) {
433 data_ofs = isize;
434 goto found;
435 } else if (whence == SEEK_DATA) {
436 data_ofs = offset;
437 goto found;
438 }
267378d4
CY
439 }
440
09cbfeaf 441 pgofs = (pgoff_t)(offset >> PAGE_SHIFT);
267378d4 442
09cbfeaf 443 for (; data_ofs < isize; data_ofs = (loff_t)pgofs << PAGE_SHIFT) {
267378d4 444 set_new_dnode(&dn, inode, NULL, NULL, 0);
4d57b86d 445 err = f2fs_get_dnode_of_data(&dn, pgofs, LOOKUP_NODE);
267378d4
CY
446 if (err && err != -ENOENT) {
447 goto fail;
448 } else if (err == -ENOENT) {
e1c42045 449 /* direct node does not exists */
267378d4 450 if (whence == SEEK_DATA) {
4d57b86d 451 pgofs = f2fs_get_next_page_offset(&dn, pgofs);
267378d4
CY
452 continue;
453 } else {
454 goto found;
455 }
456 }
457
81ca7350 458 end_offset = ADDRS_PER_PAGE(dn.node_page, inode);
267378d4
CY
459
460 /* find data/hole in dnode block */
461 for (; dn.ofs_in_node < end_offset;
462 dn.ofs_in_node++, pgofs++,
09cbfeaf 463 data_ofs = (loff_t)pgofs << PAGE_SHIFT) {
267378d4 464 block_t blkaddr;
f11e98bd 465
a2ced1ce 466 blkaddr = f2fs_data_blkaddr(&dn);
267378d4 467
c9b60788
CY
468 if (__is_valid_data_blkaddr(blkaddr) &&
469 !f2fs_is_valid_blkaddr(F2FS_I_SB(inode),
93770ab7 470 blkaddr, DATA_GENERIC_ENHANCE)) {
c9b60788
CY
471 f2fs_put_dnode(&dn);
472 goto fail;
473 }
474
4cb03fec 475 if (__found_offset(file->f_mapping, blkaddr,
e1da7872 476 pgofs, whence)) {
267378d4
CY
477 f2fs_put_dnode(&dn);
478 goto found;
479 }
480 }
481 f2fs_put_dnode(&dn);
482 }
483
484 if (whence == SEEK_DATA)
485 goto fail;
267378d4 486found:
fe369bc8
JK
487 if (whence == SEEK_HOLE && data_ofs > isize)
488 data_ofs = isize;
5955102c 489 inode_unlock(inode);
267378d4
CY
490 return vfs_setpos(file, data_ofs, maxbytes);
491fail:
5955102c 492 inode_unlock(inode);
267378d4
CY
493 return -ENXIO;
494}
495
496static loff_t f2fs_llseek(struct file *file, loff_t offset, int whence)
497{
498 struct inode *inode = file->f_mapping->host;
499 loff_t maxbytes = inode->i_sb->s_maxbytes;
500
6d1451bf
CX
501 if (f2fs_compressed_file(inode))
502 maxbytes = max_file_blocks(inode) << F2FS_BLKSIZE_BITS;
503
267378d4
CY
504 switch (whence) {
505 case SEEK_SET:
506 case SEEK_CUR:
507 case SEEK_END:
508 return generic_file_llseek_size(file, offset, whence,
509 maxbytes, i_size_read(inode));
510 case SEEK_DATA:
511 case SEEK_HOLE:
0b4c5afd
JK
512 if (offset < 0)
513 return -ENXIO;
267378d4
CY
514 return f2fs_seek_block(file, offset, whence);
515 }
516
517 return -EINVAL;
518}
519
fbfa2cc5
JK
520static int f2fs_file_mmap(struct file *file, struct vm_area_struct *vma)
521{
b3d208f9
JK
522 struct inode *inode = file_inode(file);
523
1f227a3e
JK
524 if (unlikely(f2fs_cp_error(F2FS_I_SB(inode))))
525 return -EIO;
526
4c8ff709
CY
527 if (!f2fs_is_compress_backend_ready(inode))
528 return -EOPNOTSUPP;
529
fbfa2cc5
JK
530 file_accessed(file);
531 vma->vm_ops = &f2fs_file_vm_ops;
4c8ff709 532 set_inode_flag(inode, FI_MMAP_FILE);
fbfa2cc5
JK
533 return 0;
534}
535
fcc85a4d
JK
536static int f2fs_file_open(struct inode *inode, struct file *filp)
537{
2e168c82 538 int err = fscrypt_file_open(inode, filp);
fcc85a4d 539
95ae251f
EB
540 if (err)
541 return err;
542
4c8ff709
CY
543 if (!f2fs_is_compress_backend_ready(inode))
544 return -EOPNOTSUPP;
545
95ae251f 546 err = fsverity_file_open(inode, filp);
2e168c82
EB
547 if (err)
548 return err;
b91050a8
HL
549
550 filp->f_mode |= FMODE_NOWAIT;
551
0abd675e 552 return dquot_file_open(inode, filp);
fcc85a4d
JK
553}
554
4d57b86d 555void f2fs_truncate_data_blocks_range(struct dnode_of_data *dn, int count)
fbfa2cc5 556{
4081363f 557 struct f2fs_sb_info *sbi = F2FS_I_SB(dn->inode);
fbfa2cc5 558 struct f2fs_node *raw_node;
19b2c30d 559 int nr_free = 0, ofs = dn->ofs_in_node, len = count;
fbfa2cc5 560 __le32 *addr;
7a2af766 561 int base = 0;
4c8ff709
CY
562 bool compressed_cluster = false;
563 int cluster_index = 0, valid_blocks = 0;
564 int cluster_size = F2FS_I(dn->inode)->i_cluster_size;
c2759eba 565 bool released = !atomic_read(&F2FS_I(dn->inode)->i_compr_blocks);
7a2af766
CY
566
567 if (IS_INODE(dn->node_page) && f2fs_has_extra_attr(dn->inode))
568 base = get_extra_isize(dn->inode);
fbfa2cc5 569
45590710 570 raw_node = F2FS_NODE(dn->node_page);
7a2af766 571 addr = blkaddr_in_node(raw_node) + base + ofs;
fbfa2cc5 572
4c8ff709
CY
573 /* Assumption: truncateion starts with cluster */
574 for (; count > 0; count--, addr++, dn->ofs_in_node++, cluster_index++) {
fbfa2cc5 575 block_t blkaddr = le32_to_cpu(*addr);
f11e98bd 576
4c8ff709
CY
577 if (f2fs_compressed_file(dn->inode) &&
578 !(cluster_index & (cluster_size - 1))) {
579 if (compressed_cluster)
580 f2fs_i_compr_blocks_update(dn->inode,
581 valid_blocks, false);
582 compressed_cluster = (blkaddr == COMPRESS_ADDR);
583 valid_blocks = 0;
584 }
585
fbfa2cc5
JK
586 if (blkaddr == NULL_ADDR)
587 continue;
588
e1509cf2 589 dn->data_blkaddr = NULL_ADDR;
4d57b86d 590 f2fs_set_data_blkaddr(dn);
c9b60788 591
4c8ff709
CY
592 if (__is_valid_data_blkaddr(blkaddr)) {
593 if (!f2fs_is_valid_blkaddr(sbi, blkaddr,
93770ab7 594 DATA_GENERIC_ENHANCE))
4c8ff709
CY
595 continue;
596 if (compressed_cluster)
597 valid_blocks++;
598 }
c9b60788 599
3c6c2beb 600 if (dn->ofs_in_node == 0 && IS_INODE(dn->node_page))
91942321 601 clear_inode_flag(dn->inode, FI_FIRST_BLOCK_WRITTEN);
4c8ff709
CY
602
603 f2fs_invalidate_blocks(sbi, blkaddr);
ef8d563f
CY
604
605 if (!released || blkaddr != COMPRESS_ADDR)
606 nr_free++;
fbfa2cc5 607 }
19b2c30d 608
4c8ff709
CY
609 if (compressed_cluster)
610 f2fs_i_compr_blocks_update(dn->inode, valid_blocks, false);
611
fbfa2cc5 612 if (nr_free) {
19b2c30d
CY
613 pgoff_t fofs;
614 /*
615 * once we invalidate valid blkaddr in range [ofs, ofs + count],
616 * we will invalidate all blkaddr in the whole range.
617 */
4d57b86d 618 fofs = f2fs_start_bidx_of_node(ofs_of_node(dn->node_page),
81ca7350 619 dn->inode) + ofs;
19b2c30d 620 f2fs_update_extent_cache_range(dn, fofs, 0, len);
d7cc950b 621 dec_valid_block_count(sbi, dn->inode, nr_free);
fbfa2cc5
JK
622 }
623 dn->ofs_in_node = ofs;
51dd6249 624
d0239e1b 625 f2fs_update_time(sbi, REQ_TIME);
51dd6249
NJ
626 trace_f2fs_truncate_data_blocks_range(dn->inode, dn->nid,
627 dn->ofs_in_node, nr_free);
fbfa2cc5
JK
628}
629
4d57b86d 630void f2fs_truncate_data_blocks(struct dnode_of_data *dn)
fbfa2cc5 631{
d02a6e61 632 f2fs_truncate_data_blocks_range(dn, ADDRS_PER_BLOCK(dn->inode));
fbfa2cc5
JK
633}
634
0bfcfcca 635static int truncate_partial_data_page(struct inode *inode, u64 from,
43f3eae1 636 bool cache_only)
fbfa2cc5 637{
193bea1d 638 loff_t offset = from & (PAGE_SIZE - 1);
09cbfeaf 639 pgoff_t index = from >> PAGE_SHIFT;
43f3eae1 640 struct address_space *mapping = inode->i_mapping;
fbfa2cc5
JK
641 struct page *page;
642
43f3eae1 643 if (!offset && !cache_only)
b3d208f9 644 return 0;
fbfa2cc5 645
43f3eae1 646 if (cache_only) {
34b5d5c2 647 page = find_lock_page(mapping, index);
43f3eae1
JK
648 if (page && PageUptodate(page))
649 goto truncate_out;
650 f2fs_put_page(page, 1);
b3d208f9 651 return 0;
43f3eae1 652 }
fbfa2cc5 653
4d57b86d 654 page = f2fs_get_lock_data_page(inode, index, true);
43f3eae1 655 if (IS_ERR(page))
a78aaa2c 656 return PTR_ERR(page) == -ENOENT ? 0 : PTR_ERR(page);
43f3eae1 657truncate_out:
bae0ee7a 658 f2fs_wait_on_page_writeback(page, DATA, true, true);
09cbfeaf 659 zero_user(page, offset, PAGE_SIZE - offset);
a9bcf9bc
JK
660
661 /* An encrypted inode should have a key and truncate the last page. */
62230e0d 662 f2fs_bug_on(F2FS_I_SB(inode), cache_only && IS_ENCRYPTED(inode));
a9bcf9bc 663 if (!cache_only)
0bfcfcca 664 set_page_dirty(page);
fbfa2cc5 665 f2fs_put_page(page, 1);
b3d208f9 666 return 0;
fbfa2cc5
JK
667}
668
3265d3db 669int f2fs_do_truncate_blocks(struct inode *inode, u64 from, bool lock)
fbfa2cc5 670{
4081363f 671 struct f2fs_sb_info *sbi = F2FS_I_SB(inode);
fbfa2cc5
JK
672 struct dnode_of_data dn;
673 pgoff_t free_from;
9ffe0fb5 674 int count = 0, err = 0;
b3d208f9 675 struct page *ipage;
0bfcfcca 676 bool truncate_page = false;
fbfa2cc5 677
51dd6249
NJ
678 trace_f2fs_truncate_blocks_enter(inode, from);
679
df033caf 680 free_from = (pgoff_t)F2FS_BLK_ALIGN(from);
fbfa2cc5 681
6d1451bf 682 if (free_from >= max_file_blocks(inode))
09210c97
CY
683 goto free_partial;
684
764aa3e9 685 if (lock)
c42d28ce 686 f2fs_lock_op(sbi);
9ffe0fb5 687
4d57b86d 688 ipage = f2fs_get_node_page(sbi, inode->i_ino);
b3d208f9
JK
689 if (IS_ERR(ipage)) {
690 err = PTR_ERR(ipage);
691 goto out;
692 }
693
694 if (f2fs_has_inline_data(inode)) {
4d57b86d 695 f2fs_truncate_inline_inode(inode, ipage, from);
b3d208f9 696 f2fs_put_page(ipage, 1);
0bfcfcca 697 truncate_page = true;
b3d208f9
JK
698 goto out;
699 }
700
701 set_new_dnode(&dn, inode, ipage, NULL, 0);
4d57b86d 702 err = f2fs_get_dnode_of_data(&dn, free_from, LOOKUP_NODE_RA);
fbfa2cc5
JK
703 if (err) {
704 if (err == -ENOENT)
705 goto free_next;
b3d208f9 706 goto out;
1ce86bf6
JK
707 }
708
81ca7350 709 count = ADDRS_PER_PAGE(dn.node_page, inode);
fbfa2cc5
JK
710
711 count -= dn.ofs_in_node;
9850cf4a 712 f2fs_bug_on(sbi, count < 0);
39936837 713
fbfa2cc5 714 if (dn.ofs_in_node || IS_INODE(dn.node_page)) {
4d57b86d 715 f2fs_truncate_data_blocks_range(&dn, count);
fbfa2cc5
JK
716 free_from += count;
717 }
718
719 f2fs_put_dnode(&dn);
720free_next:
4d57b86d 721 err = f2fs_truncate_inode_blocks(inode, free_from);
764d2c80
JK
722out:
723 if (lock)
c42d28ce 724 f2fs_unlock_op(sbi);
09210c97 725free_partial:
b3d208f9
JK
726 /* lastly zero out the first data page */
727 if (!err)
0bfcfcca 728 err = truncate_partial_data_page(inode, from, truncate_page);
fbfa2cc5 729
51dd6249 730 trace_f2fs_truncate_blocks_exit(inode, err);
fbfa2cc5
JK
731 return err;
732}
733
4c8ff709
CY
734int f2fs_truncate_blocks(struct inode *inode, u64 from, bool lock)
735{
736 u64 free_from = from;
3265d3db 737 int err;
4c8ff709 738
3265d3db 739#ifdef CONFIG_F2FS_FS_COMPRESSION
4c8ff709
CY
740 /*
741 * for compressed file, only support cluster size
742 * aligned truncation.
743 */
4fec3fc0
CY
744 if (f2fs_compressed_file(inode))
745 free_from = round_up(from,
746 F2FS_I(inode)->i_cluster_size << PAGE_SHIFT);
3265d3db
CY
747#endif
748
749 err = f2fs_do_truncate_blocks(inode, free_from, lock);
750 if (err)
751 return err;
752
753#ifdef CONFIG_F2FS_FS_COMPRESSION
4a4fc043
FC
754 /*
755 * For compressed file, after release compress blocks, don't allow write
756 * direct, but we should allow write direct after truncate to zero.
757 */
758 if (f2fs_compressed_file(inode) && !free_from
759 && is_inode_flag_set(inode, FI_COMPRESS_RELEASED))
760 clear_inode_flag(inode, FI_COMPRESS_RELEASED);
761
17d7648d 762 if (from != free_from) {
3265d3db 763 err = f2fs_truncate_partial_cluster(inode, from, lock);
17d7648d
CY
764 if (err)
765 return err;
766 }
3265d3db 767#endif
4c8ff709 768
17d7648d 769 return 0;
4c8ff709
CY
770}
771
9a449e9c 772int f2fs_truncate(struct inode *inode)
fbfa2cc5 773{
b0154891
CY
774 int err;
775
1f227a3e
JK
776 if (unlikely(f2fs_cp_error(F2FS_I_SB(inode))))
777 return -EIO;
778
fbfa2cc5
JK
779 if (!(S_ISREG(inode->i_mode) || S_ISDIR(inode->i_mode) ||
780 S_ISLNK(inode->i_mode)))
b0154891 781 return 0;
fbfa2cc5 782
51dd6249
NJ
783 trace_f2fs_truncate(inode);
784
14b44d23 785 if (time_to_inject(F2FS_I_SB(inode), FAULT_TRUNCATE)) {
c45d6002 786 f2fs_show_injection_info(F2FS_I_SB(inode), FAULT_TRUNCATE);
14b44d23
JK
787 return -EIO;
788 }
7fa750a1 789
10a26878 790 err = f2fs_dquot_initialize(inode);
25fb04db
YC
791 if (err)
792 return err;
793
92dffd01 794 /* we should check inline_data size */
b9d777b8 795 if (!f2fs_may_inline_data(inode)) {
b0154891
CY
796 err = f2fs_convert_inline_inode(inode);
797 if (err)
798 return err;
92dffd01
JK
799 }
800
c42d28ce 801 err = f2fs_truncate_blocks(inode, i_size_read(inode), true);
b0154891
CY
802 if (err)
803 return err;
804
078cd827 805 inode->i_mtime = inode->i_ctime = current_time(inode);
7c45729a 806 f2fs_mark_inode_dirty_sync(inode, false);
b0154891 807 return 0;
fbfa2cc5
JK
808}
809
549c7297
CB
810int f2fs_getattr(struct user_namespace *mnt_userns, const struct path *path,
811 struct kstat *stat, u32 request_mask, unsigned int query_flags)
fbfa2cc5 812{
a528d35e 813 struct inode *inode = d_inode(path->dentry);
1c6d8ee4 814 struct f2fs_inode_info *fi = F2FS_I(inode);
d13732cc 815 struct f2fs_inode *ri = NULL;
1c6d8ee4
CY
816 unsigned int flags;
817
1c1d35df 818 if (f2fs_has_extra_attr(inode) &&
7beb01f7 819 f2fs_sb_has_inode_crtime(F2FS_I_SB(inode)) &&
1c1d35df
CY
820 F2FS_FITS_IN_INODE(ri, fi->i_extra_isize, i_crtime)) {
821 stat->result_mask |= STATX_BTIME;
822 stat->btime.tv_sec = fi->i_crtime.tv_sec;
823 stat->btime.tv_nsec = fi->i_crtime.tv_nsec;
824 }
825
36098557 826 flags = fi->i_flags;
fd26725f
CY
827 if (flags & F2FS_COMPR_FL)
828 stat->attributes |= STATX_ATTR_COMPRESSED;
59c84408 829 if (flags & F2FS_APPEND_FL)
1c6d8ee4 830 stat->attributes |= STATX_ATTR_APPEND;
62230e0d 831 if (IS_ENCRYPTED(inode))
1c6d8ee4 832 stat->attributes |= STATX_ATTR_ENCRYPTED;
59c84408 833 if (flags & F2FS_IMMUTABLE_FL)
1c6d8ee4 834 stat->attributes |= STATX_ATTR_IMMUTABLE;
59c84408 835 if (flags & F2FS_NODUMP_FL)
1c6d8ee4 836 stat->attributes |= STATX_ATTR_NODUMP;
924e3194
EB
837 if (IS_VERITY(inode))
838 stat->attributes |= STATX_ATTR_VERITY;
1c6d8ee4 839
fd26725f
CY
840 stat->attributes_mask |= (STATX_ATTR_COMPRESSED |
841 STATX_ATTR_APPEND |
1c6d8ee4
CY
842 STATX_ATTR_ENCRYPTED |
843 STATX_ATTR_IMMUTABLE |
924e3194
EB
844 STATX_ATTR_NODUMP |
845 STATX_ATTR_VERITY);
1c6d8ee4 846
984fc4e7 847 generic_fillattr(mnt_userns, inode, stat);
5b4267d1
JK
848
849 /* we need to show initial sectors used for inline_data/dentries */
850 if ((S_ISREG(inode->i_mode) && f2fs_has_inline_data(inode)) ||
851 f2fs_has_inline_dentry(inode))
852 stat->blocks += (stat->size + 511) >> 9;
853
fbfa2cc5
JK
854 return 0;
855}
856
857#ifdef CONFIG_F2FS_FS_POSIX_ACL
e65ce2a5
CB
858static void __setattr_copy(struct user_namespace *mnt_userns,
859 struct inode *inode, const struct iattr *attr)
fbfa2cc5 860{
fbfa2cc5
JK
861 unsigned int ia_valid = attr->ia_valid;
862
863 if (ia_valid & ATTR_UID)
864 inode->i_uid = attr->ia_uid;
865 if (ia_valid & ATTR_GID)
866 inode->i_gid = attr->ia_gid;
eb31e2f6
AG
867 if (ia_valid & ATTR_ATIME)
868 inode->i_atime = attr->ia_atime;
869 if (ia_valid & ATTR_MTIME)
870 inode->i_mtime = attr->ia_mtime;
871 if (ia_valid & ATTR_CTIME)
872 inode->i_ctime = attr->ia_ctime;
fbfa2cc5
JK
873 if (ia_valid & ATTR_MODE) {
874 umode_t mode = attr->ia_mode;
2f221d6f 875 kgid_t kgid = i_gid_into_mnt(mnt_userns, inode);
fbfa2cc5 876
7d6beb71 877 if (!in_group_p(kgid) && !capable_wrt_inode_uidgid(mnt_userns, inode, CAP_FSETID))
fbfa2cc5 878 mode &= ~S_ISGID;
91942321 879 set_acl_inode(inode, mode);
fbfa2cc5
JK
880 }
881}
882#else
883#define __setattr_copy setattr_copy
884#endif
885
549c7297
CB
886int f2fs_setattr(struct user_namespace *mnt_userns, struct dentry *dentry,
887 struct iattr *attr)
fbfa2cc5 888{
2b0143b5 889 struct inode *inode = d_inode(dentry);
fbfa2cc5
JK
890 int err;
891
1f227a3e
JK
892 if (unlikely(f2fs_cp_error(F2FS_I_SB(inode))))
893 return -EIO;
894
e0fcd015
CY
895 if (unlikely(IS_IMMUTABLE(inode)))
896 return -EPERM;
897
898 if (unlikely(IS_APPEND(inode) &&
899 (attr->ia_valid & (ATTR_MODE | ATTR_UID |
900 ATTR_GID | ATTR_TIMES_SET))))
901 return -EPERM;
902
4c8ff709
CY
903 if ((attr->ia_valid & ATTR_SIZE) &&
904 !f2fs_is_compress_backend_ready(inode))
905 return -EOPNOTSUPP;
906
984fc4e7 907 err = setattr_prepare(mnt_userns, dentry, attr);
fbfa2cc5
JK
908 if (err)
909 return err;
910
20bb2479
EB
911 err = fscrypt_prepare_setattr(dentry, attr);
912 if (err)
913 return err;
914
95ae251f
EB
915 err = fsverity_prepare_setattr(dentry, attr);
916 if (err)
917 return err;
918
0abd675e 919 if (is_quota_modification(inode, attr)) {
10a26878 920 err = f2fs_dquot_initialize(inode);
0abd675e
CY
921 if (err)
922 return err;
923 }
924 if ((attr->ia_valid & ATTR_UID &&
925 !uid_eq(attr->ia_uid, inode->i_uid)) ||
926 (attr->ia_valid & ATTR_GID &&
927 !gid_eq(attr->ia_gid, inode->i_gid))) {
af033b2a 928 f2fs_lock_op(F2FS_I_SB(inode));
0abd675e 929 err = dquot_transfer(inode, attr);
af033b2a
CY
930 if (err) {
931 set_sbi_flag(F2FS_I_SB(inode),
932 SBI_QUOTA_NEED_REPAIR);
933 f2fs_unlock_op(F2FS_I_SB(inode));
0abd675e 934 return err;
af033b2a
CY
935 }
936 /*
937 * update uid/gid under lock_op(), so that dquot and inode can
938 * be updated atomically.
939 */
940 if (attr->ia_valid & ATTR_UID)
941 inode->i_uid = attr->ia_uid;
942 if (attr->ia_valid & ATTR_GID)
943 inode->i_gid = attr->ia_gid;
944 f2fs_mark_inode_dirty_sync(inode, true);
945 f2fs_unlock_op(F2FS_I_SB(inode));
0abd675e
CY
946 }
947
09db6a2e 948 if (attr->ia_valid & ATTR_SIZE) {
cfb9a34d
JK
949 loff_t old_size = i_size_read(inode);
950
951 if (attr->ia_size > MAX_INLINE_DATA(inode)) {
952 /*
953 * should convert inline inode before i_size_write to
954 * keep smaller than inline_data size with inline flag.
955 */
956 err = f2fs_convert_inline_inode(inode);
957 if (err)
958 return err;
959 }
a33c1502 960
e4544b63 961 f2fs_down_write(&F2FS_I(inode)->i_gc_rwsem[WRITE]);
edc6d01b 962 filemap_invalidate_lock(inode->i_mapping);
a33c1502
CY
963
964 truncate_setsize(inode, attr->ia_size);
965
cfb9a34d 966 if (attr->ia_size <= old_size)
9a449e9c 967 err = f2fs_truncate(inode);
a33c1502
CY
968 /*
969 * do not trim all blocks after i_size if target size is
970 * larger than i_size.
971 */
edc6d01b 972 filemap_invalidate_unlock(inode->i_mapping);
e4544b63 973 f2fs_up_write(&F2FS_I(inode)->i_gc_rwsem[WRITE]);
a33c1502
CY
974 if (err)
975 return err;
0cab80ee 976
c10c9820 977 spin_lock(&F2FS_I(inode)->i_size_lock);
cfb9a34d 978 inode->i_mtime = inode->i_ctime = current_time(inode);
a0d00fad 979 F2FS_I(inode)->last_disk_size = i_size_read(inode);
c10c9820 980 spin_unlock(&F2FS_I(inode)->i_size_lock);
fbfa2cc5
JK
981 }
982
984fc4e7 983 __setattr_copy(mnt_userns, inode, attr);
fbfa2cc5
JK
984
985 if (attr->ia_valid & ATTR_MODE) {
984fc4e7 986 err = posix_acl_chmod(mnt_userns, inode, f2fs_get_inode_mode(inode));
17232e83
CY
987
988 if (is_inode_flag_set(inode, FI_ACL_MODE)) {
989 if (!err)
990 inode->i_mode = F2FS_I(inode)->i_acl_mode;
91942321 991 clear_inode_flag(inode, FI_ACL_MODE);
fbfa2cc5
JK
992 }
993 }
994
c0ed4405 995 /* file size may changed here */
ca597bdd 996 f2fs_mark_inode_dirty_sync(inode, true);
15d04354
JK
997
998 /* inode change will produce dirty node pages flushed by checkpoint */
999 f2fs_balance_fs(F2FS_I_SB(inode), true);
1000
fbfa2cc5
JK
1001 return err;
1002}
1003
1004const struct inode_operations f2fs_file_inode_operations = {
1005 .getattr = f2fs_getattr,
1006 .setattr = f2fs_setattr,
1007 .get_acl = f2fs_get_acl,
a6dda0e6 1008 .set_acl = f2fs_set_acl,
fbfa2cc5 1009 .listxattr = f2fs_listxattr,
9ab70134 1010 .fiemap = f2fs_fiemap,
9b1bb01c
MS
1011 .fileattr_get = f2fs_fileattr_get,
1012 .fileattr_set = f2fs_fileattr_set,
fbfa2cc5
JK
1013};
1014
6394328a 1015static int fill_zero(struct inode *inode, pgoff_t index,
fbfa2cc5
JK
1016 loff_t start, loff_t len)
1017{
4081363f 1018 struct f2fs_sb_info *sbi = F2FS_I_SB(inode);
fbfa2cc5
JK
1019 struct page *page;
1020
1021 if (!len)
6394328a 1022 return 0;
fbfa2cc5 1023
2c4db1a6 1024 f2fs_balance_fs(sbi, true);
bd43df02 1025
e479556b 1026 f2fs_lock_op(sbi);
4d57b86d 1027 page = f2fs_get_new_data_page(inode, NULL, index, false);
e479556b 1028 f2fs_unlock_op(sbi);
fbfa2cc5 1029
6394328a
CY
1030 if (IS_ERR(page))
1031 return PTR_ERR(page);
1032
bae0ee7a 1033 f2fs_wait_on_page_writeback(page, DATA, true, true);
6394328a
CY
1034 zero_user(page, start, len);
1035 set_page_dirty(page);
1036 f2fs_put_page(page, 1);
1037 return 0;
fbfa2cc5
JK
1038}
1039
4d57b86d 1040int f2fs_truncate_hole(struct inode *inode, pgoff_t pg_start, pgoff_t pg_end)
fbfa2cc5 1041{
fbfa2cc5
JK
1042 int err;
1043
ea58711e 1044 while (pg_start < pg_end) {
fbfa2cc5 1045 struct dnode_of_data dn;
ea58711e 1046 pgoff_t end_offset, count;
9eaeba70 1047
fbfa2cc5 1048 set_new_dnode(&dn, inode, NULL, NULL, 0);
4d57b86d 1049 err = f2fs_get_dnode_of_data(&dn, pg_start, LOOKUP_NODE);
fbfa2cc5 1050 if (err) {
ea58711e 1051 if (err == -ENOENT) {
4d57b86d
CY
1052 pg_start = f2fs_get_next_page_offset(&dn,
1053 pg_start);
fbfa2cc5 1054 continue;
ea58711e 1055 }
fbfa2cc5
JK
1056 return err;
1057 }
1058
81ca7350 1059 end_offset = ADDRS_PER_PAGE(dn.node_page, inode);
ea58711e
CY
1060 count = min(end_offset - dn.ofs_in_node, pg_end - pg_start);
1061
1062 f2fs_bug_on(F2FS_I_SB(inode), count == 0 || count > end_offset);
1063
4d57b86d 1064 f2fs_truncate_data_blocks_range(&dn, count);
fbfa2cc5 1065 f2fs_put_dnode(&dn);
ea58711e
CY
1066
1067 pg_start += count;
fbfa2cc5
JK
1068 }
1069 return 0;
1070}
1071
a66c7b2f 1072static int punch_hole(struct inode *inode, loff_t offset, loff_t len)
fbfa2cc5
JK
1073{
1074 pgoff_t pg_start, pg_end;
1075 loff_t off_start, off_end;
b9d777b8 1076 int ret;
fbfa2cc5 1077
b9d777b8
JK
1078 ret = f2fs_convert_inline_inode(inode);
1079 if (ret)
1080 return ret;
9ffe0fb5 1081
09cbfeaf
KS
1082 pg_start = ((unsigned long long) offset) >> PAGE_SHIFT;
1083 pg_end = ((unsigned long long) offset + len) >> PAGE_SHIFT;
fbfa2cc5 1084
09cbfeaf
KS
1085 off_start = offset & (PAGE_SIZE - 1);
1086 off_end = (offset + len) & (PAGE_SIZE - 1);
fbfa2cc5
JK
1087
1088 if (pg_start == pg_end) {
6394328a 1089 ret = fill_zero(inode, pg_start, off_start,
fbfa2cc5 1090 off_end - off_start);
6394328a
CY
1091 if (ret)
1092 return ret;
fbfa2cc5 1093 } else {
6394328a
CY
1094 if (off_start) {
1095 ret = fill_zero(inode, pg_start++, off_start,
09cbfeaf 1096 PAGE_SIZE - off_start);
6394328a
CY
1097 if (ret)
1098 return ret;
1099 }
1100 if (off_end) {
1101 ret = fill_zero(inode, pg_end, 0, off_end);
1102 if (ret)
1103 return ret;
1104 }
fbfa2cc5
JK
1105
1106 if (pg_start < pg_end) {
fbfa2cc5 1107 loff_t blk_start, blk_end;
4081363f 1108 struct f2fs_sb_info *sbi = F2FS_I_SB(inode);
1127a3d4 1109
2c4db1a6 1110 f2fs_balance_fs(sbi, true);
fbfa2cc5 1111
09cbfeaf
KS
1112 blk_start = (loff_t)pg_start << PAGE_SHIFT;
1113 blk_end = (loff_t)pg_end << PAGE_SHIFT;
a33c1502 1114
e4544b63 1115 f2fs_down_write(&F2FS_I(inode)->i_gc_rwsem[WRITE]);
6abaa83c 1116 filemap_invalidate_lock(inode->i_mapping);
a33c1502 1117
c8dc3047 1118 truncate_pagecache_range(inode, blk_start, blk_end - 1);
39936837 1119
e479556b 1120 f2fs_lock_op(sbi);
4d57b86d 1121 ret = f2fs_truncate_hole(inode, pg_start, pg_end);
e479556b 1122 f2fs_unlock_op(sbi);
a33c1502 1123
6abaa83c 1124 filemap_invalidate_unlock(inode->i_mapping);
e4544b63 1125 f2fs_up_write(&F2FS_I(inode)->i_gc_rwsem[WRITE]);
fbfa2cc5
JK
1126 }
1127 }
1128
fbfa2cc5
JK
1129 return ret;
1130}
1131
0a2aa8fb
JK
1132static int __read_out_blkaddrs(struct inode *inode, block_t *blkaddr,
1133 int *do_replace, pgoff_t off, pgoff_t len)
b4ace337
CY
1134{
1135 struct f2fs_sb_info *sbi = F2FS_I_SB(inode);
1136 struct dnode_of_data dn;
0a2aa8fb 1137 int ret, done, i;
ecbaa406 1138
0a2aa8fb 1139next_dnode:
6e2c64ad 1140 set_new_dnode(&dn, inode, NULL, NULL, 0);
4d57b86d 1141 ret = f2fs_get_dnode_of_data(&dn, off, LOOKUP_NODE_RA);
6e2c64ad
JK
1142 if (ret && ret != -ENOENT) {
1143 return ret;
1144 } else if (ret == -ENOENT) {
0a2aa8fb
JK
1145 if (dn.max_level == 0)
1146 return -ENOENT;
4c8ff709
CY
1147 done = min((pgoff_t)ADDRS_PER_BLOCK(inode) -
1148 dn.ofs_in_node, len);
0a2aa8fb
JK
1149 blkaddr += done;
1150 do_replace += done;
1151 goto next;
1152 }
1153
1154 done = min((pgoff_t)ADDRS_PER_PAGE(dn.node_page, inode) -
1155 dn.ofs_in_node, len);
1156 for (i = 0; i < done; i++, blkaddr++, do_replace++, dn.ofs_in_node++) {
a2ced1ce 1157 *blkaddr = f2fs_data_blkaddr(&dn);
93770ab7
CY
1158
1159 if (__is_valid_data_blkaddr(*blkaddr) &&
1160 !f2fs_is_valid_blkaddr(sbi, *blkaddr,
1161 DATA_GENERIC_ENHANCE)) {
1162 f2fs_put_dnode(&dn);
10f966bb 1163 return -EFSCORRUPTED;
93770ab7
CY
1164 }
1165
4d57b86d 1166 if (!f2fs_is_checkpointed_data(sbi, *blkaddr)) {
0a2aa8fb 1167
b0332a0f 1168 if (f2fs_lfs_mode(sbi)) {
0a2aa8fb 1169 f2fs_put_dnode(&dn);
fd114ab2 1170 return -EOPNOTSUPP;
0a2aa8fb
JK
1171 }
1172
6e2c64ad 1173 /* do not invalidate this block address */
f28b3434 1174 f2fs_update_data_blkaddr(&dn, NULL_ADDR);
0a2aa8fb 1175 *do_replace = 1;
b4ace337 1176 }
6e2c64ad 1177 }
0a2aa8fb
JK
1178 f2fs_put_dnode(&dn);
1179next:
1180 len -= done;
1181 off += done;
1182 if (len)
1183 goto next_dnode;
1184 return 0;
1185}
b4ace337 1186
0a2aa8fb
JK
1187static int __roll_back_blkaddrs(struct inode *inode, block_t *blkaddr,
1188 int *do_replace, pgoff_t off, int len)
1189{
1190 struct f2fs_sb_info *sbi = F2FS_I_SB(inode);
1191 struct dnode_of_data dn;
1192 int ret, i;
b4ace337 1193
0a2aa8fb
JK
1194 for (i = 0; i < len; i++, do_replace++, blkaddr++) {
1195 if (*do_replace == 0)
1196 continue;
b4ace337 1197
0a2aa8fb 1198 set_new_dnode(&dn, inode, NULL, NULL, 0);
4d57b86d 1199 ret = f2fs_get_dnode_of_data(&dn, off + i, LOOKUP_NODE_RA);
0a2aa8fb
JK
1200 if (ret) {
1201 dec_valid_block_count(sbi, inode, 1);
4d57b86d 1202 f2fs_invalidate_blocks(sbi, *blkaddr);
0a2aa8fb
JK
1203 } else {
1204 f2fs_update_data_blkaddr(&dn, *blkaddr);
36abef4e 1205 }
0a2aa8fb
JK
1206 f2fs_put_dnode(&dn);
1207 }
1208 return 0;
1209}
1210
1211static int __clone_blkaddrs(struct inode *src_inode, struct inode *dst_inode,
1212 block_t *blkaddr, int *do_replace,
1213 pgoff_t src, pgoff_t dst, pgoff_t len, bool full)
1214{
1215 struct f2fs_sb_info *sbi = F2FS_I_SB(src_inode);
1216 pgoff_t i = 0;
1217 int ret;
36abef4e 1218
0a2aa8fb
JK
1219 while (i < len) {
1220 if (blkaddr[i] == NULL_ADDR && !full) {
1221 i++;
1222 continue;
6e2c64ad 1223 }
b4ace337 1224
0a2aa8fb
JK
1225 if (do_replace[i] || blkaddr[i] == NULL_ADDR) {
1226 struct dnode_of_data dn;
1227 struct node_info ni;
1228 size_t new_size;
1229 pgoff_t ilen;
b4ace337 1230
0a2aa8fb 1231 set_new_dnode(&dn, dst_inode, NULL, NULL, 0);
4d57b86d 1232 ret = f2fs_get_dnode_of_data(&dn, dst + i, ALLOC_NODE);
0a2aa8fb
JK
1233 if (ret)
1234 return ret;
b4ace337 1235
a9419b63 1236 ret = f2fs_get_node_info(sbi, dn.nid, &ni, false);
7735730d
CY
1237 if (ret) {
1238 f2fs_put_dnode(&dn);
1239 return ret;
1240 }
1241
0a2aa8fb
JK
1242 ilen = min((pgoff_t)
1243 ADDRS_PER_PAGE(dn.node_page, dst_inode) -
1244 dn.ofs_in_node, len - i);
1245 do {
a2ced1ce 1246 dn.data_blkaddr = f2fs_data_blkaddr(&dn);
4d57b86d 1247 f2fs_truncate_data_blocks_range(&dn, 1);
0a2aa8fb
JK
1248
1249 if (do_replace[i]) {
1250 f2fs_i_blocks_write(src_inode,
0abd675e 1251 1, false, false);
0a2aa8fb 1252 f2fs_i_blocks_write(dst_inode,
0abd675e 1253 1, true, false);
0a2aa8fb
JK
1254 f2fs_replace_block(sbi, &dn, dn.data_blkaddr,
1255 blkaddr[i], ni.version, true, false);
1256
1257 do_replace[i] = 0;
1258 }
1259 dn.ofs_in_node++;
1260 i++;
1f0d5c91 1261 new_size = (loff_t)(dst + i) << PAGE_SHIFT;
0a2aa8fb
JK
1262 if (dst_inode->i_size < new_size)
1263 f2fs_i_size_write(dst_inode, new_size);
e87f7329 1264 } while (--ilen && (do_replace[i] || blkaddr[i] == NULL_ADDR));
6e2c64ad 1265
0a2aa8fb
JK
1266 f2fs_put_dnode(&dn);
1267 } else {
1268 struct page *psrc, *pdst;
1269
4d57b86d
CY
1270 psrc = f2fs_get_lock_data_page(src_inode,
1271 src + i, true);
0a2aa8fb
JK
1272 if (IS_ERR(psrc))
1273 return PTR_ERR(psrc);
4d57b86d 1274 pdst = f2fs_get_new_data_page(dst_inode, NULL, dst + i,
0a2aa8fb
JK
1275 true);
1276 if (IS_ERR(pdst)) {
1277 f2fs_put_page(psrc, 1);
1278 return PTR_ERR(pdst);
1279 }
1280 f2fs_copy_page(psrc, pdst);
1281 set_page_dirty(pdst);
1282 f2fs_put_page(pdst, 1);
6e2c64ad 1283 f2fs_put_page(psrc, 1);
b4ace337 1284
4d57b86d
CY
1285 ret = f2fs_truncate_hole(src_inode,
1286 src + i, src + i + 1);
0a2aa8fb
JK
1287 if (ret)
1288 return ret;
1289 i++;
1290 }
6e2c64ad
JK
1291 }
1292 return 0;
0a2aa8fb 1293}
b4ace337 1294
0a2aa8fb
JK
1295static int __exchange_data_block(struct inode *src_inode,
1296 struct inode *dst_inode, pgoff_t src, pgoff_t dst,
363cad7f 1297 pgoff_t len, bool full)
0a2aa8fb
JK
1298{
1299 block_t *src_blkaddr;
1300 int *do_replace;
363cad7f 1301 pgoff_t olen;
0a2aa8fb
JK
1302 int ret;
1303
363cad7f 1304 while (len) {
d02a6e61 1305 olen = min((pgoff_t)4 * ADDRS_PER_BLOCK(src_inode), len);
0a2aa8fb 1306
628b3d14 1307 src_blkaddr = f2fs_kvzalloc(F2FS_I_SB(src_inode),
9d2a789c 1308 array_size(olen, sizeof(block_t)),
4f4460c0 1309 GFP_NOFS);
363cad7f
JK
1310 if (!src_blkaddr)
1311 return -ENOMEM;
0a2aa8fb 1312
628b3d14 1313 do_replace = f2fs_kvzalloc(F2FS_I_SB(src_inode),
9d2a789c 1314 array_size(olen, sizeof(int)),
4f4460c0 1315 GFP_NOFS);
363cad7f
JK
1316 if (!do_replace) {
1317 kvfree(src_blkaddr);
1318 return -ENOMEM;
1319 }
0a2aa8fb 1320
363cad7f
JK
1321 ret = __read_out_blkaddrs(src_inode, src_blkaddr,
1322 do_replace, src, olen);
1323 if (ret)
1324 goto roll_back;
0a2aa8fb 1325
363cad7f
JK
1326 ret = __clone_blkaddrs(src_inode, dst_inode, src_blkaddr,
1327 do_replace, src, dst, olen, full);
1328 if (ret)
1329 goto roll_back;
1330
1331 src += olen;
1332 dst += olen;
1333 len -= olen;
1334
1335 kvfree(src_blkaddr);
1336 kvfree(do_replace);
1337 }
0a2aa8fb
JK
1338 return 0;
1339
1340roll_back:
9fd62605 1341 __roll_back_blkaddrs(src_inode, src_blkaddr, do_replace, src, olen);
0a2aa8fb
JK
1342 kvfree(src_blkaddr);
1343 kvfree(do_replace);
6e2c64ad
JK
1344 return ret;
1345}
b4ace337 1346
6f8d4455 1347static int f2fs_do_collapse(struct inode *inode, loff_t offset, loff_t len)
6e2c64ad
JK
1348{
1349 struct f2fs_sb_info *sbi = F2FS_I_SB(inode);
f91108b8 1350 pgoff_t nrpages = DIV_ROUND_UP(i_size_read(inode), PAGE_SIZE);
6f8d4455
JK
1351 pgoff_t start = offset >> PAGE_SHIFT;
1352 pgoff_t end = (offset + len) >> PAGE_SHIFT;
0a2aa8fb 1353 int ret;
6e2c64ad 1354
0a2aa8fb 1355 f2fs_balance_fs(sbi, true);
5f281fab 1356
6f8d4455 1357 /* avoid gc operation during block exchange */
e4544b63 1358 f2fs_down_write(&F2FS_I(inode)->i_gc_rwsem[WRITE]);
edc6d01b 1359 filemap_invalidate_lock(inode->i_mapping);
5f281fab 1360
6f8d4455
JK
1361 f2fs_lock_op(sbi);
1362 f2fs_drop_extent_tree(inode);
1363 truncate_pagecache(inode, offset);
0a2aa8fb
JK
1364 ret = __exchange_data_block(inode, inode, end, start, nrpages - end, true);
1365 f2fs_unlock_op(sbi);
6f8d4455 1366
edc6d01b 1367 filemap_invalidate_unlock(inode->i_mapping);
e4544b63 1368 f2fs_up_write(&F2FS_I(inode)->i_gc_rwsem[WRITE]);
b4ace337
CY
1369 return ret;
1370}
1371
1372static int f2fs_collapse_range(struct inode *inode, loff_t offset, loff_t len)
1373{
b4ace337
CY
1374 loff_t new_size;
1375 int ret;
1376
b4ace337
CY
1377 if (offset + len >= i_size_read(inode))
1378 return -EINVAL;
1379
1380 /* collapse range should be aligned to block size of f2fs. */
1381 if (offset & (F2FS_BLKSIZE - 1) || len & (F2FS_BLKSIZE - 1))
1382 return -EINVAL;
1383
b9d777b8
JK
1384 ret = f2fs_convert_inline_inode(inode);
1385 if (ret)
1386 return ret;
97a7b2c2 1387
b4ace337
CY
1388 /* write out all dirty pages from offset */
1389 ret = filemap_write_and_wait_range(inode->i_mapping, offset, LLONG_MAX);
1390 if (ret)
6f8d4455 1391 return ret;
b4ace337 1392
6f8d4455 1393 ret = f2fs_do_collapse(inode, offset, len);
b4ace337 1394 if (ret)
6f8d4455 1395 return ret;
b4ace337 1396
6e2c64ad 1397 /* write out all moved pages, if possible */
edc6d01b 1398 filemap_invalidate_lock(inode->i_mapping);
6e2c64ad
JK
1399 filemap_write_and_wait_range(inode->i_mapping, offset, LLONG_MAX);
1400 truncate_pagecache(inode, offset);
1401
b4ace337 1402 new_size = i_size_read(inode) - len;
c42d28ce 1403 ret = f2fs_truncate_blocks(inode, new_size, true);
edc6d01b 1404 filemap_invalidate_unlock(inode->i_mapping);
b4ace337 1405 if (!ret)
fc9581c8 1406 f2fs_i_size_write(inode, new_size);
b4ace337
CY
1407 return ret;
1408}
1409
6e961949
CY
1410static int f2fs_do_zero_range(struct dnode_of_data *dn, pgoff_t start,
1411 pgoff_t end)
1412{
1413 struct f2fs_sb_info *sbi = F2FS_I_SB(dn->inode);
1414 pgoff_t index = start;
1415 unsigned int ofs_in_node = dn->ofs_in_node;
1416 blkcnt_t count = 0;
1417 int ret;
1418
1419 for (; index < end; index++, dn->ofs_in_node++) {
a2ced1ce 1420 if (f2fs_data_blkaddr(dn) == NULL_ADDR)
6e961949
CY
1421 count++;
1422 }
1423
1424 dn->ofs_in_node = ofs_in_node;
4d57b86d 1425 ret = f2fs_reserve_new_blocks(dn, count);
6e961949
CY
1426 if (ret)
1427 return ret;
1428
1429 dn->ofs_in_node = ofs_in_node;
1430 for (index = start; index < end; index++, dn->ofs_in_node++) {
a2ced1ce 1431 dn->data_blkaddr = f2fs_data_blkaddr(dn);
6e961949 1432 /*
4d57b86d 1433 * f2fs_reserve_new_blocks will not guarantee entire block
6e961949
CY
1434 * allocation.
1435 */
1436 if (dn->data_blkaddr == NULL_ADDR) {
1437 ret = -ENOSPC;
1438 break;
1439 }
1440 if (dn->data_blkaddr != NEW_ADDR) {
4d57b86d 1441 f2fs_invalidate_blocks(sbi, dn->data_blkaddr);
6e961949 1442 dn->data_blkaddr = NEW_ADDR;
4d57b86d 1443 f2fs_set_data_blkaddr(dn);
6e961949
CY
1444 }
1445 }
1446
1447 f2fs_update_extent_cache_range(dn, start, 0, index - start);
1448
1449 return ret;
1450}
1451
75cd4e09
CY
1452static int f2fs_zero_range(struct inode *inode, loff_t offset, loff_t len,
1453 int mode)
1454{
1455 struct f2fs_sb_info *sbi = F2FS_I_SB(inode);
1456 struct address_space *mapping = inode->i_mapping;
1457 pgoff_t index, pg_start, pg_end;
1458 loff_t new_size = i_size_read(inode);
1459 loff_t off_start, off_end;
1460 int ret = 0;
1461
75cd4e09
CY
1462 ret = inode_newsize_ok(inode, (len + offset));
1463 if (ret)
1464 return ret;
1465
b9d777b8
JK
1466 ret = f2fs_convert_inline_inode(inode);
1467 if (ret)
1468 return ret;
75cd4e09
CY
1469
1470 ret = filemap_write_and_wait_range(mapping, offset, offset + len - 1);
1471 if (ret)
6f8d4455 1472 return ret;
75cd4e09 1473
09cbfeaf
KS
1474 pg_start = ((unsigned long long) offset) >> PAGE_SHIFT;
1475 pg_end = ((unsigned long long) offset + len) >> PAGE_SHIFT;
75cd4e09 1476
09cbfeaf
KS
1477 off_start = offset & (PAGE_SIZE - 1);
1478 off_end = (offset + len) & (PAGE_SIZE - 1);
75cd4e09
CY
1479
1480 if (pg_start == pg_end) {
6394328a
CY
1481 ret = fill_zero(inode, pg_start, off_start,
1482 off_end - off_start);
1483 if (ret)
6f8d4455 1484 return ret;
6394328a 1485
75cd4e09
CY
1486 new_size = max_t(loff_t, new_size, offset + len);
1487 } else {
1488 if (off_start) {
6394328a 1489 ret = fill_zero(inode, pg_start++, off_start,
09cbfeaf 1490 PAGE_SIZE - off_start);
6394328a 1491 if (ret)
6f8d4455 1492 return ret;
6394328a 1493
75cd4e09 1494 new_size = max_t(loff_t, new_size,
09cbfeaf 1495 (loff_t)pg_start << PAGE_SHIFT);
75cd4e09
CY
1496 }
1497
6e961949 1498 for (index = pg_start; index < pg_end;) {
75cd4e09 1499 struct dnode_of_data dn;
6e961949
CY
1500 unsigned int end_offset;
1501 pgoff_t end;
75cd4e09 1502
e4544b63 1503 f2fs_down_write(&F2FS_I(inode)->i_gc_rwsem[WRITE]);
edc6d01b 1504 filemap_invalidate_lock(mapping);
c7079853
CY
1505
1506 truncate_pagecache_range(inode,
1507 (loff_t)index << PAGE_SHIFT,
1508 ((loff_t)pg_end << PAGE_SHIFT) - 1);
1509
75cd4e09
CY
1510 f2fs_lock_op(sbi);
1511
6e961949 1512 set_new_dnode(&dn, inode, NULL, NULL, 0);
4d57b86d 1513 ret = f2fs_get_dnode_of_data(&dn, index, ALLOC_NODE);
75cd4e09
CY
1514 if (ret) {
1515 f2fs_unlock_op(sbi);
edc6d01b 1516 filemap_invalidate_unlock(mapping);
e4544b63 1517 f2fs_up_write(&F2FS_I(inode)->i_gc_rwsem[WRITE]);
75cd4e09
CY
1518 goto out;
1519 }
1520
6e961949
CY
1521 end_offset = ADDRS_PER_PAGE(dn.node_page, inode);
1522 end = min(pg_end, end_offset - dn.ofs_in_node + index);
1523
1524 ret = f2fs_do_zero_range(&dn, index, end);
75cd4e09 1525 f2fs_put_dnode(&dn);
c7079853 1526
75cd4e09 1527 f2fs_unlock_op(sbi);
edc6d01b 1528 filemap_invalidate_unlock(mapping);
e4544b63 1529 f2fs_up_write(&F2FS_I(inode)->i_gc_rwsem[WRITE]);
9434fcde
CY
1530
1531 f2fs_balance_fs(sbi, dn.node_changed);
1532
6e961949
CY
1533 if (ret)
1534 goto out;
75cd4e09 1535
6e961949 1536 index = end;
75cd4e09 1537 new_size = max_t(loff_t, new_size,
6e961949 1538 (loff_t)index << PAGE_SHIFT);
75cd4e09
CY
1539 }
1540
1541 if (off_end) {
6394328a
CY
1542 ret = fill_zero(inode, pg_end, 0, off_end);
1543 if (ret)
1544 goto out;
1545
75cd4e09
CY
1546 new_size = max_t(loff_t, new_size, offset + len);
1547 }
1548 }
1549
1550out:
17cd07ae
CY
1551 if (new_size > i_size_read(inode)) {
1552 if (mode & FALLOC_FL_KEEP_SIZE)
1553 file_set_keep_isize(inode);
1554 else
1555 f2fs_i_size_write(inode, new_size);
1556 }
75cd4e09
CY
1557 return ret;
1558}
1559
f62185d0
CY
1560static int f2fs_insert_range(struct inode *inode, loff_t offset, loff_t len)
1561{
1562 struct f2fs_sb_info *sbi = F2FS_I_SB(inode);
edc6d01b 1563 struct address_space *mapping = inode->i_mapping;
0a2aa8fb 1564 pgoff_t nr, pg_start, pg_end, delta, idx;
f62185d0 1565 loff_t new_size;
6e2c64ad 1566 int ret = 0;
f62185d0 1567
f62185d0 1568 new_size = i_size_read(inode) + len;
46e82fb1
KM
1569 ret = inode_newsize_ok(inode, new_size);
1570 if (ret)
1571 return ret;
f62185d0
CY
1572
1573 if (offset >= i_size_read(inode))
1574 return -EINVAL;
1575
1576 /* insert range should be aligned to block size of f2fs. */
1577 if (offset & (F2FS_BLKSIZE - 1) || len & (F2FS_BLKSIZE - 1))
1578 return -EINVAL;
1579
b9d777b8
JK
1580 ret = f2fs_convert_inline_inode(inode);
1581 if (ret)
1582 return ret;
97a7b2c2 1583
2c4db1a6 1584 f2fs_balance_fs(sbi, true);
2a340760 1585
edc6d01b 1586 filemap_invalidate_lock(mapping);
c42d28ce 1587 ret = f2fs_truncate_blocks(inode, i_size_read(inode), true);
edc6d01b 1588 filemap_invalidate_unlock(mapping);
f62185d0 1589 if (ret)
6f8d4455 1590 return ret;
f62185d0
CY
1591
1592 /* write out all dirty pages from offset */
edc6d01b 1593 ret = filemap_write_and_wait_range(mapping, offset, LLONG_MAX);
f62185d0 1594 if (ret)
6f8d4455 1595 return ret;
f62185d0 1596
09cbfeaf
KS
1597 pg_start = offset >> PAGE_SHIFT;
1598 pg_end = (offset + len) >> PAGE_SHIFT;
f62185d0 1599 delta = pg_end - pg_start;
f91108b8 1600 idx = DIV_ROUND_UP(i_size_read(inode), PAGE_SIZE);
0a2aa8fb 1601
6f8d4455 1602 /* avoid gc operation during block exchange */
e4544b63 1603 f2fs_down_write(&F2FS_I(inode)->i_gc_rwsem[WRITE]);
edc6d01b 1604 filemap_invalidate_lock(mapping);
6f8d4455
JK
1605 truncate_pagecache(inode, offset);
1606
0a2aa8fb
JK
1607 while (!ret && idx > pg_start) {
1608 nr = idx - pg_start;
1609 if (nr > delta)
1610 nr = delta;
1611 idx -= nr;
f62185d0 1612
f62185d0 1613 f2fs_lock_op(sbi);
5f281fab
JK
1614 f2fs_drop_extent_tree(inode);
1615
0a2aa8fb
JK
1616 ret = __exchange_data_block(inode, inode, idx,
1617 idx + delta, nr, false);
f62185d0
CY
1618 f2fs_unlock_op(sbi);
1619 }
edc6d01b 1620 filemap_invalidate_unlock(mapping);
e4544b63 1621 f2fs_up_write(&F2FS_I(inode)->i_gc_rwsem[WRITE]);
f62185d0 1622
6e2c64ad 1623 /* write out all moved pages, if possible */
edc6d01b
JK
1624 filemap_invalidate_lock(mapping);
1625 filemap_write_and_wait_range(mapping, offset, LLONG_MAX);
6e2c64ad 1626 truncate_pagecache(inode, offset);
edc6d01b 1627 filemap_invalidate_unlock(mapping);
6e2c64ad
JK
1628
1629 if (!ret)
fc9581c8 1630 f2fs_i_size_write(inode, new_size);
f62185d0
CY
1631 return ret;
1632}
1633
fbfa2cc5
JK
1634static int expand_inode_data(struct inode *inode, loff_t offset,
1635 loff_t len, int mode)
1636{
4081363f 1637 struct f2fs_sb_info *sbi = F2FS_I_SB(inode);
d5097be5 1638 struct f2fs_map_blocks map = { .m_next_pgofs = NULL,
f9d6d059
CY
1639 .m_next_extent = NULL, .m_seg_type = NO_CHECK_TYPE,
1640 .m_may_create = true };
88f2cfc5 1641 pgoff_t pg_start, pg_end;
fbfa2cc5 1642 loff_t new_size = i_size_read(inode);
e12dd7bd 1643 loff_t off_end;
88f2cfc5 1644 block_t expanded = 0;
a7de6086 1645 int err;
fbfa2cc5 1646
a7de6086
JK
1647 err = inode_newsize_ok(inode, (len + offset));
1648 if (err)
1649 return err;
fbfa2cc5 1650
a7de6086
JK
1651 err = f2fs_convert_inline_inode(inode);
1652 if (err)
1653 return err;
9e09fc85 1654
2c4db1a6 1655 f2fs_balance_fs(sbi, true);
2a340760 1656
88f2cfc5 1657 pg_start = ((unsigned long long)offset) >> PAGE_SHIFT;
e12dd7bd 1658 pg_end = ((unsigned long long)offset + len) >> PAGE_SHIFT;
09cbfeaf 1659 off_end = (offset + len) & (PAGE_SIZE - 1);
fbfa2cc5 1660
88f2cfc5
CY
1661 map.m_lblk = pg_start;
1662 map.m_len = pg_end - pg_start;
e12dd7bd
JK
1663 if (off_end)
1664 map.m_len++;
ead43275 1665
f5a53edc
JK
1666 if (!map.m_len)
1667 return 0;
1668
1669 if (f2fs_is_pinned_file(inode)) {
e1175f02
CY
1670 block_t sec_blks = BLKS_PER_SEC(sbi);
1671 block_t sec_len = roundup(map.m_len, sec_blks);
f5a53edc 1672
e1175f02 1673 map.m_len = sec_blks;
f5a53edc
JK
1674next_alloc:
1675 if (has_not_enough_free_secs(sbi, 0,
1676 GET_SEC_FROM_SEG(sbi, overprovision_segments(sbi)))) {
e4544b63 1677 f2fs_down_write(&sbi->gc_lock);
7dede886 1678 err = f2fs_gc(sbi, true, false, false, NULL_SEGNO);
f5a53edc
JK
1679 if (err && err != -ENODATA && err != -EAGAIN)
1680 goto out_err;
1681 }
1682
e4544b63 1683 f2fs_down_write(&sbi->pin_sem);
fd612648
DJ
1684
1685 f2fs_lock_op(sbi);
509f1010 1686 f2fs_allocate_new_section(sbi, CURSEG_COLD_DATA_PINNED, false);
fd612648
DJ
1687 f2fs_unlock_op(sbi);
1688
d0b9e42a 1689 map.m_seg_type = CURSEG_COLD_DATA_PINNED;
f5a53edc 1690 err = f2fs_map_blocks(inode, &map, 1, F2FS_GET_BLOCK_PRE_DIO);
d4dd19ec 1691 file_dont_truncate(inode);
d0b9e42a 1692
e4544b63 1693 f2fs_up_write(&sbi->pin_sem);
cad3836f 1694
88f2cfc5 1695 expanded += map.m_len;
e1175f02 1696 sec_len -= map.m_len;
f5a53edc 1697 map.m_lblk += map.m_len;
e1175f02 1698 if (!err && sec_len)
f5a53edc
JK
1699 goto next_alloc;
1700
88f2cfc5 1701 map.m_len = expanded;
f5a53edc
JK
1702 } else {
1703 err = f2fs_map_blocks(inode, &map, 1, F2FS_GET_BLOCK_PRE_AIO);
88f2cfc5 1704 expanded = map.m_len;
f5a53edc
JK
1705 }
1706out_err:
a7de6086 1707 if (err) {
e12dd7bd 1708 pgoff_t last_off;
fbfa2cc5 1709
88f2cfc5 1710 if (!expanded)
a7de6086 1711 return err;
98397ff3 1712
88f2cfc5 1713 last_off = pg_start + expanded - 1;
e12dd7bd
JK
1714
1715 /* update new size to the failed position */
1061fd48 1716 new_size = (last_off == pg_end) ? offset + len :
e12dd7bd
JK
1717 (loff_t)(last_off + 1) << PAGE_SHIFT;
1718 } else {
1719 new_size = ((loff_t)pg_end << PAGE_SHIFT) + off_end;
fbfa2cc5
JK
1720 }
1721
e8ed90a6
CY
1722 if (new_size > i_size_read(inode)) {
1723 if (mode & FALLOC_FL_KEEP_SIZE)
1724 file_set_keep_isize(inode);
1725 else
1726 f2fs_i_size_write(inode, new_size);
1727 }
fbfa2cc5 1728
a7de6086 1729 return err;
fbfa2cc5
JK
1730}
1731
1732static long f2fs_fallocate(struct file *file, int mode,
1733 loff_t offset, loff_t len)
1734{
6131ffaa 1735 struct inode *inode = file_inode(file);
587c0a42 1736 long ret = 0;
fbfa2cc5 1737
1f227a3e
JK
1738 if (unlikely(f2fs_cp_error(F2FS_I_SB(inode))))
1739 return -EIO;
00e09c0b
CY
1740 if (!f2fs_is_checkpoint_ready(F2FS_I_SB(inode)))
1741 return -ENOSPC;
4c8ff709
CY
1742 if (!f2fs_is_compress_backend_ready(inode))
1743 return -EOPNOTSUPP;
1f227a3e 1744
c998012b
CY
1745 /* f2fs only support ->fallocate for regular file */
1746 if (!S_ISREG(inode->i_mode))
1747 return -EINVAL;
1748
62230e0d 1749 if (IS_ENCRYPTED(inode) &&
f62185d0 1750 (mode & (FALLOC_FL_COLLAPSE_RANGE | FALLOC_FL_INSERT_RANGE)))
fcc85a4d
JK
1751 return -EOPNOTSUPP;
1752
5fed0be8
JK
1753 /*
1754 * Pinned file should not support partial trucation since the block
1755 * can be used by applications.
1756 */
1757 if ((f2fs_compressed_file(inode) || f2fs_is_pinned_file(inode)) &&
4c8ff709
CY
1758 (mode & (FALLOC_FL_PUNCH_HOLE | FALLOC_FL_COLLAPSE_RANGE |
1759 FALLOC_FL_ZERO_RANGE | FALLOC_FL_INSERT_RANGE)))
1760 return -EOPNOTSUPP;
1761
b4ace337 1762 if (mode & ~(FALLOC_FL_KEEP_SIZE | FALLOC_FL_PUNCH_HOLE |
f62185d0
CY
1763 FALLOC_FL_COLLAPSE_RANGE | FALLOC_FL_ZERO_RANGE |
1764 FALLOC_FL_INSERT_RANGE))
fbfa2cc5
JK
1765 return -EOPNOTSUPP;
1766
5955102c 1767 inode_lock(inode);
3375f696 1768
587c0a42
TY
1769 if (mode & FALLOC_FL_PUNCH_HOLE) {
1770 if (offset >= inode->i_size)
1771 goto out;
1772
a66c7b2f 1773 ret = punch_hole(inode, offset, len);
b4ace337
CY
1774 } else if (mode & FALLOC_FL_COLLAPSE_RANGE) {
1775 ret = f2fs_collapse_range(inode, offset, len);
75cd4e09
CY
1776 } else if (mode & FALLOC_FL_ZERO_RANGE) {
1777 ret = f2fs_zero_range(inode, offset, len, mode);
f62185d0
CY
1778 } else if (mode & FALLOC_FL_INSERT_RANGE) {
1779 ret = f2fs_insert_range(inode, offset, len);
b4ace337 1780 } else {
fbfa2cc5 1781 ret = expand_inode_data(inode, offset, len, mode);
b4ace337 1782 }
fbfa2cc5 1783
3af60a49 1784 if (!ret) {
078cd827 1785 inode->i_mtime = inode->i_ctime = current_time(inode);
7c45729a 1786 f2fs_mark_inode_dirty_sync(inode, false);
d0239e1b 1787 f2fs_update_time(F2FS_I_SB(inode), REQ_TIME);
3af60a49 1788 }
3375f696 1789
587c0a42 1790out:
5955102c 1791 inode_unlock(inode);
3375f696 1792
c01e2853 1793 trace_f2fs_fallocate(inode, mode, offset, len, ret);
fbfa2cc5
JK
1794 return ret;
1795}
1796
1e84371f
JK
1797static int f2fs_release_file(struct inode *inode, struct file *filp)
1798{
de5307e4
JK
1799 /*
1800 * f2fs_relase_file is called at every close calls. So we should
1801 * not drop any inmemory pages by close called by other process.
1802 */
1803 if (!(filp->f_mode & FMODE_WRITE) ||
1804 atomic_read(&inode->i_writecount) != 1)
1805 return 0;
1806
1e84371f
JK
1807 /* some remained atomic pages should discarded */
1808 if (f2fs_is_atomic_file(inode))
4d57b86d 1809 f2fs_drop_inmem_pages(inode);
1e84371f 1810 if (f2fs_is_volatile_file(inode)) {
91942321 1811 set_inode_flag(inode, FI_DROP_CACHE);
1e84371f 1812 filemap_fdatawrite(inode->i_mapping);
91942321 1813 clear_inode_flag(inode, FI_DROP_CACHE);
dfa74280
CY
1814 clear_inode_flag(inode, FI_VOLATILE_FILE);
1815 stat_dec_volatile_write(inode);
1e84371f
JK
1816 }
1817 return 0;
1818}
1819
7a10f017 1820static int f2fs_file_flush(struct file *file, fl_owner_t id)
fbfa2cc5 1821{
7a10f017
JK
1822 struct inode *inode = file_inode(file);
1823
1824 /*
1825 * If the process doing a transaction is crashed, we should do
1826 * roll-back. Otherwise, other reader/write can see corrupted database
1827 * until all the writers close its file. Since this should be done
1828 * before dropping file lock, it needs to do in ->flush.
1829 */
1830 if (f2fs_is_atomic_file(inode) &&
1831 F2FS_I(inode)->inmem_task == current)
4d57b86d 1832 f2fs_drop_inmem_pages(inode);
7a10f017 1833 return 0;
fbfa2cc5
JK
1834}
1835
36098557 1836static int f2fs_setflags_common(struct inode *inode, u32 iflags, u32 mask)
2c1d0305
CY
1837{
1838 struct f2fs_inode_info *fi = F2FS_I(inode);
99eabb91
JK
1839 u32 masked_flags = fi->i_flags & mask;
1840
a7531039
JK
1841 /* mask can be shrunk by flags_valid selector */
1842 iflags &= mask;
2c1d0305
CY
1843
1844 /* Is it quota file? Do not allow user to mess with it */
1845 if (IS_NOQUOTA(inode))
1846 return -EPERM;
1847
99eabb91 1848 if ((iflags ^ masked_flags) & F2FS_CASEFOLD_FL) {
2c2eb7a3
DR
1849 if (!f2fs_sb_has_casefold(F2FS_I_SB(inode)))
1850 return -EOPNOTSUPP;
1851 if (!f2fs_empty_dir(inode))
1852 return -ENOTEMPTY;
1853 }
1854
4c8ff709
CY
1855 if (iflags & (F2FS_COMPR_FL | F2FS_NOCOMP_FL)) {
1856 if (!f2fs_sb_has_compression(F2FS_I_SB(inode)))
1857 return -EOPNOTSUPP;
1858 if ((iflags & F2FS_COMPR_FL) && (iflags & F2FS_NOCOMP_FL))
1859 return -EINVAL;
1860 }
1861
99eabb91 1862 if ((iflags ^ masked_flags) & F2FS_COMPR_FL) {
aa576970 1863 if (masked_flags & F2FS_COMPR_FL) {
78134d03 1864 if (!f2fs_disable_compressed_file(inode))
2536ac68
CY
1865 return -EINVAL;
1866 }
4c8ff709
CY
1867 if (iflags & F2FS_NOCOMP_FL)
1868 return -EINVAL;
1869 if (iflags & F2FS_COMPR_FL) {
4c8ff709
CY
1870 if (!f2fs_may_compress(inode))
1871 return -EINVAL;
519a5a2f
CY
1872 if (S_ISREG(inode->i_mode) && inode->i_size)
1873 return -EINVAL;
4c8ff709
CY
1874
1875 set_compress_context(inode);
1876 }
1877 }
99eabb91
JK
1878 if ((iflags ^ masked_flags) & F2FS_NOCOMP_FL) {
1879 if (masked_flags & F2FS_COMPR_FL)
4c8ff709
CY
1880 return -EINVAL;
1881 }
1882
d5e5efa2 1883 fi->i_flags = iflags | (fi->i_flags & ~mask);
4c8ff709
CY
1884 f2fs_bug_on(F2FS_I_SB(inode), (fi->i_flags & F2FS_COMPR_FL) &&
1885 (fi->i_flags & F2FS_NOCOMP_FL));
2c1d0305 1886
59c84408 1887 if (fi->i_flags & F2FS_PROJINHERIT_FL)
2c1d0305
CY
1888 set_inode_flag(inode, FI_PROJ_INHERIT);
1889 else
1890 clear_inode_flag(inode, FI_PROJ_INHERIT);
1891
1892 inode->i_ctime = current_time(inode);
1893 f2fs_set_inode_flags(inode);
b32e0190 1894 f2fs_mark_inode_dirty_sync(inode, true);
2c1d0305
CY
1895 return 0;
1896}
1897
9b1bb01c 1898/* FS_IOC_[GS]ETFLAGS and FS_IOC_FS[GS]ETXATTR support */
36098557
EB
1899
1900/*
1901 * To make a new on-disk f2fs i_flag gettable via FS_IOC_GETFLAGS, add an entry
1902 * for it to f2fs_fsflags_map[], and add its FS_*_FL equivalent to
1903 * F2FS_GETTABLE_FS_FL. To also make it settable via FS_IOC_SETFLAGS, also add
1904 * its FS_*_FL equivalent to F2FS_SETTABLE_FS_FL.
9b1bb01c
MS
1905 *
1906 * Translating flags to fsx_flags value used by FS_IOC_FSGETXATTR and
1907 * FS_IOC_FSSETXATTR is done by the VFS.
36098557
EB
1908 */
1909
1910static const struct {
1911 u32 iflag;
1912 u32 fsflag;
1913} f2fs_fsflags_map[] = {
4c8ff709 1914 { F2FS_COMPR_FL, FS_COMPR_FL },
36098557
EB
1915 { F2FS_SYNC_FL, FS_SYNC_FL },
1916 { F2FS_IMMUTABLE_FL, FS_IMMUTABLE_FL },
1917 { F2FS_APPEND_FL, FS_APPEND_FL },
1918 { F2FS_NODUMP_FL, FS_NODUMP_FL },
1919 { F2FS_NOATIME_FL, FS_NOATIME_FL },
4c8ff709 1920 { F2FS_NOCOMP_FL, FS_NOCOMP_FL },
36098557
EB
1921 { F2FS_INDEX_FL, FS_INDEX_FL },
1922 { F2FS_DIRSYNC_FL, FS_DIRSYNC_FL },
1923 { F2FS_PROJINHERIT_FL, FS_PROJINHERIT_FL },
2c2eb7a3 1924 { F2FS_CASEFOLD_FL, FS_CASEFOLD_FL },
36098557
EB
1925};
1926
1927#define F2FS_GETTABLE_FS_FL ( \
4c8ff709 1928 FS_COMPR_FL | \
36098557
EB
1929 FS_SYNC_FL | \
1930 FS_IMMUTABLE_FL | \
1931 FS_APPEND_FL | \
1932 FS_NODUMP_FL | \
1933 FS_NOATIME_FL | \
4c8ff709 1934 FS_NOCOMP_FL | \
36098557
EB
1935 FS_INDEX_FL | \
1936 FS_DIRSYNC_FL | \
1937 FS_PROJINHERIT_FL | \
1938 FS_ENCRYPT_FL | \
1939 FS_INLINE_DATA_FL | \
95ae251f 1940 FS_NOCOW_FL | \
fbc246a1 1941 FS_VERITY_FL | \
2c2eb7a3 1942 FS_CASEFOLD_FL)
36098557
EB
1943
1944#define F2FS_SETTABLE_FS_FL ( \
4c8ff709 1945 FS_COMPR_FL | \
36098557
EB
1946 FS_SYNC_FL | \
1947 FS_IMMUTABLE_FL | \
1948 FS_APPEND_FL | \
1949 FS_NODUMP_FL | \
1950 FS_NOATIME_FL | \
4c8ff709 1951 FS_NOCOMP_FL | \
36098557 1952 FS_DIRSYNC_FL | \
2c2eb7a3
DR
1953 FS_PROJINHERIT_FL | \
1954 FS_CASEFOLD_FL)
36098557
EB
1955
1956/* Convert f2fs on-disk i_flags to FS_IOC_{GET,SET}FLAGS flags */
1957static inline u32 f2fs_iflags_to_fsflags(u32 iflags)
1958{
1959 u32 fsflags = 0;
1960 int i;
1961
1962 for (i = 0; i < ARRAY_SIZE(f2fs_fsflags_map); i++)
1963 if (iflags & f2fs_fsflags_map[i].iflag)
1964 fsflags |= f2fs_fsflags_map[i].fsflag;
1965
1966 return fsflags;
1967}
1968
1969/* Convert FS_IOC_{GET,SET}FLAGS flags to f2fs on-disk i_flags */
1970static inline u32 f2fs_fsflags_to_iflags(u32 fsflags)
1971{
1972 u32 iflags = 0;
1973 int i;
1974
1975 for (i = 0; i < ARRAY_SIZE(f2fs_fsflags_map); i++)
1976 if (fsflags & f2fs_fsflags_map[i].fsflag)
1977 iflags |= f2fs_fsflags_map[i].iflag;
1978
1979 return iflags;
1980}
1981
d49f3e89
CY
1982static int f2fs_ioc_getversion(struct file *filp, unsigned long arg)
1983{
1984 struct inode *inode = file_inode(filp);
1985
1986 return put_user(inode->i_generation, (int __user *)arg);
1987}
1988
88b88a66
JK
1989static int f2fs_ioc_start_atomic_write(struct file *filp)
1990{
1991 struct inode *inode = file_inode(filp);
984fc4e7 1992 struct user_namespace *mnt_userns = file_mnt_user_ns(filp);
743b620c
JK
1993 struct f2fs_inode_info *fi = F2FS_I(inode);
1994 struct f2fs_sb_info *sbi = F2FS_I_SB(inode);
f4c9c743 1995 int ret;
88b88a66 1996
984fc4e7 1997 if (!inode_owner_or_capable(mnt_userns, inode))
88b88a66
JK
1998 return -EACCES;
1999
e811898c
JK
2000 if (!S_ISREG(inode->i_mode))
2001 return -EINVAL;
2002
038d0698
CY
2003 if (filp->f_flags & O_DIRECT)
2004 return -EINVAL;
2005
7fb17fe4
CY
2006 ret = mnt_want_write_file(filp);
2007 if (ret)
2008 return ret;
2009
0fac558b
CY
2010 inode_lock(inode);
2011
9b56adcf
FC
2012 if (!f2fs_disable_compressed_file(inode)) {
2013 ret = -EINVAL;
2014 goto out;
2015 }
4c8ff709 2016
455e3a58
JK
2017 if (f2fs_is_atomic_file(inode)) {
2018 if (is_inode_flag_set(inode, FI_ATOMIC_REVOKE_REQUEST))
2019 ret = -EINVAL;
7fb17fe4 2020 goto out;
455e3a58 2021 }
88b88a66 2022
f4c9c743
CY
2023 ret = f2fs_convert_inline_inode(inode);
2024 if (ret)
7fb17fe4 2025 goto out;
88b88a66 2026
e4544b63 2027 f2fs_down_write(&F2FS_I(inode)->i_gc_rwsem[WRITE]);
6f8d4455 2028
31867b23
JK
2029 /*
2030 * Should wait end_io to count F2FS_WB_CP_DATA correctly by
2031 * f2fs_is_atomic_file.
2032 */
2033 if (get_dirty_pages(inode))
dcbb4c10
JP
2034 f2fs_warn(F2FS_I_SB(inode), "Unexpected flush for atomic writes: ino=%lu, npages=%u",
2035 inode->i_ino, get_dirty_pages(inode));
c27753d6 2036 ret = filemap_write_and_wait_range(inode->i_mapping, 0, LLONG_MAX);
6f8d4455 2037 if (ret) {
e4544b63 2038 f2fs_up_write(&F2FS_I(inode)->i_gc_rwsem[WRITE]);
684ca7e5 2039 goto out;
6f8d4455 2040 }
31867b23 2041
743b620c
JK
2042 spin_lock(&sbi->inode_lock[ATOMIC_FILE]);
2043 if (list_empty(&fi->inmem_ilist))
2044 list_add_tail(&fi->inmem_ilist, &sbi->inode_list[ATOMIC_FILE]);
677017d1 2045 sbi->atomic_files++;
743b620c
JK
2046 spin_unlock(&sbi->inode_lock[ATOMIC_FILE]);
2047
2048 /* add inode in inmem_list first and set atomic_file */
054afda9 2049 set_inode_flag(inode, FI_ATOMIC_FILE);
2ef79ecb 2050 clear_inode_flag(inode, FI_ATOMIC_REVOKE_REQUEST);
e4544b63 2051 f2fs_up_write(&F2FS_I(inode)->i_gc_rwsem[WRITE]);
684ca7e5 2052
6f8d4455 2053 f2fs_update_time(F2FS_I_SB(inode), REQ_TIME);
7a10f017 2054 F2FS_I(inode)->inmem_task = current;
26a28a0c 2055 stat_update_max_atomic_write(inode);
684ca7e5 2056out:
0fac558b 2057 inode_unlock(inode);
7fb17fe4 2058 mnt_drop_write_file(filp);
c27753d6 2059 return ret;
88b88a66
JK
2060}
2061
2062static int f2fs_ioc_commit_atomic_write(struct file *filp)
2063{
2064 struct inode *inode = file_inode(filp);
984fc4e7 2065 struct user_namespace *mnt_userns = file_mnt_user_ns(filp);
88b88a66
JK
2066 int ret;
2067
984fc4e7 2068 if (!inode_owner_or_capable(mnt_userns, inode))
88b88a66
JK
2069 return -EACCES;
2070
2071 ret = mnt_want_write_file(filp);
2072 if (ret)
2073 return ret;
2074
6f8d4455 2075 f2fs_balance_fs(F2FS_I_SB(inode), true);
0fac558b 2076
6f8d4455 2077 inode_lock(inode);
1dc0f899 2078
b169c3c5
CY
2079 if (f2fs_is_volatile_file(inode)) {
2080 ret = -EINVAL;
7fb17fe4 2081 goto err_out;
b169c3c5 2082 }
7fb17fe4 2083
6282adbf 2084 if (f2fs_is_atomic_file(inode)) {
4d57b86d 2085 ret = f2fs_commit_inmem_pages(inode);
5fe45743 2086 if (ret)
edb27dee 2087 goto err_out;
5fe45743 2088
26a28a0c 2089 ret = f2fs_do_sync_file(filp, 0, LLONG_MAX, 0, true);
743b620c
JK
2090 if (!ret)
2091 f2fs_drop_inmem_pages(inode);
26a28a0c 2092 } else {
774e1b78 2093 ret = f2fs_do_sync_file(filp, 0, LLONG_MAX, 1, false);
6282adbf 2094 }
edb27dee 2095err_out:
2ef79ecb
CY
2096 if (is_inode_flag_set(inode, FI_ATOMIC_REVOKE_REQUEST)) {
2097 clear_inode_flag(inode, FI_ATOMIC_REVOKE_REQUEST);
2098 ret = -EINVAL;
2099 }
0fac558b 2100 inode_unlock(inode);
88b88a66
JK
2101 mnt_drop_write_file(filp);
2102 return ret;
2103}
2104
02a1335f
JK
2105static int f2fs_ioc_start_volatile_write(struct file *filp)
2106{
2107 struct inode *inode = file_inode(filp);
984fc4e7 2108 struct user_namespace *mnt_userns = file_mnt_user_ns(filp);
f4c9c743 2109 int ret;
02a1335f 2110
984fc4e7 2111 if (!inode_owner_or_capable(mnt_userns, inode))
02a1335f
JK
2112 return -EACCES;
2113
8ff0971f
CY
2114 if (!S_ISREG(inode->i_mode))
2115 return -EINVAL;
2116
7fb17fe4
CY
2117 ret = mnt_want_write_file(filp);
2118 if (ret)
2119 return ret;
2120
0fac558b
CY
2121 inode_lock(inode);
2122
1e84371f 2123 if (f2fs_is_volatile_file(inode))
7fb17fe4 2124 goto out;
1e84371f 2125
f4c9c743
CY
2126 ret = f2fs_convert_inline_inode(inode);
2127 if (ret)
7fb17fe4 2128 goto out;
b3d208f9 2129
648d50ba
CY
2130 stat_inc_volatile_write(inode);
2131 stat_update_max_volatile_write(inode);
2132
91942321 2133 set_inode_flag(inode, FI_VOLATILE_FILE);
d0239e1b 2134 f2fs_update_time(F2FS_I_SB(inode), REQ_TIME);
7fb17fe4 2135out:
0fac558b 2136 inode_unlock(inode);
7fb17fe4
CY
2137 mnt_drop_write_file(filp);
2138 return ret;
02a1335f
JK
2139}
2140
1e84371f
JK
2141static int f2fs_ioc_release_volatile_write(struct file *filp)
2142{
2143 struct inode *inode = file_inode(filp);
984fc4e7 2144 struct user_namespace *mnt_userns = file_mnt_user_ns(filp);
7fb17fe4 2145 int ret;
1e84371f 2146
984fc4e7 2147 if (!inode_owner_or_capable(mnt_userns, inode))
1e84371f
JK
2148 return -EACCES;
2149
7fb17fe4
CY
2150 ret = mnt_want_write_file(filp);
2151 if (ret)
2152 return ret;
2153
0fac558b
CY
2154 inode_lock(inode);
2155
1e84371f 2156 if (!f2fs_is_volatile_file(inode))
7fb17fe4 2157 goto out;
1e84371f 2158
7fb17fe4
CY
2159 if (!f2fs_is_first_block_written(inode)) {
2160 ret = truncate_partial_data_page(inode, 0, true);
2161 goto out;
2162 }
3c6c2beb 2163
7fb17fe4
CY
2164 ret = punch_hole(inode, 0, F2FS_BLKSIZE);
2165out:
0fac558b 2166 inode_unlock(inode);
7fb17fe4
CY
2167 mnt_drop_write_file(filp);
2168 return ret;
1e84371f
JK
2169}
2170
2171static int f2fs_ioc_abort_volatile_write(struct file *filp)
2172{
2173 struct inode *inode = file_inode(filp);
984fc4e7 2174 struct user_namespace *mnt_userns = file_mnt_user_ns(filp);
1e84371f
JK
2175 int ret;
2176
984fc4e7 2177 if (!inode_owner_or_capable(mnt_userns, inode))
1e84371f
JK
2178 return -EACCES;
2179
2180 ret = mnt_want_write_file(filp);
2181 if (ret)
2182 return ret;
2183
0fac558b
CY
2184 inode_lock(inode);
2185
26dc3d44 2186 if (f2fs_is_atomic_file(inode))
4d57b86d 2187 f2fs_drop_inmem_pages(inode);
732d5648 2188 if (f2fs_is_volatile_file(inode)) {
91942321 2189 clear_inode_flag(inode, FI_VOLATILE_FILE);
648d50ba 2190 stat_dec_volatile_write(inode);
608514de 2191 ret = f2fs_do_sync_file(filp, 0, LLONG_MAX, 0, true);
732d5648 2192 }
de6a8ec9 2193
455e3a58
JK
2194 clear_inode_flag(inode, FI_ATOMIC_REVOKE_REQUEST);
2195
0fac558b
CY
2196 inode_unlock(inode);
2197
1e84371f 2198 mnt_drop_write_file(filp);
d0239e1b 2199 f2fs_update_time(F2FS_I_SB(inode), REQ_TIME);
1e84371f
JK
2200 return ret;
2201}
2202
1abff93d
JK
2203static int f2fs_ioc_shutdown(struct file *filp, unsigned long arg)
2204{
2205 struct inode *inode = file_inode(filp);
2206 struct f2fs_sb_info *sbi = F2FS_I_SB(inode);
2207 struct super_block *sb = sbi->sb;
2208 __u32 in;
2a96d8ad 2209 int ret = 0;
1abff93d
JK
2210
2211 if (!capable(CAP_SYS_ADMIN))
2212 return -EPERM;
2213
2214 if (get_user(in, (__u32 __user *)arg))
2215 return -EFAULT;
2216
60b2b4ee
ST
2217 if (in != F2FS_GOING_DOWN_FULLSYNC) {
2218 ret = mnt_want_write_file(filp);
8626441f
CY
2219 if (ret) {
2220 if (ret == -EROFS) {
2221 ret = 0;
2222 f2fs_stop_checkpoint(sbi, false);
2223 set_sbi_flag(sbi, SBI_IS_SHUTDOWN);
2224 trace_f2fs_shutdown(sbi, in, ret);
2225 }
60b2b4ee 2226 return ret;
8626441f 2227 }
60b2b4ee 2228 }
7fb17fe4 2229
1abff93d
JK
2230 switch (in) {
2231 case F2FS_GOING_DOWN_FULLSYNC:
040f04bd
CH
2232 ret = freeze_bdev(sb->s_bdev);
2233 if (ret)
d027c484 2234 goto out;
040f04bd
CH
2235 f2fs_stop_checkpoint(sbi, false);
2236 set_sbi_flag(sbi, SBI_IS_SHUTDOWN);
2237 thaw_bdev(sb->s_bdev);
1abff93d
JK
2238 break;
2239 case F2FS_GOING_DOWN_METASYNC:
2240 /* do checkpoint only */
d027c484
CY
2241 ret = f2fs_sync_fs(sb, 1);
2242 if (ret)
2243 goto out;
38f91ca8 2244 f2fs_stop_checkpoint(sbi, false);
83a3bfdb 2245 set_sbi_flag(sbi, SBI_IS_SHUTDOWN);
1abff93d
JK
2246 break;
2247 case F2FS_GOING_DOWN_NOSYNC:
38f91ca8 2248 f2fs_stop_checkpoint(sbi, false);
83a3bfdb 2249 set_sbi_flag(sbi, SBI_IS_SHUTDOWN);
1abff93d 2250 break;
c912a829 2251 case F2FS_GOING_DOWN_METAFLUSH:
4d57b86d 2252 f2fs_sync_meta_pages(sbi, META, LONG_MAX, FS_META_IO);
38f91ca8 2253 f2fs_stop_checkpoint(sbi, false);
83a3bfdb 2254 set_sbi_flag(sbi, SBI_IS_SHUTDOWN);
c912a829 2255 break;
0cd6d9b0
JK
2256 case F2FS_GOING_DOWN_NEED_FSCK:
2257 set_sbi_flag(sbi, SBI_NEED_FSCK);
db610a64
JK
2258 set_sbi_flag(sbi, SBI_CP_DISABLED_QUICK);
2259 set_sbi_flag(sbi, SBI_IS_DIRTY);
0cd6d9b0
JK
2260 /* do checkpoint only */
2261 ret = f2fs_sync_fs(sb, 1);
db610a64 2262 goto out;
1abff93d 2263 default:
7fb17fe4
CY
2264 ret = -EINVAL;
2265 goto out;
1abff93d 2266 }
7950e9ac 2267
4d57b86d
CY
2268 f2fs_stop_gc_thread(sbi);
2269 f2fs_stop_discard_thread(sbi);
7950e9ac 2270
4d57b86d 2271 f2fs_drop_discard_cmd(sbi);
7950e9ac
CY
2272 clear_opt(sbi, DISCARD);
2273
d0239e1b 2274 f2fs_update_time(sbi, REQ_TIME);
7fb17fe4 2275out:
60b2b4ee
ST
2276 if (in != F2FS_GOING_DOWN_FULLSYNC)
2277 mnt_drop_write_file(filp);
559e87c4
CY
2278
2279 trace_f2fs_shutdown(sbi, in, ret);
2280
7fb17fe4 2281 return ret;
1abff93d
JK
2282}
2283
52656e6c
JK
2284static int f2fs_ioc_fitrim(struct file *filp, unsigned long arg)
2285{
2286 struct inode *inode = file_inode(filp);
2287 struct super_block *sb = inode->i_sb;
2288 struct request_queue *q = bdev_get_queue(sb->s_bdev);
2289 struct fstrim_range range;
2290 int ret;
4b2fecc8 2291
52656e6c
JK
2292 if (!capable(CAP_SYS_ADMIN))
2293 return -EPERM;
4b2fecc8 2294
7d20c8ab 2295 if (!f2fs_hw_support_discard(F2FS_SB(sb)))
52656e6c 2296 return -EOPNOTSUPP;
4b2fecc8 2297
52656e6c
JK
2298 if (copy_from_user(&range, (struct fstrim_range __user *)arg,
2299 sizeof(range)))
2300 return -EFAULT;
4b2fecc8 2301
7fb17fe4
CY
2302 ret = mnt_want_write_file(filp);
2303 if (ret)
2304 return ret;
2305
52656e6c
JK
2306 range.minlen = max((unsigned int)range.minlen,
2307 q->limits.discard_granularity);
2308 ret = f2fs_trim_fs(F2FS_SB(sb), &range);
7fb17fe4 2309 mnt_drop_write_file(filp);
52656e6c
JK
2310 if (ret < 0)
2311 return ret;
4b2fecc8 2312
52656e6c
JK
2313 if (copy_to_user((struct fstrim_range __user *)arg, &range,
2314 sizeof(range)))
2315 return -EFAULT;
d0239e1b 2316 f2fs_update_time(F2FS_I_SB(inode), REQ_TIME);
52656e6c
JK
2317 return 0;
2318}
2319
f424f664
JK
2320static bool uuid_is_nonzero(__u8 u[16])
2321{
2322 int i;
2323
2324 for (i = 0; i < 16; i++)
2325 if (u[i])
2326 return true;
2327 return false;
2328}
2329
2330static int f2fs_ioc_set_encryption_policy(struct file *filp, unsigned long arg)
2331{
f424f664
JK
2332 struct inode *inode = file_inode(filp);
2333
7beb01f7 2334 if (!f2fs_sb_has_encrypt(F2FS_I_SB(inode)))
ead710b7
CY
2335 return -EOPNOTSUPP;
2336
d0239e1b 2337 f2fs_update_time(F2FS_I_SB(inode), REQ_TIME);
7fb17fe4 2338
db717d8e 2339 return fscrypt_ioctl_set_policy(filp, (const void __user *)arg);
f424f664
JK
2340}
2341
2342static int f2fs_ioc_get_encryption_policy(struct file *filp, unsigned long arg)
2343{
7beb01f7 2344 if (!f2fs_sb_has_encrypt(F2FS_I_SB(file_inode(filp))))
ead710b7 2345 return -EOPNOTSUPP;
db717d8e 2346 return fscrypt_ioctl_get_policy(filp, (void __user *)arg);
f424f664
JK
2347}
2348
2349static int f2fs_ioc_get_encryption_pwsalt(struct file *filp, unsigned long arg)
2350{
2351 struct inode *inode = file_inode(filp);
2352 struct f2fs_sb_info *sbi = F2FS_I_SB(inode);
2353 int err;
2354
7beb01f7 2355 if (!f2fs_sb_has_encrypt(sbi))
f424f664
JK
2356 return -EOPNOTSUPP;
2357
f424f664
JK
2358 err = mnt_want_write_file(filp);
2359 if (err)
2360 return err;
2361
e4544b63 2362 f2fs_down_write(&sbi->sb_lock);
d0d3f1b3
CY
2363
2364 if (uuid_is_nonzero(sbi->raw_super->encrypt_pw_salt))
2365 goto got_it;
2366
f424f664
JK
2367 /* update superblock with uuid */
2368 generate_random_uuid(sbi->raw_super->encrypt_pw_salt);
2369
c5bda1c8 2370 err = f2fs_commit_super(sbi, false);
f424f664
JK
2371 if (err) {
2372 /* undo new data */
2373 memset(sbi->raw_super->encrypt_pw_salt, 0, 16);
d0d3f1b3 2374 goto out_err;
f424f664
JK
2375 }
2376got_it:
2377 if (copy_to_user((__u8 __user *)arg, sbi->raw_super->encrypt_pw_salt,
2378 16))
d0d3f1b3
CY
2379 err = -EFAULT;
2380out_err:
e4544b63 2381 f2fs_up_write(&sbi->sb_lock);
d0d3f1b3
CY
2382 mnt_drop_write_file(filp);
2383 return err;
f424f664
JK
2384}
2385
8ce589c7
EB
2386static int f2fs_ioc_get_encryption_policy_ex(struct file *filp,
2387 unsigned long arg)
2388{
2389 if (!f2fs_sb_has_encrypt(F2FS_I_SB(file_inode(filp))))
2390 return -EOPNOTSUPP;
2391
2392 return fscrypt_ioctl_get_policy_ex(filp, (void __user *)arg);
2393}
2394
2395static int f2fs_ioc_add_encryption_key(struct file *filp, unsigned long arg)
2396{
2397 if (!f2fs_sb_has_encrypt(F2FS_I_SB(file_inode(filp))))
2398 return -EOPNOTSUPP;
2399
2400 return fscrypt_ioctl_add_key(filp, (void __user *)arg);
2401}
2402
2403static int f2fs_ioc_remove_encryption_key(struct file *filp, unsigned long arg)
2404{
2405 if (!f2fs_sb_has_encrypt(F2FS_I_SB(file_inode(filp))))
2406 return -EOPNOTSUPP;
2407
2408 return fscrypt_ioctl_remove_key(filp, (void __user *)arg);
2409}
2410
2411static int f2fs_ioc_remove_encryption_key_all_users(struct file *filp,
2412 unsigned long arg)
2413{
2414 if (!f2fs_sb_has_encrypt(F2FS_I_SB(file_inode(filp))))
2415 return -EOPNOTSUPP;
2416
2417 return fscrypt_ioctl_remove_key_all_users(filp, (void __user *)arg);
2418}
2419
2420static int f2fs_ioc_get_encryption_key_status(struct file *filp,
2421 unsigned long arg)
2422{
2423 if (!f2fs_sb_has_encrypt(F2FS_I_SB(file_inode(filp))))
2424 return -EOPNOTSUPP;
2425
2426 return fscrypt_ioctl_get_key_status(filp, (void __user *)arg);
2427}
2428
ee446e1a
EB
2429static int f2fs_ioc_get_encryption_nonce(struct file *filp, unsigned long arg)
2430{
2431 if (!f2fs_sb_has_encrypt(F2FS_I_SB(file_inode(filp))))
2432 return -EOPNOTSUPP;
2433
2434 return fscrypt_ioctl_get_nonce(filp, (void __user *)arg);
2435}
2436
c1c1b583
CY
2437static int f2fs_ioc_gc(struct file *filp, unsigned long arg)
2438{
2439 struct inode *inode = file_inode(filp);
2440 struct f2fs_sb_info *sbi = F2FS_I_SB(inode);
d530d4d8 2441 __u32 sync;
7fb17fe4 2442 int ret;
c1c1b583
CY
2443
2444 if (!capable(CAP_SYS_ADMIN))
2445 return -EPERM;
2446
d530d4d8 2447 if (get_user(sync, (__u32 __user *)arg))
c1c1b583
CY
2448 return -EFAULT;
2449
d530d4d8
CY
2450 if (f2fs_readonly(sbi->sb))
2451 return -EROFS;
c1c1b583 2452
7fb17fe4
CY
2453 ret = mnt_want_write_file(filp);
2454 if (ret)
2455 return ret;
2456
d530d4d8 2457 if (!sync) {
e4544b63 2458 if (!f2fs_down_write_trylock(&sbi->gc_lock)) {
7fb17fe4
CY
2459 ret = -EBUSY;
2460 goto out;
2461 }
d530d4d8 2462 } else {
e4544b63 2463 f2fs_down_write(&sbi->gc_lock);
c1c1b583
CY
2464 }
2465
7dede886 2466 ret = f2fs_gc(sbi, sync, true, false, NULL_SEGNO);
7fb17fe4
CY
2467out:
2468 mnt_drop_write_file(filp);
2469 return ret;
c1c1b583
CY
2470}
2471
34178b1b 2472static int __f2fs_ioc_gc_range(struct file *filp, struct f2fs_gc_range *range)
34dc77ad 2473{
34178b1b 2474 struct f2fs_sb_info *sbi = F2FS_I_SB(file_inode(filp));
34dc77ad
JK
2475 u64 end;
2476 int ret;
2477
2478 if (!capable(CAP_SYS_ADMIN))
2479 return -EPERM;
34dc77ad
JK
2480 if (f2fs_readonly(sbi->sb))
2481 return -EROFS;
2482
34178b1b
CY
2483 end = range->start + range->len;
2484 if (end < range->start || range->start < MAIN_BLKADDR(sbi) ||
fbbf7799 2485 end >= MAX_BLKADDR(sbi))
b82f6e34 2486 return -EINVAL;
b82f6e34 2487
34dc77ad
JK
2488 ret = mnt_want_write_file(filp);
2489 if (ret)
2490 return ret;
2491
34dc77ad 2492do_more:
34178b1b 2493 if (!range->sync) {
e4544b63 2494 if (!f2fs_down_write_trylock(&sbi->gc_lock)) {
34dc77ad
JK
2495 ret = -EBUSY;
2496 goto out;
2497 }
2498 } else {
e4544b63 2499 f2fs_down_write(&sbi->gc_lock);
34dc77ad
JK
2500 }
2501
7dede886
CY
2502 ret = f2fs_gc(sbi, range->sync, true, false,
2503 GET_SEGNO(sbi, range->start));
97767500
QZ
2504 if (ret) {
2505 if (ret == -EBUSY)
2506 ret = -EAGAIN;
2507 goto out;
2508 }
34178b1b
CY
2509 range->start += BLKS_PER_SEC(sbi);
2510 if (range->start <= end)
34dc77ad
JK
2511 goto do_more;
2512out:
2513 mnt_drop_write_file(filp);
2514 return ret;
2515}
2516
34178b1b
CY
2517static int f2fs_ioc_gc_range(struct file *filp, unsigned long arg)
2518{
2519 struct f2fs_gc_range range;
2520
2521 if (copy_from_user(&range, (struct f2fs_gc_range __user *)arg,
2522 sizeof(range)))
2523 return -EFAULT;
2524 return __f2fs_ioc_gc_range(filp, &range);
2525}
2526
059c0648 2527static int f2fs_ioc_write_checkpoint(struct file *filp, unsigned long arg)
456b88e4
CY
2528{
2529 struct inode *inode = file_inode(filp);
2530 struct f2fs_sb_info *sbi = F2FS_I_SB(inode);
7fb17fe4 2531 int ret;
456b88e4
CY
2532
2533 if (!capable(CAP_SYS_ADMIN))
2534 return -EPERM;
2535
2536 if (f2fs_readonly(sbi->sb))
2537 return -EROFS;
2538
4354994f 2539 if (unlikely(is_sbi_flag_set(sbi, SBI_CP_DISABLED))) {
dcbb4c10 2540 f2fs_info(sbi, "Skipping Checkpoint. Checkpoints currently disabled.");
4354994f
DR
2541 return -EINVAL;
2542 }
2543
7fb17fe4
CY
2544 ret = mnt_want_write_file(filp);
2545 if (ret)
2546 return ret;
2547
2548 ret = f2fs_sync_fs(sbi->sb, 1);
2549
2550 mnt_drop_write_file(filp);
2551 return ret;
456b88e4
CY
2552}
2553
d323d005
CY
2554static int f2fs_defragment_range(struct f2fs_sb_info *sbi,
2555 struct file *filp,
2556 struct f2fs_defragment *range)
2557{
2558 struct inode *inode = file_inode(filp);
f3d98e74 2559 struct f2fs_map_blocks map = { .m_next_extent = NULL,
5f029c04 2560 .m_seg_type = NO_CHECK_TYPE,
f4f0b677 2561 .m_may_create = false };
1061fd48 2562 struct extent_info ei = {0, 0, 0};
f3d98e74 2563 pgoff_t pg_start, pg_end, next_pgofs;
3519e3f9 2564 unsigned int blk_per_seg = sbi->blocks_per_seg;
d323d005 2565 unsigned int total = 0, sec_num;
d323d005
CY
2566 block_t blk_end = 0;
2567 bool fragmented = false;
2568 int err;
2569
09cbfeaf
KS
2570 pg_start = range->start >> PAGE_SHIFT;
2571 pg_end = (range->start + range->len) >> PAGE_SHIFT;
d323d005 2572
2c4db1a6 2573 f2fs_balance_fs(sbi, true);
d323d005 2574
5955102c 2575 inode_lock(inode);
d323d005 2576
1018a546
CY
2577 /* if in-place-update policy is enabled, don't waste time here */
2578 set_inode_flag(inode, FI_OPU_WRITE);
2579 if (f2fs_should_update_inplace(inode, NULL)) {
2580 err = -EINVAL;
2581 goto out;
2582 }
2583
d323d005
CY
2584 /* writeback all dirty pages in the range */
2585 err = filemap_write_and_wait_range(inode->i_mapping, range->start,
d8fe4f0e 2586 range->start + range->len - 1);
d323d005
CY
2587 if (err)
2588 goto out;
2589
2590 /*
2591 * lookup mapping info in extent cache, skip defragmenting if physical
2592 * block addresses are continuous.
2593 */
2594 if (f2fs_lookup_extent_cache(inode, pg_start, &ei)) {
2595 if (ei.fofs + ei.len >= pg_end)
2596 goto out;
2597 }
2598
2599 map.m_lblk = pg_start;
f3d98e74 2600 map.m_next_pgofs = &next_pgofs;
d323d005
CY
2601
2602 /*
2603 * lookup mapping info in dnode page cache, skip defragmenting if all
2604 * physical block addresses are continuous even if there are hole(s)
2605 * in logical blocks.
2606 */
2607 while (map.m_lblk < pg_end) {
a1c1e9b7 2608 map.m_len = pg_end - map.m_lblk;
f2220c7f 2609 err = f2fs_map_blocks(inode, &map, 0, F2FS_GET_BLOCK_DEFAULT);
d323d005
CY
2610 if (err)
2611 goto out;
2612
2613 if (!(map.m_flags & F2FS_MAP_FLAGS)) {
f3d98e74 2614 map.m_lblk = next_pgofs;
d323d005
CY
2615 continue;
2616 }
2617
25a912e5 2618 if (blk_end && blk_end != map.m_pblk)
d323d005 2619 fragmented = true;
25a912e5
CY
2620
2621 /* record total count of block that we're going to move */
2622 total += map.m_len;
2623
d323d005
CY
2624 blk_end = map.m_pblk + map.m_len;
2625
2626 map.m_lblk += map.m_len;
d323d005
CY
2627 }
2628
d3a1a0e1
CY
2629 if (!fragmented) {
2630 total = 0;
d323d005 2631 goto out;
d3a1a0e1 2632 }
d323d005 2633
f91108b8 2634 sec_num = DIV_ROUND_UP(total, BLKS_PER_SEC(sbi));
d323d005
CY
2635
2636 /*
2637 * make sure there are enough free section for LFS allocation, this can
2638 * avoid defragment running in SSR mode when free section are allocated
2639 * intensively
2640 */
7f3037a5 2641 if (has_not_enough_free_secs(sbi, 0, sec_num)) {
d323d005
CY
2642 err = -EAGAIN;
2643 goto out;
2644 }
2645
25a912e5
CY
2646 map.m_lblk = pg_start;
2647 map.m_len = pg_end - pg_start;
2648 total = 0;
2649
d323d005
CY
2650 while (map.m_lblk < pg_end) {
2651 pgoff_t idx;
2652 int cnt = 0;
2653
2654do_map:
a1c1e9b7 2655 map.m_len = pg_end - map.m_lblk;
f2220c7f 2656 err = f2fs_map_blocks(inode, &map, 0, F2FS_GET_BLOCK_DEFAULT);
d323d005
CY
2657 if (err)
2658 goto clear_out;
2659
2660 if (!(map.m_flags & F2FS_MAP_FLAGS)) {
f3d98e74 2661 map.m_lblk = next_pgofs;
d3a1a0e1 2662 goto check;
d323d005
CY
2663 }
2664
1018a546 2665 set_inode_flag(inode, FI_SKIP_WRITES);
d323d005
CY
2666
2667 idx = map.m_lblk;
2668 while (idx < map.m_lblk + map.m_len && cnt < blk_per_seg) {
2669 struct page *page;
2670
4d57b86d 2671 page = f2fs_get_lock_data_page(inode, idx, true);
d323d005
CY
2672 if (IS_ERR(page)) {
2673 err = PTR_ERR(page);
2674 goto clear_out;
2675 }
2676
2677 set_page_dirty(page);
2678 f2fs_put_page(page, 1);
2679
2680 idx++;
2681 cnt++;
2682 total++;
2683 }
2684
2685 map.m_lblk = idx;
d3a1a0e1
CY
2686check:
2687 if (map.m_lblk < pg_end && cnt < blk_per_seg)
d323d005
CY
2688 goto do_map;
2689
1018a546 2690 clear_inode_flag(inode, FI_SKIP_WRITES);
d323d005
CY
2691
2692 err = filemap_fdatawrite(inode->i_mapping);
2693 if (err)
2694 goto out;
2695 }
2696clear_out:
1018a546 2697 clear_inode_flag(inode, FI_SKIP_WRITES);
d323d005 2698out:
1018a546 2699 clear_inode_flag(inode, FI_OPU_WRITE);
5955102c 2700 inode_unlock(inode);
d323d005 2701 if (!err)
09cbfeaf 2702 range->len = (u64)total << PAGE_SHIFT;
d323d005
CY
2703 return err;
2704}
2705
2706static int f2fs_ioc_defragment(struct file *filp, unsigned long arg)
2707{
2708 struct inode *inode = file_inode(filp);
2709 struct f2fs_sb_info *sbi = F2FS_I_SB(inode);
2710 struct f2fs_defragment range;
2711 int err;
2712
2713 if (!capable(CAP_SYS_ADMIN))
2714 return -EPERM;
2715
7eab0c0d 2716 if (!S_ISREG(inode->i_mode) || f2fs_is_atomic_file(inode))
d323d005
CY
2717 return -EINVAL;
2718
d7563861
KM
2719 if (f2fs_readonly(sbi->sb))
2720 return -EROFS;
d323d005
CY
2721
2722 if (copy_from_user(&range, (struct f2fs_defragment __user *)arg,
d7563861
KM
2723 sizeof(range)))
2724 return -EFAULT;
d323d005
CY
2725
2726 /* verify alignment of offset & size */
d7563861
KM
2727 if (range.start & (F2FS_BLKSIZE - 1) || range.len & (F2FS_BLKSIZE - 1))
2728 return -EINVAL;
d323d005 2729
1941d7bc 2730 if (unlikely((range.start + range.len) >> PAGE_SHIFT >
6d1451bf 2731 max_file_blocks(inode)))
d7563861
KM
2732 return -EINVAL;
2733
2734 err = mnt_want_write_file(filp);
2735 if (err)
2736 return err;
1941d7bc 2737
d323d005 2738 err = f2fs_defragment_range(sbi, filp, &range);
d7563861
KM
2739 mnt_drop_write_file(filp);
2740
d0239e1b 2741 f2fs_update_time(sbi, REQ_TIME);
d323d005 2742 if (err < 0)
d7563861 2743 return err;
d323d005
CY
2744
2745 if (copy_to_user((struct f2fs_defragment __user *)arg, &range,
2746 sizeof(range)))
d7563861
KM
2747 return -EFAULT;
2748
2749 return 0;
d323d005
CY
2750}
2751
4dd6f977
JK
2752static int f2fs_move_file_range(struct file *file_in, loff_t pos_in,
2753 struct file *file_out, loff_t pos_out, size_t len)
2754{
2755 struct inode *src = file_inode(file_in);
2756 struct inode *dst = file_inode(file_out);
2757 struct f2fs_sb_info *sbi = F2FS_I_SB(src);
2758 size_t olen = len, dst_max_i_size = 0;
2759 size_t dst_osize;
2760 int ret;
2761
2762 if (file_in->f_path.mnt != file_out->f_path.mnt ||
2763 src->i_sb != dst->i_sb)
2764 return -EXDEV;
2765
2766 if (unlikely(f2fs_readonly(src->i_sb)))
2767 return -EROFS;
2768
fe8494bf
CY
2769 if (!S_ISREG(src->i_mode) || !S_ISREG(dst->i_mode))
2770 return -EINVAL;
4dd6f977 2771
62230e0d 2772 if (IS_ENCRYPTED(src) || IS_ENCRYPTED(dst))
4dd6f977
JK
2773 return -EOPNOTSUPP;
2774
aad1383c
DR
2775 if (pos_out < 0 || pos_in < 0)
2776 return -EINVAL;
2777
d95fd91c
FL
2778 if (src == dst) {
2779 if (pos_in == pos_out)
2780 return 0;
2781 if (pos_out > pos_in && pos_out < pos_in + len)
2782 return -EINVAL;
2783 }
2784
4dd6f977 2785 inode_lock(src);
20a3d61d 2786 if (src != dst) {
bb06664a
CY
2787 ret = -EBUSY;
2788 if (!inode_trylock(dst))
2789 goto out;
20a3d61d 2790 }
4dd6f977
JK
2791
2792 ret = -EINVAL;
2793 if (pos_in + len > src->i_size || pos_in + len < pos_in)
2794 goto out_unlock;
2795 if (len == 0)
2796 olen = len = src->i_size - pos_in;
2797 if (pos_in + len == src->i_size)
2798 len = ALIGN(src->i_size, F2FS_BLKSIZE) - pos_in;
2799 if (len == 0) {
2800 ret = 0;
2801 goto out_unlock;
2802 }
2803
2804 dst_osize = dst->i_size;
2805 if (pos_out + olen > dst->i_size)
2806 dst_max_i_size = pos_out + olen;
2807
2808 /* verify the end result is block aligned */
2809 if (!IS_ALIGNED(pos_in, F2FS_BLKSIZE) ||
2810 !IS_ALIGNED(pos_in + len, F2FS_BLKSIZE) ||
2811 !IS_ALIGNED(pos_out, F2FS_BLKSIZE))
2812 goto out_unlock;
2813
2814 ret = f2fs_convert_inline_inode(src);
2815 if (ret)
2816 goto out_unlock;
2817
2818 ret = f2fs_convert_inline_inode(dst);
2819 if (ret)
2820 goto out_unlock;
2821
2822 /* write out all dirty pages from offset */
2823 ret = filemap_write_and_wait_range(src->i_mapping,
2824 pos_in, pos_in + len);
2825 if (ret)
2826 goto out_unlock;
2827
2828 ret = filemap_write_and_wait_range(dst->i_mapping,
2829 pos_out, pos_out + len);
2830 if (ret)
2831 goto out_unlock;
2832
2833 f2fs_balance_fs(sbi, true);
6f8d4455 2834
e4544b63 2835 f2fs_down_write(&F2FS_I(src)->i_gc_rwsem[WRITE]);
6f8d4455
JK
2836 if (src != dst) {
2837 ret = -EBUSY;
e4544b63 2838 if (!f2fs_down_write_trylock(&F2FS_I(dst)->i_gc_rwsem[WRITE]))
6f8d4455
JK
2839 goto out_src;
2840 }
2841
4dd6f977 2842 f2fs_lock_op(sbi);
61e4da11
FL
2843 ret = __exchange_data_block(src, dst, pos_in >> F2FS_BLKSIZE_BITS,
2844 pos_out >> F2FS_BLKSIZE_BITS,
2845 len >> F2FS_BLKSIZE_BITS, false);
4dd6f977
JK
2846
2847 if (!ret) {
2848 if (dst_max_i_size)
2849 f2fs_i_size_write(dst, dst_max_i_size);
2850 else if (dst_osize != dst->i_size)
2851 f2fs_i_size_write(dst, dst_osize);
2852 }
2853 f2fs_unlock_op(sbi);
6f8d4455
JK
2854
2855 if (src != dst)
e4544b63 2856 f2fs_up_write(&F2FS_I(dst)->i_gc_rwsem[WRITE]);
6f8d4455 2857out_src:
e4544b63 2858 f2fs_up_write(&F2FS_I(src)->i_gc_rwsem[WRITE]);
6f8d4455
JK
2859out_unlock:
2860 if (src != dst)
4dd6f977 2861 inode_unlock(dst);
20a3d61d 2862out:
4dd6f977
JK
2863 inode_unlock(src);
2864 return ret;
2865}
2866
34178b1b
CY
2867static int __f2fs_ioc_move_range(struct file *filp,
2868 struct f2fs_move_range *range)
4dd6f977 2869{
4dd6f977
JK
2870 struct fd dst;
2871 int err;
2872
2873 if (!(filp->f_mode & FMODE_READ) ||
2874 !(filp->f_mode & FMODE_WRITE))
2875 return -EBADF;
2876
34178b1b 2877 dst = fdget(range->dst_fd);
4dd6f977
JK
2878 if (!dst.file)
2879 return -EBADF;
2880
2881 if (!(dst.file->f_mode & FMODE_WRITE)) {
2882 err = -EBADF;
2883 goto err_out;
2884 }
2885
2886 err = mnt_want_write_file(filp);
2887 if (err)
2888 goto err_out;
2889
34178b1b
CY
2890 err = f2fs_move_file_range(filp, range->pos_in, dst.file,
2891 range->pos_out, range->len);
4dd6f977
JK
2892
2893 mnt_drop_write_file(filp);
4dd6f977
JK
2894err_out:
2895 fdput(dst);
2896 return err;
2897}
2898
34178b1b
CY
2899static int f2fs_ioc_move_range(struct file *filp, unsigned long arg)
2900{
2901 struct f2fs_move_range range;
2902
2903 if (copy_from_user(&range, (struct f2fs_move_range __user *)arg,
2904 sizeof(range)))
2905 return -EFAULT;
2906 return __f2fs_ioc_move_range(filp, &range);
2907}
2908
e066b83c
JK
2909static int f2fs_ioc_flush_device(struct file *filp, unsigned long arg)
2910{
2911 struct inode *inode = file_inode(filp);
2912 struct f2fs_sb_info *sbi = F2FS_I_SB(inode);
2913 struct sit_info *sm = SIT_I(sbi);
2914 unsigned int start_segno = 0, end_segno = 0;
2915 unsigned int dev_start_segno = 0, dev_end_segno = 0;
2916 struct f2fs_flush_device range;
2917 int ret;
2918
2919 if (!capable(CAP_SYS_ADMIN))
2920 return -EPERM;
2921
2922 if (f2fs_readonly(sbi->sb))
2923 return -EROFS;
2924
4354994f
DR
2925 if (unlikely(is_sbi_flag_set(sbi, SBI_CP_DISABLED)))
2926 return -EINVAL;
2927
e066b83c
JK
2928 if (copy_from_user(&range, (struct f2fs_flush_device __user *)arg,
2929 sizeof(range)))
2930 return -EFAULT;
2931
0916878d 2932 if (!f2fs_is_multi_device(sbi) || sbi->s_ndevs - 1 <= range.dev_num ||
2c70c5e3 2933 __is_large_section(sbi)) {
dcbb4c10
JP
2934 f2fs_warn(sbi, "Can't flush %u in %d for segs_per_sec %u != 1",
2935 range.dev_num, sbi->s_ndevs, sbi->segs_per_sec);
e066b83c
JK
2936 return -EINVAL;
2937 }
2938
2939 ret = mnt_want_write_file(filp);
2940 if (ret)
2941 return ret;
2942
2943 if (range.dev_num != 0)
2944 dev_start_segno = GET_SEGNO(sbi, FDEV(range.dev_num).start_blk);
2945 dev_end_segno = GET_SEGNO(sbi, FDEV(range.dev_num).end_blk);
2946
2947 start_segno = sm->last_victim[FLUSH_DEVICE];
2948 if (start_segno < dev_start_segno || start_segno >= dev_end_segno)
2949 start_segno = dev_start_segno;
2950 end_segno = min(start_segno + range.segments, dev_end_segno);
2951
2952 while (start_segno < end_segno) {
e4544b63 2953 if (!f2fs_down_write_trylock(&sbi->gc_lock)) {
e066b83c
JK
2954 ret = -EBUSY;
2955 goto out;
2956 }
2957 sm->last_victim[GC_CB] = end_segno + 1;
2958 sm->last_victim[GC_GREEDY] = end_segno + 1;
2959 sm->last_victim[ALLOC_NEXT] = end_segno + 1;
7dede886 2960 ret = f2fs_gc(sbi, true, true, true, start_segno);
e066b83c
JK
2961 if (ret == -EAGAIN)
2962 ret = 0;
2963 else if (ret < 0)
2964 break;
2965 start_segno++;
2966 }
2967out:
2968 mnt_drop_write_file(filp);
2969 return ret;
2970}
2971
e65ef207
JK
2972static int f2fs_ioc_get_features(struct file *filp, unsigned long arg)
2973{
2974 struct inode *inode = file_inode(filp);
2975 u32 sb_feature = le32_to_cpu(F2FS_I_SB(inode)->raw_super->feature);
2976
2977 /* Must validate to set it with SQLite behavior in Android. */
2978 sb_feature |= F2FS_FEATURE_ATOMIC_WRITE;
2979
2980 return put_user(sb_feature, (u32 __user *)arg);
2981}
e066b83c 2982
2c1d0305 2983#ifdef CONFIG_QUOTA
78130819
CY
2984int f2fs_transfer_project_quota(struct inode *inode, kprojid_t kprojid)
2985{
2986 struct dquot *transfer_to[MAXQUOTAS] = {};
2987 struct f2fs_sb_info *sbi = F2FS_I_SB(inode);
2988 struct super_block *sb = sbi->sb;
2989 int err = 0;
2990
2991 transfer_to[PRJQUOTA] = dqget(sb, make_kqid_projid(kprojid));
2992 if (!IS_ERR(transfer_to[PRJQUOTA])) {
2993 err = __dquot_transfer(inode, transfer_to);
2994 if (err)
2995 set_sbi_flag(sbi, SBI_QUOTA_NEED_REPAIR);
2996 dqput(transfer_to[PRJQUOTA]);
2997 }
2998 return err;
2999}
3000
9b1bb01c 3001static int f2fs_ioc_setproject(struct inode *inode, __u32 projid)
2c1d0305 3002{
2c1d0305
CY
3003 struct f2fs_inode_info *fi = F2FS_I(inode);
3004 struct f2fs_sb_info *sbi = F2FS_I_SB(inode);
d13732cc 3005 struct f2fs_inode *ri = NULL;
2c1d0305
CY
3006 kprojid_t kprojid;
3007 int err;
3008
7beb01f7 3009 if (!f2fs_sb_has_project_quota(sbi)) {
2c1d0305
CY
3010 if (projid != F2FS_DEF_PROJID)
3011 return -EOPNOTSUPP;
3012 else
3013 return 0;
3014 }
3015
3016 if (!f2fs_has_extra_attr(inode))
3017 return -EOPNOTSUPP;
3018
3019 kprojid = make_kprojid(&init_user_ns, (projid_t)projid);
3020
3021 if (projid_eq(kprojid, F2FS_I(inode)->i_projid))
3022 return 0;
3023
2c1d0305 3024 err = -EPERM;
2c1d0305
CY
3025 /* Is it quota file? Do not allow user to mess with it */
3026 if (IS_NOQUOTA(inode))
c8e92757 3027 return err;
2c1d0305 3028
d13732cc
JY
3029 if (!F2FS_FITS_IN_INODE(ri, fi->i_extra_isize, i_projid))
3030 return -EOVERFLOW;
2c1d0305 3031
10a26878 3032 err = f2fs_dquot_initialize(inode);
c22aecd7 3033 if (err)
c8e92757 3034 return err;
2c1d0305 3035
78130819
CY
3036 f2fs_lock_op(sbi);
3037 err = f2fs_transfer_project_quota(inode, kprojid);
3038 if (err)
3039 goto out_unlock;
2c1d0305
CY
3040
3041 F2FS_I(inode)->i_projid = kprojid;
3042 inode->i_ctime = current_time(inode);
2c1d0305 3043 f2fs_mark_inode_dirty_sync(inode, true);
78130819
CY
3044out_unlock:
3045 f2fs_unlock_op(sbi);
2c1d0305
CY
3046 return err;
3047}
3048#else
78130819
CY
3049int f2fs_transfer_project_quota(struct inode *inode, kprojid_t kprojid)
3050{
3051 return 0;
3052}
3053
9b1bb01c 3054static int f2fs_ioc_setproject(struct inode *inode, __u32 projid)
2c1d0305
CY
3055{
3056 if (projid != F2FS_DEF_PROJID)
3057 return -EOPNOTSUPP;
3058 return 0;
3059}
3060#endif
3061
9b1bb01c 3062int f2fs_fileattr_get(struct dentry *dentry, struct fileattr *fa)
2c1d0305 3063{
9b1bb01c 3064 struct inode *inode = d_inode(dentry);
2c1d0305 3065 struct f2fs_inode_info *fi = F2FS_I(inode);
9b1bb01c 3066 u32 fsflags = f2fs_iflags_to_fsflags(fi->i_flags);
2c1d0305 3067
9b1bb01c
MS
3068 if (IS_ENCRYPTED(inode))
3069 fsflags |= FS_ENCRYPT_FL;
3070 if (IS_VERITY(inode))
3071 fsflags |= FS_VERITY_FL;
3072 if (f2fs_has_inline_data(inode) || f2fs_has_inline_dentry(inode))
3073 fsflags |= FS_INLINE_DATA_FL;
3074 if (is_inode_flag_set(inode, FI_PIN_FILE))
3075 fsflags |= FS_NOCOW_FL;
3076
3077 fileattr_fill_flags(fa, fsflags & F2FS_GETTABLE_FS_FL);
2c1d0305 3078
7beb01f7 3079 if (f2fs_sb_has_project_quota(F2FS_I_SB(inode)))
6fc93c4e 3080 fa->fsx_projid = from_kprojid(&init_user_ns, fi->i_projid);
2c1d0305 3081
c8e92757
WS
3082 return 0;
3083}
3084
9b1bb01c
MS
3085int f2fs_fileattr_set(struct user_namespace *mnt_userns,
3086 struct dentry *dentry, struct fileattr *fa)
2c1d0305 3087{
9b1bb01c
MS
3088 struct inode *inode = d_inode(dentry);
3089 u32 fsflags = fa->flags, mask = F2FS_SETTABLE_FS_FL;
36098557 3090 u32 iflags;
2c1d0305
CY
3091 int err;
3092
9b1bb01c
MS
3093 if (unlikely(f2fs_cp_error(F2FS_I_SB(inode))))
3094 return -EIO;
3095 if (!f2fs_is_checkpoint_ready(F2FS_I_SB(inode)))
3096 return -ENOSPC;
3097 if (fsflags & ~F2FS_GETTABLE_FS_FL)
2c1d0305 3098 return -EOPNOTSUPP;
9b1bb01c
MS
3099 fsflags &= F2FS_SETTABLE_FS_FL;
3100 if (!fa->flags_valid)
3101 mask &= FS_COMMON_FL;
2c1d0305 3102
9b1bb01c 3103 iflags = f2fs_fsflags_to_iflags(fsflags);
36098557 3104 if (f2fs_mask_flags(inode->i_mode, iflags) != iflags)
2c1d0305
CY
3105 return -EOPNOTSUPP;
3106
9b1bb01c
MS
3107 err = f2fs_setflags_common(inode, iflags, f2fs_fsflags_to_iflags(mask));
3108 if (!err)
3109 err = f2fs_ioc_setproject(inode, fa->fsx_projid);
2c1d0305 3110
c8e92757 3111 return err;
2c1d0305 3112}
e066b83c 3113
1ad71a27
JK
3114int f2fs_pin_file_control(struct inode *inode, bool inc)
3115{
3116 struct f2fs_inode_info *fi = F2FS_I(inode);
3117 struct f2fs_sb_info *sbi = F2FS_I_SB(inode);
3118
3119 /* Use i_gc_failures for normal file as a risk signal. */
3120 if (inc)
2ef79ecb
CY
3121 f2fs_i_gc_failures_write(inode,
3122 fi->i_gc_failures[GC_FAILURE_PIN] + 1);
1ad71a27 3123
2ef79ecb 3124 if (fi->i_gc_failures[GC_FAILURE_PIN] > sbi->gc_pin_file_threshold) {
dcbb4c10
JP
3125 f2fs_warn(sbi, "%s: Enable GC = ino %lx after %x GC trials",
3126 __func__, inode->i_ino,
3127 fi->i_gc_failures[GC_FAILURE_PIN]);
1ad71a27
JK
3128 clear_inode_flag(inode, FI_PIN_FILE);
3129 return -EAGAIN;
3130 }
3131 return 0;
3132}
3133
3134static int f2fs_ioc_set_pin_file(struct file *filp, unsigned long arg)
3135{
3136 struct inode *inode = file_inode(filp);
3137 __u32 pin;
3138 int ret = 0;
3139
1ad71a27
JK
3140 if (get_user(pin, (__u32 __user *)arg))
3141 return -EFAULT;
3142
3143 if (!S_ISREG(inode->i_mode))
3144 return -EINVAL;
3145
3146 if (f2fs_readonly(F2FS_I_SB(inode)->sb))
3147 return -EROFS;
3148
3149 ret = mnt_want_write_file(filp);
3150 if (ret)
3151 return ret;
3152
3153 inode_lock(inode);
3154
3155 if (!pin) {
3156 clear_inode_flag(inode, FI_PIN_FILE);
30933364 3157 f2fs_i_gc_failures_write(inode, 0);
1ad71a27
JK
3158 goto done;
3159 }
3160
19bdba52
JK
3161 if (f2fs_should_update_outplace(inode, NULL)) {
3162 ret = -EINVAL;
3163 goto out;
3164 }
3165
1ad71a27
JK
3166 if (f2fs_pin_file_control(inode, false)) {
3167 ret = -EAGAIN;
3168 goto out;
3169 }
4c8ff709 3170
1ad71a27
JK
3171 ret = f2fs_convert_inline_inode(inode);
3172 if (ret)
3173 goto out;
3174
78134d03 3175 if (!f2fs_disable_compressed_file(inode)) {
4c8ff709
CY
3176 ret = -EOPNOTSUPP;
3177 goto out;
3178 }
3179
1ad71a27 3180 set_inode_flag(inode, FI_PIN_FILE);
2ef79ecb 3181 ret = F2FS_I(inode)->i_gc_failures[GC_FAILURE_PIN];
1ad71a27
JK
3182done:
3183 f2fs_update_time(F2FS_I_SB(inode), REQ_TIME);
3184out:
3185 inode_unlock(inode);
3186 mnt_drop_write_file(filp);
3187 return ret;
3188}
3189
3190static int f2fs_ioc_get_pin_file(struct file *filp, unsigned long arg)
3191{
3192 struct inode *inode = file_inode(filp);
3193 __u32 pin = 0;
3194
3195 if (is_inode_flag_set(inode, FI_PIN_FILE))
2ef79ecb 3196 pin = F2FS_I(inode)->i_gc_failures[GC_FAILURE_PIN];
1ad71a27
JK
3197 return put_user(pin, (u32 __user *)arg);
3198}
3199
c4020b2d
CY
3200int f2fs_precache_extents(struct inode *inode)
3201{
3202 struct f2fs_inode_info *fi = F2FS_I(inode);
3203 struct f2fs_map_blocks map;
3204 pgoff_t m_next_extent;
3205 loff_t end;
3206 int err;
3207
3208 if (is_inode_flag_set(inode, FI_NO_EXTENT))
3209 return -EOPNOTSUPP;
3210
3211 map.m_lblk = 0;
3212 map.m_next_pgofs = NULL;
3213 map.m_next_extent = &m_next_extent;
3214 map.m_seg_type = NO_CHECK_TYPE;
f4f0b677 3215 map.m_may_create = false;
6d1451bf 3216 end = max_file_blocks(inode);
c4020b2d
CY
3217
3218 while (map.m_lblk < end) {
3219 map.m_len = end - map.m_lblk;
3220
e4544b63 3221 f2fs_down_write(&fi->i_gc_rwsem[WRITE]);
c4020b2d 3222 err = f2fs_map_blocks(inode, &map, 0, F2FS_GET_BLOCK_PRECACHE);
e4544b63 3223 f2fs_up_write(&fi->i_gc_rwsem[WRITE]);
c4020b2d
CY
3224 if (err)
3225 return err;
3226
3227 map.m_lblk = m_next_extent;
3228 }
3229
4f55dc2a 3230 return 0;
c4020b2d
CY
3231}
3232
3233static int f2fs_ioc_precache_extents(struct file *filp, unsigned long arg)
3234{
3235 return f2fs_precache_extents(file_inode(filp));
3236}
3237
04f0b2ea
QS
3238static int f2fs_ioc_resize_fs(struct file *filp, unsigned long arg)
3239{
3240 struct f2fs_sb_info *sbi = F2FS_I_SB(file_inode(filp));
3241 __u64 block_count;
04f0b2ea
QS
3242
3243 if (!capable(CAP_SYS_ADMIN))
3244 return -EPERM;
3245
3246 if (f2fs_readonly(sbi->sb))
3247 return -EROFS;
3248
3249 if (copy_from_user(&block_count, (void __user *)arg,
3250 sizeof(block_count)))
3251 return -EFAULT;
3252
b4b10061 3253 return f2fs_resize_fs(sbi, block_count);
04f0b2ea
QS
3254}
3255
95ae251f
EB
3256static int f2fs_ioc_enable_verity(struct file *filp, unsigned long arg)
3257{
3258 struct inode *inode = file_inode(filp);
3259
3260 f2fs_update_time(F2FS_I_SB(inode), REQ_TIME);
3261
3262 if (!f2fs_sb_has_verity(F2FS_I_SB(inode))) {
3263 f2fs_warn(F2FS_I_SB(inode),
833dcd35 3264 "Can't enable fs-verity on inode %lu: the verity feature is not enabled on this filesystem",
95ae251f
EB
3265 inode->i_ino);
3266 return -EOPNOTSUPP;
3267 }
3268
3269 return fsverity_ioctl_enable(filp, (const void __user *)arg);
3270}
3271
3272static int f2fs_ioc_measure_verity(struct file *filp, unsigned long arg)
3273{
3274 if (!f2fs_sb_has_verity(F2FS_I_SB(file_inode(filp))))
3275 return -EOPNOTSUPP;
3276
3277 return fsverity_ioctl_measure(filp, (void __user *)arg);
3278}
3279
e17fe657
EB
3280static int f2fs_ioc_read_verity_metadata(struct file *filp, unsigned long arg)
3281{
3282 if (!f2fs_sb_has_verity(F2FS_I_SB(file_inode(filp))))
3283 return -EOPNOTSUPP;
3284
3285 return fsverity_ioctl_read_metadata(filp, (const void __user *)arg);
3286}
3287
3357af8f 3288static int f2fs_ioc_getfslabel(struct file *filp, unsigned long arg)
4507847c
CY
3289{
3290 struct inode *inode = file_inode(filp);
3291 struct f2fs_sb_info *sbi = F2FS_I_SB(inode);
3292 char *vbuf;
3293 int count;
3294 int err = 0;
3295
3296 vbuf = f2fs_kzalloc(sbi, MAX_VOLUME_NAME, GFP_KERNEL);
3297 if (!vbuf)
3298 return -ENOMEM;
3299
e4544b63 3300 f2fs_down_read(&sbi->sb_lock);
4507847c
CY
3301 count = utf16s_to_utf8s(sbi->raw_super->volume_name,
3302 ARRAY_SIZE(sbi->raw_super->volume_name),
3303 UTF16_LITTLE_ENDIAN, vbuf, MAX_VOLUME_NAME);
e4544b63 3304 f2fs_up_read(&sbi->sb_lock);
4507847c
CY
3305
3306 if (copy_to_user((char __user *)arg, vbuf,
3307 min(FSLABEL_MAX, count)))
3308 err = -EFAULT;
3309
c8eb7024 3310 kfree(vbuf);
4507847c
CY
3311 return err;
3312}
3313
3357af8f 3314static int f2fs_ioc_setfslabel(struct file *filp, unsigned long arg)
4507847c
CY
3315{
3316 struct inode *inode = file_inode(filp);
3317 struct f2fs_sb_info *sbi = F2FS_I_SB(inode);
3318 char *vbuf;
3319 int err = 0;
3320
3321 if (!capable(CAP_SYS_ADMIN))
3322 return -EPERM;
3323
3324 vbuf = strndup_user((const char __user *)arg, FSLABEL_MAX);
3325 if (IS_ERR(vbuf))
3326 return PTR_ERR(vbuf);
3327
3328 err = mnt_want_write_file(filp);
3329 if (err)
3330 goto out;
3331
e4544b63 3332 f2fs_down_write(&sbi->sb_lock);
4507847c
CY
3333
3334 memset(sbi->raw_super->volume_name, 0,
3335 sizeof(sbi->raw_super->volume_name));
3336 utf8s_to_utf16s(vbuf, strlen(vbuf), UTF16_LITTLE_ENDIAN,
3337 sbi->raw_super->volume_name,
3338 ARRAY_SIZE(sbi->raw_super->volume_name));
3339
3340 err = f2fs_commit_super(sbi, false);
3341
e4544b63 3342 f2fs_up_write(&sbi->sb_lock);
4507847c
CY
3343
3344 mnt_drop_write_file(filp);
3345out:
3346 kfree(vbuf);
3347 return err;
3348}
3349
439dfb10
CY
3350static int f2fs_get_compress_blocks(struct file *filp, unsigned long arg)
3351{
3352 struct inode *inode = file_inode(filp);
3353 __u64 blocks;
3354
3355 if (!f2fs_sb_has_compression(F2FS_I_SB(inode)))
3356 return -EOPNOTSUPP;
3357
3358 if (!f2fs_compressed_file(inode))
3359 return -EINVAL;
3360
c2759eba 3361 blocks = atomic_read(&F2FS_I(inode)->i_compr_blocks);
439dfb10
CY
3362 return put_user(blocks, (u64 __user *)arg);
3363}
3364
ef8d563f
CY
3365static int release_compress_blocks(struct dnode_of_data *dn, pgoff_t count)
3366{
3367 struct f2fs_sb_info *sbi = F2FS_I_SB(dn->inode);
3368 unsigned int released_blocks = 0;
3369 int cluster_size = F2FS_I(dn->inode)->i_cluster_size;
3370 block_t blkaddr;
3371 int i;
3372
3373 for (i = 0; i < count; i++) {
3374 blkaddr = data_blkaddr(dn->inode, dn->node_page,
3375 dn->ofs_in_node + i);
3376
3377 if (!__is_valid_data_blkaddr(blkaddr))
3378 continue;
3379 if (unlikely(!f2fs_is_valid_blkaddr(sbi, blkaddr,
3380 DATA_GENERIC_ENHANCE)))
3381 return -EFSCORRUPTED;
3382 }
3383
3384 while (count) {
3385 int compr_blocks = 0;
3386
3387 for (i = 0; i < cluster_size; i++, dn->ofs_in_node++) {
3388 blkaddr = f2fs_data_blkaddr(dn);
3389
3390 if (i == 0) {
3391 if (blkaddr == COMPRESS_ADDR)
3392 continue;
3393 dn->ofs_in_node += cluster_size;
3394 goto next;
3395 }
3396
3397 if (__is_valid_data_blkaddr(blkaddr))
3398 compr_blocks++;
3399
3400 if (blkaddr != NEW_ADDR)
3401 continue;
3402
3403 dn->data_blkaddr = NULL_ADDR;
3404 f2fs_set_data_blkaddr(dn);
3405 }
3406
3407 f2fs_i_compr_blocks_update(dn->inode, compr_blocks, false);
3408 dec_valid_block_count(sbi, dn->inode,
3409 cluster_size - compr_blocks);
3410
3411 released_blocks += cluster_size - compr_blocks;
3412next:
3413 count -= cluster_size;
3414 }
3415
3416 return released_blocks;
3417}
3418
3419static int f2fs_release_compress_blocks(struct file *filp, unsigned long arg)
3420{
3421 struct inode *inode = file_inode(filp);
3422 struct f2fs_sb_info *sbi = F2FS_I_SB(inode);
3423 pgoff_t page_idx = 0, last_idx;
3424 unsigned int released_blocks = 0;
3425 int ret;
3426 int writecount;
3427
3428 if (!f2fs_sb_has_compression(F2FS_I_SB(inode)))
3429 return -EOPNOTSUPP;
3430
3431 if (!f2fs_compressed_file(inode))
3432 return -EINVAL;
3433
3434 if (f2fs_readonly(sbi->sb))
3435 return -EROFS;
3436
3437 ret = mnt_want_write_file(filp);
3438 if (ret)
3439 return ret;
3440
3441 f2fs_balance_fs(F2FS_I_SB(inode), true);
3442
3443 inode_lock(inode);
3444
3445 writecount = atomic_read(&inode->i_writecount);
8c8cf26a
DJ
3446 if ((filp->f_mode & FMODE_WRITE && writecount != 1) ||
3447 (!(filp->f_mode & FMODE_WRITE) && writecount)) {
ef8d563f
CY
3448 ret = -EBUSY;
3449 goto out;
3450 }
3451
c6140415 3452 if (is_inode_flag_set(inode, FI_COMPRESS_RELEASED)) {
ef8d563f
CY
3453 ret = -EINVAL;
3454 goto out;
3455 }
3456
3457 ret = filemap_write_and_wait_range(inode->i_mapping, 0, LLONG_MAX);
3458 if (ret)
3459 goto out;
3460
c6140415 3461 set_inode_flag(inode, FI_COMPRESS_RELEASED);
ef8d563f
CY
3462 inode->i_ctime = current_time(inode);
3463 f2fs_mark_inode_dirty_sync(inode, true);
3464
c2759eba 3465 if (!atomic_read(&F2FS_I(inode)->i_compr_blocks))
567c4bf5
DJ
3466 goto out;
3467
e4544b63 3468 f2fs_down_write(&F2FS_I(inode)->i_gc_rwsem[WRITE]);
edc6d01b 3469 filemap_invalidate_lock(inode->i_mapping);
ef8d563f
CY
3470
3471 last_idx = DIV_ROUND_UP(i_size_read(inode), PAGE_SIZE);
3472
3473 while (page_idx < last_idx) {
3474 struct dnode_of_data dn;
3475 pgoff_t end_offset, count;
3476
3477 set_new_dnode(&dn, inode, NULL, NULL, 0);
3478 ret = f2fs_get_dnode_of_data(&dn, page_idx, LOOKUP_NODE);
3479 if (ret) {
3480 if (ret == -ENOENT) {
3481 page_idx = f2fs_get_next_page_offset(&dn,
3482 page_idx);
3483 ret = 0;
3484 continue;
3485 }
3486 break;
3487 }
3488
3489 end_offset = ADDRS_PER_PAGE(dn.node_page, inode);
3490 count = min(end_offset - dn.ofs_in_node, last_idx - page_idx);
4fec3fc0 3491 count = round_up(count, F2FS_I(inode)->i_cluster_size);
ef8d563f
CY
3492
3493 ret = release_compress_blocks(&dn, count);
3494
3495 f2fs_put_dnode(&dn);
3496
3497 if (ret < 0)
3498 break;
3499
3500 page_idx += count;
3501 released_blocks += ret;
3502 }
3503
edc6d01b 3504 filemap_invalidate_unlock(inode->i_mapping);
e4544b63 3505 f2fs_up_write(&F2FS_I(inode)->i_gc_rwsem[WRITE]);
ef8d563f
CY
3506out:
3507 inode_unlock(inode);
3508
3509 mnt_drop_write_file(filp);
3510
3511 if (ret >= 0) {
3512 ret = put_user(released_blocks, (u64 __user *)arg);
c2759eba
DJ
3513 } else if (released_blocks &&
3514 atomic_read(&F2FS_I(inode)->i_compr_blocks)) {
ef8d563f
CY
3515 set_sbi_flag(sbi, SBI_NEED_FSCK);
3516 f2fs_warn(sbi, "%s: partial blocks were released i_ino=%lx "
c2759eba 3517 "iblocks=%llu, released=%u, compr_blocks=%u, "
ef8d563f
CY
3518 "run fsck to fix.",
3519 __func__, inode->i_ino, inode->i_blocks,
3520 released_blocks,
c2759eba 3521 atomic_read(&F2FS_I(inode)->i_compr_blocks));
ef8d563f
CY
3522 }
3523
3524 return ret;
3525}
3526
c75488fb
CY
3527static int reserve_compress_blocks(struct dnode_of_data *dn, pgoff_t count)
3528{
3529 struct f2fs_sb_info *sbi = F2FS_I_SB(dn->inode);
3530 unsigned int reserved_blocks = 0;
3531 int cluster_size = F2FS_I(dn->inode)->i_cluster_size;
3532 block_t blkaddr;
3533 int i;
3534
3535 for (i = 0; i < count; i++) {
3536 blkaddr = data_blkaddr(dn->inode, dn->node_page,
3537 dn->ofs_in_node + i);
3538
3539 if (!__is_valid_data_blkaddr(blkaddr))
3540 continue;
3541 if (unlikely(!f2fs_is_valid_blkaddr(sbi, blkaddr,
3542 DATA_GENERIC_ENHANCE)))
3543 return -EFSCORRUPTED;
3544 }
3545
3546 while (count) {
3547 int compr_blocks = 0;
3548 blkcnt_t reserved;
3549 int ret;
3550
3551 for (i = 0; i < cluster_size; i++, dn->ofs_in_node++) {
3552 blkaddr = f2fs_data_blkaddr(dn);
3553
3554 if (i == 0) {
3555 if (blkaddr == COMPRESS_ADDR)
3556 continue;
3557 dn->ofs_in_node += cluster_size;
3558 goto next;
3559 }
3560
3561 if (__is_valid_data_blkaddr(blkaddr)) {
3562 compr_blocks++;
3563 continue;
3564 }
3565
3566 dn->data_blkaddr = NEW_ADDR;
3567 f2fs_set_data_blkaddr(dn);
3568 }
3569
3570 reserved = cluster_size - compr_blocks;
3571 ret = inc_valid_block_count(sbi, dn->inode, &reserved);
3572 if (ret)
3573 return ret;
3574
3575 if (reserved != cluster_size - compr_blocks)
3576 return -ENOSPC;
3577
3578 f2fs_i_compr_blocks_update(dn->inode, compr_blocks, true);
3579
3580 reserved_blocks += reserved;
3581next:
3582 count -= cluster_size;
3583 }
3584
3585 return reserved_blocks;
3586}
3587
3588static int f2fs_reserve_compress_blocks(struct file *filp, unsigned long arg)
3589{
3590 struct inode *inode = file_inode(filp);
3591 struct f2fs_sb_info *sbi = F2FS_I_SB(inode);
3592 pgoff_t page_idx = 0, last_idx;
3593 unsigned int reserved_blocks = 0;
3594 int ret;
3595
3596 if (!f2fs_sb_has_compression(F2FS_I_SB(inode)))
3597 return -EOPNOTSUPP;
3598
3599 if (!f2fs_compressed_file(inode))
3600 return -EINVAL;
3601
3602 if (f2fs_readonly(sbi->sb))
3603 return -EROFS;
3604
3605 ret = mnt_want_write_file(filp);
3606 if (ret)
3607 return ret;
3608
c2759eba 3609 if (atomic_read(&F2FS_I(inode)->i_compr_blocks))
c75488fb
CY
3610 goto out;
3611
3612 f2fs_balance_fs(F2FS_I_SB(inode), true);
3613
3614 inode_lock(inode);
3615
c6140415 3616 if (!is_inode_flag_set(inode, FI_COMPRESS_RELEASED)) {
c75488fb
CY
3617 ret = -EINVAL;
3618 goto unlock_inode;
3619 }
3620
e4544b63 3621 f2fs_down_write(&F2FS_I(inode)->i_gc_rwsem[WRITE]);
edc6d01b 3622 filemap_invalidate_lock(inode->i_mapping);
c75488fb
CY
3623
3624 last_idx = DIV_ROUND_UP(i_size_read(inode), PAGE_SIZE);
3625
3626 while (page_idx < last_idx) {
3627 struct dnode_of_data dn;
3628 pgoff_t end_offset, count;
3629
3630 set_new_dnode(&dn, inode, NULL, NULL, 0);
3631 ret = f2fs_get_dnode_of_data(&dn, page_idx, LOOKUP_NODE);
3632 if (ret) {
3633 if (ret == -ENOENT) {
3634 page_idx = f2fs_get_next_page_offset(&dn,
3635 page_idx);
3636 ret = 0;
3637 continue;
3638 }
3639 break;
3640 }
3641
3642 end_offset = ADDRS_PER_PAGE(dn.node_page, inode);
3643 count = min(end_offset - dn.ofs_in_node, last_idx - page_idx);
4fec3fc0 3644 count = round_up(count, F2FS_I(inode)->i_cluster_size);
c75488fb
CY
3645
3646 ret = reserve_compress_blocks(&dn, count);
3647
3648 f2fs_put_dnode(&dn);
3649
3650 if (ret < 0)
3651 break;
3652
3653 page_idx += count;
3654 reserved_blocks += ret;
3655 }
3656
edc6d01b 3657 filemap_invalidate_unlock(inode->i_mapping);
e4544b63 3658 f2fs_up_write(&F2FS_I(inode)->i_gc_rwsem[WRITE]);
c75488fb
CY
3659
3660 if (ret >= 0) {
c6140415 3661 clear_inode_flag(inode, FI_COMPRESS_RELEASED);
c75488fb
CY
3662 inode->i_ctime = current_time(inode);
3663 f2fs_mark_inode_dirty_sync(inode, true);
3664 }
3665unlock_inode:
3666 inode_unlock(inode);
3667out:
3668 mnt_drop_write_file(filp);
3669
3670 if (ret >= 0) {
3671 ret = put_user(reserved_blocks, (u64 __user *)arg);
c2759eba
DJ
3672 } else if (reserved_blocks &&
3673 atomic_read(&F2FS_I(inode)->i_compr_blocks)) {
c75488fb
CY
3674 set_sbi_flag(sbi, SBI_NEED_FSCK);
3675 f2fs_warn(sbi, "%s: partial blocks were released i_ino=%lx "
c2759eba 3676 "iblocks=%llu, reserved=%u, compr_blocks=%u, "
c75488fb
CY
3677 "run fsck to fix.",
3678 __func__, inode->i_ino, inode->i_blocks,
3679 reserved_blocks,
c2759eba 3680 atomic_read(&F2FS_I(inode)->i_compr_blocks));
c75488fb
CY
3681 }
3682
3683 return ret;
3684}
3685
9af84648
DJ
3686static int f2fs_secure_erase(struct block_device *bdev, struct inode *inode,
3687 pgoff_t off, block_t block, block_t len, u32 flags)
3688{
3689 struct request_queue *q = bdev_get_queue(bdev);
3690 sector_t sector = SECTOR_FROM_BLOCK(block);
3691 sector_t nr_sects = SECTOR_FROM_BLOCK(len);
3692 int ret = 0;
3693
3694 if (!q)
3695 return -ENXIO;
3696
3697 if (flags & F2FS_TRIM_FILE_DISCARD)
3698 ret = blkdev_issue_discard(bdev, sector, nr_sects, GFP_NOFS,
3699 blk_queue_secure_erase(q) ?
3700 BLKDEV_DISCARD_SECURE : 0);
3701
3702 if (!ret && (flags & F2FS_TRIM_FILE_ZEROOUT)) {
3703 if (IS_ENCRYPTED(inode))
3704 ret = fscrypt_zeroout_range(inode, off, block, len);
3705 else
3706 ret = blkdev_issue_zeroout(bdev, sector, nr_sects,
3707 GFP_NOFS, 0);
3708 }
3709
3710 return ret;
3711}
3712
3713static int f2fs_sec_trim_file(struct file *filp, unsigned long arg)
3714{
3715 struct inode *inode = file_inode(filp);
3716 struct f2fs_sb_info *sbi = F2FS_I_SB(inode);
3717 struct address_space *mapping = inode->i_mapping;
3718 struct block_device *prev_bdev = NULL;
3719 struct f2fs_sectrim_range range;
3720 pgoff_t index, pg_end, prev_index = 0;
3721 block_t prev_block = 0, len = 0;
3722 loff_t end_addr;
3723 bool to_end = false;
3724 int ret = 0;
3725
3726 if (!(filp->f_mode & FMODE_WRITE))
3727 return -EBADF;
3728
3729 if (copy_from_user(&range, (struct f2fs_sectrim_range __user *)arg,
3730 sizeof(range)))
3731 return -EFAULT;
3732
3733 if (range.flags == 0 || (range.flags & ~F2FS_TRIM_FILE_MASK) ||
3734 !S_ISREG(inode->i_mode))
3735 return -EINVAL;
3736
3737 if (((range.flags & F2FS_TRIM_FILE_DISCARD) &&
3738 !f2fs_hw_support_discard(sbi)) ||
3739 ((range.flags & F2FS_TRIM_FILE_ZEROOUT) &&
3740 IS_ENCRYPTED(inode) && f2fs_is_multi_device(sbi)))
3741 return -EOPNOTSUPP;
3742
3743 file_start_write(filp);
3744 inode_lock(inode);
3745
3746 if (f2fs_is_atomic_file(inode) || f2fs_compressed_file(inode) ||
3747 range.start >= inode->i_size) {
3748 ret = -EINVAL;
3749 goto err;
3750 }
3751
3752 if (range.len == 0)
3753 goto err;
3754
3755 if (inode->i_size - range.start > range.len) {
3756 end_addr = range.start + range.len;
3757 } else {
3758 end_addr = range.len == (u64)-1 ?
3759 sbi->sb->s_maxbytes : inode->i_size;
3760 to_end = true;
3761 }
3762
3763 if (!IS_ALIGNED(range.start, F2FS_BLKSIZE) ||
3764 (!to_end && !IS_ALIGNED(end_addr, F2FS_BLKSIZE))) {
3765 ret = -EINVAL;
3766 goto err;
3767 }
3768
3769 index = F2FS_BYTES_TO_BLK(range.start);
3770 pg_end = DIV_ROUND_UP(end_addr, F2FS_BLKSIZE);
3771
3772 ret = f2fs_convert_inline_inode(inode);
3773 if (ret)
3774 goto err;
3775
e4544b63 3776 f2fs_down_write(&F2FS_I(inode)->i_gc_rwsem[WRITE]);
edc6d01b 3777 filemap_invalidate_lock(mapping);
9af84648
DJ
3778
3779 ret = filemap_write_and_wait_range(mapping, range.start,
3780 to_end ? LLONG_MAX : end_addr - 1);
3781 if (ret)
3782 goto out;
3783
3784 truncate_inode_pages_range(mapping, range.start,
3785 to_end ? -1 : end_addr - 1);
3786
3787 while (index < pg_end) {
3788 struct dnode_of_data dn;
3789 pgoff_t end_offset, count;
3790 int i;
3791
3792 set_new_dnode(&dn, inode, NULL, NULL, 0);
3793 ret = f2fs_get_dnode_of_data(&dn, index, LOOKUP_NODE);
3794 if (ret) {
3795 if (ret == -ENOENT) {
3796 index = f2fs_get_next_page_offset(&dn, index);
3797 continue;
3798 }
3799 goto out;
3800 }
3801
3802 end_offset = ADDRS_PER_PAGE(dn.node_page, inode);
3803 count = min(end_offset - dn.ofs_in_node, pg_end - index);
3804 for (i = 0; i < count; i++, index++, dn.ofs_in_node++) {
3805 struct block_device *cur_bdev;
3806 block_t blkaddr = f2fs_data_blkaddr(&dn);
3807
3808 if (!__is_valid_data_blkaddr(blkaddr))
3809 continue;
3810
3811 if (!f2fs_is_valid_blkaddr(sbi, blkaddr,
3812 DATA_GENERIC_ENHANCE)) {
3813 ret = -EFSCORRUPTED;
3814 f2fs_put_dnode(&dn);
3815 goto out;
3816 }
3817
3818 cur_bdev = f2fs_target_device(sbi, blkaddr, NULL);
3819 if (f2fs_is_multi_device(sbi)) {
3820 int di = f2fs_target_device_index(sbi, blkaddr);
3821
3822 blkaddr -= FDEV(di).start_blk;
3823 }
3824
3825 if (len) {
3826 if (prev_bdev == cur_bdev &&
3827 index == prev_index + len &&
3828 blkaddr == prev_block + len) {
3829 len++;
3830 } else {
3831 ret = f2fs_secure_erase(prev_bdev,
3832 inode, prev_index, prev_block,
3833 len, range.flags);
3834 if (ret) {
3835 f2fs_put_dnode(&dn);
3836 goto out;
3837 }
3838
3839 len = 0;
3840 }
3841 }
3842
3843 if (!len) {
3844 prev_bdev = cur_bdev;
3845 prev_index = index;
3846 prev_block = blkaddr;
3847 len = 1;
3848 }
3849 }
3850
3851 f2fs_put_dnode(&dn);
3852
3853 if (fatal_signal_pending(current)) {
3854 ret = -EINTR;
3855 goto out;
3856 }
3857 cond_resched();
3858 }
3859
3860 if (len)
3861 ret = f2fs_secure_erase(prev_bdev, inode, prev_index,
3862 prev_block, len, range.flags);
3863out:
edc6d01b 3864 filemap_invalidate_unlock(mapping);
e4544b63 3865 f2fs_up_write(&F2FS_I(inode)->i_gc_rwsem[WRITE]);
9af84648
DJ
3866err:
3867 inode_unlock(inode);
3868 file_end_write(filp);
3869
3870 return ret;
3871}
3872
9e2a5f8c 3873static int f2fs_ioc_get_compress_option(struct file *filp, unsigned long arg)
52656e6c 3874{
9e2a5f8c
DJ
3875 struct inode *inode = file_inode(filp);
3876 struct f2fs_comp_option option;
3877
3878 if (!f2fs_sb_has_compression(F2FS_I_SB(inode)))
3879 return -EOPNOTSUPP;
3880
3881 inode_lock_shared(inode);
3882
3883 if (!f2fs_compressed_file(inode)) {
3884 inode_unlock_shared(inode);
3885 return -ENODATA;
3886 }
3887
3888 option.algorithm = F2FS_I(inode)->i_compress_algorithm;
3889 option.log_cluster_size = F2FS_I(inode)->i_log_cluster_size;
3890
3891 inode_unlock_shared(inode);
3892
3893 if (copy_to_user((struct f2fs_comp_option __user *)arg, &option,
3894 sizeof(option)))
3895 return -EFAULT;
3896
3897 return 0;
3898}
3899
e1e8debe
DJ
3900static int f2fs_ioc_set_compress_option(struct file *filp, unsigned long arg)
3901{
3902 struct inode *inode = file_inode(filp);
3903 struct f2fs_sb_info *sbi = F2FS_I_SB(inode);
3904 struct f2fs_comp_option option;
3905 int ret = 0;
1f227a3e 3906
e1e8debe
DJ
3907 if (!f2fs_sb_has_compression(sbi))
3908 return -EOPNOTSUPP;
3909
3910 if (!(filp->f_mode & FMODE_WRITE))
3911 return -EBADF;
3912
3913 if (copy_from_user(&option, (struct f2fs_comp_option __user *)arg,
3914 sizeof(option)))
3915 return -EFAULT;
3916
3917 if (!f2fs_compressed_file(inode) ||
3918 option.log_cluster_size < MIN_COMPRESS_LOG_SIZE ||
3919 option.log_cluster_size > MAX_COMPRESS_LOG_SIZE ||
3920 option.algorithm >= COMPRESS_MAX)
3921 return -EINVAL;
3922
3923 file_start_write(filp);
3924 inode_lock(inode);
3925
3926 if (f2fs_is_mmap_file(inode) || get_dirty_pages(inode)) {
3927 ret = -EBUSY;
3928 goto out;
3929 }
3930
3931 if (inode->i_size != 0) {
3932 ret = -EFBIG;
3933 goto out;
3934 }
3935
3936 F2FS_I(inode)->i_compress_algorithm = option.algorithm;
3937 F2FS_I(inode)->i_log_cluster_size = option.log_cluster_size;
3938 F2FS_I(inode)->i_cluster_size = 1 << option.log_cluster_size;
3939 f2fs_mark_inode_dirty_sync(inode, true);
3940
3941 if (!f2fs_is_compress_backend_ready(inode))
3942 f2fs_warn(sbi, "compression algorithm is successfully set, "
3943 "but current kernel doesn't support this algorithm.");
3944out:
3945 inode_unlock(inode);
3946 file_end_write(filp);
3947
3948 return ret;
3949}
3950
5fdb322f
DJ
3951static int redirty_blocks(struct inode *inode, pgoff_t page_idx, int len)
3952{
fcd9ae4f 3953 DEFINE_READAHEAD(ractl, NULL, NULL, inode->i_mapping, page_idx);
5fdb322f
DJ
3954 struct address_space *mapping = inode->i_mapping;
3955 struct page *page;
3956 pgoff_t redirty_idx = page_idx;
3957 int i, page_len = 0, ret = 0;
3958
3959 page_cache_ra_unbounded(&ractl, len, 0);
3960
3961 for (i = 0; i < len; i++, page_idx++) {
3962 page = read_cache_page(mapping, page_idx, NULL, NULL);
3963 if (IS_ERR(page)) {
3964 ret = PTR_ERR(page);
3965 break;
3966 }
3967 page_len++;
3968 }
3969
3970 for (i = 0; i < page_len; i++, redirty_idx++) {
3971 page = find_lock_page(mapping, redirty_idx);
df0736d7
DJ
3972 if (!page) {
3973 ret = -ENOMEM;
3974 break;
3975 }
5fdb322f
DJ
3976 set_page_dirty(page);
3977 f2fs_put_page(page, 1);
3978 f2fs_put_page(page, 0);
3979 }
3980
3981 return ret;
3982}
3983
3984static int f2fs_ioc_decompress_file(struct file *filp, unsigned long arg)
3985{
3986 struct inode *inode = file_inode(filp);
3987 struct f2fs_sb_info *sbi = F2FS_I_SB(inode);
3988 struct f2fs_inode_info *fi = F2FS_I(inode);
3989 pgoff_t page_idx = 0, last_idx;
3990 unsigned int blk_per_seg = sbi->blocks_per_seg;
3991 int cluster_size = F2FS_I(inode)->i_cluster_size;
3992 int count, ret;
3993
3994 if (!f2fs_sb_has_compression(sbi) ||
3995 F2FS_OPTION(sbi).compress_mode != COMPR_MODE_USER)
3996 return -EOPNOTSUPP;
3997
3998 if (!(filp->f_mode & FMODE_WRITE))
3999 return -EBADF;
4000
4001 if (!f2fs_compressed_file(inode))
4002 return -EINVAL;
4003
4004 f2fs_balance_fs(F2FS_I_SB(inode), true);
4005
4006 file_start_write(filp);
4007 inode_lock(inode);
4008
4009 if (!f2fs_is_compress_backend_ready(inode)) {
4010 ret = -EOPNOTSUPP;
4011 goto out;
4012 }
4013
4014 if (f2fs_is_mmap_file(inode)) {
4015 ret = -EBUSY;
4016 goto out;
4017 }
4018
4019 ret = filemap_write_and_wait_range(inode->i_mapping, 0, LLONG_MAX);
4020 if (ret)
4021 goto out;
4022
4023 if (!atomic_read(&fi->i_compr_blocks))
4024 goto out;
4025
4026 last_idx = DIV_ROUND_UP(i_size_read(inode), PAGE_SIZE);
4027
4028 count = last_idx - page_idx;
4029 while (count) {
4030 int len = min(cluster_size, count);
4031
4032 ret = redirty_blocks(inode, page_idx, len);
4033 if (ret < 0)
4034 break;
4035
4036 if (get_dirty_pages(inode) >= blk_per_seg)
4037 filemap_fdatawrite(inode->i_mapping);
4038
4039 count -= len;
4040 page_idx += len;
4041 }
4042
4043 if (!ret)
4044 ret = filemap_write_and_wait_range(inode->i_mapping, 0,
4045 LLONG_MAX);
4046
4047 if (ret)
833dcd35
JP
4048 f2fs_warn(sbi, "%s: The file might be partially decompressed (errno=%d). Please delete the file.",
4049 __func__, ret);
5fdb322f
DJ
4050out:
4051 inode_unlock(inode);
4052 file_end_write(filp);
4053
4054 return ret;
4055}
4056
4057static int f2fs_ioc_compress_file(struct file *filp, unsigned long arg)
4058{
4059 struct inode *inode = file_inode(filp);
4060 struct f2fs_sb_info *sbi = F2FS_I_SB(inode);
4061 pgoff_t page_idx = 0, last_idx;
4062 unsigned int blk_per_seg = sbi->blocks_per_seg;
4063 int cluster_size = F2FS_I(inode)->i_cluster_size;
4064 int count, ret;
4065
4066 if (!f2fs_sb_has_compression(sbi) ||
4067 F2FS_OPTION(sbi).compress_mode != COMPR_MODE_USER)
4068 return -EOPNOTSUPP;
4069
4070 if (!(filp->f_mode & FMODE_WRITE))
4071 return -EBADF;
4072
4073 if (!f2fs_compressed_file(inode))
4074 return -EINVAL;
4075
4076 f2fs_balance_fs(F2FS_I_SB(inode), true);
4077
4078 file_start_write(filp);
4079 inode_lock(inode);
4080
4081 if (!f2fs_is_compress_backend_ready(inode)) {
4082 ret = -EOPNOTSUPP;
4083 goto out;
4084 }
4085
4086 if (f2fs_is_mmap_file(inode)) {
4087 ret = -EBUSY;
4088 goto out;
4089 }
4090
4091 ret = filemap_write_and_wait_range(inode->i_mapping, 0, LLONG_MAX);
4092 if (ret)
4093 goto out;
4094
4095 set_inode_flag(inode, FI_ENABLE_COMPRESS);
4096
4097 last_idx = DIV_ROUND_UP(i_size_read(inode), PAGE_SIZE);
4098
4099 count = last_idx - page_idx;
4100 while (count) {
4101 int len = min(cluster_size, count);
4102
4103 ret = redirty_blocks(inode, page_idx, len);
4104 if (ret < 0)
4105 break;
4106
4107 if (get_dirty_pages(inode) >= blk_per_seg)
4108 filemap_fdatawrite(inode->i_mapping);
4109
4110 count -= len;
4111 page_idx += len;
4112 }
4113
4114 if (!ret)
4115 ret = filemap_write_and_wait_range(inode->i_mapping, 0,
4116 LLONG_MAX);
4117
4118 clear_inode_flag(inode, FI_ENABLE_COMPRESS);
4119
4120 if (ret)
833dcd35
JP
4121 f2fs_warn(sbi, "%s: The file might be partially compressed (errno=%d). Please delete the file.",
4122 __func__, ret);
5fdb322f
DJ
4123out:
4124 inode_unlock(inode);
4125 file_end_write(filp);
4126
4127 return ret;
4128}
4129
34178b1b 4130static long __f2fs_ioctl(struct file *filp, unsigned int cmd, unsigned long arg)
52656e6c
JK
4131{
4132 switch (cmd) {
3357af8f 4133 case FS_IOC_GETVERSION:
d49f3e89 4134 return f2fs_ioc_getversion(filp, arg);
88b88a66
JK
4135 case F2FS_IOC_START_ATOMIC_WRITE:
4136 return f2fs_ioc_start_atomic_write(filp);
4137 case F2FS_IOC_COMMIT_ATOMIC_WRITE:
4138 return f2fs_ioc_commit_atomic_write(filp);
02a1335f
JK
4139 case F2FS_IOC_START_VOLATILE_WRITE:
4140 return f2fs_ioc_start_volatile_write(filp);
1e84371f
JK
4141 case F2FS_IOC_RELEASE_VOLATILE_WRITE:
4142 return f2fs_ioc_release_volatile_write(filp);
4143 case F2FS_IOC_ABORT_VOLATILE_WRITE:
4144 return f2fs_ioc_abort_volatile_write(filp);
1abff93d
JK
4145 case F2FS_IOC_SHUTDOWN:
4146 return f2fs_ioc_shutdown(filp, arg);
52656e6c
JK
4147 case FITRIM:
4148 return f2fs_ioc_fitrim(filp, arg);
3357af8f 4149 case FS_IOC_SET_ENCRYPTION_POLICY:
f424f664 4150 return f2fs_ioc_set_encryption_policy(filp, arg);
3357af8f 4151 case FS_IOC_GET_ENCRYPTION_POLICY:
f424f664 4152 return f2fs_ioc_get_encryption_policy(filp, arg);
3357af8f 4153 case FS_IOC_GET_ENCRYPTION_PWSALT:
f424f664 4154 return f2fs_ioc_get_encryption_pwsalt(filp, arg);
8ce589c7
EB
4155 case FS_IOC_GET_ENCRYPTION_POLICY_EX:
4156 return f2fs_ioc_get_encryption_policy_ex(filp, arg);
4157 case FS_IOC_ADD_ENCRYPTION_KEY:
4158 return f2fs_ioc_add_encryption_key(filp, arg);
4159 case FS_IOC_REMOVE_ENCRYPTION_KEY:
4160 return f2fs_ioc_remove_encryption_key(filp, arg);
4161 case FS_IOC_REMOVE_ENCRYPTION_KEY_ALL_USERS:
4162 return f2fs_ioc_remove_encryption_key_all_users(filp, arg);
4163 case FS_IOC_GET_ENCRYPTION_KEY_STATUS:
4164 return f2fs_ioc_get_encryption_key_status(filp, arg);
ee446e1a
EB
4165 case FS_IOC_GET_ENCRYPTION_NONCE:
4166 return f2fs_ioc_get_encryption_nonce(filp, arg);
c1c1b583
CY
4167 case F2FS_IOC_GARBAGE_COLLECT:
4168 return f2fs_ioc_gc(filp, arg);
34dc77ad
JK
4169 case F2FS_IOC_GARBAGE_COLLECT_RANGE:
4170 return f2fs_ioc_gc_range(filp, arg);
456b88e4 4171 case F2FS_IOC_WRITE_CHECKPOINT:
059c0648 4172 return f2fs_ioc_write_checkpoint(filp, arg);
d323d005
CY
4173 case F2FS_IOC_DEFRAGMENT:
4174 return f2fs_ioc_defragment(filp, arg);
4dd6f977
JK
4175 case F2FS_IOC_MOVE_RANGE:
4176 return f2fs_ioc_move_range(filp, arg);
e066b83c
JK
4177 case F2FS_IOC_FLUSH_DEVICE:
4178 return f2fs_ioc_flush_device(filp, arg);
e65ef207
JK
4179 case F2FS_IOC_GET_FEATURES:
4180 return f2fs_ioc_get_features(filp, arg);
1ad71a27
JK
4181 case F2FS_IOC_GET_PIN_FILE:
4182 return f2fs_ioc_get_pin_file(filp, arg);
4183 case F2FS_IOC_SET_PIN_FILE:
4184 return f2fs_ioc_set_pin_file(filp, arg);
c4020b2d
CY
4185 case F2FS_IOC_PRECACHE_EXTENTS:
4186 return f2fs_ioc_precache_extents(filp, arg);
04f0b2ea
QS
4187 case F2FS_IOC_RESIZE_FS:
4188 return f2fs_ioc_resize_fs(filp, arg);
95ae251f
EB
4189 case FS_IOC_ENABLE_VERITY:
4190 return f2fs_ioc_enable_verity(filp, arg);
4191 case FS_IOC_MEASURE_VERITY:
4192 return f2fs_ioc_measure_verity(filp, arg);
e17fe657
EB
4193 case FS_IOC_READ_VERITY_METADATA:
4194 return f2fs_ioc_read_verity_metadata(filp, arg);
3357af8f
EB
4195 case FS_IOC_GETFSLABEL:
4196 return f2fs_ioc_getfslabel(filp, arg);
4197 case FS_IOC_SETFSLABEL:
4198 return f2fs_ioc_setfslabel(filp, arg);
439dfb10
CY
4199 case F2FS_IOC_GET_COMPRESS_BLOCKS:
4200 return f2fs_get_compress_blocks(filp, arg);
ef8d563f
CY
4201 case F2FS_IOC_RELEASE_COMPRESS_BLOCKS:
4202 return f2fs_release_compress_blocks(filp, arg);
c75488fb
CY
4203 case F2FS_IOC_RESERVE_COMPRESS_BLOCKS:
4204 return f2fs_reserve_compress_blocks(filp, arg);
9af84648
DJ
4205 case F2FS_IOC_SEC_TRIM_FILE:
4206 return f2fs_sec_trim_file(filp, arg);
9e2a5f8c
DJ
4207 case F2FS_IOC_GET_COMPRESS_OPTION:
4208 return f2fs_ioc_get_compress_option(filp, arg);
e1e8debe
DJ
4209 case F2FS_IOC_SET_COMPRESS_OPTION:
4210 return f2fs_ioc_set_compress_option(filp, arg);
5fdb322f
DJ
4211 case F2FS_IOC_DECOMPRESS_FILE:
4212 return f2fs_ioc_decompress_file(filp, arg);
4213 case F2FS_IOC_COMPRESS_FILE:
4214 return f2fs_ioc_compress_file(filp, arg);
fbfa2cc5
JK
4215 default:
4216 return -ENOTTY;
4217 }
4218}
4219
34178b1b
CY
4220long f2fs_ioctl(struct file *filp, unsigned int cmd, unsigned long arg)
4221{
4222 if (unlikely(f2fs_cp_error(F2FS_I_SB(file_inode(filp)))))
4223 return -EIO;
4224 if (!f2fs_is_checkpoint_ready(F2FS_I_SB(file_inode(filp))))
4225 return -ENOSPC;
4226
4227 return __f2fs_ioctl(filp, cmd, arg);
4228}
4229
a1e09b03
EB
4230/*
4231 * Return %true if the given read or write request should use direct I/O, or
4232 * %false if it should use buffered I/O.
4233 */
4234static bool f2fs_should_use_dio(struct inode *inode, struct kiocb *iocb,
4235 struct iov_iter *iter)
4236{
4237 unsigned int align;
4238
4239 if (!(iocb->ki_flags & IOCB_DIRECT))
4240 return false;
4241
4242 if (f2fs_force_buffered_io(inode, iocb, iter))
4243 return false;
4244
4245 /*
4246 * Direct I/O not aligned to the disk's logical_block_size will be
4247 * attempted, but will fail with -EINVAL.
4248 *
4249 * f2fs additionally requires that direct I/O be aligned to the
4250 * filesystem block size, which is often a stricter requirement.
4251 * However, f2fs traditionally falls back to buffered I/O on requests
4252 * that are logical_block_size-aligned but not fs-block aligned.
4253 *
4254 * The below logic implements this behavior.
4255 */
4256 align = iocb->ki_pos | iov_iter_alignment(iter);
4257 if (!IS_ALIGNED(align, i_blocksize(inode)) &&
4258 IS_ALIGNED(align, bdev_logical_block_size(inode->i_sb->s_bdev)))
4259 return false;
4260
4261 return true;
4262}
4263
4264static int f2fs_dio_read_end_io(struct kiocb *iocb, ssize_t size, int error,
4265 unsigned int flags)
4266{
4267 struct f2fs_sb_info *sbi = F2FS_I_SB(file_inode(iocb->ki_filp));
4268
4269 dec_page_count(sbi, F2FS_DIO_READ);
4270 if (error)
4271 return error;
4272 f2fs_update_iostat(sbi, APP_DIRECT_READ_IO, size);
4273 return 0;
4274}
4275
4276static const struct iomap_dio_ops f2fs_iomap_dio_read_ops = {
4277 .end_io = f2fs_dio_read_end_io,
4278};
4279
4280static ssize_t f2fs_dio_read_iter(struct kiocb *iocb, struct iov_iter *to)
4c8ff709
CY
4281{
4282 struct file *file = iocb->ki_filp;
4283 struct inode *inode = file_inode(file);
a1e09b03
EB
4284 struct f2fs_sb_info *sbi = F2FS_I_SB(inode);
4285 struct f2fs_inode_info *fi = F2FS_I(inode);
4286 const loff_t pos = iocb->ki_pos;
4287 const size_t count = iov_iter_count(to);
4288 struct iomap_dio *dio;
4289 ssize_t ret;
4290
4291 if (count == 0)
4292 return 0; /* skip atime update */
4293
bd984c03 4294 trace_f2fs_direct_IO_enter(inode, iocb, count, READ);
a1e09b03
EB
4295
4296 if (iocb->ki_flags & IOCB_NOWAIT) {
e4544b63 4297 if (!f2fs_down_read_trylock(&fi->i_gc_rwsem[READ])) {
a1e09b03
EB
4298 ret = -EAGAIN;
4299 goto out;
4300 }
4301 } else {
e4544b63 4302 f2fs_down_read(&fi->i_gc_rwsem[READ]);
a1e09b03
EB
4303 }
4304
4305 /*
4306 * We have to use __iomap_dio_rw() and iomap_dio_complete() instead of
4307 * the higher-level function iomap_dio_rw() in order to ensure that the
4308 * F2FS_DIO_READ counter will be decremented correctly in all cases.
4309 */
4310 inc_page_count(sbi, F2FS_DIO_READ);
4311 dio = __iomap_dio_rw(iocb, to, &f2fs_iomap_ops,
4312 &f2fs_iomap_dio_read_ops, 0, 0);
4313 if (IS_ERR_OR_NULL(dio)) {
4314 ret = PTR_ERR_OR_ZERO(dio);
4315 if (ret != -EIOCBQUEUED)
4316 dec_page_count(sbi, F2FS_DIO_READ);
4317 } else {
4318 ret = iomap_dio_complete(dio);
4319 }
4320
e4544b63 4321 f2fs_up_read(&fi->i_gc_rwsem[READ]);
a1e09b03
EB
4322
4323 file_accessed(file);
4324out:
4325 trace_f2fs_direct_IO_exit(inode, pos, count, READ, ret);
4326 return ret;
4327}
4328
4329static ssize_t f2fs_file_read_iter(struct kiocb *iocb, struct iov_iter *to)
4330{
4331 struct inode *inode = file_inode(iocb->ki_filp);
4332 ssize_t ret;
4c8ff709
CY
4333
4334 if (!f2fs_is_compress_backend_ready(inode))
4335 return -EOPNOTSUPP;
4336
a1e09b03
EB
4337 if (f2fs_should_use_dio(inode, iocb, to))
4338 return f2fs_dio_read_iter(iocb, to);
8b83ac81 4339
a1e09b03 4340 ret = filemap_read(iocb, to, 0);
8b83ac81 4341 if (ret > 0)
a1e09b03 4342 f2fs_update_iostat(F2FS_I_SB(inode), APP_BUFFERED_READ_IO, ret);
8b83ac81 4343 return ret;
4c8ff709
CY
4344}
4345
a1e09b03
EB
4346static ssize_t f2fs_write_checks(struct kiocb *iocb, struct iov_iter *from)
4347{
4348 struct file *file = iocb->ki_filp;
4349 struct inode *inode = file_inode(file);
4350 ssize_t count;
4351 int err;
4352
4353 if (IS_IMMUTABLE(inode))
4354 return -EPERM;
4355
4356 if (is_inode_flag_set(inode, FI_COMPRESS_RELEASED))
4357 return -EPERM;
4358
4359 count = generic_write_checks(iocb, from);
4360 if (count <= 0)
4361 return count;
4362
4363 err = file_modified(file);
4364 if (err)
4365 return err;
4366 return count;
4367}
4368
3d697a4a
EB
4369/*
4370 * Preallocate blocks for a write request, if it is possible and helpful to do
4371 * so. Returns a positive number if blocks may have been preallocated, 0 if no
4372 * blocks were preallocated, or a negative errno value if something went
4373 * seriously wrong. Also sets FI_PREALLOCATED_ALL on the inode if *all* the
4374 * requested blocks (not just some of them) have been allocated.
4375 */
a1e09b03
EB
4376static int f2fs_preallocate_blocks(struct kiocb *iocb, struct iov_iter *iter,
4377 bool dio)
3d697a4a
EB
4378{
4379 struct inode *inode = file_inode(iocb->ki_filp);
4380 struct f2fs_sb_info *sbi = F2FS_I_SB(inode);
4381 const loff_t pos = iocb->ki_pos;
4382 const size_t count = iov_iter_count(iter);
4383 struct f2fs_map_blocks map = {};
3d697a4a
EB
4384 int flag;
4385 int ret;
4386
4387 /* If it will be an out-of-place direct write, don't bother. */
4388 if (dio && f2fs_lfs_mode(sbi))
4389 return 0;
d4dd19ec
JK
4390 /*
4391 * Don't preallocate holes aligned to DIO_SKIP_HOLES which turns into
4392 * buffered IO, if DIO meets any holes.
4393 */
4394 if (dio && i_size_read(inode) &&
4395 (F2FS_BYTES_TO_BLK(pos) < F2FS_BLK_ALIGN(i_size_read(inode))))
4396 return 0;
3d697a4a
EB
4397
4398 /* No-wait I/O can't allocate blocks. */
4399 if (iocb->ki_flags & IOCB_NOWAIT)
4400 return 0;
4401
4402 /* If it will be a short write, don't bother. */
4403 if (fault_in_iov_iter_readable(iter, count))
4404 return 0;
4405
4406 if (f2fs_has_inline_data(inode)) {
4407 /* If the data will fit inline, don't bother. */
4408 if (pos + count <= MAX_INLINE_DATA(inode))
4409 return 0;
4410 ret = f2fs_convert_inline_inode(inode);
4411 if (ret)
4412 return ret;
4413 }
4414
4415 /* Do not preallocate blocks that will be written partially in 4KB. */
4416 map.m_lblk = F2FS_BLK_ALIGN(pos);
4417 map.m_len = F2FS_BYTES_TO_BLK(pos + count);
4418 if (map.m_len > map.m_lblk)
4419 map.m_len -= map.m_lblk;
4420 else
4421 map.m_len = 0;
4422 map.m_may_create = true;
4423 if (dio) {
4424 map.m_seg_type = f2fs_rw_hint_to_seg_type(inode->i_write_hint);
4425 flag = F2FS_GET_BLOCK_PRE_DIO;
4426 } else {
4427 map.m_seg_type = NO_CHECK_TYPE;
4428 flag = F2FS_GET_BLOCK_PRE_AIO;
4429 }
4430
4431 ret = f2fs_map_blocks(inode, &map, 1, flag);
d4dd19ec
JK
4432 /* -ENOSPC|-EDQUOT are fine to report the number of allocated blocks. */
4433 if (ret < 0 && !((ret == -ENOSPC || ret == -EDQUOT) && map.m_len > 0))
3d697a4a
EB
4434 return ret;
4435 if (ret == 0)
4436 set_inode_flag(inode, FI_PREALLOCATED_ALL);
4437 return map.m_len;
4438}
4439
a1e09b03
EB
4440static ssize_t f2fs_buffered_write_iter(struct kiocb *iocb,
4441 struct iov_iter *from)
fcc85a4d 4442{
b439b103
JK
4443 struct file *file = iocb->ki_filp;
4444 struct inode *inode = file_inode(file);
a1e09b03
EB
4445 ssize_t ret;
4446
4447 if (iocb->ki_flags & IOCB_NOWAIT)
4448 return -EOPNOTSUPP;
4449
4450 current->backing_dev_info = inode_to_bdi(inode);
800ba295 4451 ret = generic_perform_write(iocb, from);
a1e09b03
EB
4452 current->backing_dev_info = NULL;
4453
4454 if (ret > 0) {
4455 iocb->ki_pos += ret;
4456 f2fs_update_iostat(F2FS_I_SB(inode), APP_BUFFERED_IO, ret);
4457 }
4458 return ret;
4459}
4460
4461static int f2fs_dio_write_end_io(struct kiocb *iocb, ssize_t size, int error,
4462 unsigned int flags)
4463{
4464 struct f2fs_sb_info *sbi = F2FS_I_SB(file_inode(iocb->ki_filp));
4465
4466 dec_page_count(sbi, F2FS_DIO_WRITE);
4467 if (error)
4468 return error;
4469 f2fs_update_iostat(sbi, APP_DIRECT_IO, size);
4470 return 0;
4471}
4472
4473static const struct iomap_dio_ops f2fs_iomap_dio_write_ops = {
4474 .end_io = f2fs_dio_write_end_io,
4475};
4476
4477static ssize_t f2fs_dio_write_iter(struct kiocb *iocb, struct iov_iter *from,
4478 bool *may_need_sync)
4479{
4480 struct file *file = iocb->ki_filp;
4481 struct inode *inode = file_inode(file);
4482 struct f2fs_inode_info *fi = F2FS_I(inode);
4483 struct f2fs_sb_info *sbi = F2FS_I_SB(inode);
4484 const bool do_opu = f2fs_lfs_mode(sbi);
a1e09b03
EB
4485 const loff_t pos = iocb->ki_pos;
4486 const ssize_t count = iov_iter_count(from);
a1e09b03
EB
4487 unsigned int dio_flags;
4488 struct iomap_dio *dio;
4489 ssize_t ret;
4490
bd984c03 4491 trace_f2fs_direct_IO_enter(inode, iocb, count, WRITE);
a1e09b03
EB
4492
4493 if (iocb->ki_flags & IOCB_NOWAIT) {
4494 /* f2fs_convert_inline_inode() and block allocation can block */
4495 if (f2fs_has_inline_data(inode) ||
4496 !f2fs_overwrite_io(inode, pos, count)) {
4497 ret = -EAGAIN;
4498 goto out;
4499 }
4500
e4544b63 4501 if (!f2fs_down_read_trylock(&fi->i_gc_rwsem[WRITE])) {
a1e09b03
EB
4502 ret = -EAGAIN;
4503 goto out;
4504 }
e4544b63
TM
4505 if (do_opu && !f2fs_down_read_trylock(&fi->i_gc_rwsem[READ])) {
4506 f2fs_up_read(&fi->i_gc_rwsem[WRITE]);
a1e09b03
EB
4507 ret = -EAGAIN;
4508 goto out;
4509 }
4510 } else {
4511 ret = f2fs_convert_inline_inode(inode);
4512 if (ret)
4513 goto out;
4514
e4544b63 4515 f2fs_down_read(&fi->i_gc_rwsem[WRITE]);
a1e09b03 4516 if (do_opu)
e4544b63 4517 f2fs_down_read(&fi->i_gc_rwsem[READ]);
a1e09b03 4518 }
a1e09b03
EB
4519
4520 /*
4521 * We have to use __iomap_dio_rw() and iomap_dio_complete() instead of
4522 * the higher-level function iomap_dio_rw() in order to ensure that the
4523 * F2FS_DIO_WRITE counter will be decremented correctly in all cases.
4524 */
4525 inc_page_count(sbi, F2FS_DIO_WRITE);
4526 dio_flags = 0;
4527 if (pos + count > inode->i_size)
4528 dio_flags |= IOMAP_DIO_FORCE_WAIT;
4529 dio = __iomap_dio_rw(iocb, from, &f2fs_iomap_ops,
4530 &f2fs_iomap_dio_write_ops, dio_flags, 0);
4531 if (IS_ERR_OR_NULL(dio)) {
4532 ret = PTR_ERR_OR_ZERO(dio);
4533 if (ret == -ENOTBLK)
4534 ret = 0;
4535 if (ret != -EIOCBQUEUED)
4536 dec_page_count(sbi, F2FS_DIO_WRITE);
4537 } else {
4538 ret = iomap_dio_complete(dio);
4539 }
4540
a1e09b03 4541 if (do_opu)
e4544b63
TM
4542 f2fs_up_read(&fi->i_gc_rwsem[READ]);
4543 f2fs_up_read(&fi->i_gc_rwsem[WRITE]);
a1e09b03
EB
4544
4545 if (ret < 0)
4546 goto out;
4547 if (pos + ret > inode->i_size)
4548 f2fs_i_size_write(inode, pos + ret);
4549 if (!do_opu)
4550 set_inode_flag(inode, FI_UPDATE_WRITE);
4551
4552 if (iov_iter_count(from)) {
4553 ssize_t ret2;
4554 loff_t bufio_start_pos = iocb->ki_pos;
4555
4556 /*
4557 * The direct write was partial, so we need to fall back to a
4558 * buffered write for the remainder.
4559 */
4560
4561 ret2 = f2fs_buffered_write_iter(iocb, from);
4562 if (iov_iter_count(from))
4563 f2fs_write_failed(inode, iocb->ki_pos);
4564 if (ret2 < 0)
4565 goto out;
4566
4567 /*
4568 * Ensure that the pagecache pages are written to disk and
4569 * invalidated to preserve the expected O_DIRECT semantics.
4570 */
4571 if (ret2 > 0) {
4572 loff_t bufio_end_pos = bufio_start_pos + ret2 - 1;
4573
4574 ret += ret2;
4575
4576 ret2 = filemap_write_and_wait_range(file->f_mapping,
4577 bufio_start_pos,
4578 bufio_end_pos);
4579 if (ret2 < 0)
4580 goto out;
4581 invalidate_mapping_pages(file->f_mapping,
4582 bufio_start_pos >> PAGE_SHIFT,
4583 bufio_end_pos >> PAGE_SHIFT);
4584 }
4585 } else {
4586 /* iomap_dio_rw() already handled the generic_write_sync(). */
4587 *may_need_sync = false;
4588 }
4589out:
4590 trace_f2fs_direct_IO_exit(inode, pos, count, WRITE, ret);
4591 return ret;
4592}
4593
4594static ssize_t f2fs_file_write_iter(struct kiocb *iocb, struct iov_iter *from)
4595{
4596 struct inode *inode = file_inode(iocb->ki_filp);
ccf7cf92
EB
4597 const loff_t orig_pos = iocb->ki_pos;
4598 const size_t orig_count = iov_iter_count(from);
3d697a4a 4599 loff_t target_size;
a1e09b03
EB
4600 bool dio;
4601 bool may_need_sync = true;
3d697a4a 4602 int preallocated;
b439b103 4603 ssize_t ret;
fcc85a4d 4604
126ce721
CY
4605 if (unlikely(f2fs_cp_error(F2FS_I_SB(inode)))) {
4606 ret = -EIO;
4607 goto out;
4608 }
1f227a3e 4609
7bd29358
CY
4610 if (!f2fs_is_compress_backend_ready(inode)) {
4611 ret = -EOPNOTSUPP;
4612 goto out;
4613 }
4c8ff709 4614
cb8434f1
GR
4615 if (iocb->ki_flags & IOCB_NOWAIT) {
4616 if (!inode_trylock(inode)) {
126ce721
CY
4617 ret = -EAGAIN;
4618 goto out;
4619 }
cb8434f1 4620 } else {
b91050a8
HL
4621 inode_lock(inode);
4622 }
4623
a1e09b03 4624 ret = f2fs_write_checks(iocb, from);
b31bf0f9
EB
4625 if (ret <= 0)
4626 goto out_unlock;
4627
a1e09b03
EB
4628 /* Determine whether we will do a direct write or a buffered write. */
4629 dio = f2fs_should_use_dio(inode, iocb, from);
3d697a4a 4630
b31bf0f9
EB
4631 /* Possibly preallocate the blocks for the write. */
4632 target_size = iocb->ki_pos + iov_iter_count(from);
a1e09b03 4633 preallocated = f2fs_preallocate_blocks(iocb, from, dio);
d4dd19ec 4634 if (preallocated < 0)
b31bf0f9 4635 ret = preallocated;
d4dd19ec 4636 else
a1e09b03
EB
4637 /* Do the actual write. */
4638 ret = dio ?
4639 f2fs_dio_write_iter(iocb, from, &may_need_sync):
4640 f2fs_buffered_write_iter(iocb, from);
dc7a10dd 4641
b31bf0f9 4642 /* Don't leave any preallocated blocks around past i_size. */
d4dd19ec 4643 if (preallocated && i_size_read(inode) < target_size) {
e4544b63 4644 f2fs_down_write(&F2FS_I(inode)->i_gc_rwsem[WRITE]);
b31bf0f9 4645 filemap_invalidate_lock(inode->i_mapping);
d4dd19ec
JK
4646 if (!f2fs_truncate(inode))
4647 file_dont_truncate(inode);
b31bf0f9 4648 filemap_invalidate_unlock(inode->i_mapping);
e4544b63 4649 f2fs_up_write(&F2FS_I(inode)->i_gc_rwsem[WRITE]);
d4dd19ec
JK
4650 } else {
4651 file_dont_truncate(inode);
b439b103 4652 }
b31bf0f9
EB
4653
4654 clear_inode_flag(inode, FI_PREALLOCATED_ALL);
3d697a4a 4655out_unlock:
b439b103 4656 inode_unlock(inode);
126ce721 4657out:
ccf7cf92 4658 trace_f2fs_file_write_iter(inode, orig_pos, orig_count, ret);
a1e09b03 4659 if (ret > 0 && may_need_sync)
e2592217 4660 ret = generic_write_sync(iocb, ret);
b439b103 4661 return ret;
fcc85a4d
JK
4662}
4663
0f6b56ec
DJ
4664static int f2fs_file_fadvise(struct file *filp, loff_t offset, loff_t len,
4665 int advice)
4666{
0f6b56ec
DJ
4667 struct address_space *mapping;
4668 struct backing_dev_info *bdi;
e64347ae
FC
4669 struct inode *inode = file_inode(filp);
4670 int err;
0f6b56ec
DJ
4671
4672 if (advice == POSIX_FADV_SEQUENTIAL) {
0f6b56ec
DJ
4673 if (S_ISFIFO(inode->i_mode))
4674 return -ESPIPE;
4675
4676 mapping = filp->f_mapping;
4677 if (!mapping || len < 0)
4678 return -EINVAL;
4679
4680 bdi = inode_to_bdi(mapping->host);
4681 filp->f_ra.ra_pages = bdi->ra_pages *
4682 F2FS_I_SB(inode)->seq_file_ra_mul;
4683 spin_lock(&filp->f_lock);
4684 filp->f_mode &= ~FMODE_RANDOM;
4685 spin_unlock(&filp->f_lock);
4686 return 0;
4687 }
4688
e64347ae
FC
4689 err = generic_fadvise(filp, offset, len, advice);
4690 if (!err && advice == POSIX_FADV_DONTNEED &&
4691 test_opt(F2FS_I_SB(inode), COMPRESS_CACHE) &&
4692 f2fs_compressed_file(inode))
4693 f2fs_invalidate_compress_pages(F2FS_I_SB(inode), inode->i_ino);
4694
4695 return err;
0f6b56ec
DJ
4696}
4697
e9750824 4698#ifdef CONFIG_COMPAT
34178b1b
CY
4699struct compat_f2fs_gc_range {
4700 u32 sync;
4701 compat_u64 start;
4702 compat_u64 len;
4703};
4704#define F2FS_IOC32_GARBAGE_COLLECT_RANGE _IOW(F2FS_IOCTL_MAGIC, 11,\
4705 struct compat_f2fs_gc_range)
4706
4707static int f2fs_compat_ioc_gc_range(struct file *file, unsigned long arg)
4708{
4709 struct compat_f2fs_gc_range __user *urange;
4710 struct f2fs_gc_range range;
4711 int err;
4712
4713 urange = compat_ptr(arg);
4714 err = get_user(range.sync, &urange->sync);
4715 err |= get_user(range.start, &urange->start);
4716 err |= get_user(range.len, &urange->len);
4717 if (err)
4718 return -EFAULT;
4719
4720 return __f2fs_ioc_gc_range(file, &range);
4721}
4722
4723struct compat_f2fs_move_range {
4724 u32 dst_fd;
4725 compat_u64 pos_in;
4726 compat_u64 pos_out;
4727 compat_u64 len;
4728};
4729#define F2FS_IOC32_MOVE_RANGE _IOWR(F2FS_IOCTL_MAGIC, 9, \
4730 struct compat_f2fs_move_range)
4731
4732static int f2fs_compat_ioc_move_range(struct file *file, unsigned long arg)
4733{
4734 struct compat_f2fs_move_range __user *urange;
4735 struct f2fs_move_range range;
4736 int err;
4737
4738 urange = compat_ptr(arg);
4739 err = get_user(range.dst_fd, &urange->dst_fd);
4740 err |= get_user(range.pos_in, &urange->pos_in);
4741 err |= get_user(range.pos_out, &urange->pos_out);
4742 err |= get_user(range.len, &urange->len);
4743 if (err)
4744 return -EFAULT;
4745
4746 return __f2fs_ioc_move_range(file, &range);
4747}
4748
e9750824
NJ
4749long f2fs_compat_ioctl(struct file *file, unsigned int cmd, unsigned long arg)
4750{
34178b1b
CY
4751 if (unlikely(f2fs_cp_error(F2FS_I_SB(file_inode(file)))))
4752 return -EIO;
4753 if (!f2fs_is_checkpoint_ready(F2FS_I_SB(file_inode(file))))
4754 return -ENOSPC;
4755
e9750824 4756 switch (cmd) {
3357af8f
EB
4757 case FS_IOC32_GETVERSION:
4758 cmd = FS_IOC_GETVERSION;
04ef4b62 4759 break;
34178b1b
CY
4760 case F2FS_IOC32_GARBAGE_COLLECT_RANGE:
4761 return f2fs_compat_ioc_gc_range(file, arg);
4762 case F2FS_IOC32_MOVE_RANGE:
4763 return f2fs_compat_ioc_move_range(file, arg);
04ef4b62
CY
4764 case F2FS_IOC_START_ATOMIC_WRITE:
4765 case F2FS_IOC_COMMIT_ATOMIC_WRITE:
4766 case F2FS_IOC_START_VOLATILE_WRITE:
4767 case F2FS_IOC_RELEASE_VOLATILE_WRITE:
4768 case F2FS_IOC_ABORT_VOLATILE_WRITE:
4769 case F2FS_IOC_SHUTDOWN:
314999dc 4770 case FITRIM:
3357af8f
EB
4771 case FS_IOC_SET_ENCRYPTION_POLICY:
4772 case FS_IOC_GET_ENCRYPTION_PWSALT:
4773 case FS_IOC_GET_ENCRYPTION_POLICY:
8ce589c7
EB
4774 case FS_IOC_GET_ENCRYPTION_POLICY_EX:
4775 case FS_IOC_ADD_ENCRYPTION_KEY:
4776 case FS_IOC_REMOVE_ENCRYPTION_KEY:
4777 case FS_IOC_REMOVE_ENCRYPTION_KEY_ALL_USERS:
4778 case FS_IOC_GET_ENCRYPTION_KEY_STATUS:
ee446e1a 4779 case FS_IOC_GET_ENCRYPTION_NONCE:
04ef4b62
CY
4780 case F2FS_IOC_GARBAGE_COLLECT:
4781 case F2FS_IOC_WRITE_CHECKPOINT:
4782 case F2FS_IOC_DEFRAGMENT:
e066b83c 4783 case F2FS_IOC_FLUSH_DEVICE:
e65ef207 4784 case F2FS_IOC_GET_FEATURES:
1ad71a27
JK
4785 case F2FS_IOC_GET_PIN_FILE:
4786 case F2FS_IOC_SET_PIN_FILE:
c4020b2d 4787 case F2FS_IOC_PRECACHE_EXTENTS:
04f0b2ea 4788 case F2FS_IOC_RESIZE_FS:
95ae251f
EB
4789 case FS_IOC_ENABLE_VERITY:
4790 case FS_IOC_MEASURE_VERITY:
e17fe657 4791 case FS_IOC_READ_VERITY_METADATA:
3357af8f
EB
4792 case FS_IOC_GETFSLABEL:
4793 case FS_IOC_SETFSLABEL:
439dfb10 4794 case F2FS_IOC_GET_COMPRESS_BLOCKS:
ef8d563f 4795 case F2FS_IOC_RELEASE_COMPRESS_BLOCKS:
c75488fb 4796 case F2FS_IOC_RESERVE_COMPRESS_BLOCKS:
9af84648 4797 case F2FS_IOC_SEC_TRIM_FILE:
9e2a5f8c 4798 case F2FS_IOC_GET_COMPRESS_OPTION:
e1e8debe 4799 case F2FS_IOC_SET_COMPRESS_OPTION:
5fdb322f
DJ
4800 case F2FS_IOC_DECOMPRESS_FILE:
4801 case F2FS_IOC_COMPRESS_FILE:
4dd6f977 4802 break;
e9750824
NJ
4803 default:
4804 return -ENOIOCTLCMD;
4805 }
34178b1b 4806 return __f2fs_ioctl(file, cmd, (unsigned long) compat_ptr(arg));
e9750824
NJ
4807}
4808#endif
4809
fbfa2cc5 4810const struct file_operations f2fs_file_operations = {
267378d4 4811 .llseek = f2fs_llseek,
4c8ff709 4812 .read_iter = f2fs_file_read_iter,
fcc85a4d
JK
4813 .write_iter = f2fs_file_write_iter,
4814 .open = f2fs_file_open,
12662234 4815 .release = f2fs_release_file,
fbfa2cc5 4816 .mmap = f2fs_file_mmap,
7a10f017 4817 .flush = f2fs_file_flush,
fbfa2cc5
JK
4818 .fsync = f2fs_sync_file,
4819 .fallocate = f2fs_fallocate,
4820 .unlocked_ioctl = f2fs_ioctl,
e9750824
NJ
4821#ifdef CONFIG_COMPAT
4822 .compat_ioctl = f2fs_compat_ioctl,
4823#endif
fbfa2cc5 4824 .splice_read = generic_file_splice_read,
8d020765 4825 .splice_write = iter_file_splice_write,
0f6b56ec 4826 .fadvise = f2fs_file_fadvise,
fbfa2cc5 4827};