]> git.ipfire.org Git - people/ms/linux.git/blame - fs/f2fs/data.c
f2fs: invalidate temporary meta page
[people/ms/linux.git] / fs / f2fs / data.c
CommitLineData
0a8165d7 1/*
eb47b800
JK
2 * fs/f2fs/data.c
3 *
4 * Copyright (c) 2012 Samsung Electronics Co., Ltd.
5 * http://www.samsung.com/
6 *
7 * This program is free software; you can redistribute it and/or modify
8 * it under the terms of the GNU General Public License version 2 as
9 * published by the Free Software Foundation.
10 */
11#include <linux/fs.h>
12#include <linux/f2fs_fs.h>
13#include <linux/buffer_head.h>
14#include <linux/mpage.h>
15#include <linux/writeback.h>
16#include <linux/backing-dev.h>
8f46dcae 17#include <linux/pagevec.h>
eb47b800
JK
18#include <linux/blkdev.h>
19#include <linux/bio.h>
690e4a3e 20#include <linux/prefetch.h>
e2e40f2c 21#include <linux/uio.h>
f1e88660 22#include <linux/cleancache.h>
eb47b800
JK
23
24#include "f2fs.h"
25#include "node.h"
26#include "segment.h"
db9f7c1a 27#include "trace.h"
848753aa 28#include <trace/events/f2fs.h>
eb47b800 29
93dfe2ac
JK
30static void f2fs_read_end_io(struct bio *bio, int err)
31{
f568849e
LT
32 struct bio_vec *bvec;
33 int i;
93dfe2ac 34
4375a336
JK
35 if (f2fs_bio_encrypted(bio)) {
36 if (err) {
37 f2fs_release_crypto_ctx(bio->bi_private);
38 } else {
39 f2fs_end_io_crypto_work(bio->bi_private, bio);
40 return;
41 }
42 }
43
12377024
CY
44 bio_for_each_segment_all(bvec, bio, i) {
45 struct page *page = bvec->bv_page;
f1e88660
JK
46
47 if (!err) {
48 SetPageUptodate(page);
49 } else {
50 ClearPageUptodate(page);
51 SetPageError(page);
52 }
53 unlock_page(page);
54 }
f1e88660
JK
55 bio_put(bio);
56}
57
93dfe2ac
JK
58static void f2fs_write_end_io(struct bio *bio, int err)
59{
1b1f559f 60 struct f2fs_sb_info *sbi = bio->bi_private;
f568849e
LT
61 struct bio_vec *bvec;
62 int i;
93dfe2ac 63
f568849e 64 bio_for_each_segment_all(bvec, bio, i) {
93dfe2ac
JK
65 struct page *page = bvec->bv_page;
66
4375a336
JK
67 f2fs_restore_and_release_control_page(&page);
68
f568849e 69 if (unlikely(err)) {
cf779cab 70 set_page_dirty(page);
93dfe2ac 71 set_bit(AS_EIO, &page->mapping->flags);
744602cf 72 f2fs_stop_checkpoint(sbi);
93dfe2ac
JK
73 }
74 end_page_writeback(page);
75 dec_page_count(sbi, F2FS_WRITEBACK);
f568849e 76 }
93dfe2ac 77
93dfe2ac
JK
78 if (!get_pages(sbi, F2FS_WRITEBACK) &&
79 !list_empty(&sbi->cp_wait.task_list))
80 wake_up(&sbi->cp_wait);
81
82 bio_put(bio);
83}
84
940a6d34
GZ
85/*
86 * Low-level block read/write IO operations.
87 */
88static struct bio *__bio_alloc(struct f2fs_sb_info *sbi, block_t blk_addr,
89 int npages, bool is_read)
90{
91 struct bio *bio;
92
93 /* No failure on bio allocation */
94 bio = bio_alloc(GFP_NOIO, npages);
95
96 bio->bi_bdev = sbi->sb->s_bdev;
55cf9cb6 97 bio->bi_iter.bi_sector = SECTOR_FROM_BLOCK(blk_addr);
940a6d34 98 bio->bi_end_io = is_read ? f2fs_read_end_io : f2fs_write_end_io;
12377024 99 bio->bi_private = is_read ? NULL : sbi;
940a6d34
GZ
100
101 return bio;
102}
103
458e6197 104static void __submit_merged_bio(struct f2fs_bio_info *io)
93dfe2ac 105{
458e6197 106 struct f2fs_io_info *fio = &io->fio;
93dfe2ac
JK
107
108 if (!io->bio)
109 return;
110
6a8f8ca5 111 if (is_read_io(fio->rw))
2ace38e0 112 trace_f2fs_submit_read_bio(io->sbi->sb, fio, io->bio);
6a8f8ca5 113 else
2ace38e0 114 trace_f2fs_submit_write_bio(io->sbi->sb, fio, io->bio);
940a6d34 115
6a8f8ca5 116 submit_bio(fio->rw, io->bio);
93dfe2ac
JK
117 io->bio = NULL;
118}
119
120void f2fs_submit_merged_bio(struct f2fs_sb_info *sbi,
458e6197 121 enum page_type type, int rw)
93dfe2ac
JK
122{
123 enum page_type btype = PAGE_TYPE_OF_BIO(type);
124 struct f2fs_bio_info *io;
125
126 io = is_read_io(rw) ? &sbi->read_io : &sbi->write_io[btype];
127
df0f8dc0 128 down_write(&io->io_rwsem);
458e6197
JK
129
130 /* change META to META_FLUSH in the checkpoint procedure */
131 if (type >= META_FLUSH) {
132 io->fio.type = META_FLUSH;
0f7b2abd
JK
133 if (test_opt(sbi, NOBARRIER))
134 io->fio.rw = WRITE_FLUSH | REQ_META | REQ_PRIO;
135 else
136 io->fio.rw = WRITE_FLUSH_FUA | REQ_META | REQ_PRIO;
458e6197
JK
137 }
138 __submit_merged_bio(io);
df0f8dc0 139 up_write(&io->io_rwsem);
93dfe2ac
JK
140}
141
142/*
143 * Fill the locked page with data located in the block address.
144 * Return unlocked page.
145 */
05ca3632 146int f2fs_submit_page_bio(struct f2fs_io_info *fio)
93dfe2ac 147{
93dfe2ac 148 struct bio *bio;
4375a336 149 struct page *page = fio->encrypted_page ? fio->encrypted_page : fio->page;
93dfe2ac 150
2ace38e0 151 trace_f2fs_submit_page_bio(page, fio);
05ca3632 152 f2fs_trace_ios(fio, 0);
93dfe2ac
JK
153
154 /* Allocate a new bio */
05ca3632 155 bio = __bio_alloc(fio->sbi, fio->blk_addr, 1, is_read_io(fio->rw));
93dfe2ac
JK
156
157 if (bio_add_page(bio, page, PAGE_CACHE_SIZE, 0) < PAGE_CACHE_SIZE) {
158 bio_put(bio);
93dfe2ac
JK
159 return -EFAULT;
160 }
161
cf04e8eb 162 submit_bio(fio->rw, bio);
93dfe2ac
JK
163 return 0;
164}
165
05ca3632 166void f2fs_submit_page_mbio(struct f2fs_io_info *fio)
93dfe2ac 167{
05ca3632 168 struct f2fs_sb_info *sbi = fio->sbi;
458e6197 169 enum page_type btype = PAGE_TYPE_OF_BIO(fio->type);
93dfe2ac 170 struct f2fs_bio_info *io;
940a6d34 171 bool is_read = is_read_io(fio->rw);
4375a336 172 struct page *bio_page;
93dfe2ac 173
940a6d34 174 io = is_read ? &sbi->read_io : &sbi->write_io[btype];
93dfe2ac 175
cf04e8eb 176 verify_block_addr(sbi, fio->blk_addr);
93dfe2ac 177
df0f8dc0 178 down_write(&io->io_rwsem);
93dfe2ac 179
940a6d34 180 if (!is_read)
93dfe2ac
JK
181 inc_page_count(sbi, F2FS_WRITEBACK);
182
cf04e8eb 183 if (io->bio && (io->last_block_in_bio != fio->blk_addr - 1 ||
458e6197
JK
184 io->fio.rw != fio->rw))
185 __submit_merged_bio(io);
93dfe2ac
JK
186alloc_new:
187 if (io->bio == NULL) {
90a893c7 188 int bio_blocks = MAX_BIO_BLOCKS(sbi);
940a6d34 189
cf04e8eb 190 io->bio = __bio_alloc(sbi, fio->blk_addr, bio_blocks, is_read);
458e6197 191 io->fio = *fio;
93dfe2ac
JK
192 }
193
4375a336
JK
194 bio_page = fio->encrypted_page ? fio->encrypted_page : fio->page;
195
196 if (bio_add_page(io->bio, bio_page, PAGE_CACHE_SIZE, 0) <
93dfe2ac 197 PAGE_CACHE_SIZE) {
458e6197 198 __submit_merged_bio(io);
93dfe2ac
JK
199 goto alloc_new;
200 }
201
cf04e8eb 202 io->last_block_in_bio = fio->blk_addr;
05ca3632 203 f2fs_trace_ios(fio, 0);
93dfe2ac 204
df0f8dc0 205 up_write(&io->io_rwsem);
05ca3632 206 trace_f2fs_submit_page_mbio(fio->page, fio);
93dfe2ac
JK
207}
208
0a8165d7 209/*
eb47b800
JK
210 * Lock ordering for the change of data block address:
211 * ->data_page
212 * ->node_page
213 * update block addresses in the node page
214 */
216a620a 215void set_data_blkaddr(struct dnode_of_data *dn)
eb47b800
JK
216{
217 struct f2fs_node *rn;
218 __le32 *addr_array;
219 struct page *node_page = dn->node_page;
220 unsigned int ofs_in_node = dn->ofs_in_node;
221
5514f0aa 222 f2fs_wait_on_page_writeback(node_page, NODE);
eb47b800 223
45590710 224 rn = F2FS_NODE(node_page);
eb47b800
JK
225
226 /* Get physical address of data block */
227 addr_array = blkaddr_in_node(rn);
e1509cf2 228 addr_array[ofs_in_node] = cpu_to_le32(dn->data_blkaddr);
eb47b800
JK
229 set_page_dirty(node_page);
230}
231
232int reserve_new_block(struct dnode_of_data *dn)
233{
4081363f 234 struct f2fs_sb_info *sbi = F2FS_I_SB(dn->inode);
eb47b800 235
6bacf52f 236 if (unlikely(is_inode_flag_set(F2FS_I(dn->inode), FI_NO_ALLOC)))
eb47b800 237 return -EPERM;
cfb271d4 238 if (unlikely(!inc_valid_block_count(sbi, dn->inode, 1)))
eb47b800
JK
239 return -ENOSPC;
240
c01e2853
NJ
241 trace_f2fs_reserve_new_block(dn->inode, dn->nid, dn->ofs_in_node);
242
eb47b800 243 dn->data_blkaddr = NEW_ADDR;
216a620a 244 set_data_blkaddr(dn);
a18ff063 245 mark_inode_dirty(dn->inode);
eb47b800
JK
246 sync_inode_page(dn);
247 return 0;
248}
249
b600965c
HL
250int f2fs_reserve_block(struct dnode_of_data *dn, pgoff_t index)
251{
252 bool need_put = dn->inode_page ? false : true;
253 int err;
254
255 err = get_dnode_of_data(dn, index, ALLOC_NODE);
256 if (err)
257 return err;
a8865372 258
b600965c
HL
259 if (dn->data_blkaddr == NULL_ADDR)
260 err = reserve_new_block(dn);
a8865372 261 if (err || need_put)
b600965c
HL
262 f2fs_put_dnode(dn);
263 return err;
264}
265
43f3eae1 266struct page *get_read_data_page(struct inode *inode, pgoff_t index, int rw)
eb47b800 267{
eb47b800
JK
268 struct address_space *mapping = inode->i_mapping;
269 struct dnode_of_data dn;
270 struct page *page;
cb3bc9ee 271 struct extent_info ei;
eb47b800 272 int err;
cf04e8eb 273 struct f2fs_io_info fio = {
05ca3632 274 .sbi = F2FS_I_SB(inode),
cf04e8eb 275 .type = DATA,
43f3eae1 276 .rw = rw,
4375a336 277 .encrypted_page = NULL,
cf04e8eb 278 };
eb47b800 279
4375a336
JK
280 if (f2fs_encrypted_inode(inode) && S_ISREG(inode->i_mode))
281 return read_mapping_page(mapping, index, NULL);
282
9ac1349a 283 page = grab_cache_page(mapping, index);
650495de
JK
284 if (!page)
285 return ERR_PTR(-ENOMEM);
286
cb3bc9ee
CY
287 if (f2fs_lookup_extent_cache(inode, index, &ei)) {
288 dn.data_blkaddr = ei.blk + index - ei.fofs;
289 goto got_it;
290 }
291
eb47b800 292 set_new_dnode(&dn, inode, NULL, NULL, 0);
266e97a8 293 err = get_dnode_of_data(&dn, index, LOOKUP_NODE);
86531d6b
JK
294 if (err)
295 goto put_err;
eb47b800
JK
296 f2fs_put_dnode(&dn);
297
6bacf52f 298 if (unlikely(dn.data_blkaddr == NULL_ADDR)) {
86531d6b
JK
299 err = -ENOENT;
300 goto put_err;
650495de 301 }
cb3bc9ee 302got_it:
43f3eae1
JK
303 if (PageUptodate(page)) {
304 unlock_page(page);
eb47b800 305 return page;
43f3eae1 306 }
eb47b800 307
d59ff4df
JK
308 /*
309 * A new dentry page is allocated but not able to be written, since its
310 * new inode page couldn't be allocated due to -ENOSPC.
311 * In such the case, its blkaddr can be remained as NEW_ADDR.
312 * see, f2fs_add_link -> get_new_data_page -> init_inode_metadata.
313 */
314 if (dn.data_blkaddr == NEW_ADDR) {
315 zero_user_segment(page, 0, PAGE_CACHE_SIZE);
316 SetPageUptodate(page);
43f3eae1 317 unlock_page(page);
d59ff4df
JK
318 return page;
319 }
eb47b800 320
cf04e8eb 321 fio.blk_addr = dn.data_blkaddr;
05ca3632
JK
322 fio.page = page;
323 err = f2fs_submit_page_bio(&fio);
393ff91f 324 if (err)
86531d6b 325 goto put_err;
43f3eae1 326 return page;
86531d6b
JK
327
328put_err:
329 f2fs_put_page(page, 1);
330 return ERR_PTR(err);
43f3eae1
JK
331}
332
333struct page *find_data_page(struct inode *inode, pgoff_t index)
334{
335 struct address_space *mapping = inode->i_mapping;
336 struct page *page;
337
338 page = find_get_page(mapping, index);
339 if (page && PageUptodate(page))
340 return page;
341 f2fs_put_page(page, 0);
342
343 page = get_read_data_page(inode, index, READ_SYNC);
344 if (IS_ERR(page))
345 return page;
346
347 if (PageUptodate(page))
348 return page;
349
350 wait_on_page_locked(page);
351 if (unlikely(!PageUptodate(page))) {
352 f2fs_put_page(page, 0);
353 return ERR_PTR(-EIO);
354 }
355 return page;
356}
357
358/*
359 * If it tries to access a hole, return an error.
360 * Because, the callers, functions in dir.c and GC, should be able to know
361 * whether this page exists or not.
362 */
363struct page *get_lock_data_page(struct inode *inode, pgoff_t index)
364{
365 struct address_space *mapping = inode->i_mapping;
366 struct page *page;
367repeat:
368 page = get_read_data_page(inode, index, READ_SYNC);
369 if (IS_ERR(page))
370 return page;
393ff91f 371
43f3eae1 372 /* wait for read completion */
393ff91f 373 lock_page(page);
6bacf52f 374 if (unlikely(!PageUptodate(page))) {
393ff91f
JK
375 f2fs_put_page(page, 1);
376 return ERR_PTR(-EIO);
eb47b800 377 }
6bacf52f 378 if (unlikely(page->mapping != mapping)) {
afcb7ca0
JK
379 f2fs_put_page(page, 1);
380 goto repeat;
eb47b800
JK
381 }
382 return page;
383}
384
0a8165d7 385/*
eb47b800
JK
386 * Caller ensures that this data page is never allocated.
387 * A new zero-filled data page is allocated in the page cache.
39936837 388 *
4f4124d0
CY
389 * Also, caller should grab and release a rwsem by calling f2fs_lock_op() and
390 * f2fs_unlock_op().
470f00e9
CY
391 * Note that, ipage is set only by make_empty_dir, and if any error occur,
392 * ipage should be released by this function.
eb47b800 393 */
64aa7ed9 394struct page *get_new_data_page(struct inode *inode,
a8865372 395 struct page *ipage, pgoff_t index, bool new_i_size)
eb47b800 396{
eb47b800
JK
397 struct address_space *mapping = inode->i_mapping;
398 struct page *page;
399 struct dnode_of_data dn;
400 int err;
01f28610
JK
401repeat:
402 page = grab_cache_page(mapping, index);
470f00e9
CY
403 if (!page) {
404 /*
405 * before exiting, we should make sure ipage will be released
406 * if any error occur.
407 */
408 f2fs_put_page(ipage, 1);
01f28610 409 return ERR_PTR(-ENOMEM);
470f00e9 410 }
eb47b800 411
a8865372 412 set_new_dnode(&dn, inode, ipage, NULL, 0);
b600965c 413 err = f2fs_reserve_block(&dn, index);
01f28610
JK
414 if (err) {
415 f2fs_put_page(page, 1);
eb47b800 416 return ERR_PTR(err);
a8865372 417 }
01f28610
JK
418 if (!ipage)
419 f2fs_put_dnode(&dn);
eb47b800
JK
420
421 if (PageUptodate(page))
01f28610 422 goto got_it;
eb47b800
JK
423
424 if (dn.data_blkaddr == NEW_ADDR) {
425 zero_user_segment(page, 0, PAGE_CACHE_SIZE);
393ff91f 426 SetPageUptodate(page);
eb47b800 427 } else {
4375a336 428 f2fs_put_page(page, 1);
a8865372 429
4375a336
JK
430 page = get_read_data_page(inode, index, READ_SYNC);
431 if (IS_ERR(page))
afcb7ca0 432 goto repeat;
4375a336
JK
433
434 /* wait for read completion */
435 lock_page(page);
eb47b800 436 }
01f28610 437got_it:
eb47b800
JK
438 if (new_i_size &&
439 i_size_read(inode) < ((index + 1) << PAGE_CACHE_SHIFT)) {
440 i_size_write(inode, ((index + 1) << PAGE_CACHE_SHIFT));
699489bb
JK
441 /* Only the directory inode sets new_i_size */
442 set_inode_flag(F2FS_I(inode), FI_UPDATE_DIR);
eb47b800
JK
443 }
444 return page;
445}
446
bfad7c2d
JK
447static int __allocate_data_block(struct dnode_of_data *dn)
448{
4081363f 449 struct f2fs_sb_info *sbi = F2FS_I_SB(dn->inode);
976e4c50 450 struct f2fs_inode_info *fi = F2FS_I(dn->inode);
bfad7c2d 451 struct f2fs_summary sum;
bfad7c2d 452 struct node_info ni;
38aa0889 453 int seg = CURSEG_WARM_DATA;
976e4c50 454 pgoff_t fofs;
bfad7c2d
JK
455
456 if (unlikely(is_inode_flag_set(F2FS_I(dn->inode), FI_NO_ALLOC)))
457 return -EPERM;
df6136ef
CY
458
459 dn->data_blkaddr = datablock_addr(dn->node_page, dn->ofs_in_node);
460 if (dn->data_blkaddr == NEW_ADDR)
461 goto alloc;
462
bfad7c2d
JK
463 if (unlikely(!inc_valid_block_count(sbi, dn->inode, 1)))
464 return -ENOSPC;
465
df6136ef 466alloc:
bfad7c2d
JK
467 get_node_info(sbi, dn->nid, &ni);
468 set_summary(&sum, dn->nid, dn->ofs_in_node, ni.version);
469
38aa0889
JK
470 if (dn->ofs_in_node == 0 && dn->inode_page == dn->node_page)
471 seg = CURSEG_DIRECT_IO;
472
df6136ef
CY
473 allocate_data_block(sbi, NULL, dn->data_blkaddr, &dn->data_blkaddr,
474 &sum, seg);
216a620a 475 set_data_blkaddr(dn);
bfad7c2d 476
976e4c50
JK
477 /* update i_size */
478 fofs = start_bidx_of_node(ofs_of_node(dn->node_page), fi) +
479 dn->ofs_in_node;
480 if (i_size_read(dn->inode) < ((fofs + 1) << PAGE_CACHE_SHIFT))
481 i_size_write(dn->inode, ((fofs + 1) << PAGE_CACHE_SHIFT));
482
3e72f721 483 /* direct IO doesn't use extent cache to maximize the performance */
a28ef1f5 484 f2fs_drop_largest_extent(dn->inode, fofs);
3e72f721 485
bfad7c2d
JK
486 return 0;
487}
488
59b802e5
JK
489static void __allocate_data_blocks(struct inode *inode, loff_t offset,
490 size_t count)
491{
492 struct f2fs_sb_info *sbi = F2FS_I_SB(inode);
493 struct dnode_of_data dn;
494 u64 start = F2FS_BYTES_TO_BLK(offset);
495 u64 len = F2FS_BYTES_TO_BLK(count);
496 bool allocated;
497 u64 end_offset;
498
499 while (len) {
500 f2fs_balance_fs(sbi);
501 f2fs_lock_op(sbi);
502
503 /* When reading holes, we need its node page */
504 set_new_dnode(&dn, inode, NULL, NULL, 0);
505 if (get_dnode_of_data(&dn, start, ALLOC_NODE))
506 goto out;
507
508 allocated = false;
509 end_offset = ADDRS_PER_PAGE(dn.node_page, F2FS_I(inode));
510
511 while (dn.ofs_in_node < end_offset && len) {
d6d4f1cb
CY
512 block_t blkaddr;
513
514 blkaddr = datablock_addr(dn.node_page, dn.ofs_in_node);
df6136ef 515 if (blkaddr == NULL_ADDR || blkaddr == NEW_ADDR) {
59b802e5
JK
516 if (__allocate_data_block(&dn))
517 goto sync_out;
518 allocated = true;
519 }
520 len--;
521 start++;
522 dn.ofs_in_node++;
523 }
524
525 if (allocated)
526 sync_inode_page(&dn);
527
528 f2fs_put_dnode(&dn);
529 f2fs_unlock_op(sbi);
530 }
531 return;
532
533sync_out:
534 if (allocated)
535 sync_inode_page(&dn);
536 f2fs_put_dnode(&dn);
537out:
538 f2fs_unlock_op(sbi);
539 return;
540}
541
0a8165d7 542/*
003a3e1d
JK
543 * f2fs_map_blocks() now supported readahead/bmap/rw direct_IO with
544 * f2fs_map_blocks structure.
4f4124d0
CY
545 * If original data blocks are allocated, then give them to blockdev.
546 * Otherwise,
547 * a. preallocate requested block addresses
548 * b. do not use extent cache for better performance
549 * c. give the block addresses to blockdev
eb47b800 550 */
003a3e1d
JK
551static int f2fs_map_blocks(struct inode *inode, struct f2fs_map_blocks *map,
552 int create, bool fiemap)
eb47b800 553{
003a3e1d 554 unsigned int maxblocks = map->m_len;
eb47b800 555 struct dnode_of_data dn;
bfad7c2d
JK
556 int mode = create ? ALLOC_NODE : LOOKUP_NODE_RA;
557 pgoff_t pgofs, end_offset;
558 int err = 0, ofs = 1;
a2e7d1bf 559 struct extent_info ei;
bfad7c2d 560 bool allocated = false;
eb47b800 561
003a3e1d
JK
562 map->m_len = 0;
563 map->m_flags = 0;
564
565 /* it only supports block size == page size */
566 pgofs = (pgoff_t)map->m_lblk;
eb47b800 567
7e4dde79 568 if (f2fs_lookup_extent_cache(inode, pgofs, &ei)) {
003a3e1d
JK
569 map->m_pblk = ei.blk + pgofs - ei.fofs;
570 map->m_len = min((pgoff_t)maxblocks, ei.fofs + ei.len - pgofs);
571 map->m_flags = F2FS_MAP_MAPPED;
bfad7c2d 572 goto out;
a2e7d1bf 573 }
bfad7c2d 574
59b802e5 575 if (create)
4081363f 576 f2fs_lock_op(F2FS_I_SB(inode));
eb47b800
JK
577
578 /* When reading holes, we need its node page */
579 set_new_dnode(&dn, inode, NULL, NULL, 0);
bfad7c2d 580 err = get_dnode_of_data(&dn, pgofs, mode);
1ec79083 581 if (err) {
bfad7c2d
JK
582 if (err == -ENOENT)
583 err = 0;
584 goto unlock_out;
848753aa 585 }
ccfb3000 586 if (dn.data_blkaddr == NEW_ADDR && !fiemap)
1ec79083 587 goto put_out;
eb47b800 588
bfad7c2d 589 if (dn.data_blkaddr != NULL_ADDR) {
003a3e1d
JK
590 map->m_flags = F2FS_MAP_MAPPED;
591 map->m_pblk = dn.data_blkaddr;
7f63eb77
JK
592 if (dn.data_blkaddr == NEW_ADDR)
593 map->m_flags |= F2FS_MAP_UNWRITTEN;
bfad7c2d
JK
594 } else if (create) {
595 err = __allocate_data_block(&dn);
596 if (err)
597 goto put_out;
598 allocated = true;
003a3e1d
JK
599 map->m_flags = F2FS_MAP_NEW | F2FS_MAP_MAPPED;
600 map->m_pblk = dn.data_blkaddr;
bfad7c2d
JK
601 } else {
602 goto put_out;
603 }
604
6403eb1f 605 end_offset = ADDRS_PER_PAGE(dn.node_page, F2FS_I(inode));
003a3e1d 606 map->m_len = 1;
bfad7c2d
JK
607 dn.ofs_in_node++;
608 pgofs++;
609
610get_next:
611 if (dn.ofs_in_node >= end_offset) {
612 if (allocated)
613 sync_inode_page(&dn);
614 allocated = false;
615 f2fs_put_dnode(&dn);
616
617 set_new_dnode(&dn, inode, NULL, NULL, 0);
618 err = get_dnode_of_data(&dn, pgofs, mode);
1ec79083 619 if (err) {
bfad7c2d
JK
620 if (err == -ENOENT)
621 err = 0;
622 goto unlock_out;
623 }
ccfb3000 624 if (dn.data_blkaddr == NEW_ADDR && !fiemap)
1ec79083
JK
625 goto put_out;
626
6403eb1f 627 end_offset = ADDRS_PER_PAGE(dn.node_page, F2FS_I(inode));
bfad7c2d 628 }
eb47b800 629
003a3e1d 630 if (maxblocks > map->m_len) {
bfad7c2d
JK
631 block_t blkaddr = datablock_addr(dn.node_page, dn.ofs_in_node);
632 if (blkaddr == NULL_ADDR && create) {
633 err = __allocate_data_block(&dn);
634 if (err)
635 goto sync_out;
636 allocated = true;
003a3e1d 637 map->m_flags |= F2FS_MAP_NEW;
bfad7c2d
JK
638 blkaddr = dn.data_blkaddr;
639 }
e1c42045 640 /* Give more consecutive addresses for the readahead */
7f63eb77
JK
641 if ((map->m_pblk != NEW_ADDR &&
642 blkaddr == (map->m_pblk + ofs)) ||
643 (map->m_pblk == NEW_ADDR &&
644 blkaddr == NEW_ADDR)) {
bfad7c2d
JK
645 ofs++;
646 dn.ofs_in_node++;
647 pgofs++;
003a3e1d 648 map->m_len++;
bfad7c2d
JK
649 goto get_next;
650 }
eb47b800 651 }
bfad7c2d
JK
652sync_out:
653 if (allocated)
654 sync_inode_page(&dn);
655put_out:
eb47b800 656 f2fs_put_dnode(&dn);
bfad7c2d
JK
657unlock_out:
658 if (create)
4081363f 659 f2fs_unlock_op(F2FS_I_SB(inode));
bfad7c2d 660out:
003a3e1d 661 trace_f2fs_map_blocks(inode, map, err);
bfad7c2d 662 return err;
eb47b800
JK
663}
664
003a3e1d
JK
665static int __get_data_block(struct inode *inode, sector_t iblock,
666 struct buffer_head *bh, int create, bool fiemap)
667{
668 struct f2fs_map_blocks map;
669 int ret;
670
671 map.m_lblk = iblock;
672 map.m_len = bh->b_size >> inode->i_blkbits;
673
674 ret = f2fs_map_blocks(inode, &map, create, fiemap);
675 if (!ret) {
676 map_bh(bh, inode->i_sb, map.m_pblk);
677 bh->b_state = (bh->b_state & ~F2FS_MAP_FLAGS) | map.m_flags;
678 bh->b_size = map.m_len << inode->i_blkbits;
679 }
680 return ret;
681}
682
ccfb3000
JK
683static int get_data_block(struct inode *inode, sector_t iblock,
684 struct buffer_head *bh_result, int create)
685{
686 return __get_data_block(inode, iblock, bh_result, create, false);
687}
688
689static int get_data_block_fiemap(struct inode *inode, sector_t iblock,
690 struct buffer_head *bh_result, int create)
691{
692 return __get_data_block(inode, iblock, bh_result, create, true);
693}
694
7f63eb77
JK
695static inline sector_t logical_to_blk(struct inode *inode, loff_t offset)
696{
697 return (offset >> inode->i_blkbits);
698}
699
700static inline loff_t blk_to_logical(struct inode *inode, sector_t blk)
701{
702 return (blk << inode->i_blkbits);
703}
704
9ab70134
JK
705int f2fs_fiemap(struct inode *inode, struct fiemap_extent_info *fieinfo,
706 u64 start, u64 len)
707{
7f63eb77
JK
708 struct buffer_head map_bh;
709 sector_t start_blk, last_blk;
710 loff_t isize = i_size_read(inode);
711 u64 logical = 0, phys = 0, size = 0;
712 u32 flags = 0;
713 bool past_eof = false, whole_file = false;
714 int ret = 0;
715
716 ret = fiemap_check_flags(fieinfo, FIEMAP_FLAG_SYNC);
717 if (ret)
718 return ret;
719
720 mutex_lock(&inode->i_mutex);
721
722 if (len >= isize) {
723 whole_file = true;
724 len = isize;
725 }
726
727 if (logical_to_blk(inode, len) == 0)
728 len = blk_to_logical(inode, 1);
729
730 start_blk = logical_to_blk(inode, start);
731 last_blk = logical_to_blk(inode, start + len - 1);
732next:
733 memset(&map_bh, 0, sizeof(struct buffer_head));
734 map_bh.b_size = len;
735
736 ret = get_data_block_fiemap(inode, start_blk, &map_bh, 0);
737 if (ret)
738 goto out;
739
740 /* HOLE */
741 if (!buffer_mapped(&map_bh)) {
742 start_blk++;
743
744 if (!past_eof && blk_to_logical(inode, start_blk) >= isize)
745 past_eof = 1;
746
747 if (past_eof && size) {
748 flags |= FIEMAP_EXTENT_LAST;
749 ret = fiemap_fill_next_extent(fieinfo, logical,
750 phys, size, flags);
751 } else if (size) {
752 ret = fiemap_fill_next_extent(fieinfo, logical,
753 phys, size, flags);
754 size = 0;
755 }
756
757 /* if we have holes up to/past EOF then we're done */
758 if (start_blk > last_blk || past_eof || ret)
759 goto out;
760 } else {
761 if (start_blk > last_blk && !whole_file) {
762 ret = fiemap_fill_next_extent(fieinfo, logical,
763 phys, size, flags);
764 goto out;
765 }
766
767 /*
768 * if size != 0 then we know we already have an extent
769 * to add, so add it.
770 */
771 if (size) {
772 ret = fiemap_fill_next_extent(fieinfo, logical,
773 phys, size, flags);
774 if (ret)
775 goto out;
776 }
777
778 logical = blk_to_logical(inode, start_blk);
779 phys = blk_to_logical(inode, map_bh.b_blocknr);
780 size = map_bh.b_size;
781 flags = 0;
782 if (buffer_unwritten(&map_bh))
783 flags = FIEMAP_EXTENT_UNWRITTEN;
784
785 start_blk += logical_to_blk(inode, size);
786
787 /*
788 * If we are past the EOF, then we need to make sure as
789 * soon as we find a hole that the last extent we found
790 * is marked with FIEMAP_EXTENT_LAST
791 */
792 if (!past_eof && logical + size >= isize)
793 past_eof = true;
794 }
795 cond_resched();
796 if (fatal_signal_pending(current))
797 ret = -EINTR;
798 else
799 goto next;
800out:
801 if (ret == 1)
802 ret = 0;
803
804 mutex_unlock(&inode->i_mutex);
805 return ret;
9ab70134
JK
806}
807
f1e88660
JK
808/*
809 * This function was originally taken from fs/mpage.c, and customized for f2fs.
810 * Major change was from block_size == page_size in f2fs by default.
811 */
812static int f2fs_mpage_readpages(struct address_space *mapping,
813 struct list_head *pages, struct page *page,
814 unsigned nr_pages)
815{
816 struct bio *bio = NULL;
817 unsigned page_idx;
818 sector_t last_block_in_bio = 0;
819 struct inode *inode = mapping->host;
820 const unsigned blkbits = inode->i_blkbits;
821 const unsigned blocksize = 1 << blkbits;
822 sector_t block_in_file;
823 sector_t last_block;
824 sector_t last_block_in_file;
825 sector_t block_nr;
826 struct block_device *bdev = inode->i_sb->s_bdev;
827 struct f2fs_map_blocks map;
828
829 map.m_pblk = 0;
830 map.m_lblk = 0;
831 map.m_len = 0;
832 map.m_flags = 0;
833
834 for (page_idx = 0; nr_pages; page_idx++, nr_pages--) {
835
836 prefetchw(&page->flags);
837 if (pages) {
838 page = list_entry(pages->prev, struct page, lru);
839 list_del(&page->lru);
840 if (add_to_page_cache_lru(page, mapping,
841 page->index, GFP_KERNEL))
842 goto next_page;
843 }
844
845 block_in_file = (sector_t)page->index;
846 last_block = block_in_file + nr_pages;
847 last_block_in_file = (i_size_read(inode) + blocksize - 1) >>
848 blkbits;
849 if (last_block > last_block_in_file)
850 last_block = last_block_in_file;
851
852 /*
853 * Map blocks using the previous result first.
854 */
855 if ((map.m_flags & F2FS_MAP_MAPPED) &&
856 block_in_file > map.m_lblk &&
857 block_in_file < (map.m_lblk + map.m_len))
858 goto got_it;
859
860 /*
861 * Then do more f2fs_map_blocks() calls until we are
862 * done with this page.
863 */
864 map.m_flags = 0;
865
866 if (block_in_file < last_block) {
867 map.m_lblk = block_in_file;
868 map.m_len = last_block - block_in_file;
869
870 if (f2fs_map_blocks(inode, &map, 0, false))
871 goto set_error_page;
872 }
873got_it:
874 if ((map.m_flags & F2FS_MAP_MAPPED)) {
875 block_nr = map.m_pblk + block_in_file - map.m_lblk;
876 SetPageMappedToDisk(page);
877
878 if (!PageUptodate(page) && !cleancache_get_page(page)) {
879 SetPageUptodate(page);
880 goto confused;
881 }
882 } else {
883 zero_user_segment(page, 0, PAGE_CACHE_SIZE);
884 SetPageUptodate(page);
885 unlock_page(page);
886 goto next_page;
887 }
888
889 /*
890 * This page will go to BIO. Do we need to send this
891 * BIO off first?
892 */
893 if (bio && (last_block_in_bio != block_nr - 1)) {
894submit_and_realloc:
895 submit_bio(READ, bio);
896 bio = NULL;
897 }
898 if (bio == NULL) {
4375a336
JK
899 struct f2fs_crypto_ctx *ctx = NULL;
900
901 if (f2fs_encrypted_inode(inode) &&
902 S_ISREG(inode->i_mode)) {
903 struct page *cpage;
904
905 ctx = f2fs_get_crypto_ctx(inode);
906 if (IS_ERR(ctx))
907 goto set_error_page;
908
909 /* wait the page to be moved by cleaning */
910 cpage = find_lock_page(
911 META_MAPPING(F2FS_I_SB(inode)),
912 block_nr);
913 if (cpage) {
914 f2fs_wait_on_page_writeback(cpage,
915 DATA);
916 f2fs_put_page(cpage, 1);
917 }
918 }
919
f1e88660
JK
920 bio = bio_alloc(GFP_KERNEL,
921 min_t(int, nr_pages, bio_get_nr_vecs(bdev)));
4375a336
JK
922 if (!bio) {
923 if (ctx)
924 f2fs_release_crypto_ctx(ctx);
f1e88660 925 goto set_error_page;
4375a336 926 }
f1e88660
JK
927 bio->bi_bdev = bdev;
928 bio->bi_iter.bi_sector = SECTOR_FROM_BLOCK(block_nr);
12377024 929 bio->bi_end_io = f2fs_read_end_io;
4375a336 930 bio->bi_private = ctx;
f1e88660
JK
931 }
932
933 if (bio_add_page(bio, page, blocksize, 0) < blocksize)
934 goto submit_and_realloc;
935
936 last_block_in_bio = block_nr;
937 goto next_page;
938set_error_page:
939 SetPageError(page);
940 zero_user_segment(page, 0, PAGE_CACHE_SIZE);
941 unlock_page(page);
942 goto next_page;
943confused:
944 if (bio) {
945 submit_bio(READ, bio);
946 bio = NULL;
947 }
948 unlock_page(page);
949next_page:
950 if (pages)
951 page_cache_release(page);
952 }
953 BUG_ON(pages && !list_empty(pages));
954 if (bio)
955 submit_bio(READ, bio);
956 return 0;
957}
958
eb47b800
JK
959static int f2fs_read_data_page(struct file *file, struct page *page)
960{
9ffe0fb5 961 struct inode *inode = page->mapping->host;
b3d208f9 962 int ret = -EAGAIN;
9ffe0fb5 963
c20e89cd
CY
964 trace_f2fs_readpage(page, DATA);
965
e1c42045 966 /* If the file has inline data, try to read it directly */
9ffe0fb5
HL
967 if (f2fs_has_inline_data(inode))
968 ret = f2fs_read_inline_data(inode, page);
b3d208f9 969 if (ret == -EAGAIN)
f1e88660 970 ret = f2fs_mpage_readpages(page->mapping, NULL, page, 1);
9ffe0fb5 971 return ret;
eb47b800
JK
972}
973
974static int f2fs_read_data_pages(struct file *file,
975 struct address_space *mapping,
976 struct list_head *pages, unsigned nr_pages)
977{
9ffe0fb5
HL
978 struct inode *inode = file->f_mapping->host;
979
980 /* If the file has inline data, skip readpages */
981 if (f2fs_has_inline_data(inode))
982 return 0;
983
f1e88660 984 return f2fs_mpage_readpages(mapping, pages, NULL, nr_pages);
eb47b800
JK
985}
986
05ca3632 987int do_write_data_page(struct f2fs_io_info *fio)
eb47b800 988{
05ca3632 989 struct page *page = fio->page;
eb47b800 990 struct inode *inode = page->mapping->host;
eb47b800
JK
991 struct dnode_of_data dn;
992 int err = 0;
993
994 set_new_dnode(&dn, inode, NULL, NULL, 0);
266e97a8 995 err = get_dnode_of_data(&dn, page->index, LOOKUP_NODE);
eb47b800
JK
996 if (err)
997 return err;
998
cf04e8eb 999 fio->blk_addr = dn.data_blkaddr;
eb47b800
JK
1000
1001 /* This page is already truncated */
2bca1e23
JK
1002 if (fio->blk_addr == NULL_ADDR) {
1003 ClearPageUptodate(page);
eb47b800 1004 goto out_writepage;
2bca1e23 1005 }
eb47b800 1006
4375a336
JK
1007 if (f2fs_encrypted_inode(inode) && S_ISREG(inode->i_mode)) {
1008 fio->encrypted_page = f2fs_encrypt(inode, fio->page);
1009 if (IS_ERR(fio->encrypted_page)) {
1010 err = PTR_ERR(fio->encrypted_page);
1011 goto out_writepage;
1012 }
1013 }
1014
eb47b800
JK
1015 set_page_writeback(page);
1016
1017 /*
1018 * If current allocation needs SSR,
1019 * it had better in-place writes for updated data.
1020 */
cf04e8eb 1021 if (unlikely(fio->blk_addr != NEW_ADDR &&
b25958b6
HL
1022 !is_cold_data(page) &&
1023 need_inplace_update(inode))) {
05ca3632 1024 rewrite_data_page(fio);
fff04f90 1025 set_inode_flag(F2FS_I(inode), FI_UPDATE_WRITE);
8ce67cb0 1026 trace_f2fs_do_write_data_page(page, IPU);
eb47b800 1027 } else {
05ca3632 1028 write_data_page(&dn, fio);
216a620a 1029 set_data_blkaddr(&dn);
7e4dde79 1030 f2fs_update_extent_cache(&dn);
8ce67cb0 1031 trace_f2fs_do_write_data_page(page, OPU);
fff04f90 1032 set_inode_flag(F2FS_I(inode), FI_APPEND_WRITE);
3c6c2beb
JK
1033 if (page->index == 0)
1034 set_inode_flag(F2FS_I(inode), FI_FIRST_BLOCK_WRITTEN);
eb47b800
JK
1035 }
1036out_writepage:
1037 f2fs_put_dnode(&dn);
1038 return err;
1039}
1040
1041static int f2fs_write_data_page(struct page *page,
1042 struct writeback_control *wbc)
1043{
1044 struct inode *inode = page->mapping->host;
4081363f 1045 struct f2fs_sb_info *sbi = F2FS_I_SB(inode);
eb47b800
JK
1046 loff_t i_size = i_size_read(inode);
1047 const pgoff_t end_index = ((unsigned long long) i_size)
1048 >> PAGE_CACHE_SHIFT;
9ffe0fb5 1049 unsigned offset = 0;
39936837 1050 bool need_balance_fs = false;
eb47b800 1051 int err = 0;
458e6197 1052 struct f2fs_io_info fio = {
05ca3632 1053 .sbi = sbi,
458e6197 1054 .type = DATA,
6c311ec6 1055 .rw = (wbc->sync_mode == WB_SYNC_ALL) ? WRITE_SYNC : WRITE,
05ca3632 1056 .page = page,
4375a336 1057 .encrypted_page = NULL,
458e6197 1058 };
eb47b800 1059
ecda0de3
CY
1060 trace_f2fs_writepage(page, DATA);
1061
eb47b800 1062 if (page->index < end_index)
39936837 1063 goto write;
eb47b800
JK
1064
1065 /*
1066 * If the offset is out-of-range of file size,
1067 * this page does not have to be written to disk.
1068 */
1069 offset = i_size & (PAGE_CACHE_SIZE - 1);
76f60268 1070 if ((page->index >= end_index + 1) || !offset)
39936837 1071 goto out;
eb47b800
JK
1072
1073 zero_user_segment(page, offset, PAGE_CACHE_SIZE);
39936837 1074write:
caf0047e 1075 if (unlikely(is_sbi_flag_set(sbi, SBI_POR_DOING)))
eb47b800 1076 goto redirty_out;
1e84371f
JK
1077 if (f2fs_is_drop_cache(inode))
1078 goto out;
1079 if (f2fs_is_volatile_file(inode) && !wbc->for_reclaim &&
1080 available_free_memory(sbi, BASE_CHECK))
1081 goto redirty_out;
eb47b800 1082
39936837 1083 /* Dentry blocks are controlled by checkpoint */
eb47b800 1084 if (S_ISDIR(inode->i_mode)) {
cf779cab
JK
1085 if (unlikely(f2fs_cp_error(sbi)))
1086 goto redirty_out;
05ca3632 1087 err = do_write_data_page(&fio);
8618b881
JK
1088 goto done;
1089 }
9ffe0fb5 1090
cf779cab
JK
1091 /* we should bypass data pages to proceed the kworkder jobs */
1092 if (unlikely(f2fs_cp_error(sbi))) {
1093 SetPageError(page);
a7ffdbe2 1094 goto out;
cf779cab
JK
1095 }
1096
8618b881 1097 if (!wbc->for_reclaim)
39936837 1098 need_balance_fs = true;
8618b881 1099 else if (has_not_enough_free_secs(sbi, 0))
39936837 1100 goto redirty_out;
eb47b800 1101
b3d208f9 1102 err = -EAGAIN;
8618b881 1103 f2fs_lock_op(sbi);
b3d208f9
JK
1104 if (f2fs_has_inline_data(inode))
1105 err = f2fs_write_inline_data(inode, page);
1106 if (err == -EAGAIN)
05ca3632 1107 err = do_write_data_page(&fio);
8618b881
JK
1108 f2fs_unlock_op(sbi);
1109done:
1110 if (err && err != -ENOENT)
1111 goto redirty_out;
eb47b800 1112
eb47b800 1113 clear_cold_data(page);
39936837 1114out:
a7ffdbe2 1115 inode_dec_dirty_pages(inode);
2bca1e23
JK
1116 if (err)
1117 ClearPageUptodate(page);
eb47b800 1118 unlock_page(page);
39936837 1119 if (need_balance_fs)
eb47b800 1120 f2fs_balance_fs(sbi);
2aea39ec
JK
1121 if (wbc->for_reclaim)
1122 f2fs_submit_merged_bio(sbi, DATA, WRITE);
eb47b800
JK
1123 return 0;
1124
eb47b800 1125redirty_out:
76f60268 1126 redirty_page_for_writepage(wbc, page);
8618b881 1127 return AOP_WRITEPAGE_ACTIVATE;
eb47b800
JK
1128}
1129
fa9150a8
NJ
1130static int __f2fs_writepage(struct page *page, struct writeback_control *wbc,
1131 void *data)
1132{
1133 struct address_space *mapping = data;
1134 int ret = mapping->a_ops->writepage(page, wbc);
1135 mapping_set_error(mapping, ret);
1136 return ret;
1137}
1138
8f46dcae
CY
1139/*
1140 * This function was copied from write_cche_pages from mm/page-writeback.c.
1141 * The major change is making write step of cold data page separately from
1142 * warm/hot data page.
1143 */
1144static int f2fs_write_cache_pages(struct address_space *mapping,
1145 struct writeback_control *wbc, writepage_t writepage,
1146 void *data)
1147{
1148 int ret = 0;
1149 int done = 0;
1150 struct pagevec pvec;
1151 int nr_pages;
1152 pgoff_t uninitialized_var(writeback_index);
1153 pgoff_t index;
1154 pgoff_t end; /* Inclusive */
1155 pgoff_t done_index;
1156 int cycled;
1157 int range_whole = 0;
1158 int tag;
1159 int step = 0;
1160
1161 pagevec_init(&pvec, 0);
1162next:
1163 if (wbc->range_cyclic) {
1164 writeback_index = mapping->writeback_index; /* prev offset */
1165 index = writeback_index;
1166 if (index == 0)
1167 cycled = 1;
1168 else
1169 cycled = 0;
1170 end = -1;
1171 } else {
1172 index = wbc->range_start >> PAGE_CACHE_SHIFT;
1173 end = wbc->range_end >> PAGE_CACHE_SHIFT;
1174 if (wbc->range_start == 0 && wbc->range_end == LLONG_MAX)
1175 range_whole = 1;
1176 cycled = 1; /* ignore range_cyclic tests */
1177 }
1178 if (wbc->sync_mode == WB_SYNC_ALL || wbc->tagged_writepages)
1179 tag = PAGECACHE_TAG_TOWRITE;
1180 else
1181 tag = PAGECACHE_TAG_DIRTY;
1182retry:
1183 if (wbc->sync_mode == WB_SYNC_ALL || wbc->tagged_writepages)
1184 tag_pages_for_writeback(mapping, index, end);
1185 done_index = index;
1186 while (!done && (index <= end)) {
1187 int i;
1188
1189 nr_pages = pagevec_lookup_tag(&pvec, mapping, &index, tag,
1190 min(end - index, (pgoff_t)PAGEVEC_SIZE - 1) + 1);
1191 if (nr_pages == 0)
1192 break;
1193
1194 for (i = 0; i < nr_pages; i++) {
1195 struct page *page = pvec.pages[i];
1196
1197 if (page->index > end) {
1198 done = 1;
1199 break;
1200 }
1201
1202 done_index = page->index;
1203
1204 lock_page(page);
1205
1206 if (unlikely(page->mapping != mapping)) {
1207continue_unlock:
1208 unlock_page(page);
1209 continue;
1210 }
1211
1212 if (!PageDirty(page)) {
1213 /* someone wrote it for us */
1214 goto continue_unlock;
1215 }
1216
737f1899 1217 if (step == is_cold_data(page))
8f46dcae
CY
1218 goto continue_unlock;
1219
1220 if (PageWriteback(page)) {
1221 if (wbc->sync_mode != WB_SYNC_NONE)
1222 f2fs_wait_on_page_writeback(page, DATA);
1223 else
1224 goto continue_unlock;
1225 }
1226
1227 BUG_ON(PageWriteback(page));
1228 if (!clear_page_dirty_for_io(page))
1229 goto continue_unlock;
1230
1231 ret = (*writepage)(page, wbc, data);
1232 if (unlikely(ret)) {
1233 if (ret == AOP_WRITEPAGE_ACTIVATE) {
1234 unlock_page(page);
1235 ret = 0;
1236 } else {
1237 done_index = page->index + 1;
1238 done = 1;
1239 break;
1240 }
1241 }
1242
1243 if (--wbc->nr_to_write <= 0 &&
1244 wbc->sync_mode == WB_SYNC_NONE) {
1245 done = 1;
1246 break;
1247 }
1248 }
1249 pagevec_release(&pvec);
1250 cond_resched();
1251 }
1252
1253 if (step < 1) {
1254 step++;
1255 goto next;
1256 }
1257
1258 if (!cycled && !done) {
1259 cycled = 1;
1260 index = 0;
1261 end = writeback_index - 1;
1262 goto retry;
1263 }
1264 if (wbc->range_cyclic || (range_whole && wbc->nr_to_write > 0))
1265 mapping->writeback_index = done_index;
1266
1267 return ret;
1268}
1269
25ca923b 1270static int f2fs_write_data_pages(struct address_space *mapping,
eb47b800
JK
1271 struct writeback_control *wbc)
1272{
1273 struct inode *inode = mapping->host;
4081363f 1274 struct f2fs_sb_info *sbi = F2FS_I_SB(inode);
5463e7c1 1275 bool locked = false;
eb47b800 1276 int ret;
50c8cdb3 1277 long diff;
eb47b800 1278
e5748434
CY
1279 trace_f2fs_writepages(mapping->host, wbc, DATA);
1280
cfb185a1 1281 /* deal with chardevs and other special file */
1282 if (!mapping->a_ops->writepage)
1283 return 0;
1284
6a290544
CY
1285 /* skip writing if there is no dirty page in this inode */
1286 if (!get_dirty_pages(inode) && wbc->sync_mode == WB_SYNC_NONE)
1287 return 0;
1288
87d6f890 1289 if (S_ISDIR(inode->i_mode) && wbc->sync_mode == WB_SYNC_NONE &&
a7ffdbe2 1290 get_dirty_pages(inode) < nr_pages_to_skip(sbi, DATA) &&
6fb03f3a 1291 available_free_memory(sbi, DIRTY_DENTS))
d3baf95d 1292 goto skip_write;
87d6f890 1293
d5669f7b
JK
1294 /* during POR, we don't need to trigger writepage at all. */
1295 if (unlikely(is_sbi_flag_set(sbi, SBI_POR_DOING)))
1296 goto skip_write;
1297
50c8cdb3 1298 diff = nr_pages_to_write(sbi, DATA, wbc);
eb47b800 1299
5463e7c1
JK
1300 if (!S_ISDIR(inode->i_mode)) {
1301 mutex_lock(&sbi->writepages);
1302 locked = true;
1303 }
8f46dcae 1304 ret = f2fs_write_cache_pages(mapping, wbc, __f2fs_writepage, mapping);
bb96a8d5 1305 f2fs_submit_merged_bio(sbi, DATA, WRITE);
5463e7c1
JK
1306 if (locked)
1307 mutex_unlock(&sbi->writepages);
458e6197 1308
eb47b800
JK
1309 remove_dirty_dir_inode(inode);
1310
50c8cdb3 1311 wbc->nr_to_write = max((long)0, wbc->nr_to_write - diff);
eb47b800 1312 return ret;
d3baf95d
JK
1313
1314skip_write:
a7ffdbe2 1315 wbc->pages_skipped += get_dirty_pages(inode);
d3baf95d 1316 return 0;
eb47b800
JK
1317}
1318
3aab8f82
CY
1319static void f2fs_write_failed(struct address_space *mapping, loff_t to)
1320{
1321 struct inode *inode = mapping->host;
1322
1323 if (to > inode->i_size) {
1324 truncate_pagecache(inode, inode->i_size);
764aa3e9 1325 truncate_blocks(inode, inode->i_size, true);
3aab8f82
CY
1326 }
1327}
1328
eb47b800
JK
1329static int f2fs_write_begin(struct file *file, struct address_space *mapping,
1330 loff_t pos, unsigned len, unsigned flags,
1331 struct page **pagep, void **fsdata)
1332{
1333 struct inode *inode = mapping->host;
4081363f 1334 struct f2fs_sb_info *sbi = F2FS_I_SB(inode);
86531d6b
JK
1335 struct page *page = NULL;
1336 struct page *ipage;
eb47b800
JK
1337 pgoff_t index = ((unsigned long long) pos) >> PAGE_CACHE_SHIFT;
1338 struct dnode_of_data dn;
1339 int err = 0;
1340
62aed044
CY
1341 trace_f2fs_write_begin(inode, pos, len, flags);
1342
eb47b800 1343 f2fs_balance_fs(sbi);
5f727395
JK
1344
1345 /*
1346 * We should check this at this moment to avoid deadlock on inode page
1347 * and #0 page. The locking rule for inline_data conversion should be:
1348 * lock_page(page #0) -> lock_page(inode_page)
1349 */
1350 if (index != 0) {
1351 err = f2fs_convert_inline_inode(inode);
1352 if (err)
1353 goto fail;
1354 }
afcb7ca0 1355repeat:
eb47b800 1356 page = grab_cache_page_write_begin(mapping, index, flags);
3aab8f82
CY
1357 if (!page) {
1358 err = -ENOMEM;
1359 goto fail;
1360 }
d5f66990 1361
eb47b800
JK
1362 *pagep = page;
1363
e479556b 1364 f2fs_lock_op(sbi);
9ba69cf9
JK
1365
1366 /* check inline_data */
1367 ipage = get_node_page(sbi, inode->i_ino);
cd34e296
CY
1368 if (IS_ERR(ipage)) {
1369 err = PTR_ERR(ipage);
9ba69cf9 1370 goto unlock_fail;
cd34e296 1371 }
9ba69cf9 1372
b3d208f9
JK
1373 set_new_dnode(&dn, inode, ipage, ipage, 0);
1374
9ba69cf9 1375 if (f2fs_has_inline_data(inode)) {
b3d208f9
JK
1376 if (pos + len <= MAX_INLINE_DATA) {
1377 read_inline_data(page, ipage);
1378 set_inode_flag(F2FS_I(inode), FI_DATA_EXIST);
1379 sync_inode_page(&dn);
1380 goto put_next;
b3d208f9 1381 }
5f727395
JK
1382 err = f2fs_convert_inline_page(&dn, page);
1383 if (err)
1384 goto put_fail;
b600965c 1385 }
9ba69cf9
JK
1386 err = f2fs_reserve_block(&dn, index);
1387 if (err)
8cdcb713 1388 goto put_fail;
b3d208f9 1389put_next:
9ba69cf9
JK
1390 f2fs_put_dnode(&dn);
1391 f2fs_unlock_op(sbi);
1392
5768dcdd
FL
1393 f2fs_wait_on_page_writeback(page, DATA);
1394
90d4388a
CY
1395 if (len == PAGE_CACHE_SIZE)
1396 goto out_update;
1397 if (PageUptodate(page))
1398 goto out_clear;
eb47b800
JK
1399
1400 if ((pos & PAGE_CACHE_MASK) >= i_size_read(inode)) {
1401 unsigned start = pos & (PAGE_CACHE_SIZE - 1);
1402 unsigned end = start + len;
1403
1404 /* Reading beyond i_size is simple: memset to zero */
1405 zero_user_segments(page, 0, start, end, PAGE_CACHE_SIZE);
90d4388a 1406 goto out_update;
eb47b800
JK
1407 }
1408
b3d208f9 1409 if (dn.data_blkaddr == NEW_ADDR) {
eb47b800
JK
1410 zero_user_segment(page, 0, PAGE_CACHE_SIZE);
1411 } else {
cf04e8eb 1412 struct f2fs_io_info fio = {
05ca3632 1413 .sbi = sbi,
cf04e8eb
JK
1414 .type = DATA,
1415 .rw = READ_SYNC,
1416 .blk_addr = dn.data_blkaddr,
05ca3632 1417 .page = page,
4375a336 1418 .encrypted_page = NULL,
cf04e8eb 1419 };
05ca3632 1420 err = f2fs_submit_page_bio(&fio);
9234f319
JK
1421 if (err)
1422 goto fail;
d54c795b 1423
393ff91f 1424 lock_page(page);
6bacf52f 1425 if (unlikely(!PageUptodate(page))) {
3aab8f82
CY
1426 err = -EIO;
1427 goto fail;
eb47b800 1428 }
6bacf52f 1429 if (unlikely(page->mapping != mapping)) {
afcb7ca0
JK
1430 f2fs_put_page(page, 1);
1431 goto repeat;
eb47b800 1432 }
4375a336
JK
1433
1434 /* avoid symlink page */
1435 if (f2fs_encrypted_inode(inode) && S_ISREG(inode->i_mode)) {
1436 err = f2fs_decrypt_one(inode, page);
86531d6b 1437 if (err)
4375a336 1438 goto fail;
4375a336 1439 }
eb47b800 1440 }
90d4388a 1441out_update:
eb47b800 1442 SetPageUptodate(page);
90d4388a 1443out_clear:
eb47b800
JK
1444 clear_cold_data(page);
1445 return 0;
9ba69cf9 1446
8cdcb713
JK
1447put_fail:
1448 f2fs_put_dnode(&dn);
9ba69cf9
JK
1449unlock_fail:
1450 f2fs_unlock_op(sbi);
3aab8f82 1451fail:
86531d6b 1452 f2fs_put_page(page, 1);
3aab8f82
CY
1453 f2fs_write_failed(mapping, pos + len);
1454 return err;
eb47b800
JK
1455}
1456
a1dd3c13
JK
1457static int f2fs_write_end(struct file *file,
1458 struct address_space *mapping,
1459 loff_t pos, unsigned len, unsigned copied,
1460 struct page *page, void *fsdata)
1461{
1462 struct inode *inode = page->mapping->host;
1463
dfb2bf38
CY
1464 trace_f2fs_write_end(inode, pos, len, copied);
1465
34ba94ba 1466 set_page_dirty(page);
a1dd3c13
JK
1467
1468 if (pos + copied > i_size_read(inode)) {
1469 i_size_write(inode, pos + copied);
1470 mark_inode_dirty(inode);
1471 update_inode_page(inode);
1472 }
1473
75c3c8bc 1474 f2fs_put_page(page, 1);
a1dd3c13
JK
1475 return copied;
1476}
1477
6f673763
OS
1478static int check_direct_IO(struct inode *inode, struct iov_iter *iter,
1479 loff_t offset)
944fcfc1
JK
1480{
1481 unsigned blocksize_mask = inode->i_sb->s_blocksize - 1;
944fcfc1 1482
6f673763 1483 if (iov_iter_rw(iter) == READ)
944fcfc1
JK
1484 return 0;
1485
1486 if (offset & blocksize_mask)
1487 return -EINVAL;
1488
5b46f25d
AV
1489 if (iov_iter_alignment(iter) & blocksize_mask)
1490 return -EINVAL;
1491
944fcfc1
JK
1492 return 0;
1493}
1494
22c6186e
OS
1495static ssize_t f2fs_direct_IO(struct kiocb *iocb, struct iov_iter *iter,
1496 loff_t offset)
eb47b800
JK
1497{
1498 struct file *file = iocb->ki_filp;
3aab8f82
CY
1499 struct address_space *mapping = file->f_mapping;
1500 struct inode *inode = mapping->host;
1501 size_t count = iov_iter_count(iter);
1502 int err;
944fcfc1 1503
b3d208f9
JK
1504 /* we don't need to use inline_data strictly */
1505 if (f2fs_has_inline_data(inode)) {
1506 err = f2fs_convert_inline_inode(inode);
1507 if (err)
1508 return err;
1509 }
9ffe0fb5 1510
fcc85a4d
JK
1511 if (f2fs_encrypted_inode(inode) && S_ISREG(inode->i_mode))
1512 return 0;
1513
6f673763 1514 if (check_direct_IO(inode, iter, offset))
944fcfc1
JK
1515 return 0;
1516
6f673763 1517 trace_f2fs_direct_IO_enter(inode, offset, count, iov_iter_rw(iter));
70407fad 1518
6f673763 1519 if (iov_iter_rw(iter) == WRITE)
59b802e5
JK
1520 __allocate_data_blocks(inode, offset, count);
1521
17f8c842 1522 err = blockdev_direct_IO(iocb, inode, iter, offset, get_data_block);
6f673763 1523 if (err < 0 && iov_iter_rw(iter) == WRITE)
3aab8f82 1524 f2fs_write_failed(mapping, offset + count);
70407fad 1525
6f673763 1526 trace_f2fs_direct_IO_exit(inode, offset, count, iov_iter_rw(iter), err);
70407fad 1527
3aab8f82 1528 return err;
eb47b800
JK
1529}
1530
487261f3
CY
1531void f2fs_invalidate_page(struct page *page, unsigned int offset,
1532 unsigned int length)
eb47b800
JK
1533{
1534 struct inode *inode = page->mapping->host;
487261f3 1535 struct f2fs_sb_info *sbi = F2FS_I_SB(inode);
a7ffdbe2 1536
487261f3
CY
1537 if (inode->i_ino >= F2FS_ROOT_INO(sbi) &&
1538 (offset % PAGE_CACHE_SIZE || length != PAGE_CACHE_SIZE))
a7ffdbe2
JK
1539 return;
1540
487261f3
CY
1541 if (PageDirty(page)) {
1542 if (inode->i_ino == F2FS_META_INO(sbi))
1543 dec_page_count(sbi, F2FS_DIRTY_META);
1544 else if (inode->i_ino == F2FS_NODE_INO(sbi))
1545 dec_page_count(sbi, F2FS_DIRTY_NODES);
1546 else
1547 inode_dec_dirty_pages(inode);
1548 }
eb47b800
JK
1549 ClearPagePrivate(page);
1550}
1551
487261f3 1552int f2fs_release_page(struct page *page, gfp_t wait)
eb47b800 1553{
f68daeeb
JK
1554 /* If this is dirty page, keep PagePrivate */
1555 if (PageDirty(page))
1556 return 0;
1557
eb47b800 1558 ClearPagePrivate(page);
c3850aa1 1559 return 1;
eb47b800
JK
1560}
1561
1562static int f2fs_set_data_page_dirty(struct page *page)
1563{
1564 struct address_space *mapping = page->mapping;
1565 struct inode *inode = mapping->host;
1566
26c6b887
JK
1567 trace_f2fs_set_page_dirty(page, DATA);
1568
eb47b800 1569 SetPageUptodate(page);
34ba94ba 1570
1e84371f 1571 if (f2fs_is_atomic_file(inode)) {
34ba94ba
JK
1572 register_inmem_page(inode, page);
1573 return 1;
1574 }
1575
eb47b800
JK
1576 if (!PageDirty(page)) {
1577 __set_page_dirty_nobuffers(page);
a7ffdbe2 1578 update_dirty_page(inode, page);
eb47b800
JK
1579 return 1;
1580 }
1581 return 0;
1582}
1583
c01e54b7
JK
1584static sector_t f2fs_bmap(struct address_space *mapping, sector_t block)
1585{
454ae7e5
CY
1586 struct inode *inode = mapping->host;
1587
b3d208f9
JK
1588 /* we don't need to use inline_data strictly */
1589 if (f2fs_has_inline_data(inode)) {
1590 int err = f2fs_convert_inline_inode(inode);
1591 if (err)
1592 return err;
1593 }
bfad7c2d 1594 return generic_block_bmap(mapping, block, get_data_block);
c01e54b7
JK
1595}
1596
eb47b800
JK
1597const struct address_space_operations f2fs_dblock_aops = {
1598 .readpage = f2fs_read_data_page,
1599 .readpages = f2fs_read_data_pages,
1600 .writepage = f2fs_write_data_page,
1601 .writepages = f2fs_write_data_pages,
1602 .write_begin = f2fs_write_begin,
a1dd3c13 1603 .write_end = f2fs_write_end,
eb47b800 1604 .set_page_dirty = f2fs_set_data_page_dirty,
487261f3
CY
1605 .invalidatepage = f2fs_invalidate_page,
1606 .releasepage = f2fs_release_page,
eb47b800 1607 .direct_IO = f2fs_direct_IO,
c01e54b7 1608 .bmap = f2fs_bmap,
eb47b800 1609};