data.c 98.4 KB
Newer Older
Chao Yu's avatar
Chao Yu committed
1
// SPDX-License-Identifier: GPL-2.0
Jaegeuk Kim's avatar
Jaegeuk Kim committed
2
/*
3 4 5 6 7 8 9 10
 * fs/f2fs/data.c
 *
 * Copyright (c) 2012 Samsung Electronics Co., Ltd.
 *             http://www.samsung.com/
 */
#include <linux/fs.h>
#include <linux/f2fs_fs.h>
#include <linux/buffer_head.h>
11
#include <linux/sched/mm.h>
12 13
#include <linux/mpage.h>
#include <linux/writeback.h>
Chao Yu's avatar
Chao Yu committed
14
#include <linux/pagevec.h>
15 16
#include <linux/blkdev.h>
#include <linux/bio.h>
17
#include <linux/blk-crypto.h>
Jaegeuk Kim's avatar
Jaegeuk Kim committed
18
#include <linux/swap.h>
19
#include <linux/prefetch.h>
20
#include <linux/uio.h>
21
#include <linux/sched/signal.h>
22
#include <linux/fiemap.h>
23
#include <linux/iomap.h>
24 25 26 27

#include "f2fs.h"
#include "node.h"
#include "segment.h"
28
#include "iostat.h"
29
#include <trace/events/f2fs.h>
30

31 32 33
#define NUM_PREALLOC_POST_READ_CTXS	128

static struct kmem_cache *bio_post_read_ctx_cache;
Chao Yu's avatar
Chao Yu committed
34
static struct kmem_cache *bio_entry_slab;
35
static mempool_t *bio_post_read_ctx_pool;
Chao Yu's avatar
Chao Yu committed
36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52
static struct bio_set f2fs_bioset;

#define	F2FS_BIO_POOL_SIZE	NR_CURSEG_TYPE

int __init f2fs_init_bioset(void)
{
	if (bioset_init(&f2fs_bioset, F2FS_BIO_POOL_SIZE,
					0, BIOSET_NEED_BVECS))
		return -ENOMEM;
	return 0;
}

void f2fs_destroy_bioset(void)
{
	bioset_exit(&f2fs_bioset);
}

53 54 55 56 57 58 59 60 61 62 63 64 65
static bool __is_cp_guaranteed(struct page *page)
{
	struct address_space *mapping = page->mapping;
	struct inode *inode;
	struct f2fs_sb_info *sbi;

	if (!mapping)
		return false;

	inode = mapping->host;
	sbi = F2FS_I_SB(inode);

	if (inode->i_ino == F2FS_META_INO(sbi) ||
Jack Qiu's avatar
Jack Qiu committed
66
			inode->i_ino == F2FS_NODE_INO(sbi) ||
67 68 69 70 71 72
			S_ISDIR(inode->i_mode))
		return true;

	if (f2fs_is_compressed_page(page))
		return false;
	if ((S_ISREG(inode->i_mode) &&
73
			(f2fs_is_atomic_file(inode) || IS_NOQUOTA(inode))) ||
74
			page_private_gcing(page))
75 76 77 78
		return true;
	return false;
}

79 80
static enum count_type __read_io_type(struct page *page)
{
Jaegeuk Kim's avatar
Jaegeuk Kim committed
81
	struct address_space *mapping = page_file_mapping(page);
82 83 84 85 86 87 88 89 90 91 92 93 94 95

	if (mapping) {
		struct inode *inode = mapping->host;
		struct f2fs_sb_info *sbi = F2FS_I_SB(inode);

		if (inode->i_ino == F2FS_META_INO(sbi))
			return F2FS_RD_META;

		if (inode->i_ino == F2FS_NODE_INO(sbi))
			return F2FS_RD_NODE;
	}
	return F2FS_RD_DATA;
}

96 97
/* postprocessing steps for read bios */
enum bio_post_read_step {
98 99 100 101 102 103 104 105 106 107 108 109 110 111 112
#ifdef CONFIG_FS_ENCRYPTION
	STEP_DECRYPT	= 1 << 0,
#else
	STEP_DECRYPT	= 0,	/* compile out the decryption-related code */
#endif
#ifdef CONFIG_F2FS_FS_COMPRESSION
	STEP_DECOMPRESS	= 1 << 1,
#else
	STEP_DECOMPRESS	= 0,	/* compile out the decompression-related code */
#endif
#ifdef CONFIG_FS_VERITY
	STEP_VERITY	= 1 << 2,
#else
	STEP_VERITY	= 0,	/* compile out the verity-related code */
#endif
113 114 115 116
};

struct bio_post_read_ctx {
	struct bio *bio;
Chao Yu's avatar
Chao Yu committed
117
	struct f2fs_sb_info *sbi;
118 119
	struct work_struct work;
	unsigned int enabled_steps;
120
	block_t fs_blkaddr;
121 122
};

123
static void f2fs_finish_read_bio(struct bio *bio)
124
{
125
	struct bio_vec *bv;
126
	struct bvec_iter_all iter_all;
127

128 129 130 131
	/*
	 * Update and unlock the bio's pagecache pages, and put the
	 * decompression context for any compressed pages.
	 */
132
	bio_for_each_segment_all(bv, bio, iter_all) {
133
		struct page *page = bv->bv_page;
134

135 136
		if (f2fs_is_compressed_page(page)) {
			if (bio->bi_status)
137
				f2fs_end_read_compressed_page(page, true, 0);
138
			f2fs_put_page_dic(page);
Chao Yu's avatar
Chao Yu committed
139 140 141
			continue;
		}

142
		/* PG_error was set if decryption or verity failed. */
143 144
		if (bio->bi_status || PageError(page)) {
			ClearPageUptodate(page);
145 146
			/* will re-read again later */
			ClearPageError(page);
147 148 149
		} else {
			SetPageUptodate(page);
		}
150
		dec_page_count(F2FS_P_SB(page), __read_io_type(page));
151 152
		unlock_page(page);
	}
153

154 155 156
	if (bio->bi_private)
		mempool_free(bio->bi_private, bio_post_read_ctx_pool);
	bio_put(bio);
Chao Yu's avatar
Chao Yu committed
157 158
}

159
static void f2fs_verify_bio(struct work_struct *work)
160 161 162
{
	struct bio_post_read_ctx *ctx =
		container_of(work, struct bio_post_read_ctx, work);
163
	struct bio *bio = ctx->bio;
164
	bool may_have_compressed_pages = (ctx->enabled_steps & STEP_DECOMPRESS);
165 166 167

	/*
	 * fsverity_verify_bio() may call readpages() again, and while verity
168 169 170 171
	 * will be disabled for this, decryption and/or decompression may still
	 * be needed, resulting in another bio_post_read_ctx being allocated.
	 * So to prevent deadlocks we need to release the current ctx to the
	 * mempool first.  This assumes that verity is the last post-read step.
172 173 174
	 */
	mempool_free(ctx, bio_post_read_ctx_pool);
	bio->bi_private = NULL;
175

176 177 178 179 180 181 182 183 184 185 186 187 188 189 190 191 192
	/*
	 * Verify the bio's pages with fs-verity.  Exclude compressed pages,
	 * as those were handled separately by f2fs_end_read_compressed_page().
	 */
	if (may_have_compressed_pages) {
		struct bio_vec *bv;
		struct bvec_iter_all iter_all;

		bio_for_each_segment_all(bv, bio, iter_all) {
			struct page *page = bv->bv_page;

			if (!f2fs_is_compressed_page(page) &&
			    !PageError(page) && !fsverity_verify_page(page))
				SetPageError(page);
		}
	} else {
		fsverity_verify_bio(bio);
Chao Yu's avatar
Chao Yu committed
193
	}
194

195
	f2fs_finish_read_bio(bio);
196 197
}

198 199 200 201 202 203 204 205 206 207
/*
 * If the bio's data needs to be verified with fs-verity, then enqueue the
 * verity work for the bio.  Otherwise finish the bio now.
 *
 * Note that to avoid deadlocks, the verity work can't be done on the
 * decryption/decompression workqueue.  This is because verifying the data pages
 * can involve reading verity metadata pages from the file, and these verity
 * metadata pages may be encrypted and/or compressed.
 */
static void f2fs_verify_and_finish_bio(struct bio *bio)
Eric Biggers's avatar
Eric Biggers committed
208
{
209
	struct bio_post_read_ctx *ctx = bio->bi_private;
Chao Yu's avatar
Chao Yu committed
210

211 212
	if (ctx && (ctx->enabled_steps & STEP_VERITY)) {
		INIT_WORK(&ctx->work, f2fs_verify_bio);
Chao Yu's avatar
Chao Yu committed
213
		fsverity_enqueue_verify_work(&ctx->work);
214 215
	} else {
		f2fs_finish_read_bio(bio);
Chao Yu's avatar
Chao Yu committed
216 217
	}
}
Eric Biggers's avatar
Eric Biggers committed
218

219 220 221 222 223 224 225 226 227 228
/*
 * Handle STEP_DECOMPRESS by decompressing any compressed clusters whose last
 * remaining page was read by @ctx->bio.
 *
 * Note that a bio may span clusters (even a mix of compressed and uncompressed
 * clusters) or be for just part of a cluster.  STEP_DECOMPRESS just indicates
 * that the bio includes at least one compressed page.  The actual decompression
 * is done on a per-cluster basis, not a per-bio basis.
 */
static void f2fs_handle_step_decompress(struct bio_post_read_ctx *ctx)
229
{
230 231 232
	struct bio_vec *bv;
	struct bvec_iter_all iter_all;
	bool all_compressed = true;
233
	block_t blkaddr = ctx->fs_blkaddr;
Chao Yu's avatar
Chao Yu committed
234

235 236
	bio_for_each_segment_all(bv, ctx->bio, iter_all) {
		struct page *page = bv->bv_page;
Chao Yu's avatar
Chao Yu committed
237

238 239
		/* PG_error was set if decryption failed. */
		if (f2fs_is_compressed_page(page))
240 241
			f2fs_end_read_compressed_page(page, PageError(page),
						blkaddr);
242 243
		else
			all_compressed = false;
244 245

		blkaddr++;
246
	}
Chao Yu's avatar
Chao Yu committed
247

248 249 250 251 252 253 254
	/*
	 * Optimization: if all the bio's pages are compressed, then scheduling
	 * the per-bio verity work is unnecessary, as verity will be fully
	 * handled at the compression cluster level.
	 */
	if (all_compressed)
		ctx->enabled_steps &= ~STEP_VERITY;
255 256
}

257
static void f2fs_post_read_work(struct work_struct *work)
258
{
259 260 261 262 263 264 265 266 267 268
	struct bio_post_read_ctx *ctx =
		container_of(work, struct bio_post_read_ctx, work);

	if (ctx->enabled_steps & STEP_DECRYPT)
		fscrypt_decrypt_bio(ctx->bio);

	if (ctx->enabled_steps & STEP_DECOMPRESS)
		f2fs_handle_step_decompress(ctx);

	f2fs_verify_and_finish_bio(ctx->bio);
269 270 271 272
}

static void f2fs_read_end_io(struct bio *bio)
{
273
	struct f2fs_sb_info *sbi = F2FS_P_SB(bio_first_page_all(bio));
274 275 276 277
	struct bio_post_read_ctx *ctx;

	iostat_update_and_unbind_ctx(bio, 0);
	ctx = bio->bi_private;
278 279 280

	if (time_to_inject(sbi, FAULT_READ_IO)) {
		f2fs_show_injection_info(sbi, FAULT_READ_IO);
281
		bio->bi_status = BLK_STS_IOERR;
282
	}
Chao Yu's avatar
Chao Yu committed
283

284 285
	if (bio->bi_status) {
		f2fs_finish_read_bio(bio);
286
		return;
287
	}
288

289 290 291 292 293 294
	if (ctx && (ctx->enabled_steps & (STEP_DECRYPT | STEP_DECOMPRESS))) {
		INIT_WORK(&ctx->work, f2fs_post_read_work);
		queue_work(ctx->sbi->post_read_wq, &ctx->work);
	} else {
		f2fs_verify_and_finish_bio(bio);
	}
295 296
}

297
static void f2fs_write_end_io(struct bio *bio)
298
{
299
	struct f2fs_sb_info *sbi;
300
	struct bio_vec *bvec;
301
	struct bvec_iter_all iter_all;
302

303 304 305
	iostat_update_and_unbind_ctx(bio, 1);
	sbi = bio->bi_private;

306
	if (time_to_inject(sbi, FAULT_WRITE_IO)) {
307
		f2fs_show_injection_info(sbi, FAULT_WRITE_IO);
308 309 310
		bio->bi_status = BLK_STS_IOERR;
	}

311
	bio_for_each_segment_all(bvec, bio, iter_all) {
312
		struct page *page = bvec->bv_page;
313
		enum count_type type = WB_DATA_TYPE(page);
314

315 316
		if (page_private_dummy(page)) {
			clear_page_private_dummy(page);
317 318 319
			unlock_page(page);
			mempool_free(page, sbi->write_io_dummy);

320
			if (unlikely(bio->bi_status))
321 322 323 324
				f2fs_stop_checkpoint(sbi, true);
			continue;
		}

325
		fscrypt_finalize_bounce_page(&page);
326

Chao Yu's avatar
Chao Yu committed
327 328 329 330 331 332 333
#ifdef CONFIG_F2FS_FS_COMPRESSION
		if (f2fs_is_compressed_page(page)) {
			f2fs_compress_write_end_io(bio, page);
			continue;
		}
#endif

334
		if (unlikely(bio->bi_status)) {
335
			mapping_set_error(page->mapping, -EIO);
336 337
			if (type == F2FS_WB_CP_DATA)
				f2fs_stop_checkpoint(sbi, true);
338
		}
339 340 341 342

		f2fs_bug_on(sbi, page->mapping == NODE_MAPPING(sbi) &&
					page->index != nid_of_node(page));

343
		dec_page_count(sbi, type);
344 345
		if (f2fs_in_warm_node_list(sbi, page))
			f2fs_del_fsync_node_entry(sbi, page);
346
		clear_page_private_gcing(page);
347
		end_page_writeback(page);
348
	}
349
	if (!get_pages(sbi, F2FS_WB_CP_DATA) &&
350
				wq_has_sleeper(&sbi->cp_wait))
351 352 353 354 355
		wake_up(&sbi->cp_wait);

	bio_put(bio);
}

Jaegeuk Kim's avatar
Jaegeuk Kim committed
356
struct block_device *f2fs_target_device(struct f2fs_sb_info *sbi,
357
		block_t blk_addr, sector_t *sector)
Jaegeuk Kim's avatar
Jaegeuk Kim committed
358 359 360 361
{
	struct block_device *bdev = sbi->sb->s_bdev;
	int i;

362 363 364 365 366 367 368 369
	if (f2fs_is_multi_device(sbi)) {
		for (i = 0; i < sbi->s_ndevs; i++) {
			if (FDEV(i).start_blk <= blk_addr &&
			    FDEV(i).end_blk >= blk_addr) {
				blk_addr -= FDEV(i).start_blk;
				bdev = FDEV(i).bdev;
				break;
			}
Jaegeuk Kim's avatar
Jaegeuk Kim committed
370 371
		}
	}
372 373 374

	if (sector)
		*sector = SECTOR_FROM_BLOCK(blk_addr);
Jaegeuk Kim's avatar
Jaegeuk Kim committed
375 376 377 378 379 380 381
	return bdev;
}

int f2fs_target_device_index(struct f2fs_sb_info *sbi, block_t blkaddr)
{
	int i;

382 383 384
	if (!f2fs_is_multi_device(sbi))
		return 0;

Jaegeuk Kim's avatar
Jaegeuk Kim committed
385 386 387 388 389 390
	for (i = 0; i < sbi->s_ndevs; i++)
		if (FDEV(i).start_blk <= blkaddr && FDEV(i).end_blk >= blkaddr)
			return i;
	return 0;
}

391 392 393 394 395 396 397 398 399 400 401 402 403 404 405 406 407 408
static void __attach_io_flag(struct f2fs_io_info *fio, unsigned int io_flag)
{
	unsigned int temp_mask = (1 << NR_TEMP_TYPE) - 1;
	unsigned int fua_flag = io_flag & temp_mask;
	unsigned int meta_flag = (io_flag >> NR_TEMP_TYPE) & temp_mask;

	/*
	 * data/node io flag bits per temp:
	 *      REQ_META     |      REQ_FUA      |
	 *    5 |    4 |   3 |    2 |    1 |   0 |
	 * Cold | Warm | Hot | Cold | Warm | Hot |
	 */
	if ((1 << fio->temp) & meta_flag)
		fio->op_flags |= REQ_META;
	if ((1 << fio->temp) & fua_flag)
		fio->op_flags |= REQ_FUA;
}

409
static struct bio *__bio_alloc(struct f2fs_io_info *fio, int npages)
410
{
411
	struct f2fs_sb_info *sbi = fio->sbi;
412 413
	struct block_device *bdev;
	sector_t sector;
414 415
	struct bio *bio;

416 417 418 419 420
	if (fio->type == DATA)
		__attach_io_flag(fio, sbi->data_io_flag);
	else if (fio->type == NODE)
		__attach_io_flag(fio, sbi->node_io_flag);

421
	bdev = f2fs_target_device(sbi, fio->new_blkaddr, &sector);
422 423
	bio = bio_alloc_bioset(bdev, npages, fio->op | fio->op_flags, GFP_NOIO,
			       &f2fs_bioset);
424
	bio->bi_iter.bi_sector = sector;
425
	if (is_read_io(fio->op)) {
426 427 428 429 430
		bio->bi_end_io = f2fs_read_end_io;
		bio->bi_private = NULL;
	} else {
		bio->bi_end_io = f2fs_write_end_io;
		bio->bi_private = sbi;
431 432
		bio->bi_write_hint = f2fs_io_type_to_rw_hint(sbi,
						fio->type, fio->temp);
433
	}
434 435
	iostat_alloc_and_bind_ctx(sbi, bio, NULL);

436 437
	if (fio->io_wbc)
		wbc_init_bio(fio->io_wbc, bio);
438 439 440 441

	return bio;
}

442 443 444 445 446 447 448 449 450 451 452 453 454 455 456 457 458 459 460 461 462 463 464 465 466 467 468
static void f2fs_set_bio_crypt_ctx(struct bio *bio, const struct inode *inode,
				  pgoff_t first_idx,
				  const struct f2fs_io_info *fio,
				  gfp_t gfp_mask)
{
	/*
	 * The f2fs garbage collector sets ->encrypted_page when it wants to
	 * read/write raw data without encryption.
	 */
	if (!fio || !fio->encrypted_page)
		fscrypt_set_bio_crypt_ctx(bio, inode, first_idx, gfp_mask);
}

static bool f2fs_crypt_mergeable_bio(struct bio *bio, const struct inode *inode,
				     pgoff_t next_idx,
				     const struct f2fs_io_info *fio)
{
	/*
	 * The f2fs garbage collector sets ->encrypted_page when it wants to
	 * read/write raw data without encryption.
	 */
	if (fio && fio->encrypted_page)
		return !bio_has_crypt_ctx(bio);

	return fscrypt_mergeable_bio(bio, inode, next_idx);
}

469 470
static inline void __submit_bio(struct f2fs_sb_info *sbi,
				struct bio *bio, enum page_type type)
471
{
472
	if (!is_read_io(bio_op(bio))) {
473 474 475 476 477
		unsigned int start;

		if (type != DATA && type != NODE)
			goto submit_io;

478
		if (f2fs_lfs_mode(sbi) && current->plug)
479 480
			blk_finish_plug(current->plug);

481
		if (!F2FS_IO_ALIGNED(sbi))
482 483
			goto submit_io;

484 485 486 487 488 489 490 491 492 493
		start = bio->bi_iter.bi_size >> F2FS_BLKSIZE_BITS;
		start %= F2FS_IO_SIZE(sbi);

		if (start == 0)
			goto submit_io;

		/* fill dummy pages */
		for (; start < F2FS_IO_SIZE(sbi); start++) {
			struct page *page =
				mempool_alloc(sbi->write_io_dummy,
494
					      GFP_NOIO | __GFP_NOFAIL);
495 496 497
			f2fs_bug_on(sbi, !page);

			lock_page(page);
498 499 500 501

			zero_user_segment(page, 0, PAGE_SIZE);
			set_page_private_dummy(page);

502 503 504 505 506 507 508 509 510
			if (bio_add_page(bio, page, PAGE_SIZE, 0) < PAGE_SIZE)
				f2fs_bug_on(sbi, 1);
		}
		/*
		 * In the NODE case, we lose next block address chain. So, we
		 * need to do checkpoint in f2fs_sync_file.
		 */
		if (type == NODE)
			set_sbi_flag(sbi, SBI_NEED_CP);
Jaegeuk Kim's avatar
Jaegeuk Kim committed
511
	}
512
submit_io:
Jaegeuk Kim's avatar
Jaegeuk Kim committed
513 514 515 516
	if (is_read_io(bio_op(bio)))
		trace_f2fs_submit_read_bio(sbi->sb, type, bio);
	else
		trace_f2fs_submit_write_bio(sbi->sb, type, bio);
517 518

	iostat_update_submit_ctx(bio, type);
519
	submit_bio(bio);
520 521
}

Chao Yu's avatar
Chao Yu committed
522 523 524 525 526 527
void f2fs_submit_bio(struct f2fs_sb_info *sbi,
				struct bio *bio, enum page_type type)
{
	__submit_bio(sbi, bio, type);
}

Jaegeuk Kim's avatar
Jaegeuk Kim committed
528
static void __submit_merged_bio(struct f2fs_bio_info *io)
529
{
Jaegeuk Kim's avatar
Jaegeuk Kim committed
530
	struct f2fs_io_info *fio = &io->fio;
531 532 533 534

	if (!io->bio)
		return;

Mike Christie's avatar
Mike Christie committed
535
	if (is_read_io(fio->op))
Jaegeuk Kim's avatar
Jaegeuk Kim committed
536
		trace_f2fs_prepare_read_bio(io->sbi->sb, fio->type, io->bio);
537
	else
Jaegeuk Kim's avatar
Jaegeuk Kim committed
538
		trace_f2fs_prepare_write_bio(io->sbi->sb, fio->type, io->bio);
Mike Christie's avatar
Mike Christie committed
539

540
	__submit_bio(io->sbi, io->bio, fio->type);
541 542 543
	io->bio = NULL;
}

Chao Yu's avatar
Chao Yu committed
544
static bool __has_merged_page(struct bio *bio, struct inode *inode,
545
						struct page *page, nid_t ino)
Chao Yu's avatar
Chao Yu committed
546 547
{
	struct bio_vec *bvec;
548
	struct bvec_iter_all iter_all;
Chao Yu's avatar
Chao Yu committed
549

Chao Yu's avatar
Chao Yu committed
550
	if (!bio)
Chao Yu's avatar
Chao Yu committed
551
		return false;
552

553
	if (!inode && !page && !ino)
554
		return true;
Chao Yu's avatar
Chao Yu committed
555

Chao Yu's avatar
Chao Yu committed
556
	bio_for_each_segment_all(bvec, bio, iter_all) {
Chao Yu's avatar
Chao Yu committed
557
		struct page *target = bvec->bv_page;
Chao Yu's avatar
Chao Yu committed
558

Chao Yu's avatar
Chao Yu committed
559
		if (fscrypt_is_bounce_page(target)) {
560
			target = fscrypt_pagecache_page(target);
Chao Yu's avatar
Chao Yu committed
561 562 563 564 565 566 567 568
			if (IS_ERR(target))
				continue;
		}
		if (f2fs_is_compressed_page(target)) {
			target = f2fs_compress_control_page(target);
			if (IS_ERR(target))
				continue;
		}
Chao Yu's avatar
Chao Yu committed
569

570 571
		if (inode && inode == target->mapping->host)
			return true;
572 573
		if (page && page == target)
			return true;
574
		if (ino && ino == ino_of_node(target))
Chao Yu's avatar
Chao Yu committed
575 576 577 578 579 580
			return true;
	}

	return false;
}

581
static void __f2fs_submit_merged_write(struct f2fs_sb_info *sbi,
Jaegeuk Kim's avatar
Jaegeuk Kim committed
582
				enum page_type type, enum temp_type temp)
583 584
{
	enum page_type btype = PAGE_TYPE_OF_BIO(type);
Jaegeuk Kim's avatar
Jaegeuk Kim committed
585
	struct f2fs_bio_info *io = sbi->write_io[btype] + temp;
586

587
	f2fs_down_write(&io->io_rwsem);
Jaegeuk Kim's avatar
Jaegeuk Kim committed
588 589 590 591

	/* change META to META_FLUSH in the checkpoint procedure */
	if (type >= META_FLUSH) {
		io->fio.type = META_FLUSH;
592
		io->bio->bi_opf |= REQ_META | REQ_PRIO | REQ_SYNC;
593
		if (!test_opt(sbi, NOBARRIER))
594
			io->bio->bi_opf |= REQ_PREFLUSH | REQ_FUA;
Jaegeuk Kim's avatar
Jaegeuk Kim committed
595 596
	}
	__submit_merged_bio(io);
597
	f2fs_up_write(&io->io_rwsem);
598 599
}

Jaegeuk Kim's avatar
Jaegeuk Kim committed
600
static void __submit_merged_write_cond(struct f2fs_sb_info *sbi,
601 602
				struct inode *inode, struct page *page,
				nid_t ino, enum page_type type, bool force)
603
{
Jaegeuk Kim's avatar
Jaegeuk Kim committed
604
	enum temp_type temp;
605
	bool ret = true;
Jaegeuk Kim's avatar
Jaegeuk Kim committed
606 607

	for (temp = HOT; temp < NR_TEMP_TYPE; temp++) {
608 609 610
		if (!force)	{
			enum page_type btype = PAGE_TYPE_OF_BIO(type);
			struct f2fs_bio_info *io = sbi->write_io[btype] + temp;
Jaegeuk Kim's avatar
Jaegeuk Kim committed
611

612
			f2fs_down_read(&io->io_rwsem);
Chao Yu's avatar
Chao Yu committed
613
			ret = __has_merged_page(io->bio, inode, page, ino);
614
			f2fs_up_read(&io->io_rwsem);
615 616 617
		}
		if (ret)
			__f2fs_submit_merged_write(sbi, type, temp);
Jaegeuk Kim's avatar
Jaegeuk Kim committed
618 619 620 621 622

		/* TODO: use HOT temp only for meta pages now. */
		if (type >= META)
			break;
	}
623 624
}

625
void f2fs_submit_merged_write(struct f2fs_sb_info *sbi, enum page_type type)
626
{
627
	__submit_merged_write_cond(sbi, NULL, NULL, 0, type, true);
628 629
}

630
void f2fs_submit_merged_write_cond(struct f2fs_sb_info *sbi,
631 632
				struct inode *inode, struct page *page,
				nid_t ino, enum page_type type)
633
{
634
	__submit_merged_write_cond(sbi, inode, page, ino, type, false);
635 636
}

637
void f2fs_flush_merged_writes(struct f2fs_sb_info *sbi)
638
{
639 640 641
	f2fs_submit_merged_write(sbi, DATA);
	f2fs_submit_merged_write(sbi, NODE);
	f2fs_submit_merged_write(sbi, META);
642 643
}

644 645
/*
 * Fill the locked page with data located in the block address.
646
 * A caller needs to unlock the page on failure.
647
 */
648
int f2fs_submit_page_bio(struct f2fs_io_info *fio)
649 650
{
	struct bio *bio;
651 652
	struct page *page = fio->encrypted_page ?
			fio->encrypted_page : fio->page;
653

654
	if (!f2fs_is_valid_blkaddr(fio->sbi, fio->new_blkaddr,
655 656
			fio->is_por ? META_POR : (__is_meta_io(fio) ?
			META_GENERIC : DATA_GENERIC_ENHANCE)))
657
		return -EFSCORRUPTED;
658

659
	trace_f2fs_submit_page_bio(page, fio);
660 661

	/* Allocate a new bio */
662
	bio = __bio_alloc(fio, 1);
663

664 665 666
	f2fs_set_bio_crypt_ctx(bio, fio->page->mapping->host,
			       fio->page->index, fio, GFP_NOIO);

667
	if (bio_add_page(bio, page, PAGE_SIZE, 0) < PAGE_SIZE) {
668 669 670
		bio_put(bio);
		return -EFAULT;
	}
671 672

	if (fio->io_wbc && !is_read_io(fio->op))
673
		wbc_account_cgroup_owner(fio->io_wbc, page, PAGE_SIZE);
674

675 676
	inc_page_count(fio->sbi, is_read_io(fio->op) ?
			__read_io_type(page): WB_DATA_TYPE(fio->page));
Chao Yu's avatar
Chao Yu committed
677 678

	__submit_bio(fio->sbi, bio, fio->type);
679 680 681
	return 0;
}

682 683 684
static bool page_is_mergeable(struct f2fs_sb_info *sbi, struct bio *bio,
				block_t last_blkaddr, block_t cur_blkaddr)
{
685 686 687
	if (unlikely(sbi->max_io_bytes &&
			bio->bi_iter.bi_size >= sbi->max_io_bytes))
		return false;
688 689
	if (last_blkaddr + 1 != cur_blkaddr)
		return false;
690
	return bio->bi_bdev == f2fs_target_device(sbi, cur_blkaddr, NULL);
691 692 693 694 695 696 697 698 699 700 701 702 703 704 705 706
}

static bool io_type_is_mergeable(struct f2fs_bio_info *io,
						struct f2fs_io_info *fio)
{
	if (io->fio.op != fio->op)
		return false;
	return io->fio.op_flags == fio->op_flags;
}

static bool io_is_mergeable(struct f2fs_sb_info *sbi, struct bio *bio,
					struct f2fs_bio_info *io,
					struct f2fs_io_info *fio,
					block_t last_blkaddr,
					block_t cur_blkaddr)
{
707 708 709 710 711 712 713 714 715 716
	if (F2FS_IO_ALIGNED(sbi) && (fio->type == DATA || fio->type == NODE)) {
		unsigned int filled_blocks =
				F2FS_BYTES_TO_BLK(bio->bi_iter.bi_size);
		unsigned int io_size = F2FS_IO_SIZE(sbi);
		unsigned int left_vecs = bio->bi_max_vecs - bio->bi_vcnt;

		/* IOs in bio is aligned and left space of vectors is not enough */
		if (!(filled_blocks % io_size) && left_vecs < io_size)
			return false;
	}
717 718 719 720 721
	if (!page_is_mergeable(sbi, bio, last_blkaddr, cur_blkaddr))
		return false;
	return io_type_is_mergeable(io, fio);
}

Chao Yu's avatar
Chao Yu committed
722 723 724 725 726 727
static void add_bio_entry(struct f2fs_sb_info *sbi, struct bio *bio,
				struct page *page, enum temp_type temp)
{
	struct f2fs_bio_info *io = sbi->write_io[DATA] + temp;
	struct bio_entry *be;

728
	be = f2fs_kmem_cache_alloc(bio_entry_slab, GFP_NOFS, true, NULL);
Chao Yu's avatar
Chao Yu committed
729 730 731 732 733 734
	be->bio = bio;
	bio_get(bio);

	if (bio_add_page(bio, page, PAGE_SIZE, 0) != PAGE_SIZE)
		f2fs_bug_on(sbi, 1);

735
	f2fs_down_write(&io->bio_list_lock);
Chao Yu's avatar
Chao Yu committed
736
	list_add_tail(&be->list, &io->bio_list);
737
	f2fs_up_write(&io->bio_list_lock);
Chao Yu's avatar
Chao Yu committed
738 739 740 741 742 743 744 745
}

static void del_bio_entry(struct bio_entry *be)
{
	list_del(&be->list);
	kmem_cache_free(bio_entry_slab, be);
}

746
static int add_ipu_page(struct f2fs_io_info *fio, struct bio **bio,
Chao Yu's avatar
Chao Yu committed
747 748
							struct page *page)
{
749
	struct f2fs_sb_info *sbi = fio->sbi;
Chao Yu's avatar
Chao Yu committed
750 751 752 753 754 755 756 757 758
	enum temp_type temp;
	bool found = false;
	int ret = -EAGAIN;

	for (temp = HOT; temp < NR_TEMP_TYPE && !found; temp++) {
		struct f2fs_bio_info *io = sbi->write_io[DATA] + temp;
		struct list_head *head = &io->bio_list;
		struct bio_entry *be;

759
		f2fs_down_write(&io->bio_list_lock);
Chao Yu's avatar
Chao Yu committed
760 761 762 763 764 765
		list_for_each_entry(be, head, list) {
			if (be->bio != *bio)
				continue;

			found = true;

766 767 768 769 770 771 772 773
			f2fs_bug_on(sbi, !page_is_mergeable(sbi, *bio,
							    *fio->last_block,
							    fio->new_blkaddr));
			if (f2fs_crypt_mergeable_bio(*bio,
					fio->page->mapping->host,
					fio->page->index, fio) &&
			    bio_add_page(*bio, page, PAGE_SIZE, 0) ==
					PAGE_SIZE) {
Chao Yu's avatar
Chao Yu committed
774 775 776 777
				ret = 0;
				break;
			}

778
			/* page can't be merged into bio; submit the bio */
Chao Yu's avatar
Chao Yu committed
779 780 781 782
			del_bio_entry(be);
			__submit_bio(sbi, *bio, DATA);
			break;
		}
783
		f2fs_up_write(&io->bio_list_lock);
Chao Yu's avatar
Chao Yu committed
784 785 786 787 788 789 790 791 792 793 794 795 796 797 798 799 800 801 802 803 804 805 806 807 808
	}

	if (ret) {
		bio_put(*bio);
		*bio = NULL;
	}

	return ret;
}

void f2fs_submit_merged_ipu_write(struct f2fs_sb_info *sbi,
					struct bio **bio, struct page *page)
{
	enum temp_type temp;
	bool found = false;
	struct bio *target = bio ? *bio : NULL;

	for (temp = HOT; temp < NR_TEMP_TYPE && !found; temp++) {
		struct f2fs_bio_info *io = sbi->write_io[DATA] + temp;
		struct list_head *head = &io->bio_list;
		struct bio_entry *be;

		if (list_empty(head))
			continue;

809
		f2fs_down_read(&io->bio_list_lock);
Chao Yu's avatar
Chao Yu committed
810 811 812 813 814 815 816 817 818
		list_for_each_entry(be, head, list) {
			if (target)
				found = (target == be->bio);
			else
				found = __has_merged_page(be->bio, NULL,
								page, 0);
			if (found)
				break;
		}
819
		f2fs_up_read(&io->bio_list_lock);
Chao Yu's avatar
Chao Yu committed
820 821 822 823 824 825

		if (!found)
			continue;

		found = false;

826
		f2fs_down_write(&io->bio_list_lock);
Chao Yu's avatar
Chao Yu committed
827 828 829 830 831 832 833 834 835 836 837 838
		list_for_each_entry(be, head, list) {
			if (target)
				found = (target == be->bio);
			else
				found = __has_merged_page(be->bio, NULL,
								page, 0);
			if (found) {
				target = be->bio;
				del_bio_entry(be);
				break;
			}
		}
839
		f2fs_up_write(&io->bio_list_lock);
Chao Yu's avatar
Chao Yu committed
840 841 842 843 844 845 846 847 848 849
	}

	if (found)
		__submit_bio(sbi, target, DATA);
	if (bio && *bio) {
		bio_put(*bio);
		*bio = NULL;
	}
}

Chao Yu's avatar
Chao Yu committed
850 851 852 853 854 855 856 857
int f2fs_merge_page_bio(struct f2fs_io_info *fio)
{
	struct bio *bio = *fio->bio;
	struct page *page = fio->encrypted_page ?
			fio->encrypted_page : fio->page;

	if (!f2fs_is_valid_blkaddr(fio->sbi, fio->new_blkaddr,
			__is_meta_io(fio) ? META_GENERIC : DATA_GENERIC))
858
		return -EFSCORRUPTED;
Chao Yu's avatar
Chao Yu committed
859 860 861

	trace_f2fs_submit_page_bio(page, fio);

862
	if (bio && !page_is_mergeable(fio->sbi, bio, *fio->last_block,
Chao Yu's avatar
Chao Yu committed
863 864
						fio->new_blkaddr))
		f2fs_submit_merged_ipu_write(fio->sbi, &bio, NULL);
Chao Yu's avatar
Chao Yu committed
865 866
alloc_new:
	if (!bio) {
867
		bio = __bio_alloc(fio, BIO_MAX_VECS);
868 869
		f2fs_set_bio_crypt_ctx(bio, fio->page->mapping->host,
				       fio->page->index, fio, GFP_NOIO);
Chao Yu's avatar
Chao Yu committed
870

Chao Yu's avatar
Chao Yu committed
871 872
		add_bio_entry(fio->sbi, bio, page, fio->temp);
	} else {
873
		if (add_ipu_page(fio, &bio, page))
Chao Yu's avatar
Chao Yu committed
874
			goto alloc_new;
Chao Yu's avatar
Chao Yu committed
875 876 877
	}

	if (fio->io_wbc)
878
		wbc_account_cgroup_owner(fio->io_wbc, page, PAGE_SIZE);
Chao Yu's avatar
Chao Yu committed
879 880 881 882 883 884 885 886 887

	inc_page_count(fio->sbi, WB_DATA_TYPE(page));

	*fio->last_block = fio->new_blkaddr;
	*fio->bio = bio;

	return 0;
}

888
void f2fs_submit_page_write(struct f2fs_io_info *fio)
889
{
890
	struct f2fs_sb_info *sbi = fio->sbi;
Jaegeuk Kim's avatar
Jaegeuk Kim committed
891
	enum page_type btype = PAGE_TYPE_OF_BIO(fio->type);
Jaegeuk Kim's avatar
Jaegeuk Kim committed
892
	struct f2fs_bio_info *io = sbi->write_io[btype] + fio->temp;
893
	struct page *bio_page;
894

895
	f2fs_bug_on(sbi, is_read_io(fio->op));
896

897
	f2fs_down_write(&io->io_rwsem);
898 899 900 901 902
next:
	if (fio->in_list) {
		spin_lock(&io->io_lock);
		if (list_empty(&io->io_list)) {
			spin_unlock(&io->io_lock);
903
			goto out;
904 905 906 907 908 909
		}
		fio = list_first_entry(&io->io_list,
						struct f2fs_io_info, list);
		list_del(&fio->list);
		spin_unlock(&io->io_lock);
	}
910

911
	verify_fio_blkaddr(fio);
912

Chao Yu's avatar
Chao Yu committed
913 914 915 916 917 918
	if (fio->encrypted_page)
		bio_page = fio->encrypted_page;
	else if (fio->compressed_page)
		bio_page = fio->compressed_page;
	else
		bio_page = fio->page;
919

920 921
	/* set submitted = true as a return value */
	fio->submitted = true;
922

923
	inc_page_count(sbi, WB_DATA_TYPE(bio_page));
924

925 926 927 928 929
	if (io->bio &&
	    (!io_is_mergeable(sbi, io->bio, io, fio, io->last_block_in_bio,
			      fio->new_blkaddr) ||
	     !f2fs_crypt_mergeable_bio(io->bio, fio->page->mapping->host,
				       bio_page->index, fio)))
Jaegeuk Kim's avatar
Jaegeuk Kim committed
930
		__submit_merged_bio(io);
931 932
alloc_new:
	if (io->bio == NULL) {
933 934
		if (F2FS_IO_ALIGNED(sbi) &&
				(fio->type == DATA || fio->type == NODE) &&
935
				fio->new_blkaddr & F2FS_IO_SIZE_MASK(sbi)) {
936
			dec_page_count(sbi, WB_DATA_TYPE(bio_page));
937 938
			fio->retry = true;
			goto skip;
939
		}
940
		io->bio = __bio_alloc(fio, BIO_MAX_VECS);
941 942
		f2fs_set_bio_crypt_ctx(io->bio, fio->page->mapping->host,
				       bio_page->index, fio, GFP_NOIO);
Jaegeuk Kim's avatar
Jaegeuk Kim committed
943
		io->fio = *fio;
944 945
	}

Jaegeuk Kim's avatar
Jaegeuk Kim committed
946
	if (bio_add_page(io->bio, bio_page, PAGE_SIZE, 0) < PAGE_SIZE) {
Jaegeuk Kim's avatar
Jaegeuk Kim committed
947
		__submit_merged_bio(io);
948 949 950
		goto alloc_new;
	}

951
	if (fio->io_wbc)
952
		wbc_account_cgroup_owner(fio->io_wbc, bio_page, PAGE_SIZE);
953

954
	io->last_block_in_bio = fio->new_blkaddr;
955 956

	trace_f2fs_submit_page_write(fio->page, fio);
957
skip:
958 959
	if (fio->in_list)
		goto next;
960
out:
Daniel Rosenberg's avatar
Daniel Rosenberg committed
961
	if (is_sbi_flag_set(sbi, SBI_IS_SHUTDOWN) ||
962
				!f2fs_is_checkpoint_ready(sbi))
Jaegeuk Kim's avatar
Jaegeuk Kim committed
963
		__submit_merged_bio(io);
964
	f2fs_up_write(&io->io_rwsem);
965 966
}

967
static struct bio *f2fs_grab_read_bio(struct inode *inode, block_t blkaddr,
Eric Biggers's avatar
Eric Biggers committed
968
				      unsigned nr_pages, unsigned op_flag,
969
				      pgoff_t first_idx, bool for_write)
970 971 972
{
	struct f2fs_sb_info *sbi = F2FS_I_SB(inode);
	struct bio *bio;
973
	struct bio_post_read_ctx *ctx = NULL;
974
	unsigned int post_read_steps = 0;
975 976
	sector_t sector;
	struct block_device *bdev = f2fs_target_device(sbi, blkaddr, &sector);
977

978 979
	bio = bio_alloc_bioset(bdev, bio_max_segs(nr_pages),
			       REQ_OP_READ | op_flag,
980
			       for_write ? GFP_NOIO : GFP_KERNEL, &f2fs_bioset);
981
	if (!bio)
982
		return ERR_PTR(-ENOMEM);
983
	bio->bi_iter.bi_sector = sector;
984
	f2fs_set_bio_crypt_ctx(bio, inode, first_idx, NULL, GFP_NOFS);
985 986
	bio->bi_end_io = f2fs_read_end_io;

987
	if (fscrypt_inode_uses_fs_layer_crypto(inode))
988
		post_read_steps |= STEP_DECRYPT;
Eric Biggers's avatar
Eric Biggers committed
989

990 991 992 993 994 995 996 997 998 999 1000
	if (f2fs_need_verity(inode, first_idx))
		post_read_steps |= STEP_VERITY;

	/*
	 * STEP_DECOMPRESS is handled specially, since a compressed file might
	 * contain both compressed and uncompressed clusters.  We'll allocate a
	 * bio_post_read_ctx if the file is compressed, but the caller is
	 * responsible for enabling STEP_DECOMPRESS if it's actually needed.
	 */

	if (post_read_steps || f2fs_compressed_file(inode)) {
1001
		/* Due to the mempool, this never fails. */
1002 1003
		ctx = mempool_alloc(bio_post_read_ctx_pool, GFP_NOFS);
		ctx->bio = bio;
Chao Yu's avatar
Chao Yu committed
1004
		ctx->sbi = sbi;
1005
		ctx->enabled_steps = post_read_steps;
1006
		ctx->fs_blkaddr = blkaddr;
1007 1008
		bio->bi_private = ctx;
	}
1009
	iostat_alloc_and_bind_ctx(sbi, bio, ctx);
1010

1011 1012 1013 1014 1015
	return bio;
}

/* This can handle encryption stuffs */
static int f2fs_submit_page_read(struct inode *inode, struct page *page,
1016
				 block_t blkaddr, int op_flags, bool for_write)
1017
{
1018 1019
	struct f2fs_sb_info *sbi = F2FS_I_SB(inode);
	struct bio *bio;
1020

1021
	bio = f2fs_grab_read_bio(inode, blkaddr, 1, op_flags,
1022
					page->index, for_write);
1023 1024 1025
	if (IS_ERR(bio))
		return PTR_ERR(bio);

1026 1027 1028
	/* wait for GCed page writeback via META_MAPPING */
	f2fs_wait_on_block_writeback(inode, blkaddr);

1029 1030 1031 1032
	if (bio_add_page(bio, page, PAGE_SIZE, 0) < PAGE_SIZE) {
		bio_put(bio);
		return -EFAULT;
	}
1033
	ClearPageError(page);
1034
	inc_page_count(sbi, F2FS_RD_DATA);
Chao Yu's avatar
Chao Yu committed
1035
	f2fs_update_iostat(sbi, FS_DATA_READ_IO, F2FS_BLKSIZE);
1036
	__submit_bio(sbi, bio, DATA);
1037 1038 1039
	return 0;
}

1040 1041 1042 1043
static void __set_data_blkaddr(struct dnode_of_data *dn)
{
	struct f2fs_node *rn = F2FS_NODE(dn->node_page);
	__le32 *addr_array;
1044 1045 1046 1047
	int base = 0;

	if (IS_INODE(dn->node_page) && f2fs_has_extra_attr(dn->inode))
		base = get_extra_isize(dn->inode);
1048 1049 1050

	/* Get physical address of data block */
	addr_array = blkaddr_in_node(rn);
1051
	addr_array[base + dn->ofs_in_node] = cpu_to_le32(dn->data_blkaddr);
1052 1053
}

Jaegeuk Kim's avatar
Jaegeuk Kim committed
1054
/*
1055 1056 1057 1058 1059
 * Lock ordering for the change of data block address:
 * ->data_page
 *  ->node_page
 *    update block addresses in the node page
 */
Chao Yu's avatar
Chao Yu committed
1060
void f2fs_set_data_blkaddr(struct dnode_of_data *dn)
1061
{
1062
	f2fs_wait_on_page_writeback(dn->node_page, NODE, true, true);
1063 1064
	__set_data_blkaddr(dn);
	if (set_page_dirty(dn->node_page))
1065
		dn->node_changed = true;
1066 1067
}

1068 1069 1070
void f2fs_update_data_blkaddr(struct dnode_of_data *dn, block_t blkaddr)
{
	dn->data_blkaddr = blkaddr;
Chao Yu's avatar
Chao Yu committed
1071
	f2fs_set_data_blkaddr(dn);
1072 1073 1074
	f2fs_update_extent_cache(dn);
}

1075
/* dn->ofs_in_node will be returned with up-to-date last block pointer */
Chao Yu's avatar
Chao Yu committed
1076
int f2fs_reserve_new_blocks(struct dnode_of_data *dn, blkcnt_t count)
1077
{
1078
	struct f2fs_sb_info *sbi = F2FS_I_SB(dn->inode);
1079
	int err;
1080

1081 1082 1083
	if (!count)
		return 0;

1084
	if (unlikely(is_inode_flag_set(dn->inode, FI_NO_ALLOC)))
1085
		return -EPERM;
1086 1087
	if (unlikely((err = inc_valid_block_count(sbi, dn->inode, &count))))
		return err;
1088

1089 1090 1091
	trace_f2fs_reserve_new_blocks(dn->inode, dn->nid,
						dn->ofs_in_node, count);

1092
	f2fs_wait_on_page_writeback(dn->node_page, NODE, true, true);
1093 1094

	for (; count > 0; dn->ofs_in_node++) {
1095
		block_t blkaddr = f2fs_data_blkaddr(dn);
Yi Zhuang's avatar
Yi Zhuang committed
1096

1097 1098 1099 1100 1101 1102 1103 1104 1105
		if (blkaddr == NULL_ADDR) {
			dn->data_blkaddr = NEW_ADDR;
			__set_data_blkaddr(dn);
			count--;
		}
	}

	if (set_page_dirty(dn->node_page))
		dn->node_changed = true;
1106 1107 1108
	return 0;
}

1109
/* Should keep dn->ofs_in_node unchanged */
Chao Yu's avatar
Chao Yu committed
1110
int f2fs_reserve_new_block(struct dnode_of_data *dn)
1111 1112 1113 1114
{
	unsigned int ofs_in_node = dn->ofs_in_node;
	int ret;

Chao Yu's avatar
Chao Yu committed
1115
	ret = f2fs_reserve_new_blocks(dn, 1);
1116 1117 1118 1119
	dn->ofs_in_node = ofs_in_node;
	return ret;
}

1120 1121 1122 1123 1124
int f2fs_reserve_block(struct dnode_of_data *dn, pgoff_t index)
{
	bool need_put = dn->inode_page ? false : true;
	int err;

Chao Yu's avatar
Chao Yu committed
1125
	err = f2fs_get_dnode_of_data(dn, index, ALLOC_NODE);
1126 1127
	if (err)
		return err;
1128

1129
	if (dn->data_blkaddr == NULL_ADDR)
Chao Yu's avatar
Chao Yu committed
1130
		err = f2fs_reserve_new_block(dn);
1131
	if (err || need_put)
1132 1133 1134 1135
		f2fs_put_dnode(dn);
	return err;
}

1136
int f2fs_get_block(struct dnode_of_data *dn, pgoff_t index)
1137
{
1138
	struct extent_info ei = {0, };
1139
	struct inode *inode = dn->inode;
1140

1141 1142 1143
	if (f2fs_lookup_extent_cache(inode, index, &ei)) {
		dn->data_blkaddr = ei.blk + index - ei.fofs;
		return 0;
1144
	}
1145

1146
	return f2fs_reserve_block(dn, index);
1147 1148
}

Chao Yu's avatar
Chao Yu committed
1149
struct page *f2fs_get_read_data_page(struct inode *inode, pgoff_t index,
Mike Christie's avatar
Mike Christie committed
1150
						int op_flags, bool for_write)
1151 1152 1153 1154
{
	struct address_space *mapping = inode->i_mapping;
	struct dnode_of_data dn;
	struct page *page;
1155
	struct extent_info ei = {0, };
1156
	int err;
1157

1158
	page = f2fs_grab_cache_page(mapping, index, for_write);
1159 1160 1161
	if (!page)
		return ERR_PTR(-ENOMEM);

Chao Yu's avatar
Chao Yu committed
1162 1163
	if (f2fs_lookup_extent_cache(inode, index, &ei)) {
		dn.data_blkaddr = ei.blk + index - ei.fofs;
1164 1165
		if (!f2fs_is_valid_blkaddr(F2FS_I_SB(inode), dn.data_blkaddr,
						DATA_GENERIC_ENHANCE_READ)) {
1166
			err = -EFSCORRUPTED;
1167 1168
			goto put_err;
		}
Chao Yu's avatar
Chao Yu committed
1169 1170 1171
		goto got_it;
	}

1172
	set_new_dnode(&dn, inode, NULL, NULL, 0);
Chao Yu's avatar
Chao Yu committed
1173
	err = f2fs_get_dnode_of_data(&dn, index, LOOKUP_NODE);
1174 1175
	if (err)
		goto put_err;
1176 1177
	f2fs_put_dnode(&dn);

1178
	if (unlikely(dn.data_blkaddr == NULL_ADDR)) {
1179 1180
		err = -ENOENT;
		goto put_err;
1181
	}
1182 1183 1184 1185
	if (dn.data_blkaddr != NEW_ADDR &&
			!f2fs_is_valid_blkaddr(F2FS_I_SB(inode),
						dn.data_blkaddr,
						DATA_GENERIC_ENHANCE)) {
1186
		err = -EFSCORRUPTED;
1187 1188
		goto put_err;
	}
Chao Yu's avatar
Chao Yu committed
1189
got_it:
1190 1191
	if (PageUptodate(page)) {
		unlock_page(page);
1192
		return page;
1193
	}
1194

Jaegeuk Kim's avatar
Jaegeuk Kim committed
1195 1196 1197 1198
	/*
	 * A new dentry page is allocated but not able to be written, since its
	 * new inode page couldn't be allocated due to -ENOSPC.
	 * In such the case, its blkaddr can be remained as NEW_ADDR.
Chao Yu's avatar
Chao Yu committed
1199 1200
	 * see, f2fs_add_link -> f2fs_get_new_data_page ->
	 * f2fs_init_inode_metadata.
Jaegeuk Kim's avatar
Jaegeuk Kim committed
1201 1202
	 */
	if (dn.data_blkaddr == NEW_ADDR) {
1203
		zero_user_segment(page, 0, PAGE_SIZE);
1204 1205
		if (!PageUptodate(page))
			SetPageUptodate(page);
1206
		unlock_page(page);
Jaegeuk Kim's avatar
Jaegeuk Kim committed
1207 1208
		return page;
	}
1209

1210 1211
	err = f2fs_submit_page_read(inode, page, dn.data_blkaddr,
						op_flags, for_write);
1212
	if (err)
1213
		goto put_err;
1214
	return page;
1215 1216 1217 1218

put_err:
	f2fs_put_page(page, 1);
	return ERR_PTR(err);
1219 1220
}

Chao Yu's avatar
Chao Yu committed
1221
struct page *f2fs_find_data_page(struct inode *inode, pgoff_t index)
1222 1223 1224 1225 1226 1227 1228 1229 1230
{
	struct address_space *mapping = inode->i_mapping;
	struct page *page;

	page = find_get_page(mapping, index);
	if (page && PageUptodate(page))
		return page;
	f2fs_put_page(page, 0);

Chao Yu's avatar
Chao Yu committed
1231
	page = f2fs_get_read_data_page(inode, index, 0, false);
1232 1233 1234 1235 1236 1237 1238 1239 1240 1241 1242 1243 1244 1245 1246 1247 1248 1249 1250
	if (IS_ERR(page))
		return page;

	if (PageUptodate(page))
		return page;

	wait_on_page_locked(page);
	if (unlikely(!PageUptodate(page))) {
		f2fs_put_page(page, 0);
		return ERR_PTR(-EIO);
	}
	return page;
}

/*
 * If it tries to access a hole, return an error.
 * Because, the callers, functions in dir.c and GC, should be able to know
 * whether this page exists or not.
 */
Chao Yu's avatar
Chao Yu committed
1251
struct page *f2fs_get_lock_data_page(struct inode *inode, pgoff_t index,
1252
							bool for_write)
1253 1254 1255 1256
{
	struct address_space *mapping = inode->i_mapping;
	struct page *page;
repeat:
Chao Yu's avatar
Chao Yu committed
1257
	page = f2fs_get_read_data_page(inode, index, 0, for_write);
1258 1259
	if (IS_ERR(page))
		return page;
1260

1261
	/* wait for read completion */
1262
	lock_page(page);
1263
	if (unlikely(page->mapping != mapping)) {
1264 1265
		f2fs_put_page(page, 1);
		goto repeat;
1266
	}
1267 1268 1269 1270
	if (unlikely(!PageUptodate(page))) {
		f2fs_put_page(page, 1);
		return ERR_PTR(-EIO);
	}
1271 1272 1273
	return page;
}

Jaegeuk Kim's avatar
Jaegeuk Kim committed
1274
/*
1275 1276
 * Caller ensures that this data page is never allocated.
 * A new zero-filled data page is allocated in the page cache.
1277
 *
Chao Yu's avatar
Chao Yu committed
1278 1279
 * Also, caller should grab and release a rwsem by calling f2fs_lock_op() and
 * f2fs_unlock_op().
1280 1281
 * Note that, ipage is set only by make_empty_dir, and if any error occur,
 * ipage should be released by this function.
1282
 */
Chao Yu's avatar
Chao Yu committed
1283
struct page *f2fs_get_new_data_page(struct inode *inode,
1284
		struct page *ipage, pgoff_t index, bool new_i_size)
1285 1286 1287 1288 1289
{
	struct address_space *mapping = inode->i_mapping;
	struct page *page;
	struct dnode_of_data dn;
	int err;
1290

1291
	page = f2fs_grab_cache_page(mapping, index, true);
1292 1293 1294 1295 1296 1297
	if (!page) {
		/*
		 * before exiting, we should make sure ipage will be released
		 * if any error occur.
		 */
		f2fs_put_page(ipage, 1);
1298
		return ERR_PTR(-ENOMEM);
1299
	}
1300

1301
	set_new_dnode(&dn, inode, ipage, NULL, 0);
1302
	err = f2fs_reserve_block(&dn, index);
1303 1304
	if (err) {
		f2fs_put_page(page, 1);
1305
		return ERR_PTR(err);
1306
	}
1307 1308
	if (!ipage)
		f2fs_put_dnode(&dn);
1309 1310

	if (PageUptodate(page))
1311
		goto got_it;
1312 1313

	if (dn.data_blkaddr == NEW_ADDR) {
1314
		zero_user_segment(page, 0, PAGE_SIZE);
1315 1316
		if (!PageUptodate(page))
			SetPageUptodate(page);
1317
	} else {
1318
		f2fs_put_page(page, 1);
1319

1320 1321
		/* if ipage exists, blkaddr should be NEW_ADDR */
		f2fs_bug_on(F2FS_I_SB(inode), ipage);
Chao Yu's avatar
Chao Yu committed
1322
		page = f2fs_get_lock_data_page(inode, index, true);
1323
		if (IS_ERR(page))
1324
			return page;
1325
	}
1326
got_it:
1327
	if (new_i_size && i_size_read(inode) <
1328
				((loff_t)(index + 1) << PAGE_SHIFT))
1329
		f2fs_i_size_write(inode, ((loff_t)(index + 1) << PAGE_SHIFT));
1330 1331 1332
	return page;
}

1333
static int __allocate_data_block(struct dnode_of_data *dn, int seg_type)
1334
{
1335
	struct f2fs_sb_info *sbi = F2FS_I_SB(dn->inode);
1336 1337
	struct f2fs_summary sum;
	struct node_info ni;
1338
	block_t old_blkaddr;
1339
	blkcnt_t count = 1;
1340
	int err;
1341

1342
	if (unlikely(is_inode_flag_set(dn->inode, FI_NO_ALLOC)))
1343
		return -EPERM;
1344

1345
	err = f2fs_get_node_info(sbi, dn->nid, &ni, false);
1346 1347 1348
	if (err)
		return err;

1349
	dn->data_blkaddr = f2fs_data_blkaddr(dn);
1350
	if (dn->data_blkaddr != NULL_ADDR)
1351 1352
		goto alloc;

1353 1354
	if (unlikely((err = inc_valid_block_count(sbi, dn->inode, &count))))
		return err;
1355

1356
alloc:
1357
	set_summary(&sum, dn->nid, dn->ofs_in_node, ni.version);
1358 1359
	old_blkaddr = dn->data_blkaddr;
	f2fs_allocate_data_block(sbi, NULL, old_blkaddr, &dn->data_blkaddr,
1360
				&sum, seg_type, NULL);
1361
	if (GET_SEGNO(sbi, old_blkaddr) != NULL_SEGNO) {
1362 1363
		invalidate_mapping_pages(META_MAPPING(sbi),
					old_blkaddr, old_blkaddr);
1364 1365
		f2fs_invalidate_compress_page(sbi, old_blkaddr);
	}
1366
	f2fs_update_data_blkaddr(dn, dn->data_blkaddr);
1367 1368 1369
	return 0;
}

1370
void f2fs_do_map_lock(struct f2fs_sb_info *sbi, int flag, bool lock)
1371 1372 1373
{
	if (flag == F2FS_GET_BLOCK_PRE_AIO) {
		if (lock)
1374
			f2fs_down_read(&sbi->node_change);
1375
		else
1376
			f2fs_up_read(&sbi->node_change);
1377 1378 1379 1380 1381 1382 1383 1384
	} else {
		if (lock)
			f2fs_lock_op(sbi);
		else
			f2fs_unlock_op(sbi);
	}
}

Jaegeuk Kim's avatar
Jaegeuk Kim committed
1385
/*
Chao Yu's avatar
Chao Yu committed
1386 1387 1388
 * f2fs_map_blocks() tries to find or build mapping relationship which
 * maps continuous logical blocks to physical blocks, and return such
 * info via f2fs_map_blocks structure.
1389
 */
Chao Yu's avatar
Chao Yu committed
1390
int f2fs_map_blocks(struct inode *inode, struct f2fs_map_blocks *map,
1391
						int create, int flag)
1392
{
Jaegeuk Kim's avatar
Jaegeuk Kim committed
1393
	unsigned int maxblocks = map->m_len;
1394
	struct dnode_of_data dn;
1395
	struct f2fs_sb_info *sbi = F2FS_I_SB(inode);
1396
	int mode = map->m_may_create ? ALLOC_NODE : LOOKUP_NODE;
1397
	pgoff_t pgofs, end_offset, end;
1398
	int err = 0, ofs = 1;
1399 1400
	unsigned int ofs_in_node, last_ofs_in_node;
	blkcnt_t prealloc;
1401
	struct extent_info ei = {0, };
1402
	block_t blkaddr;
1403
	unsigned int start_pgofs;
1404
	int bidx = 0;
1405

1406 1407 1408
	if (!maxblocks)
		return 0;

1409 1410 1411 1412
	map->m_bdev = inode->i_sb->s_bdev;
	map->m_multidev_dio =
		f2fs_allow_multi_device_dio(F2FS_I_SB(inode), flag);

Jaegeuk Kim's avatar
Jaegeuk Kim committed
1413 1414 1415 1416 1417
	map->m_len = 0;
	map->m_flags = 0;

	/* it only supports block size == page size */
	pgofs =	(pgoff_t)map->m_lblk;
1418
	end = pgofs + maxblocks;
1419

1420
	if (!create && f2fs_lookup_extent_cache(inode, pgofs, &ei)) {
1421
		if (f2fs_lfs_mode(sbi) && flag == F2FS_GET_BLOCK_DIO &&
1422 1423 1424
							map->m_may_create)
			goto next_dnode;

Jaegeuk Kim's avatar
Jaegeuk Kim committed
1425 1426 1427
		map->m_pblk = ei.blk + pgofs - ei.fofs;
		map->m_len = min((pgoff_t)maxblocks, ei.fofs + ei.len - pgofs);
		map->m_flags = F2FS_MAP_MAPPED;
1428 1429
		if (map->m_next_extent)
			*map->m_next_extent = pgofs + map->m_len;
1430 1431 1432 1433 1434

		/* for hardware encryption, but to avoid potential issue in future */
		if (flag == F2FS_GET_BLOCK_DIO)
			f2fs_wait_on_block_writeback_range(inode,
						map->m_pblk, map->m_len);
1435 1436 1437 1438 1439 1440 1441 1442 1443 1444 1445 1446 1447 1448 1449

		if (map->m_multidev_dio) {
			block_t blk_addr = map->m_pblk;

			bidx = f2fs_target_device_index(sbi, map->m_pblk);

			map->m_bdev = FDEV(bidx).bdev;
			map->m_pblk -= FDEV(bidx).start_blk;
			map->m_len = min(map->m_len,
				FDEV(bidx).end_blk + 1 - map->m_pblk);

			if (map->m_may_create)
				f2fs_update_device_state(sbi, inode->i_ino,
							blk_addr, map->m_len);
		}
1450
		goto out;
1451
	}
1452

Chao Yu's avatar
Chao Yu committed
1453
next_dnode:
1454
	if (map->m_may_create)
1455
		f2fs_do_map_lock(sbi, flag, true);
1456 1457 1458

	/* When reading holes, we need its node page */
	set_new_dnode(&dn, inode, NULL, NULL, 0);
Chao Yu's avatar
Chao Yu committed
1459
	err = f2fs_get_dnode_of_data(&dn, pgofs, mode);
1460
	if (err) {
1461 1462
		if (flag == F2FS_GET_BLOCK_BMAP)
			map->m_pblk = 0;
1463

1464
		if (err == -ENOENT) {
1465 1466 1467 1468 1469 1470 1471 1472 1473 1474 1475 1476 1477
			/*
			 * There is one exceptional case that read_node_page()
			 * may return -ENOENT due to filesystem has been
			 * shutdown or cp_error, so force to convert error
			 * number to EIO for such case.
			 */
			if (map->m_may_create &&
				(is_sbi_flag_set(sbi, SBI_IS_SHUTDOWN) ||
				f2fs_cp_error(sbi))) {
				err = -EIO;
				goto unlock_out;
			}

1478
			err = 0;
1479 1480
			if (map->m_next_pgofs)
				*map->m_next_pgofs =
Chao Yu's avatar
Chao Yu committed
1481
					f2fs_get_next_page_offset(&dn, pgofs);
1482 1483
			if (map->m_next_extent)
				*map->m_next_extent =
Chao Yu's avatar
Chao Yu committed
1484
					f2fs_get_next_page_offset(&dn, pgofs);
1485
		}
1486
		goto unlock_out;
1487
	}
Chao Yu's avatar
Chao Yu committed
1488

1489
	start_pgofs = pgofs;
1490
	prealloc = 0;
1491
	last_ofs_in_node = ofs_in_node = dn.ofs_in_node;
1492
	end_offset = ADDRS_PER_PAGE(dn.node_page, inode);
Chao Yu's avatar
Chao Yu committed
1493 1494

next_block:
1495
	blkaddr = f2fs_data_blkaddr(&dn);
Chao Yu's avatar
Chao Yu committed
1496

1497
	if (__is_valid_data_blkaddr(blkaddr) &&
1498
		!f2fs_is_valid_blkaddr(sbi, blkaddr, DATA_GENERIC_ENHANCE)) {
1499
		err = -EFSCORRUPTED;
1500 1501 1502
		goto sync_out;
	}

1503
	if (__is_valid_data_blkaddr(blkaddr)) {
1504
		/* use out-place-update for driect IO under LFS mode */
1505
		if (f2fs_lfs_mode(sbi) && flag == F2FS_GET_BLOCK_DIO &&
1506
							map->m_may_create) {
1507
			err = __allocate_data_block(&dn, map->m_seg_type);
1508 1509 1510 1511
			if (err)
				goto sync_out;
			blkaddr = dn.data_blkaddr;
			set_inode_flag(inode, FI_APPEND_WRITE);
1512 1513
		}
	} else {
Chao Yu's avatar
Chao Yu committed
1514
		if (create) {
1515 1516
			if (unlikely(f2fs_cp_error(sbi))) {
				err = -EIO;
Chao Yu's avatar
Chao Yu committed
1517
				goto sync_out;
1518
			}
1519
			if (flag == F2FS_GET_BLOCK_PRE_AIO) {
1520 1521 1522 1523
				if (blkaddr == NULL_ADDR) {
					prealloc++;
					last_ofs_in_node = dn.ofs_in_node;
				}
1524
			} else {
1525 1526
				WARN_ON(flag != F2FS_GET_BLOCK_PRE_DIO &&
					flag != F2FS_GET_BLOCK_DIO);
1527 1528
				err = __allocate_data_block(&dn,
							map->m_seg_type);
1529 1530 1531
				if (!err) {
					if (flag == F2FS_GET_BLOCK_PRE_DIO)
						file_need_truncate(inode);
1532
					set_inode_flag(inode, FI_APPEND_WRITE);
1533
				}
1534
			}
Chao Yu's avatar
Chao Yu committed
1535
			if (err)
Chao Yu's avatar
Chao Yu committed
1536
				goto sync_out;
1537
			map->m_flags |= F2FS_MAP_NEW;
Chao Yu's avatar
Chao Yu committed
1538
			blkaddr = dn.data_blkaddr;
Chao Yu's avatar
Chao Yu committed
1539
		} else {
1540 1541 1542 1543 1544 1545 1546
			if (f2fs_compressed_file(inode) &&
					f2fs_sanity_check_cluster(&dn) &&
					(flag != F2FS_GET_BLOCK_FIEMAP ||
					IS_ENABLED(CONFIG_F2FS_CHECK_FS))) {
				err = -EFSCORRUPTED;
				goto sync_out;
			}
1547 1548 1549 1550
			if (flag == F2FS_GET_BLOCK_BMAP) {
				map->m_pblk = 0;
				goto sync_out;
			}
1551 1552
			if (flag == F2FS_GET_BLOCK_PRECACHE)
				goto sync_out;
1553 1554 1555 1556
			if (flag == F2FS_GET_BLOCK_FIEMAP &&
						blkaddr == NULL_ADDR) {
				if (map->m_next_pgofs)
					*map->m_next_pgofs = pgofs + 1;
Chao Yu's avatar
Chao Yu committed
1557
				goto sync_out;
1558
			}
1559 1560 1561 1562
			if (flag != F2FS_GET_BLOCK_FIEMAP) {
				/* for defragment case */
				if (map->m_next_pgofs)
					*map->m_next_pgofs = pgofs + 1;
Chao Yu's avatar
Chao Yu committed
1563
				goto sync_out;
1564
			}
1565 1566
		}
	}
1567

1568 1569 1570
	if (flag == F2FS_GET_BLOCK_PRE_AIO)
		goto skip;

1571 1572 1573
	if (map->m_multidev_dio)
		bidx = f2fs_target_device_index(sbi, blkaddr);

Chao Yu's avatar
Chao Yu committed
1574 1575 1576 1577 1578 1579 1580 1581
	if (map->m_len == 0) {
		/* preallocated unwritten block should be mapped for fiemap. */
		if (blkaddr == NEW_ADDR)
			map->m_flags |= F2FS_MAP_UNWRITTEN;
		map->m_flags |= F2FS_MAP_MAPPED;

		map->m_pblk = blkaddr;
		map->m_len = 1;
1582 1583 1584

		if (map->m_multidev_dio)
			map->m_bdev = FDEV(bidx).bdev;
Chao Yu's avatar
Chao Yu committed
1585 1586
	} else if ((map->m_pblk != NEW_ADDR &&
			blkaddr == (map->m_pblk + ofs)) ||
1587
			(map->m_pblk == NEW_ADDR && blkaddr == NEW_ADDR) ||
1588
			flag == F2FS_GET_BLOCK_PRE_DIO) {
1589 1590
		if (map->m_multidev_dio && map->m_bdev != FDEV(bidx).bdev)
			goto sync_out;
Chao Yu's avatar
Chao Yu committed
1591 1592 1593 1594 1595
		ofs++;
		map->m_len++;
	} else {
		goto sync_out;
	}
1596

1597
skip:
1598 1599 1600
	dn.ofs_in_node++;
	pgofs++;

1601 1602 1603
	/* preallocate blocks in batch for one dnode page */
	if (flag == F2FS_GET_BLOCK_PRE_AIO &&
			(pgofs == end || dn.ofs_in_node == end_offset)) {
1604

1605
		dn.ofs_in_node = ofs_in_node;
Chao Yu's avatar
Chao Yu committed
1606
		err = f2fs_reserve_new_blocks(&dn, prealloc);
1607 1608
		if (err)
			goto sync_out;
1609

1610 1611 1612 1613
		map->m_len += dn.ofs_in_node - ofs_in_node;
		if (prealloc && dn.ofs_in_node != last_ofs_in_node + 1) {
			err = -ENOSPC;
			goto sync_out;
1614
		}
1615 1616 1617 1618 1619 1620 1621 1622
		dn.ofs_in_node = end_offset;
	}

	if (pgofs >= end)
		goto sync_out;
	else if (dn.ofs_in_node < end_offset)
		goto next_block;

1623 1624 1625 1626 1627 1628 1629 1630 1631 1632
	if (flag == F2FS_GET_BLOCK_PRECACHE) {
		if (map->m_flags & F2FS_MAP_MAPPED) {
			unsigned int ofs = start_pgofs - map->m_lblk;

			f2fs_update_extent_cache_range(&dn,
				start_pgofs, map->m_pblk + ofs,
				map->m_len - ofs);
		}
	}

1633 1634
	f2fs_put_dnode(&dn);

1635
	if (map->m_may_create) {
1636
		f2fs_do_map_lock(sbi, flag, false);
1637
		f2fs_balance_fs(sbi, dn.node_changed);
1638
	}
1639
	goto next_dnode;
1640

1641
sync_out:
1642

1643 1644 1645 1646 1647
	if (flag == F2FS_GET_BLOCK_DIO && map->m_flags & F2FS_MAP_MAPPED) {
		/*
		 * for hardware encryption, but to avoid potential issue
		 * in future
		 */
1648 1649
		f2fs_wait_on_block_writeback_range(inode,
						map->m_pblk, map->m_len);
1650 1651
		invalidate_mapping_pages(META_MAPPING(sbi),
						map->m_pblk, map->m_pblk);
1652

1653 1654 1655 1656 1657 1658 1659 1660 1661 1662 1663 1664 1665 1666 1667 1668 1669
		if (map->m_multidev_dio) {
			block_t blk_addr = map->m_pblk;

			bidx = f2fs_target_device_index(sbi, map->m_pblk);

			map->m_bdev = FDEV(bidx).bdev;
			map->m_pblk -= FDEV(bidx).start_blk;

			if (map->m_may_create)
				f2fs_update_device_state(sbi, inode->i_ino,
							blk_addr, map->m_len);

			f2fs_bug_on(sbi, blk_addr + map->m_len >
						FDEV(bidx).end_blk + 1);
		}
	}

1670 1671 1672 1673 1674 1675 1676 1677 1678 1679 1680
	if (flag == F2FS_GET_BLOCK_PRECACHE) {
		if (map->m_flags & F2FS_MAP_MAPPED) {
			unsigned int ofs = start_pgofs - map->m_lblk;

			f2fs_update_extent_cache_range(&dn,
				start_pgofs, map->m_pblk + ofs,
				map->m_len - ofs);
		}
		if (map->m_next_extent)
			*map->m_next_extent = pgofs + 1;
	}
1681
	f2fs_put_dnode(&dn);
1682
unlock_out:
1683
	if (map->m_may_create) {
1684
		f2fs_do_map_lock(sbi, flag, false);
1685
		f2fs_balance_fs(sbi, dn.node_changed);
1686
	}
1687
out:
1688
	trace_f2fs_map_blocks(inode, map, create, flag, err);
1689
	return err;
1690 1691
}

Hyunchul Lee's avatar
Hyunchul Lee committed
1692 1693 1694 1695 1696 1697 1698 1699 1700 1701 1702 1703 1704
bool f2fs_overwrite_io(struct inode *inode, loff_t pos, size_t len)
{
	struct f2fs_map_blocks map;
	block_t last_lblk;
	int err;

	if (pos + len > i_size_read(inode))
		return false;

	map.m_lblk = F2FS_BYTES_TO_BLK(pos);
	map.m_next_pgofs = NULL;
	map.m_next_extent = NULL;
	map.m_seg_type = NO_CHECK_TYPE;
1705
	map.m_may_create = false;
Hyunchul Lee's avatar
Hyunchul Lee committed
1706 1707 1708 1709 1710 1711 1712 1713 1714 1715 1716 1717
	last_lblk = F2FS_BLK_ALIGN(pos + len);

	while (map.m_lblk < last_lblk) {
		map.m_len = last_lblk - map.m_lblk;
		err = f2fs_map_blocks(inode, &map, 0, F2FS_GET_BLOCK_DEFAULT);
		if (err || map.m_len == 0)
			return false;
		map.m_lblk += map.m_len;
	}
	return true;
}

1718 1719 1720 1721 1722 1723 1724 1725 1726 1727
static inline u64 bytes_to_blks(struct inode *inode, u64 bytes)
{
	return (bytes >> inode->i_blkbits);
}

static inline u64 blks_to_bytes(struct inode *inode, u64 blks)
{
	return (blks << inode->i_blkbits);
}

Chao Yu's avatar
Chao Yu committed
1728 1729 1730 1731 1732 1733 1734 1735 1736 1737 1738 1739 1740 1741 1742 1743 1744 1745 1746
static int f2fs_xattr_fiemap(struct inode *inode,
				struct fiemap_extent_info *fieinfo)
{
	struct f2fs_sb_info *sbi = F2FS_I_SB(inode);
	struct page *page;
	struct node_info ni;
	__u64 phys = 0, len;
	__u32 flags;
	nid_t xnid = F2FS_I(inode)->i_xattr_nid;
	int err = 0;

	if (f2fs_has_inline_xattr(inode)) {
		int offset;

		page = f2fs_grab_cache_page(NODE_MAPPING(sbi),
						inode->i_ino, false);
		if (!page)
			return -ENOMEM;

1747
		err = f2fs_get_node_info(sbi, inode->i_ino, &ni, false);
1748 1749 1750 1751
		if (err) {
			f2fs_put_page(page, 1);
			return err;
		}
Chao Yu's avatar
Chao Yu committed
1752

1753
		phys = blks_to_bytes(inode, ni.blk_addr);
Chao Yu's avatar
Chao Yu committed
1754 1755
		offset = offsetof(struct f2fs_inode, i_addr) +
					sizeof(__le32) * (DEF_ADDRS_PER_INODE -
1756
					get_inline_xattr_addrs(inode));
Chao Yu's avatar
Chao Yu committed
1757 1758 1759 1760 1761 1762 1763 1764 1765 1766 1767 1768

		phys += offset;
		len = inline_xattr_size(inode);

		f2fs_put_page(page, 1);

		flags = FIEMAP_EXTENT_DATA_INLINE | FIEMAP_EXTENT_NOT_ALIGNED;

		if (!xnid)
			flags |= FIEMAP_EXTENT_LAST;

		err = fiemap_fill_next_extent(fieinfo, 0, phys, len, flags);
1769
		trace_f2fs_fiemap(inode, 0, phys, len, flags, err);
Chao Yu's avatar
Chao Yu committed
1770 1771 1772 1773 1774 1775 1776 1777 1778
		if (err || err == 1)
			return err;
	}

	if (xnid) {
		page = f2fs_grab_cache_page(NODE_MAPPING(sbi), xnid, false);
		if (!page)
			return -ENOMEM;

1779
		err = f2fs_get_node_info(sbi, xnid, &ni, false);
1780 1781 1782 1783
		if (err) {
			f2fs_put_page(page, 1);
			return err;
		}
Chao Yu's avatar
Chao Yu committed
1784

1785
		phys = blks_to_bytes(inode, ni.blk_addr);
Chao Yu's avatar
Chao Yu committed
1786 1787 1788 1789 1790 1791 1792
		len = inode->i_sb->s_blocksize;

		f2fs_put_page(page, 1);

		flags = FIEMAP_EXTENT_LAST;
	}

1793
	if (phys) {
Chao Yu's avatar
Chao Yu committed
1794
		err = fiemap_fill_next_extent(fieinfo, 0, phys, len, flags);
1795 1796
		trace_f2fs_fiemap(inode, 0, phys, len, flags, err);
	}
Chao Yu's avatar
Chao Yu committed
1797 1798 1799 1800

	return (err < 0 ? err : 0);
}

1801 1802 1803 1804 1805 1806 1807 1808 1809 1810 1811 1812 1813 1814 1815 1816 1817 1818 1819
static loff_t max_inode_blocks(struct inode *inode)
{
	loff_t result = ADDRS_PER_INODE(inode);
	loff_t leaf_count = ADDRS_PER_BLOCK(inode);

	/* two direct node blocks */
	result += (leaf_count * 2);

	/* two indirect node blocks */
	leaf_count *= NIDS_PER_BLOCK;
	result += (leaf_count * 2);

	/* one double indirect node block */
	leaf_count *= NIDS_PER_BLOCK;
	result += leaf_count;

	return result;
}

Jaegeuk Kim's avatar
Jaegeuk Kim committed
1820 1821 1822
int f2fs_fiemap(struct inode *inode, struct fiemap_extent_info *fieinfo,
		u64 start, u64 len)
{
1823
	struct f2fs_map_blocks map;
1824
	sector_t start_blk, last_blk;
1825
	pgoff_t next_pgofs;
1826 1827 1828
	u64 logical = 0, phys = 0, size = 0;
	u32 flags = 0;
	int ret = 0;
1829
	bool compr_cluster = false, compr_appended;
1830
	unsigned int cluster_size = F2FS_I(inode)->i_cluster_size;
1831
	unsigned int count_in_cluster = 0;
1832
	loff_t maxbytes;
1833

1834 1835 1836 1837 1838 1839
	if (fieinfo->fi_flags & FIEMAP_FLAG_CACHE) {
		ret = f2fs_precache_extents(inode);
		if (ret)
			return ret;
	}

1840
	ret = fiemap_prep(inode, fieinfo, start, &len, FIEMAP_FLAG_XATTR);
1841 1842 1843
	if (ret)
		return ret;

1844 1845
	inode_lock(inode);

1846 1847 1848 1849 1850 1851 1852 1853 1854
	maxbytes = max_file_blocks(inode) << F2FS_BLKSIZE_BITS;
	if (start > maxbytes) {
		ret = -EFBIG;
		goto out;
	}

	if (len > maxbytes || (maxbytes - len) < start)
		len = maxbytes - start;

Chao Yu's avatar
Chao Yu committed
1855 1856 1857 1858 1859
	if (fieinfo->fi_flags & FIEMAP_FLAG_XATTR) {
		ret = f2fs_xattr_fiemap(inode, fieinfo);
		goto out;
	}

1860
	if (f2fs_has_inline_data(inode) || f2fs_has_inline_dentry(inode)) {
1861 1862
		ret = f2fs_inline_data_fiemap(inode, fieinfo, start, len);
		if (ret != -EAGAIN)
1863
			goto out;
1864 1865
	}

1866 1867
	if (bytes_to_blks(inode, len) == 0)
		len = blks_to_bytes(inode, 1);
1868

1869 1870
	start_blk = bytes_to_blks(inode, start);
	last_blk = bytes_to_blks(inode, start + len - 1);
1871

1872
next:
1873 1874 1875 1876 1877
	memset(&map, 0, sizeof(map));
	map.m_lblk = start_blk;
	map.m_len = bytes_to_blks(inode, len);
	map.m_next_pgofs = &next_pgofs;
	map.m_seg_type = NO_CHECK_TYPE;
1878

1879 1880 1881 1882
	if (compr_cluster) {
		map.m_lblk += 1;
		map.m_len = cluster_size - count_in_cluster;
	}
1883

1884
	ret = f2fs_map_blocks(inode, &map, 0, F2FS_GET_BLOCK_FIEMAP);
1885 1886 1887 1888
	if (ret)
		goto out;

	/* HOLE */
1889
	if (!compr_cluster && !(map.m_flags & F2FS_MAP_FLAGS)) {
1890
		start_blk = next_pgofs;
1891

1892
		if (blks_to_bytes(inode, start_blk) < blks_to_bytes(inode,
1893
						max_inode_blocks(inode)))
1894
			goto prep_next;
1895

1896 1897
		flags |= FIEMAP_EXTENT_LAST;
	}
1898

1899 1900 1901 1902 1903 1904 1905 1906
	compr_appended = false;
	/* In a case of compressed cluster, append this to the last extent */
	if (compr_cluster && ((map.m_flags & F2FS_MAP_UNWRITTEN) ||
			!(map.m_flags & F2FS_MAP_FLAGS))) {
		compr_appended = true;
		goto skip_fill;
	}

1907
	if (size) {
1908
		flags |= FIEMAP_EXTENT_MERGED;
1909
		if (IS_ENCRYPTED(inode))
1910 1911
			flags |= FIEMAP_EXTENT_DATA_ENCRYPTED;

1912 1913
		ret = fiemap_fill_next_extent(fieinfo, logical,
				phys, size, flags);
1914
		trace_f2fs_fiemap(inode, logical, phys, size, flags, ret);
1915 1916 1917
		if (ret)
			goto out;
		size = 0;
1918
	}
1919

1920
	if (start_blk > last_blk)
1921
		goto out;
1922

1923
skip_fill:
1924
	if (map.m_pblk == COMPRESS_ADDR) {
1925
		compr_cluster = true;
1926 1927 1928 1929 1930 1931 1932 1933 1934 1935 1936 1937 1938 1939 1940 1941 1942 1943 1944 1945 1946 1947 1948 1949
		count_in_cluster = 1;
	} else if (compr_appended) {
		unsigned int appended_blks = cluster_size -
						count_in_cluster + 1;
		size += blks_to_bytes(inode, appended_blks);
		start_blk += appended_blks;
		compr_cluster = false;
	} else {
		logical = blks_to_bytes(inode, start_blk);
		phys = __is_valid_data_blkaddr(map.m_pblk) ?
			blks_to_bytes(inode, map.m_pblk) : 0;
		size = blks_to_bytes(inode, map.m_len);
		flags = 0;

		if (compr_cluster) {
			flags = FIEMAP_EXTENT_ENCODED;
			count_in_cluster += map.m_len;
			if (count_in_cluster == cluster_size) {
				compr_cluster = false;
				size += blks_to_bytes(inode, 1);
			}
		} else if (map.m_flags & F2FS_MAP_UNWRITTEN) {
			flags = FIEMAP_EXTENT_UNWRITTEN;
		}
1950

1951 1952
		start_blk += bytes_to_blks(inode, size);
	}
1953

1954
prep_next:
1955 1956 1957 1958 1959 1960 1961 1962 1963
	cond_resched();
	if (fatal_signal_pending(current))
		ret = -EINTR;
	else
		goto next;
out:
	if (ret == 1)
		ret = 0;

Al Viro's avatar
Al Viro committed
1964
	inode_unlock(inode);
1965
	return ret;
Jaegeuk Kim's avatar
Jaegeuk Kim committed
1966 1967
}

Eric Biggers's avatar
Eric Biggers committed
1968 1969 1970 1971 1972 1973 1974 1975 1976
static inline loff_t f2fs_readpage_limit(struct inode *inode)
{
	if (IS_ENABLED(CONFIG_FS_VERITY) &&
	    (IS_VERITY(inode) || f2fs_verity_in_progress(inode)))
		return inode->i_sb->s_maxbytes;

	return i_size_read(inode);
}

1977 1978 1979 1980 1981 1982 1983 1984
static int f2fs_read_single_page(struct inode *inode, struct page *page,
					unsigned nr_pages,
					struct f2fs_map_blocks *map,
					struct bio **bio_ret,
					sector_t *last_block_in_bio,
					bool is_readahead)
{
	struct bio *bio = *bio_ret;
1985
	const unsigned blocksize = blks_to_bytes(inode, 1);
1986 1987 1988 1989 1990 1991
	sector_t block_in_file;
	sector_t last_block;
	sector_t last_block_in_file;
	sector_t block_nr;
	int ret = 0;

Jaegeuk Kim's avatar
Jaegeuk Kim committed
1992
	block_in_file = (sector_t)page_index(page);
1993
	last_block = block_in_file + nr_pages;
1994 1995
	last_block_in_file = bytes_to_blks(inode,
			f2fs_readpage_limit(inode) + blocksize - 1);
1996 1997 1998 1999 2000 2001 2002 2003 2004 2005 2006 2007 2008 2009 2010 2011 2012 2013 2014 2015 2016 2017 2018 2019 2020 2021 2022 2023 2024 2025
	if (last_block > last_block_in_file)
		last_block = last_block_in_file;

	/* just zeroing out page which is beyond EOF */
	if (block_in_file >= last_block)
		goto zero_out;
	/*
	 * Map blocks using the previous result first.
	 */
	if ((map->m_flags & F2FS_MAP_MAPPED) &&
			block_in_file > map->m_lblk &&
			block_in_file < (map->m_lblk + map->m_len))
		goto got_it;

	/*
	 * Then do more f2fs_map_blocks() calls until we are
	 * done with this page.
	 */
	map->m_lblk = block_in_file;
	map->m_len = last_block - block_in_file;

	ret = f2fs_map_blocks(inode, map, 0, F2FS_GET_BLOCK_DEFAULT);
	if (ret)
		goto out;
got_it:
	if ((map->m_flags & F2FS_MAP_MAPPED)) {
		block_nr = map->m_pblk + block_in_file - map->m_lblk;
		SetPageMappedToDisk(page);

		if (!f2fs_is_valid_blkaddr(F2FS_I_SB(inode), block_nr,
2026
						DATA_GENERIC_ENHANCE_READ)) {
2027
			ret = -EFSCORRUPTED;
2028 2029 2030 2031 2032
			goto out;
		}
	} else {
zero_out:
		zero_user_segment(page, 0, PAGE_SIZE);
Eric Biggers's avatar
Eric Biggers committed
2033 2034 2035 2036 2037
		if (f2fs_need_verity(inode, page->index) &&
		    !fsverity_verify_page(page)) {
			ret = -EIO;
			goto out;
		}
2038 2039 2040 2041 2042 2043 2044 2045 2046 2047
		if (!PageUptodate(page))
			SetPageUptodate(page);
		unlock_page(page);
		goto out;
	}

	/*
	 * This page will go to BIO.  Do we need to send this
	 * BIO off first?
	 */
2048 2049 2050
	if (bio && (!page_is_mergeable(F2FS_I_SB(inode), bio,
				       *last_block_in_bio, block_nr) ||
		    !f2fs_crypt_mergeable_bio(bio, inode, page->index, NULL))) {
2051 2052 2053 2054 2055 2056
submit_and_realloc:
		__submit_bio(F2FS_I_SB(inode), bio, DATA);
		bio = NULL;
	}
	if (bio == NULL) {
		bio = f2fs_grab_read_bio(inode, block_nr, nr_pages,
2057
				is_readahead ? REQ_RAHEAD : 0, page->index,
2058
				false);
2059 2060 2061 2062 2063 2064 2065 2066 2067 2068 2069 2070 2071 2072 2073 2074 2075
		if (IS_ERR(bio)) {
			ret = PTR_ERR(bio);
			bio = NULL;
			goto out;
		}
	}

	/*
	 * If the page is under writeback, we need to wait for
	 * its completion to see the correct decrypted data.
	 */
	f2fs_wait_on_block_writeback(inode, block_nr);

	if (bio_add_page(bio, page, blocksize, 0) < blocksize)
		goto submit_and_realloc;

	inc_page_count(F2FS_I_SB(inode), F2FS_RD_DATA);
Chao Yu's avatar
Chao Yu committed
2076
	f2fs_update_iostat(F2FS_I_SB(inode), FS_DATA_READ_IO, F2FS_BLKSIZE);
2077 2078 2079 2080 2081 2082 2083 2084
	ClearPageError(page);
	*last_block_in_bio = block_nr;
	goto out;
out:
	*bio_ret = bio;
	return ret;
}

Chao Yu's avatar
Chao Yu committed
2085 2086 2087
#ifdef CONFIG_F2FS_FS_COMPRESSION
int f2fs_read_multi_pages(struct compress_ctx *cc, struct bio **bio_ret,
				unsigned nr_pages, sector_t *last_block_in_bio,
2088
				bool is_readahead, bool for_write)
Chao Yu's avatar
Chao Yu committed
2089 2090 2091 2092 2093 2094 2095
{
	struct dnode_of_data dn;
	struct inode *inode = cc->inode;
	struct f2fs_sb_info *sbi = F2FS_I_SB(inode);
	struct bio *bio = *bio_ret;
	unsigned int start_idx = cc->cluster_idx << cc->log_cluster_size;
	sector_t last_block_in_file;
2096
	const unsigned blocksize = blks_to_bytes(inode, 1);
Chao Yu's avatar
Chao Yu committed
2097
	struct decompress_io_ctx *dic = NULL;
2098 2099
	struct extent_info ei = {0, };
	bool from_dnode = true;
Chao Yu's avatar
Chao Yu committed
2100 2101 2102 2103 2104
	int i;
	int ret = 0;

	f2fs_bug_on(sbi, f2fs_cluster_is_empty(cc));

2105 2106
	last_block_in_file = bytes_to_blks(inode,
			f2fs_readpage_limit(inode) + blocksize - 1);
Chao Yu's avatar
Chao Yu committed
2107 2108 2109 2110 2111 2112 2113 2114 2115 2116 2117 2118 2119 2120 2121

	/* get rid of pages beyond EOF */
	for (i = 0; i < cc->cluster_size; i++) {
		struct page *page = cc->rpages[i];

		if (!page)
			continue;
		if ((sector_t)page->index >= last_block_in_file) {
			zero_user_segment(page, 0, PAGE_SIZE);
			if (!PageUptodate(page))
				SetPageUptodate(page);
		} else if (!PageUptodate(page)) {
			continue;
		}
		unlock_page(page);
2122 2123
		if (for_write)
			put_page(page);
Chao Yu's avatar
Chao Yu committed
2124 2125 2126 2127 2128 2129 2130 2131
		cc->rpages[i] = NULL;
		cc->nr_rpages--;
	}

	/* we are done since all pages are beyond EOF */
	if (f2fs_cluster_is_empty(cc))
		goto out;

2132 2133 2134 2135 2136 2137
	if (f2fs_lookup_extent_cache(inode, start_idx, &ei))
		from_dnode = false;

	if (!from_dnode)
		goto skip_reading_dnode;

Chao Yu's avatar
Chao Yu committed
2138 2139 2140 2141 2142
	set_new_dnode(&dn, inode, NULL, NULL, 0);
	ret = f2fs_get_dnode_of_data(&dn, start_idx, LOOKUP_NODE);
	if (ret)
		goto out;

2143
	f2fs_bug_on(sbi, dn.data_blkaddr != COMPRESS_ADDR);
Chao Yu's avatar
Chao Yu committed
2144

2145
skip_reading_dnode:
Chao Yu's avatar
Chao Yu committed
2146 2147 2148
	for (i = 1; i < cc->cluster_size; i++) {
		block_t blkaddr;

2149 2150 2151
		blkaddr = from_dnode ? data_blkaddr(dn.inode, dn.node_page,
					dn.ofs_in_node + i) :
					ei.blk + i - 1;
Chao Yu's avatar
Chao Yu committed
2152 2153 2154 2155 2156 2157 2158 2159 2160

		if (!__is_valid_data_blkaddr(blkaddr))
			break;

		if (!f2fs_is_valid_blkaddr(sbi, blkaddr, DATA_GENERIC)) {
			ret = -EFAULT;
			goto out_put_dnode;
		}
		cc->nr_cpages++;
2161 2162 2163

		if (!from_dnode && i >= ei.c_len)
			break;
Chao Yu's avatar
Chao Yu committed
2164 2165 2166 2167 2168 2169 2170 2171 2172 2173 2174 2175 2176 2177
	}

	/* nothing to decompress */
	if (cc->nr_cpages == 0) {
		ret = 0;
		goto out_put_dnode;
	}

	dic = f2fs_alloc_dic(cc);
	if (IS_ERR(dic)) {
		ret = PTR_ERR(dic);
		goto out_put_dnode;
	}

2178
	for (i = 0; i < cc->nr_cpages; i++) {
Chao Yu's avatar
Chao Yu committed
2179 2180
		struct page *page = dic->cpages[i];
		block_t blkaddr;
2181
		struct bio_post_read_ctx *ctx;
Chao Yu's avatar
Chao Yu committed
2182

2183 2184 2185
		blkaddr = from_dnode ? data_blkaddr(dn.inode, dn.node_page,
					dn.ofs_in_node + i + 1) :
					ei.blk + i;
Chao Yu's avatar
Chao Yu committed
2186

2187 2188 2189 2190 2191 2192 2193 2194
		f2fs_wait_on_block_writeback(inode, blkaddr);

		if (f2fs_load_compressed_page(sbi, page, blkaddr)) {
			if (atomic_dec_and_test(&dic->remaining_pages))
				f2fs_decompress_cluster(dic);
			continue;
		}

2195 2196 2197
		if (bio && (!page_is_mergeable(sbi, bio,
					*last_block_in_bio, blkaddr) ||
		    !f2fs_crypt_mergeable_bio(bio, inode, page->index, NULL))) {
Chao Yu's avatar
Chao Yu committed
2198 2199 2200 2201 2202 2203 2204 2205
submit_and_realloc:
			__submit_bio(sbi, bio, DATA);
			bio = NULL;
		}

		if (!bio) {
			bio = f2fs_grab_read_bio(inode, blkaddr, nr_pages,
					is_readahead ? REQ_RAHEAD : 0,
2206
					page->index, for_write);
Chao Yu's avatar
Chao Yu committed
2207 2208
			if (IS_ERR(bio)) {
				ret = PTR_ERR(bio);
2209
				f2fs_decompress_end_io(dic, ret);
Chao Yu's avatar
Chao Yu committed
2210
				f2fs_put_dnode(&dn);
2211
				*bio_ret = NULL;
Chao Yu's avatar
Chao Yu committed
2212 2213 2214 2215 2216 2217 2218
				return ret;
			}
		}

		if (bio_add_page(bio, page, blocksize, 0) < blocksize)
			goto submit_and_realloc;

2219
		ctx = get_post_read_ctx(bio);
2220 2221
		ctx->enabled_steps |= STEP_DECOMPRESS;
		refcount_inc(&dic->refcnt);
2222

Chao Yu's avatar
Chao Yu committed
2223
		inc_page_count(sbi, F2FS_RD_DATA);
Chao Yu's avatar
Chao Yu committed
2224
		f2fs_update_iostat(sbi, FS_DATA_READ_IO, F2FS_BLKSIZE);
2225
		f2fs_update_iostat(sbi, FS_CDATA_READ_IO, F2FS_BLKSIZE);
Chao Yu's avatar
Chao Yu committed
2226 2227 2228 2229
		ClearPageError(page);
		*last_block_in_bio = blkaddr;
	}

2230 2231
	if (from_dnode)
		f2fs_put_dnode(&dn);
Chao Yu's avatar
Chao Yu committed
2232 2233 2234 2235 2236

	*bio_ret = bio;
	return 0;

out_put_dnode:
2237 2238
	if (from_dnode)
		f2fs_put_dnode(&dn);
Chao Yu's avatar
Chao Yu committed
2239
out:
2240 2241 2242 2243 2244 2245 2246
	for (i = 0; i < cc->cluster_size; i++) {
		if (cc->rpages[i]) {
			ClearPageUptodate(cc->rpages[i]);
			ClearPageError(cc->rpages[i]);
			unlock_page(cc->rpages[i]);
		}
	}
Chao Yu's avatar
Chao Yu committed
2247 2248 2249 2250 2251
	*bio_ret = bio;
	return ret;
}
#endif

2252 2253 2254 2255
/*
 * This function was originally taken from fs/mpage.c, and customized for f2fs.
 * Major change was from block_size == page_size in f2fs by default.
 */
2256
static int f2fs_mpage_readpages(struct inode *inode,
2257
		struct readahead_control *rac, struct page *page)
2258 2259 2260 2261
{
	struct bio *bio = NULL;
	sector_t last_block_in_bio = 0;
	struct f2fs_map_blocks map;
Chao Yu's avatar
Chao Yu committed
2262 2263 2264 2265 2266 2267 2268 2269 2270 2271 2272
#ifdef CONFIG_F2FS_FS_COMPRESSION
	struct compress_ctx cc = {
		.inode = inode,
		.log_cluster_size = F2FS_I(inode)->i_log_cluster_size,
		.cluster_size = F2FS_I(inode)->i_cluster_size,
		.cluster_idx = NULL_CLUSTER,
		.rpages = NULL,
		.cpages = NULL,
		.nr_rpages = 0,
		.nr_cpages = 0,
	};
2273
	pgoff_t nc_cluster_idx = NULL_CLUSTER;
Chao Yu's avatar
Chao Yu committed
2274
#endif
2275
	unsigned nr_pages = rac ? readahead_count(rac) : 1;
Chao Yu's avatar
Chao Yu committed
2276
	unsigned max_nr_pages = nr_pages;
2277
	int ret = 0;
2278 2279 2280 2281 2282

	map.m_pblk = 0;
	map.m_lblk = 0;
	map.m_len = 0;
	map.m_flags = 0;
2283
	map.m_next_pgofs = NULL;
2284
	map.m_next_extent = NULL;
2285
	map.m_seg_type = NO_CHECK_TYPE;
2286
	map.m_may_create = false;
2287

LiFan's avatar
LiFan committed
2288
	for (; nr_pages; nr_pages--) {
2289 2290
		if (rac) {
			page = readahead_page(rac);
2291
			prefetchw(&page->flags);
2292 2293
		}

Chao Yu's avatar
Chao Yu committed
2294 2295 2296 2297 2298 2299 2300
#ifdef CONFIG_F2FS_FS_COMPRESSION
		if (f2fs_compressed_file(inode)) {
			/* there are remained comressed pages, submit them */
			if (!f2fs_cluster_can_merge_page(&cc, page->index)) {
				ret = f2fs_read_multi_pages(&cc, &bio,
							max_nr_pages,
							&last_block_in_bio,
2301
							rac != NULL, false);
2302
				f2fs_destroy_compress_ctx(&cc, false);
Chao Yu's avatar
Chao Yu committed
2303 2304 2305
				if (ret)
					goto set_error_page;
			}
2306 2307 2308 2309 2310
			if (cc.cluster_idx == NULL_CLUSTER) {
				if (nc_cluster_idx ==
					page->index >> cc.log_cluster_size) {
					goto read_single_page;
				}
Chao Yu's avatar
Chao Yu committed
2311

2312 2313 2314 2315 2316 2317 2318 2319
				ret = f2fs_is_compressed_cluster(inode, page->index);
				if (ret < 0)
					goto set_error_page;
				else if (!ret) {
					nc_cluster_idx =
						page->index >> cc.log_cluster_size;
					goto read_single_page;
				}
Chao Yu's avatar
Chao Yu committed
2320

2321 2322
				nc_cluster_idx = NULL_CLUSTER;
			}
Chao Yu's avatar
Chao Yu committed
2323 2324 2325 2326 2327 2328 2329 2330 2331 2332 2333 2334
			ret = f2fs_init_compress_ctx(&cc);
			if (ret)
				goto set_error_page;

			f2fs_compress_ctx_add_page(&cc, page);

			goto next_page;
		}
read_single_page:
#endif

		ret = f2fs_read_single_page(inode, page, max_nr_pages, &map,
2335
					&bio, &last_block_in_bio, rac);
2336
		if (ret) {
Chao Yu's avatar
Chao Yu committed
2337 2338 2339
#ifdef CONFIG_F2FS_FS_COMPRESSION
set_error_page:
#endif
2340
			SetPageError(page);
2341
			zero_user_segment(page, 0, PAGE_SIZE);
2342 2343
			unlock_page(page);
		}
2344
#ifdef CONFIG_F2FS_FS_COMPRESSION
2345
next_page:
2346 2347
#endif
		if (rac)
2348
			put_page(page);
Chao Yu's avatar
Chao Yu committed
2349 2350 2351 2352 2353 2354 2355 2356

#ifdef CONFIG_F2FS_FS_COMPRESSION
		if (f2fs_compressed_file(inode)) {
			/* last page */
			if (nr_pages == 1 && !f2fs_cluster_is_empty(&cc)) {
				ret = f2fs_read_multi_pages(&cc, &bio,
							max_nr_pages,
							&last_block_in_bio,
2357
							rac != NULL, false);
2358
				f2fs_destroy_compress_ctx(&cc, false);
Chao Yu's avatar
Chao Yu committed
2359 2360 2361
			}
		}
#endif
2362 2363
	}
	if (bio)
2364
		__submit_bio(F2FS_I_SB(inode), bio, DATA);
2365
	return ret;
2366 2367
}

2368 2369
static int f2fs_read_data_page(struct file *file, struct page *page)
{
Jaegeuk Kim's avatar
Jaegeuk Kim committed
2370
	struct inode *inode = page_file_mapping(page)->host;
2371
	int ret = -EAGAIN;
2372

2373 2374
	trace_f2fs_readpage(page, DATA);

Chao Yu's avatar
Chao Yu committed
2375 2376 2377 2378 2379
	if (!f2fs_is_compress_backend_ready(inode)) {
		unlock_page(page);
		return -EOPNOTSUPP;
	}

arter97's avatar
arter97 committed
2380
	/* If the file has inline data, try to read it directly */
2381 2382
	if (f2fs_has_inline_data(inode))
		ret = f2fs_read_inline_data(inode, page);
2383
	if (ret == -EAGAIN)
2384
		ret = f2fs_mpage_readpages(inode, NULL, page);
2385
	return ret;
2386 2387
}

2388
static void f2fs_readahead(struct readahead_control *rac)
2389
{
2390
	struct inode *inode = rac->mapping->host;
2391

2392
	trace_f2fs_readpages(inode, readahead_index(rac), readahead_count(rac));
2393

Chao Yu's avatar
Chao Yu committed
2394
	if (!f2fs_is_compress_backend_ready(inode))
2395
		return;
Chao Yu's avatar
Chao Yu committed
2396

2397 2398
	/* If the file has inline data, skip readpages */
	if (f2fs_has_inline_data(inode))
2399
		return;
2400

2401
	f2fs_mpage_readpages(inode, rac, NULL);
2402 2403
}

Chao Yu's avatar
Chao Yu committed
2404
int f2fs_encrypt_one_page(struct f2fs_io_info *fio)
2405 2406
{
	struct inode *inode = fio->page->mapping->host;
Chao Yu's avatar
Chao Yu committed
2407
	struct page *mpage, *page;
2408 2409
	gfp_t gfp_flags = GFP_NOFS;

2410
	if (!f2fs_encrypted_file(inode))
2411 2412
		return 0;

Chao Yu's avatar
Chao Yu committed
2413 2414
	page = fio->compressed_page ? fio->compressed_page : fio->page;

2415
	/* wait for GCed page writeback via META_MAPPING */
2416
	f2fs_wait_on_block_writeback(inode, fio->old_blkaddr);
2417

2418 2419 2420
	if (fscrypt_inode_uses_inline_crypto(inode))
		return 0;

2421
retry_encrypt:
Chao Yu's avatar
Chao Yu committed
2422 2423
	fio->encrypted_page = fscrypt_encrypt_pagecache_blocks(page,
					PAGE_SIZE, 0, gfp_flags);
2424 2425 2426 2427
	if (IS_ERR(fio->encrypted_page)) {
		/* flush pending IOs and wait for a while in the ENOMEM case */
		if (PTR_ERR(fio->encrypted_page) == -ENOMEM) {
			f2fs_flush_merged_writes(fio->sbi);
2428
			memalloc_retry_wait(GFP_NOFS);
2429 2430 2431 2432 2433
			gfp_flags |= __GFP_NOFAIL;
			goto retry_encrypt;
		}
		return PTR_ERR(fio->encrypted_page);
	}
2434

2435 2436 2437 2438 2439 2440
	mpage = find_lock_page(META_MAPPING(fio->sbi), fio->old_blkaddr);
	if (mpage) {
		if (PageUptodate(mpage))
			memcpy(page_address(mpage),
				page_address(fio->encrypted_page), PAGE_SIZE);
		f2fs_put_page(mpage, 1);
2441
	}
2442
	return 0;
2443 2444
}

Chao Yu's avatar
Chao Yu committed
2445 2446
static inline bool check_inplace_update_policy(struct inode *inode,
				struct f2fs_io_info *fio)
2447
{
Chao Yu's avatar
Chao Yu committed
2448 2449
	struct f2fs_sb_info *sbi = F2FS_I_SB(inode);
	unsigned int policy = SM_I(sbi)->ipu_policy;
2450

2451 2452 2453
	if (policy & (0x1 << F2FS_IPU_HONOR_OPU_WRITE) &&
			is_inode_flag_set(inode, FI_OPU_WRITE))
		return false;
Chao Yu's avatar
Chao Yu committed
2454 2455
	if (policy & (0x1 << F2FS_IPU_FORCE))
		return true;
Chao Yu's avatar
Chao Yu committed
2456
	if (policy & (0x1 << F2FS_IPU_SSR) && f2fs_need_SSR(sbi))
Chao Yu's avatar
Chao Yu committed
2457 2458 2459 2460
		return true;
	if (policy & (0x1 << F2FS_IPU_UTIL) &&
			utilization(sbi) > SM_I(sbi)->min_ipu_util)
		return true;
Chao Yu's avatar
Chao Yu committed
2461
	if (policy & (0x1 << F2FS_IPU_SSR_UTIL) && f2fs_need_SSR(sbi) &&
Chao Yu's avatar
Chao Yu committed
2462 2463 2464 2465 2466 2467 2468 2469 2470
			utilization(sbi) > SM_I(sbi)->min_ipu_util)
		return true;

	/*
	 * IPU for rewrite async pages
	 */
	if (policy & (0x1 << F2FS_IPU_ASYNC) &&
			fio && fio->op == REQ_OP_WRITE &&
			!(fio->op_flags & REQ_SYNC) &&
2471
			!IS_ENCRYPTED(inode))
Chao Yu's avatar
Chao Yu committed
2472 2473 2474 2475 2476 2477 2478
		return true;

	/* this is only set during fdatasync */
	if (policy & (0x1 << F2FS_IPU_FSYNC) &&
			is_inode_flag_set(inode, FI_NEED_IPU))
		return true;

Daniel Rosenberg's avatar
Daniel Rosenberg committed
2479 2480 2481 2482
	if (unlikely(fio && is_sbi_flag_set(sbi, SBI_CP_DISABLED) &&
			!f2fs_is_checkpointed_data(sbi, fio->old_blkaddr)))
		return true;

Chao Yu's avatar
Chao Yu committed
2483 2484 2485
	return false;
}

Chao Yu's avatar
Chao Yu committed
2486
bool f2fs_should_update_inplace(struct inode *inode, struct f2fs_io_info *fio)
Chao Yu's avatar
Chao Yu committed
2487
{
2488 2489 2490 2491
	/* swap file is migrating in aligned write mode */
	if (is_inode_flag_set(inode, FI_ALIGNED_WRITE))
		return false;

2492 2493
	if (f2fs_is_pinned_file(inode))
		return true;
Chao Yu's avatar
Chao Yu committed
2494 2495 2496 2497 2498 2499 2500 2501

	/* if this is cold file, we should overwrite to avoid fragmentation */
	if (file_is_cold(inode))
		return true;

	return check_inplace_update_policy(inode, fio);
}

Chao Yu's avatar
Chao Yu committed
2502
bool f2fs_should_update_outplace(struct inode *inode, struct f2fs_io_info *fio)
Chao Yu's avatar
Chao Yu committed
2503 2504 2505
{
	struct f2fs_sb_info *sbi = F2FS_I_SB(inode);

2506 2507 2508 2509 2510
	/* The below cases were checked when setting it. */
	if (f2fs_is_pinned_file(inode))
		return false;
	if (fio && is_sbi_flag_set(sbi, SBI_NEED_FSCK))
		return true;
2511
	if (f2fs_lfs_mode(sbi))
Chao Yu's avatar
Chao Yu committed
2512 2513 2514
		return true;
	if (S_ISDIR(inode->i_mode))
		return true;
2515 2516
	if (IS_NOQUOTA(inode))
		return true;
Chao Yu's avatar
Chao Yu committed
2517 2518
	if (f2fs_is_atomic_file(inode))
		return true;
2519 2520 2521 2522 2523

	/* swap file is migrating in aligned write mode */
	if (is_inode_flag_set(inode, FI_ALIGNED_WRITE))
		return true;

2524 2525 2526
	if (is_inode_flag_set(inode, FI_OPU_WRITE))
		return true;

Chao Yu's avatar
Chao Yu committed
2527
	if (fio) {
2528
		if (page_private_gcing(fio->page))
Chao Yu's avatar
Chao Yu committed
2529
			return true;
2530
		if (page_private_dummy(fio->page))
Chao Yu's avatar
Chao Yu committed
2531
			return true;
Daniel Rosenberg's avatar
Daniel Rosenberg committed
2532 2533 2534
		if (unlikely(is_sbi_flag_set(sbi, SBI_CP_DISABLED) &&
			f2fs_is_checkpointed_data(sbi, fio->old_blkaddr)))
			return true;
Chao Yu's avatar
Chao Yu committed
2535 2536 2537 2538
	}
	return false;
}

2539 2540 2541 2542
static inline bool need_inplace_update(struct f2fs_io_info *fio)
{
	struct inode *inode = fio->page->mapping->host;

Chao Yu's avatar
Chao Yu committed
2543
	if (f2fs_should_update_outplace(inode, fio))
2544 2545
		return false;

Chao Yu's avatar
Chao Yu committed
2546
	return f2fs_should_update_inplace(inode, fio);
2547 2548
}

Chao Yu's avatar
Chao Yu committed
2549
int f2fs_do_write_data_page(struct f2fs_io_info *fio)
2550
{
2551
	struct page *page = fio->page;
2552 2553
	struct inode *inode = page->mapping->host;
	struct dnode_of_data dn;
2554
	struct extent_info ei = {0, };
2555
	struct node_info ni;
2556
	bool ipu_force = false;
2557 2558 2559
	int err = 0;

	set_new_dnode(&dn, inode, NULL, NULL, 0);
2560 2561 2562
	if (need_inplace_update(fio) &&
			f2fs_lookup_extent_cache(inode, page->index, &ei)) {
		fio->old_blkaddr = ei.blk + page->index - ei.fofs;
2563

2564
		if (!f2fs_is_valid_blkaddr(fio->sbi, fio->old_blkaddr,
2565
						DATA_GENERIC_ENHANCE))
2566
			return -EFSCORRUPTED;
2567 2568 2569 2570

		ipu_force = true;
		fio->need_lock = LOCK_DONE;
		goto got_it;
2571
	}
2572

2573 2574 2575
	/* Deadlock due to between page->lock and f2fs_lock_op */
	if (fio->need_lock == LOCK_REQ && !f2fs_trylock_op(fio->sbi))
		return -EAGAIN;
2576

Chao Yu's avatar
Chao Yu committed
2577
	err = f2fs_get_dnode_of_data(&dn, page->index, LOOKUP_NODE);
2578
	if (err)
2579
		goto out;
2580

2581
	fio->old_blkaddr = dn.data_blkaddr;
2582 2583

	/* This page is already truncated */
2584
	if (fio->old_blkaddr == NULL_ADDR) {
2585
		ClearPageUptodate(page);
2586
		clear_page_private_gcing(page);
2587
		goto out_writepage;
2588
	}
2589
got_it:
2590 2591
	if (__is_valid_data_blkaddr(fio->old_blkaddr) &&
		!f2fs_is_valid_blkaddr(fio->sbi, fio->old_blkaddr,
2592
						DATA_GENERIC_ENHANCE)) {
2593
		err = -EFSCORRUPTED;
2594 2595
		goto out_writepage;
	}
2596 2597 2598 2599
	/*
	 * If current allocation needs SSR,
	 * it had better in-place writes for updated data.
	 */
2600 2601
	if (ipu_force ||
		(__is_valid_data_blkaddr(fio->old_blkaddr) &&
2602
					need_inplace_update(fio))) {
Chao Yu's avatar
Chao Yu committed
2603
		err = f2fs_encrypt_one_page(fio);
2604 2605 2606 2607
		if (err)
			goto out_writepage;

		set_page_writeback(page);
2608
		ClearPageError(page);
2609
		f2fs_put_dnode(&dn);
2610
		if (fio->need_lock == LOCK_REQ)
2611
			f2fs_unlock_op(fio->sbi);
Chao Yu's avatar
Chao Yu committed
2612
		err = f2fs_inplace_write_data(fio);
2613
		if (err) {
2614
			if (fscrypt_inode_uses_fs_layer_crypto(inode))
2615
				fscrypt_finalize_bounce_page(&fio->encrypted_page);
2616 2617
			if (PageWriteback(page))
				end_page_writeback(page);
2618 2619
		} else {
			set_inode_flag(inode, FI_UPDATE_WRITE);
2620
		}
2621
		trace_f2fs_do_write_data_page(fio->page, IPU);
2622
		return err;
2623
	}
2624

2625 2626 2627 2628 2629 2630 2631 2632
	if (fio->need_lock == LOCK_RETRY) {
		if (!f2fs_trylock_op(fio->sbi)) {
			err = -EAGAIN;
			goto out_writepage;
		}
		fio->need_lock = LOCK_REQ;
	}

2633
	err = f2fs_get_node_info(fio->sbi, dn.nid, &ni, false);
2634 2635 2636 2637 2638
	if (err)
		goto out_writepage;

	fio->version = ni.version;

Chao Yu's avatar
Chao Yu committed
2639
	err = f2fs_encrypt_one_page(fio);
2640 2641 2642 2643
	if (err)
		goto out_writepage;

	set_page_writeback(page);
2644
	ClearPageError(page);
2645

Chao Yu's avatar
Chao Yu committed
2646 2647 2648
	if (fio->compr_blocks && fio->old_blkaddr == COMPRESS_ADDR)
		f2fs_i_compr_blocks_update(inode, fio->compr_blocks - 1, false);

2649
	/* LFS mode write path */
Chao Yu's avatar
Chao Yu committed
2650
	f2fs_outplace_write_data(&dn, fio);
2651 2652 2653 2654
	trace_f2fs_do_write_data_page(page, OPU);
	set_inode_flag(inode, FI_APPEND_WRITE);
	if (page->index == 0)
		set_inode_flag(inode, FI_FIRST_BLOCK_WRITTEN);
2655 2656
out_writepage:
	f2fs_put_dnode(&dn);
2657
out:
2658
	if (fio->need_lock == LOCK_REQ)
2659
		f2fs_unlock_op(fio->sbi);
2660 2661 2662
	return err;
}

Chao Yu's avatar
Chao Yu committed
2663
int f2fs_write_single_data_page(struct page *page, int *submitted,
Chao Yu's avatar
Chao Yu committed
2664 2665
				struct bio **bio,
				sector_t *last_block,
Chao Yu's avatar
Chao Yu committed
2666
				struct writeback_control *wbc,
Chao Yu's avatar
Chao Yu committed
2667
				enum iostat_type io_type,
2668 2669
				int compr_blocks,
				bool allow_balance)
2670 2671
{
	struct inode *inode = page->mapping->host;
2672
	struct f2fs_sb_info *sbi = F2FS_I_SB(inode);
2673
	loff_t i_size = i_size_read(inode);
Chao Yu's avatar
Chao Yu committed
2674
	const pgoff_t end_index = ((unsigned long long)i_size)
2675
							>> PAGE_SHIFT;
Chao Yu's avatar
Chao Yu committed
2676
	loff_t psize = (loff_t)(page->index + 1) << PAGE_SHIFT;
2677
	unsigned offset = 0;
2678
	bool need_balance_fs = false;
2679
	int err = 0;
Jaegeuk Kim's avatar
Jaegeuk Kim committed
2680
	struct f2fs_io_info fio = {
2681
		.sbi = sbi,
Chao Yu's avatar
Chao Yu committed
2682
		.ino = inode->i_ino,
Jaegeuk Kim's avatar
Jaegeuk Kim committed
2683
		.type = DATA,
Mike Christie's avatar
Mike Christie committed
2684
		.op = REQ_OP_WRITE,
2685
		.op_flags = wbc_to_write_flags(wbc),
2686
		.old_blkaddr = NULL_ADDR,
2687
		.page = page,
2688
		.encrypted_page = NULL,
2689
		.submitted = false,
Chao Yu's avatar
Chao Yu committed
2690
		.compr_blocks = compr_blocks,
2691
		.need_lock = LOCK_RETRY,
Chao Yu's avatar
Chao Yu committed
2692
		.io_type = io_type,
2693
		.io_wbc = wbc,
Chao Yu's avatar
Chao Yu committed
2694 2695
		.bio = bio,
		.last_block = last_block,
Jaegeuk Kim's avatar
Jaegeuk Kim committed
2696
	};
2697

2698 2699
	trace_f2fs_writepage(page, DATA);

2700 2701 2702
	/* we should bypass data pages to proceed the kworkder jobs */
	if (unlikely(f2fs_cp_error(sbi))) {
		mapping_set_error(page->mapping, -EIO);
2703 2704 2705 2706 2707 2708
		/*
		 * don't drop any dirty dentry pages for keeping lastest
		 * directory structure.
		 */
		if (S_ISDIR(inode->i_mode))
			goto redirty_out;
2709 2710 2711
		goto out;
	}

2712 2713 2714
	if (unlikely(is_sbi_flag_set(sbi, SBI_POR_DOING)))
		goto redirty_out;

Chao Yu's avatar
Chao Yu committed
2715 2716 2717
	if (page->index < end_index ||
			f2fs_verity_in_progress(inode) ||
			compr_blocks)
2718
		goto write;
2719 2720 2721 2722 2723

	/*
	 * If the offset is out-of-range of file size,
	 * this page does not have to be written to disk.
	 */
2724
	offset = i_size & (PAGE_SIZE - 1);
2725
	if ((page->index >= end_index + 1) || !offset)
2726
		goto out;
2727

2728
	zero_user_segment(page, offset, PAGE_SIZE);
2729
write:
2730 2731
	if (f2fs_is_drop_cache(inode))
		goto out;
2732 2733 2734
	/* we should not write 0'th page having journal header */
	if (f2fs_is_volatile_file(inode) && (!page->index ||
			(!wbc->for_reclaim &&
Chao Yu's avatar
Chao Yu committed
2735
			f2fs_available_free_memory(sbi, BASE_CHECK))))
2736
		goto redirty_out;
2737

2738 2739
	/* Dentry/quota blocks are controlled by checkpoint */
	if (S_ISDIR(inode->i_mode) || IS_NOQUOTA(inode)) {
2740 2741 2742 2743 2744 2745
		/*
		 * We need to wait for node_write to avoid block allocation during
		 * checkpoint. This can only happen to quota writes which can cause
		 * the below discard race condition.
		 */
		if (IS_NOQUOTA(inode))
2746
			f2fs_down_read(&sbi->node_write);
2747

2748
		fio.need_lock = LOCK_DONE;
Chao Yu's avatar
Chao Yu committed
2749
		err = f2fs_do_write_data_page(&fio);
2750 2751

		if (IS_NOQUOTA(inode))
2752
			f2fs_up_read(&sbi->node_write);
2753

2754 2755
		goto done;
	}
2756

2757
	if (!wbc->for_reclaim)
2758
		need_balance_fs = true;
2759
	else if (has_not_enough_free_secs(sbi, 0, 0))
2760
		goto redirty_out;
2761 2762
	else
		set_inode_flag(inode, FI_HOT_DATA);
2763

2764
	err = -EAGAIN;
2765
	if (f2fs_has_inline_data(inode)) {
2766
		err = f2fs_write_inline_data(inode, page);
2767 2768 2769
		if (!err)
			goto out;
	}
2770

2771
	if (err == -EAGAIN) {
Chao Yu's avatar
Chao Yu committed
2772
		err = f2fs_do_write_data_page(&fio);
2773 2774
		if (err == -EAGAIN) {
			fio.need_lock = LOCK_REQ;
Chao Yu's avatar
Chao Yu committed
2775
			err = f2fs_do_write_data_page(&fio);
2776 2777
		}
	}
2778

2779 2780 2781
	if (err) {
		file_set_keep_isize(inode);
	} else {
2782
		spin_lock(&F2FS_I(inode)->i_size_lock);
2783 2784
		if (F2FS_I(inode)->last_disk_size < psize)
			F2FS_I(inode)->last_disk_size = psize;
2785
		spin_unlock(&F2FS_I(inode)->i_size_lock);
2786
	}
2787

2788 2789 2790
done:
	if (err && err != -ENOENT)
		goto redirty_out;
2791

2792
out:
2793
	inode_dec_dirty_pages(inode);
2794
	if (err) {
2795
		ClearPageUptodate(page);
2796
		clear_page_private_gcing(page);
2797
	}
2798 2799

	if (wbc->for_reclaim) {
2800
		f2fs_submit_merged_write_cond(sbi, NULL, page, 0, DATA);
2801
		clear_inode_flag(inode, FI_HOT_DATA);
Chao Yu's avatar
Chao Yu committed
2802
		f2fs_remove_dirty_inode(inode);
2803
		submitted = NULL;
2804
	}
2805
	unlock_page(page);
2806
	if (!S_ISDIR(inode->i_mode) && !IS_NOQUOTA(inode) &&
2807
			!F2FS_I(inode)->cp_task && allow_balance)
Jaegeuk Kim's avatar
Jaegeuk Kim committed
2808
		f2fs_balance_fs(sbi, need_balance_fs);
2809

2810
	if (unlikely(f2fs_cp_error(sbi))) {
2811
		f2fs_submit_merged_write(sbi, DATA);
Chao Yu's avatar
Chao Yu committed
2812
		f2fs_submit_merged_ipu_write(sbi, bio, NULL);
2813 2814 2815 2816
		submitted = NULL;
	}

	if (submitted)
Chao Yu's avatar
Chao Yu committed
2817
		*submitted = fio.submitted ? 1 : 0;
2818

2819 2820 2821
	return 0;

redirty_out:
2822
	redirty_page_for_writepage(wbc, page);
2823 2824 2825 2826 2827 2828 2829
	/*
	 * pageout() in MM traslates EAGAIN, so calls handle_write_error()
	 * -> mapping_set_error() -> set_bit(AS_EIO, ...).
	 * file_write_and_wait_range() will see EIO error, which is critical
	 * to return value of fsync() followed by atomic_write failure to user.
	 */
	if (!err || wbc->for_reclaim)
2830
		return AOP_WRITEPAGE_ACTIVATE;
2831 2832
	unlock_page(page);
	return err;
2833 2834
}

2835 2836 2837
static int f2fs_write_data_page(struct page *page,
					struct writeback_control *wbc)
{
Chao Yu's avatar
Chao Yu committed
2838 2839 2840 2841 2842 2843 2844 2845 2846 2847 2848 2849 2850 2851 2852 2853
#ifdef CONFIG_F2FS_FS_COMPRESSION
	struct inode *inode = page->mapping->host;

	if (unlikely(f2fs_cp_error(F2FS_I_SB(inode))))
		goto out;

	if (f2fs_compressed_file(inode)) {
		if (f2fs_is_compressed_cluster(inode, page->index)) {
			redirty_page_for_writepage(wbc, page);
			return AOP_WRITEPAGE_ACTIVATE;
		}
	}
out:
#endif

	return f2fs_write_single_data_page(page, NULL, NULL, NULL,
2854
						wbc, FS_DATA_IO, 0, true);
2855 2856
}

Chao Yu's avatar
Chao Yu committed
2857 2858 2859 2860 2861 2862
/*
 * This function was copied from write_cche_pages from mm/page-writeback.c.
 * The major change is making write step of cold data page separately from
 * warm/hot data page.
 */
static int f2fs_write_cache_pages(struct address_space *mapping,
Chao Yu's avatar
Chao Yu committed
2863 2864
					struct writeback_control *wbc,
					enum iostat_type io_type)
Chao Yu's avatar
Chao Yu committed
2865 2866
{
	int ret = 0;
Chao Yu's avatar
Chao Yu committed
2867
	int done = 0, retry = 0;
Chao Yu's avatar
Chao Yu committed
2868
	struct pagevec pvec;
2869
	struct f2fs_sb_info *sbi = F2FS_M_SB(mapping);
Chao Yu's avatar
Chao Yu committed
2870 2871
	struct bio *bio = NULL;
	sector_t last_block;
Chao Yu's avatar
Chao Yu committed
2872 2873 2874 2875 2876 2877 2878 2879 2880 2881
#ifdef CONFIG_F2FS_FS_COMPRESSION
	struct inode *inode = mapping->host;
	struct compress_ctx cc = {
		.inode = inode,
		.log_cluster_size = F2FS_I(inode)->i_log_cluster_size,
		.cluster_size = F2FS_I(inode)->i_cluster_size,
		.cluster_idx = NULL_CLUSTER,
		.rpages = NULL,
		.nr_rpages = 0,
		.cpages = NULL,
2882
		.valid_nr_cpages = 0,
Chao Yu's avatar
Chao Yu committed
2883 2884 2885 2886 2887 2888
		.rbuf = NULL,
		.cbuf = NULL,
		.rlen = PAGE_SIZE * F2FS_I(inode)->i_cluster_size,
		.private = NULL,
	};
#endif
Chao Yu's avatar
Chao Yu committed
2889 2890 2891 2892 2893
	int nr_pages;
	pgoff_t index;
	pgoff_t end;		/* Inclusive */
	pgoff_t done_index;
	int range_whole = 0;
Matthew Wilcox's avatar
Matthew Wilcox committed
2894
	xa_mark_t tag;
2895
	int nwritten = 0;
Chao Yu's avatar
Chao Yu committed
2896 2897
	int submitted = 0;
	int i;
Chao Yu's avatar
Chao Yu committed
2898

2899
	pagevec_init(&pvec);
2900

2901 2902 2903 2904 2905 2906
	if (get_dirty_pages(mapping->host) <=
				SM_I(F2FS_M_SB(mapping))->min_hot_blocks)
		set_inode_flag(mapping->host, FI_HOT_DATA);
	else
		clear_inode_flag(mapping->host, FI_HOT_DATA);

Chao Yu's avatar
Chao Yu committed
2907
	if (wbc->range_cyclic) {
2908
		index = mapping->writeback_index; /* prev offset */
Chao Yu's avatar
Chao Yu committed
2909 2910
		end = -1;
	} else {
2911 2912
		index = wbc->range_start >> PAGE_SHIFT;
		end = wbc->range_end >> PAGE_SHIFT;
Chao Yu's avatar
Chao Yu committed
2913 2914 2915 2916 2917 2918 2919 2920
		if (wbc->range_start == 0 && wbc->range_end == LLONG_MAX)
			range_whole = 1;
	}
	if (wbc->sync_mode == WB_SYNC_ALL || wbc->tagged_writepages)
		tag = PAGECACHE_TAG_TOWRITE;
	else
		tag = PAGECACHE_TAG_DIRTY;
retry:
Chao Yu's avatar
Chao Yu committed
2921
	retry = 0;
Chao Yu's avatar
Chao Yu committed
2922 2923 2924
	if (wbc->sync_mode == WB_SYNC_ALL || wbc->tagged_writepages)
		tag_pages_for_writeback(mapping, index, end);
	done_index = index;
Chao Yu's avatar
Chao Yu committed
2925
	while (!done && !retry && (index <= end)) {
2926
		nr_pages = pagevec_lookup_range_tag(&pvec, mapping, &index, end,
2927
				tag);
Chao Yu's avatar
Chao Yu committed
2928 2929 2930 2931 2932
		if (nr_pages == 0)
			break;

		for (i = 0; i < nr_pages; i++) {
			struct page *page = pvec.pages[i];
Chao Yu's avatar
Chao Yu committed
2933 2934 2935 2936 2937
			bool need_readd;
readd:
			need_readd = false;
#ifdef CONFIG_F2FS_FS_COMPRESSION
			if (f2fs_compressed_file(inode)) {
2938 2939 2940 2941
				void *fsdata = NULL;
				struct page *pagep;
				int ret2;

Chao Yu's avatar
Chao Yu committed
2942 2943 2944 2945 2946 2947 2948 2949 2950 2951 2952 2953 2954 2955
				ret = f2fs_init_compress_ctx(&cc);
				if (ret) {
					done = 1;
					break;
				}

				if (!f2fs_cluster_can_merge_page(&cc,
								page->index)) {
					ret = f2fs_write_multi_pages(&cc,
						&submitted, wbc, io_type);
					if (!ret)
						need_readd = true;
					goto result;
				}
Chao Yu's avatar
Chao Yu committed
2956

Chao Yu's avatar
Chao Yu committed
2957 2958 2959
				if (unlikely(f2fs_cp_error(sbi)))
					goto lock_page;

2960 2961
				if (!f2fs_cluster_is_empty(&cc))
					goto lock_page;
Chao Yu's avatar
Chao Yu committed
2962

2963
				ret2 = f2fs_prepare_compress_overwrite(
Chao Yu's avatar
Chao Yu committed
2964 2965
							inode, &pagep,
							page->index, &fsdata);
2966 2967 2968 2969 2970 2971 2972 2973 2974 2975 2976
				if (ret2 < 0) {
					ret = ret2;
					done = 1;
					break;
				} else if (ret2 &&
					(!f2fs_compress_write_end(inode,
						fsdata, page->index, 1) ||
					 !f2fs_all_cluster_page_loaded(&cc,
						&pvec, i, nr_pages))) {
					retry = 1;
					break;
Chao Yu's avatar
Chao Yu committed
2977 2978 2979
				}
			}
#endif
2980
			/* give a priority to WB_SYNC threads */
2981
			if (atomic_read(&sbi->wb_sync_req[DATA]) &&
2982 2983 2984 2985
					wbc->sync_mode == WB_SYNC_NONE) {
				done = 1;
				break;
			}
Chao Yu's avatar
Chao Yu committed
2986 2987 2988
#ifdef CONFIG_F2FS_FS_COMPRESSION
lock_page:
#endif
Chao Yu's avatar
Chao Yu committed
2989
			done_index = page->index;
2990
retry_write:
Chao Yu's avatar
Chao Yu committed
2991 2992 2993 2994 2995 2996 2997 2998 2999 3000 3001 3002 3003 3004
			lock_page(page);

			if (unlikely(page->mapping != mapping)) {
continue_unlock:
				unlock_page(page);
				continue;
			}

			if (!PageDirty(page)) {
				/* someone wrote it for us */
				goto continue_unlock;
			}

			if (PageWriteback(page)) {
Chao Yu's avatar
Chao Yu committed
3005
				if (wbc->sync_mode != WB_SYNC_NONE)
3006
					f2fs_wait_on_page_writeback(page,
3007
							DATA, true, true);
Chao Yu's avatar
Chao Yu committed
3008
				else
Chao Yu's avatar
Chao Yu committed
3009 3010 3011 3012 3013 3014
					goto continue_unlock;
			}

			if (!clear_page_dirty_for_io(page))
				goto continue_unlock;

Chao Yu's avatar
Chao Yu committed
3015 3016 3017 3018 3019 3020 3021 3022
#ifdef CONFIG_F2FS_FS_COMPRESSION
			if (f2fs_compressed_file(inode)) {
				get_page(page);
				f2fs_compress_ctx_add_page(&cc, page);
				continue;
			}
#endif
			ret = f2fs_write_single_data_page(page, &submitted,
3023 3024
					&bio, &last_block, wbc, io_type,
					0, true);
Chao Yu's avatar
Chao Yu committed
3025 3026 3027 3028 3029 3030 3031 3032
			if (ret == AOP_WRITEPAGE_ACTIVATE)
				unlock_page(page);
#ifdef CONFIG_F2FS_FS_COMPRESSION
result:
#endif
			nwritten += submitted;
			wbc->nr_to_write -= submitted;

Chao Yu's avatar
Chao Yu committed
3033
			if (unlikely(ret)) {
3034 3035 3036 3037 3038 3039
				/*
				 * keep nr_to_write, since vfs uses this to
				 * get # of written pages.
				 */
				if (ret == AOP_WRITEPAGE_ACTIVATE) {
					ret = 0;
Chao Yu's avatar
Chao Yu committed
3040
					goto next;
3041 3042 3043 3044 3045
				} else if (ret == -EAGAIN) {
					ret = 0;
					if (wbc->sync_mode == WB_SYNC_ALL) {
						cond_resched();
						congestion_wait(BLK_RW_ASYNC,
Chao Yu's avatar
Chao Yu committed
3046
							DEFAULT_IO_TIMEOUT);
3047 3048
						goto retry_write;
					}
Chao Yu's avatar
Chao Yu committed
3049
					goto next;
3050
				}
3051 3052 3053
				done_index = page->index + 1;
				done = 1;
				break;
Chao Yu's avatar
Chao Yu committed
3054 3055
			}

Chao Yu's avatar
Chao Yu committed
3056
			if (wbc->nr_to_write <= 0 &&
3057
					wbc->sync_mode == WB_SYNC_NONE) {
Chao Yu's avatar
Chao Yu committed
3058 3059 3060
				done = 1;
				break;
			}
Chao Yu's avatar
Chao Yu committed
3061 3062 3063
next:
			if (need_readd)
				goto readd;
Chao Yu's avatar
Chao Yu committed
3064 3065 3066 3067
		}
		pagevec_release(&pvec);
		cond_resched();
	}
Chao Yu's avatar
Chao Yu committed
3068 3069 3070 3071 3072 3073 3074 3075 3076 3077 3078
#ifdef CONFIG_F2FS_FS_COMPRESSION
	/* flush remained pages in compress cluster */
	if (f2fs_compressed_file(inode) && !f2fs_cluster_is_empty(&cc)) {
		ret = f2fs_write_multi_pages(&cc, &submitted, wbc, io_type);
		nwritten += submitted;
		wbc->nr_to_write -= submitted;
		if (ret) {
			done = 1;
			retry = 0;
		}
	}
3079
	if (f2fs_compressed_file(inode))
3080
		f2fs_destroy_compress_ctx(&cc, false);
Chao Yu's avatar
Chao Yu committed
3081
#endif
3082
	if (retry) {
Chao Yu's avatar
Chao Yu committed
3083
		index = 0;
3084
		end = -1;
Chao Yu's avatar
Chao Yu committed
3085 3086
		goto retry;
	}
3087 3088
	if (wbc->range_cyclic && !done)
		done_index = 0;
Chao Yu's avatar
Chao Yu committed
3089 3090 3091
	if (wbc->range_cyclic || (range_whole && wbc->nr_to_write > 0))
		mapping->writeback_index = done_index;

3092
	if (nwritten)
3093
		f2fs_submit_merged_write_cond(F2FS_M_SB(mapping), mapping->host,
3094
								NULL, 0, DATA);
Chao Yu's avatar
Chao Yu committed
3095 3096
	/* submit cached bio of IPU write */
	if (bio)
Chao Yu's avatar
Chao Yu committed
3097
		f2fs_submit_merged_ipu_write(sbi, &bio, NULL);
Chao Yu's avatar
Chao Yu committed
3098

Chao Yu's avatar
Chao Yu committed
3099 3100 3101
	return ret;
}

3102 3103 3104
static inline bool __should_serialize_io(struct inode *inode,
					struct writeback_control *wbc)
{
3105 3106 3107 3108
	/* to avoid deadlock in path of data flush */
	if (F2FS_I(inode)->cp_task)
		return false;

3109 3110
	if (!S_ISREG(inode->i_mode))
		return false;
3111 3112
	if (IS_NOQUOTA(inode))
		return false;
3113

3114
	if (f2fs_need_compress_data(inode))
3115
		return true;
3116 3117 3118 3119 3120 3121 3122
	if (wbc->sync_mode != WB_SYNC_ALL)
		return true;
	if (get_dirty_pages(inode) >= SM_I(F2FS_I_SB(inode))->min_seq_blocks)
		return true;
	return false;
}

3123
static int __f2fs_write_data_pages(struct address_space *mapping,
Chao Yu's avatar
Chao Yu committed
3124 3125
						struct writeback_control *wbc,
						enum iostat_type io_type)
3126 3127
{
	struct inode *inode = mapping->host;
3128
	struct f2fs_sb_info *sbi = F2FS_I_SB(inode);
3129
	struct blk_plug plug;
3130
	int ret;
3131
	bool locked = false;
3132

P J P's avatar
P J P committed
3133 3134 3135 3136
	/* deal with chardevs and other special file */
	if (!mapping->a_ops->writepage)
		return 0;

3137 3138 3139 3140
	/* skip writing if there is no dirty page in this inode */
	if (!get_dirty_pages(inode) && wbc->sync_mode == WB_SYNC_NONE)
		return 0;

3141 3142 3143 3144
	/* during POR, we don't need to trigger writepage at all. */
	if (unlikely(is_sbi_flag_set(sbi, SBI_POR_DOING)))
		goto skip_write;

3145 3146
	if ((S_ISDIR(inode->i_mode) || IS_NOQUOTA(inode)) &&
			wbc->sync_mode == WB_SYNC_NONE &&
3147
			get_dirty_pages(inode) < nr_pages_to_skip(sbi, DATA) &&
Chao Yu's avatar
Chao Yu committed
3148
			f2fs_available_free_memory(sbi, DIRTY_DENTS))
3149 3150
		goto skip_write;

3151 3152
	/* skip writing in file defragment preparing stage */
	if (is_inode_flag_set(inode, FI_SKIP_WRITES))
Chao Yu's avatar
Chao Yu committed
3153 3154
		goto skip_write;

Yunlei He's avatar
Yunlei He committed
3155 3156
	trace_f2fs_writepages(mapping->host, wbc, DATA);

3157 3158
	/* to avoid spliting IOs due to mixed WB_SYNC_ALL and WB_SYNC_NONE */
	if (wbc->sync_mode == WB_SYNC_ALL)
3159
		atomic_inc(&sbi->wb_sync_req[DATA]);
3160 3161 3162 3163
	else if (atomic_read(&sbi->wb_sync_req[DATA])) {
		/* to avoid potential deadlock */
		if (current->plug)
			blk_finish_plug(current->plug);
3164
		goto skip_write;
3165
	}
3166

3167 3168 3169 3170 3171
	if (__should_serialize_io(inode, wbc)) {
		mutex_lock(&sbi->writepages);
		locked = true;
	}

3172
	blk_start_plug(&plug);
Chao Yu's avatar
Chao Yu committed
3173
	ret = f2fs_write_cache_pages(mapping, wbc, io_type);
3174
	blk_finish_plug(&plug);
3175

3176 3177 3178
	if (locked)
		mutex_unlock(&sbi->writepages);

3179
	if (wbc->sync_mode == WB_SYNC_ALL)
3180
		atomic_dec(&sbi->wb_sync_req[DATA]);
3181 3182 3183 3184
	/*
	 * if some pages were truncated, we cannot guarantee its mapping->host
	 * to detect pending bios.
	 */
Jaegeuk Kim's avatar
Jaegeuk Kim committed
3185

Chao Yu's avatar
Chao Yu committed
3186
	f2fs_remove_dirty_inode(inode);
3187
	return ret;
3188 3189

skip_write:
3190
	wbc->pages_skipped += get_dirty_pages(inode);
Yunlei He's avatar
Yunlei He committed
3191
	trace_f2fs_writepages(mapping->host, wbc, DATA);
3192
	return 0;
3193 3194
}

Chao Yu's avatar
Chao Yu committed
3195 3196 3197 3198 3199 3200 3201 3202 3203 3204
static int f2fs_write_data_pages(struct address_space *mapping,
			    struct writeback_control *wbc)
{
	struct inode *inode = mapping->host;

	return __f2fs_write_data_pages(mapping, wbc,
			F2FS_I(inode)->cp_task == current ?
			FS_CP_DATA_IO : FS_DATA_IO);
}

Eric Biggers's avatar
Eric Biggers committed
3205
void f2fs_write_failed(struct inode *inode, loff_t to)
3206
{
3207
	loff_t i_size = i_size_read(inode);
3208

3209 3210 3211
	if (IS_NOQUOTA(inode))
		return;

Eric Biggers's avatar
Eric Biggers committed
3212 3213
	/* In the fs-verity case, f2fs_end_enable_verity() does the truncate */
	if (to > i_size && !f2fs_verity_in_progress(inode)) {
3214
		f2fs_down_write(&F2FS_I(inode)->i_gc_rwsem[WRITE]);
3215
		filemap_invalidate_lock(inode->i_mapping);
3216

3217
		truncate_pagecache(inode, i_size);
3218
		f2fs_truncate_blocks(inode, i_size, true);
3219

3220
		filemap_invalidate_unlock(inode->i_mapping);
3221
		f2fs_up_write(&F2FS_I(inode)->i_gc_rwsem[WRITE]);
3222 3223 3224
	}
}

3225 3226 3227 3228 3229 3230 3231 3232
static int prepare_write_begin(struct f2fs_sb_info *sbi,
			struct page *page, loff_t pos, unsigned len,
			block_t *blk_addr, bool *node_changed)
{
	struct inode *inode = page->mapping->host;
	pgoff_t index = page->index;
	struct dnode_of_data dn;
	struct page *ipage;
3233
	bool locked = false;
3234
	struct extent_info ei = {0, };
3235
	int err = 0;
3236
	int flag;
3237

3238
	/*
3239 3240
	 * If a whole page is being written and we already preallocated all the
	 * blocks, then there is no need to get a block address now.
3241
	 */
3242
	if (len == PAGE_SIZE && is_inode_flag_set(inode, FI_PREALLOCATED_ALL))
3243 3244
		return 0;

3245 3246 3247 3248 3249 3250
	/* f2fs_lock_op avoids race between write CP and convert_inline_page */
	if (f2fs_has_inline_data(inode) && pos + len > MAX_INLINE_DATA(inode))
		flag = F2FS_GET_BLOCK_DEFAULT;
	else
		flag = F2FS_GET_BLOCK_PRE_AIO;

3251
	if (f2fs_has_inline_data(inode) ||
3252
			(pos & PAGE_MASK) >= i_size_read(inode)) {
3253
		f2fs_do_map_lock(sbi, flag, true);
3254 3255
		locked = true;
	}
Chao Yu's avatar
Chao Yu committed
3256

3257
restart:
3258
	/* check inline_data */
Chao Yu's avatar
Chao Yu committed
3259
	ipage = f2fs_get_node_page(sbi, inode->i_ino);
3260 3261 3262 3263 3264 3265 3266 3267
	if (IS_ERR(ipage)) {
		err = PTR_ERR(ipage);
		goto unlock_out;
	}

	set_new_dnode(&dn, inode, ipage, ipage, 0);

	if (f2fs_has_inline_data(inode)) {
3268
		if (pos + len <= MAX_INLINE_DATA(inode)) {
Chao Yu's avatar
Chao Yu committed
3269
			f2fs_do_read_inline_data(page, ipage);
3270
			set_inode_flag(inode, FI_DATA_EXIST);
3271
			if (inode->i_nlink)
3272
				set_page_private_inline(ipage);
3273 3274 3275
		} else {
			err = f2fs_convert_inline_page(&dn, page);
			if (err)
3276 3277 3278 3279 3280 3281 3282 3283 3284 3285 3286
				goto out;
			if (dn.data_blkaddr == NULL_ADDR)
				err = f2fs_get_block(&dn, index);
		}
	} else if (locked) {
		err = f2fs_get_block(&dn, index);
	} else {
		if (f2fs_lookup_extent_cache(inode, index, &ei)) {
			dn.data_blkaddr = ei.blk + index - ei.fofs;
		} else {
			/* hole case */
Chao Yu's avatar
Chao Yu committed
3287
			err = f2fs_get_dnode_of_data(&dn, index, LOOKUP_NODE);
3288
			if (err || dn.data_blkaddr == NULL_ADDR) {
3289
				f2fs_put_dnode(&dn);
3290
				f2fs_do_map_lock(sbi, F2FS_GET_BLOCK_PRE_AIO,
3291
								true);
3292
				WARN_ON(flag != F2FS_GET_BLOCK_PRE_AIO);
3293 3294 3295
				locked = true;
				goto restart;
			}
3296 3297
		}
	}
3298

3299 3300 3301
	/* convert_inline_page can make node_changed */
	*blk_addr = dn.data_blkaddr;
	*node_changed = dn.node_changed;
3302
out:
3303 3304
	f2fs_put_dnode(&dn);
unlock_out:
3305
	if (locked)
3306
		f2fs_do_map_lock(sbi, flag, false);
3307 3308 3309
	return err;
}

3310 3311 3312 3313 3314
static int f2fs_write_begin(struct file *file, struct address_space *mapping,
		loff_t pos, unsigned len, unsigned flags,
		struct page **pagep, void **fsdata)
{
	struct inode *inode = mapping->host;
3315
	struct f2fs_sb_info *sbi = F2FS_I_SB(inode);
3316
	struct page *page = NULL;
3317
	pgoff_t index = ((unsigned long long) pos) >> PAGE_SHIFT;
3318
	bool need_balance = false, drop_atomic = false;
3319
	block_t blkaddr = NULL_ADDR;
3320 3321
	int err = 0;

3322 3323
	trace_f2fs_write_begin(inode, pos, len, flags);

3324 3325
	if (!f2fs_is_checkpoint_ready(sbi)) {
		err = -ENOSPC;
Daniel Rosenberg's avatar
Daniel Rosenberg committed
3326
		goto fail;
3327
	}
Daniel Rosenberg's avatar
Daniel Rosenberg committed
3328

3329 3330 3331
	if ((f2fs_is_atomic_file(inode) &&
			!f2fs_available_free_memory(sbi, INMEM_PAGES)) ||
			is_inode_flag_set(inode, FI_ATOMIC_REVOKE_REQUEST)) {
Jaegeuk Kim's avatar
Jaegeuk Kim committed
3332
		err = -ENOMEM;
3333
		drop_atomic = true;
Jaegeuk Kim's avatar
Jaegeuk Kim committed
3334 3335 3336
		goto fail;
	}

3337 3338 3339 3340 3341 3342 3343 3344 3345 3346
	/*
	 * We should check this at this moment to avoid deadlock on inode page
	 * and #0 page. The locking rule for inline_data conversion should be:
	 * lock_page(page #0) -> lock_page(inode_page)
	 */
	if (index != 0) {
		err = f2fs_convert_inline_inode(inode);
		if (err)
			goto fail;
	}
Chao Yu's avatar
Chao Yu committed
3347 3348 3349 3350 3351 3352 3353

#ifdef CONFIG_F2FS_FS_COMPRESSION
	if (f2fs_compressed_file(inode)) {
		int ret;

		*fsdata = NULL;

3354
		if (len == PAGE_SIZE && !(f2fs_is_atomic_file(inode)))
3355 3356
			goto repeat;

Chao Yu's avatar
Chao Yu committed
3357 3358 3359 3360 3361 3362 3363 3364 3365 3366 3367
		ret = f2fs_prepare_compress_overwrite(inode, pagep,
							index, fsdata);
		if (ret < 0) {
			err = ret;
			goto fail;
		} else if (ret) {
			return 0;
		}
	}
#endif

3368
repeat:
3369 3370 3371 3372
	/*
	 * Do not use grab_cache_page_write_begin() to avoid deadlock due to
	 * wait_for_stable_page. Will wait that below with our IO control.
	 */
3373
	page = f2fs_pagecache_get_page(mapping, index,
3374
				FGP_LOCK | FGP_WRITE | FGP_CREAT, GFP_NOFS);
3375 3376 3377 3378
	if (!page) {
		err = -ENOMEM;
		goto fail;
	}
3379

Chao Yu's avatar
Chao Yu committed
3380 3381
	/* TODO: cluster can be compressed due to race with .writepage */

3382 3383
	*pagep = page;

3384 3385
	err = prepare_write_begin(sbi, page, pos, len,
					&blkaddr, &need_balance);
3386
	if (err)
3387
		goto fail;
3388

3389 3390
	if (need_balance && !IS_NOQUOTA(inode) &&
			has_not_enough_free_secs(sbi, 0, 0)) {
3391
		unlock_page(page);
Jaegeuk Kim's avatar
Jaegeuk Kim committed
3392
		f2fs_balance_fs(sbi, true);
3393 3394 3395 3396 3397 3398 3399 3400
		lock_page(page);
		if (page->mapping != mapping) {
			/* The page got truncated from under us */
			f2fs_put_page(page, 1);
			goto repeat;
		}
	}

3401
	f2fs_wait_on_page_writeback(page, DATA, false, true);
3402

3403 3404
	if (len == PAGE_SIZE || PageUptodate(page))
		return 0;
3405

Eric Biggers's avatar
Eric Biggers committed
3406 3407
	if (!(pos & (PAGE_SIZE - 1)) && (pos + len) >= i_size_read(inode) &&
	    !f2fs_verity_in_progress(inode)) {
3408 3409 3410 3411
		zero_user_segment(page, len, PAGE_SIZE);
		return 0;
	}

3412
	if (blkaddr == NEW_ADDR) {
3413
		zero_user_segment(page, 0, PAGE_SIZE);
3414
		SetPageUptodate(page);
3415
	} else {
3416 3417
		if (!f2fs_is_valid_blkaddr(sbi, blkaddr,
				DATA_GENERIC_ENHANCE_READ)) {
3418
			err = -EFSCORRUPTED;
3419 3420
			goto fail;
		}
3421
		err = f2fs_submit_page_read(inode, page, blkaddr, 0, true);
3422
		if (err)
3423
			goto fail;
3424

3425
		lock_page(page);
3426
		if (unlikely(page->mapping != mapping)) {
3427 3428
			f2fs_put_page(page, 1);
			goto repeat;
3429
		}
3430 3431 3432
		if (unlikely(!PageUptodate(page))) {
			err = -EIO;
			goto fail;
3433
		}
3434 3435
	}
	return 0;
3436

3437
fail:
3438
	f2fs_put_page(page, 1);
3439
	f2fs_write_failed(inode, pos + len);
3440
	if (drop_atomic)
Chao Yu's avatar
Chao Yu committed
3441
		f2fs_drop_inmem_pages_all(sbi, false);
3442
	return err;
3443 3444
}

3445 3446 3447 3448 3449 3450 3451
static int f2fs_write_end(struct file *file,
			struct address_space *mapping,
			loff_t pos, unsigned len, unsigned copied,
			struct page *page, void *fsdata)
{
	struct inode *inode = page->mapping->host;

3452 3453
	trace_f2fs_write_end(inode, pos, len, copied);

3454 3455 3456 3457 3458 3459
	/*
	 * This should be come from len == PAGE_SIZE, and we expect copied
	 * should be PAGE_SIZE. Otherwise, we treat it with zero copied and
	 * let generic_perform_write() try to copy data again through copied=0.
	 */
	if (!PageUptodate(page)) {
3460
		if (unlikely(copied != len))
3461 3462 3463 3464
			copied = 0;
		else
			SetPageUptodate(page);
	}
Chao Yu's avatar
Chao Yu committed
3465 3466 3467 3468 3469 3470

#ifdef CONFIG_F2FS_FS_COMPRESSION
	/* overwrite compressed file */
	if (f2fs_compressed_file(inode) && fsdata) {
		f2fs_compress_write_end(inode, fsdata, page->index, copied);
		f2fs_update_time(F2FS_I_SB(inode), REQ_TIME);
3471 3472 3473 3474

		if (pos + copied > i_size_read(inode) &&
				!f2fs_verity_in_progress(inode))
			f2fs_i_size_write(inode, pos + copied);
Chao Yu's avatar
Chao Yu committed
3475 3476 3477 3478
		return copied;
	}
#endif

3479 3480 3481
	if (!copied)
		goto unlock_out;

3482
	set_page_dirty(page);
3483

Eric Biggers's avatar
Eric Biggers committed
3484 3485
	if (pos + copied > i_size_read(inode) &&
	    !f2fs_verity_in_progress(inode))
3486
		f2fs_i_size_write(inode, pos + copied);
3487
unlock_out:
3488
	f2fs_put_page(page, 1);
3489
	f2fs_update_time(F2FS_I_SB(inode), REQ_TIME);
3490 3491 3492
	return copied;
}

3493 3494
void f2fs_invalidate_page(struct page *page, unsigned int offset,
							unsigned int length)
3495 3496
{
	struct inode *inode = page->mapping->host;
3497
	struct f2fs_sb_info *sbi = F2FS_I_SB(inode);
3498

3499
	if (inode->i_ino >= F2FS_ROOT_INO(sbi) &&
3500
		(offset % PAGE_SIZE || length != PAGE_SIZE))
3501 3502
		return;

3503
	if (PageDirty(page)) {
3504
		if (inode->i_ino == F2FS_META_INO(sbi)) {
3505
			dec_page_count(sbi, F2FS_DIRTY_META);
3506
		} else if (inode->i_ino == F2FS_NODE_INO(sbi)) {
3507
			dec_page_count(sbi, F2FS_DIRTY_NODES);
3508
		} else {
3509
			inode_dec_dirty_pages(inode);
Chao Yu's avatar
Chao Yu committed
3510
			f2fs_remove_dirty_inode(inode);
3511
		}
3512
	}
Chao Yu's avatar
Chao Yu committed
3513

3514
	clear_page_private_gcing(page);
3515

3516 3517 3518
	if (test_opt(sbi, COMPRESS_CACHE) &&
			inode->i_ino == F2FS_COMPRESS_INO(sbi))
		clear_page_private_data(page);
3519

3520
	if (page_private_atomic(page))
Chao Yu's avatar
Chao Yu committed
3521
		return f2fs_drop_inmem_page(inode, page);
Chao Yu's avatar
Chao Yu committed
3522

3523 3524
	detach_page_private(page);
	set_page_private(page, 0);
3525 3526
}

3527
int f2fs_release_page(struct page *page, gfp_t wait)
3528
{
3529 3530 3531 3532
	/* If this is dirty page, keep PagePrivate */
	if (PageDirty(page))
		return 0;

Chao Yu's avatar
Chao Yu committed
3533
	/* This is atomic written page, keep Private */
3534
	if (page_private_atomic(page))
Chao Yu's avatar
Chao Yu committed
3535 3536
		return 0;

3537 3538 3539
	if (test_opt(F2FS_P_SB(page), COMPRESS_CACHE)) {
		struct inode *inode = page->mapping->host;

3540
		if (inode->i_ino == F2FS_COMPRESS_INO(F2FS_I_SB(inode)))
3541 3542 3543
			clear_page_private_data(page);
	}

3544 3545 3546 3547
	clear_page_private_gcing(page);

	detach_page_private(page);
	set_page_private(page, 0);
3548
	return 1;
3549 3550 3551 3552
}

static int f2fs_set_data_page_dirty(struct page *page)
{
Jaegeuk Kim's avatar
Jaegeuk Kim committed
3553
	struct inode *inode = page_file_mapping(page)->host;
3554

3555 3556
	trace_f2fs_set_page_dirty(page, DATA);

3557 3558
	if (!PageUptodate(page))
		SetPageUptodate(page);
Jaegeuk Kim's avatar
Jaegeuk Kim committed
3559 3560
	if (PageSwapCache(page))
		return __set_page_dirty_nobuffers(page);
3561

Chao Yu's avatar
Chao Yu committed
3562
	if (f2fs_is_atomic_file(inode) && !f2fs_is_commit_atomic_write(inode)) {
3563
		if (!page_private_atomic(page)) {
Chao Yu's avatar
Chao Yu committed
3564
			f2fs_register_inmem_page(inode, page);
Chao Yu's avatar
Chao Yu committed
3565 3566 3567 3568 3569 3570 3571
			return 1;
		}
		/*
		 * Previously, this page has been registered, we just
		 * return here.
		 */
		return 0;
3572 3573
	}

3574
	if (!PageDirty(page)) {
3575
		__set_page_dirty_nobuffers(page);
Chao Yu's avatar
Chao Yu committed
3576
		f2fs_update_dirty_page(inode, page);
3577 3578 3579 3580 3581
		return 1;
	}
	return 0;
}

3582 3583 3584 3585 3586 3587 3588 3589 3590 3591 3592 3593 3594 3595 3596 3597 3598 3599 3600 3601 3602 3603 3604 3605 3606

static sector_t f2fs_bmap_compress(struct inode *inode, sector_t block)
{
#ifdef CONFIG_F2FS_FS_COMPRESSION
	struct dnode_of_data dn;
	sector_t start_idx, blknr = 0;
	int ret;

	start_idx = round_down(block, F2FS_I(inode)->i_cluster_size);

	set_new_dnode(&dn, inode, NULL, NULL, 0);
	ret = f2fs_get_dnode_of_data(&dn, start_idx, LOOKUP_NODE);
	if (ret)
		return 0;

	if (dn.data_blkaddr != COMPRESS_ADDR) {
		dn.ofs_in_node += block - start_idx;
		blknr = f2fs_data_blkaddr(&dn);
		if (!__is_valid_data_blkaddr(blknr))
			blknr = 0;
	}

	f2fs_put_dnode(&dn);
	return blknr;
#else
3607
	return 0;
3608 3609 3610 3611
#endif
}


Jaegeuk Kim's avatar
Jaegeuk Kim committed
3612 3613
static sector_t f2fs_bmap(struct address_space *mapping, sector_t block)
{
3614
	struct inode *inode = mapping->host;
Chao Yu's avatar
Chao Yu committed
3615
	sector_t blknr = 0;
3616

Jaegeuk Kim's avatar
Jaegeuk Kim committed
3617
	if (f2fs_has_inline_data(inode))
Chao Yu's avatar
Chao Yu committed
3618
		goto out;
Jaegeuk Kim's avatar
Jaegeuk Kim committed
3619 3620 3621 3622 3623

	/* make sure allocating whole blocks */
	if (mapping_tagged(mapping, PAGECACHE_TAG_DIRTY))
		filemap_write_and_wait(mapping);

3624
	/* Block number less than F2FS MAX BLOCKS */
3625
	if (unlikely(block >= max_file_blocks(inode)))
3626
		goto out;
3627

3628 3629 3630
	if (f2fs_compressed_file(inode)) {
		blknr = f2fs_bmap_compress(inode, block);
	} else {
3631 3632 3633 3634 3635 3636 3637 3638 3639 3640
		struct f2fs_map_blocks map;

		memset(&map, 0, sizeof(map));
		map.m_lblk = block;
		map.m_len = 1;
		map.m_next_pgofs = NULL;
		map.m_seg_type = NO_CHECK_TYPE;

		if (!f2fs_map_blocks(inode, &map, 0, F2FS_GET_BLOCK_BMAP))
			blknr = map.m_pblk;
3641
	}
Chao Yu's avatar
Chao Yu committed
3642 3643 3644
out:
	trace_f2fs_bmap(inode, block, blknr);
	return blknr;
3645 3646
}

3647 3648 3649 3650 3651 3652 3653 3654
#ifdef CONFIG_MIGRATION
#include <linux/migrate.h>

int f2fs_migrate_page(struct address_space *mapping,
		struct page *newpage, struct page *page, enum migrate_mode mode)
{
	int rc, extra_count;
	struct f2fs_inode_info *fi = F2FS_I(mapping->host);
3655
	bool atomic_written = page_private_atomic(page);
3656 3657 3658 3659

	BUG_ON(PageWriteback(page));

	/* migrating an atomic written page is safe with the inmem_lock hold */
3660 3661 3662 3663 3664 3665
	if (atomic_written) {
		if (mode != MIGRATE_SYNC)
			return -EBUSY;
		if (!mutex_trylock(&fi->inmem_lock))
			return -EAGAIN;
	}
3666

3667 3668
	/* one extra reference was held for atomic_write page */
	extra_count = atomic_written ? 1 : 0;
3669
	rc = migrate_page_move_mapping(mapping, newpage,
3670
				page, extra_count);
3671 3672 3673 3674 3675 3676 3677 3678
	if (rc != MIGRATEPAGE_SUCCESS) {
		if (atomic_written)
			mutex_unlock(&fi->inmem_lock);
		return rc;
	}

	if (atomic_written) {
		struct inmem_pages *cur;
Yi Zhuang's avatar
Yi Zhuang committed
3679

3680 3681 3682 3683 3684 3685 3686 3687 3688 3689
		list_for_each_entry(cur, &fi->inmem_pages, list)
			if (cur->page == page) {
				cur->page = newpage;
				break;
			}
		mutex_unlock(&fi->inmem_lock);
		put_page(page);
		get_page(newpage);
	}

3690 3691
	/* guarantee to start from no stale private field */
	set_page_private(newpage, 0);
3692
	if (PagePrivate(page)) {
3693 3694 3695 3696 3697 3698 3699
		set_page_private(newpage, page_private(page));
		SetPagePrivate(newpage);
		get_page(newpage);

		set_page_private(page, 0);
		ClearPagePrivate(page);
		put_page(page);
3700
	}
3701

3702 3703 3704 3705
	if (mode != MIGRATE_SYNC_NO_COPY)
		migrate_page_copy(newpage, page);
	else
		migrate_page_states(newpage, page);
3706 3707 3708 3709 3710

	return MIGRATEPAGE_SUCCESS;
}
#endif

Jaegeuk Kim's avatar
Jaegeuk Kim committed
3711
#ifdef CONFIG_SWAP
3712 3713 3714 3715 3716 3717 3718 3719 3720 3721
static int f2fs_migrate_blocks(struct inode *inode, block_t start_blk,
							unsigned int blkcnt)
{
	struct f2fs_sb_info *sbi = F2FS_I_SB(inode);
	unsigned int blkofs;
	unsigned int blk_per_sec = BLKS_PER_SEC(sbi);
	unsigned int secidx = start_blk / blk_per_sec;
	unsigned int end_sec = secidx + blkcnt / blk_per_sec;
	int ret = 0;

3722
	f2fs_down_write(&F2FS_I(inode)->i_gc_rwsem[WRITE]);
3723
	filemap_invalidate_lock(inode->i_mapping);
3724 3725

	set_inode_flag(inode, FI_ALIGNED_WRITE);
3726
	set_inode_flag(inode, FI_OPU_WRITE);
3727 3728

	for (; secidx < end_sec; secidx++) {
3729
		f2fs_down_write(&sbi->pin_sem);
3730 3731 3732 3733 3734

		f2fs_lock_op(sbi);
		f2fs_allocate_new_section(sbi, CURSEG_COLD_DATA_PINNED, false);
		f2fs_unlock_op(sbi);

3735
		set_inode_flag(inode, FI_SKIP_WRITES);
3736 3737 3738 3739 3740 3741 3742

		for (blkofs = 0; blkofs < blk_per_sec; blkofs++) {
			struct page *page;
			unsigned int blkidx = secidx * blk_per_sec + blkofs;

			page = f2fs_get_lock_data_page(inode, blkidx, true);
			if (IS_ERR(page)) {
3743
				f2fs_up_write(&sbi->pin_sem);
3744 3745 3746 3747 3748 3749 3750 3751
				ret = PTR_ERR(page);
				goto done;
			}

			set_page_dirty(page);
			f2fs_put_page(page, 1);
		}

3752
		clear_inode_flag(inode, FI_SKIP_WRITES);
3753 3754 3755

		ret = filemap_fdatawrite(inode->i_mapping);

3756
		f2fs_up_write(&sbi->pin_sem);
3757 3758 3759 3760 3761 3762

		if (ret)
			break;
	}

done:
3763 3764
	clear_inode_flag(inode, FI_SKIP_WRITES);
	clear_inode_flag(inode, FI_OPU_WRITE);
3765 3766
	clear_inode_flag(inode, FI_ALIGNED_WRITE);

3767
	filemap_invalidate_unlock(inode->i_mapping);
3768
	f2fs_up_write(&F2FS_I(inode)->i_gc_rwsem[WRITE]);
3769 3770 3771 3772

	return ret;
}

Chao Yu's avatar
Chao Yu committed
3773
static int check_swap_activate(struct swap_info_struct *sis,
3774 3775 3776 3777
				struct file *swap_file, sector_t *span)
{
	struct address_space *mapping = swap_file->f_mapping;
	struct inode *inode = mapping->host;
3778
	struct f2fs_sb_info *sbi = F2FS_I_SB(inode);
3779 3780 3781 3782 3783 3784 3785
	sector_t cur_lblock;
	sector_t last_lblock;
	sector_t pblock;
	sector_t lowest_pblock = -1;
	sector_t highest_pblock = 0;
	int nr_extents = 0;
	unsigned long nr_pblocks;
3786 3787
	unsigned int blks_per_sec = BLKS_PER_SEC(sbi);
	unsigned int sec_blks_mask = BLKS_PER_SEC(sbi) - 1;
3788
	unsigned int not_aligned = 0;
3789
	int ret = 0;
3790 3791 3792 3793 3794 3795

	/*
	 * Map all the blocks into the extent list.  This code doesn't try
	 * to be very smart.
	 */
	cur_lblock = 0;
3796
	last_lblock = bytes_to_blks(inode, i_size_read(inode));
3797

3798
	while (cur_lblock < last_lblock && cur_lblock < sis->max) {
3799
		struct f2fs_map_blocks map;
3800
retry:
3801 3802
		cond_resched();

3803 3804
		memset(&map, 0, sizeof(map));
		map.m_lblk = cur_lblock;
3805 3806 3807
		map.m_len = last_lblock - cur_lblock;
		map.m_next_pgofs = NULL;
		map.m_next_extent = NULL;
3808
		map.m_seg_type = NO_CHECK_TYPE;
3809
		map.m_may_create = false;
3810

3811
		ret = f2fs_map_blocks(inode, &map, 0, F2FS_GET_BLOCK_FIEMAP);
3812
		if (ret)
3813
			goto out;
3814 3815

		/* hole */
3816
		if (!(map.m_flags & F2FS_MAP_FLAGS)) {
Joe Perches's avatar
Joe Perches committed
3817
			f2fs_err(sbi, "Swapfile has holes");
3818
			ret = -EINVAL;
3819 3820
			goto out;
		}
3821

3822 3823
		pblock = map.m_pblk;
		nr_pblocks = map.m_len;
3824

3825 3826
		if ((pblock - SM_I(sbi)->main_blkaddr) & sec_blks_mask ||
				nr_pblocks & sec_blks_mask) {
3827
			not_aligned++;
3828

3829 3830 3831 3832 3833 3834 3835 3836 3837 3838 3839 3840 3841 3842 3843 3844 3845 3846
			nr_pblocks = roundup(nr_pblocks, blks_per_sec);
			if (cur_lblock + nr_pblocks > sis->max)
				nr_pblocks -= blks_per_sec;

			if (!nr_pblocks) {
				/* this extent is last one */
				nr_pblocks = map.m_len;
				f2fs_warn(sbi, "Swapfile: last extent is not aligned to section");
				goto next;
			}

			ret = f2fs_migrate_blocks(inode, cur_lblock,
							nr_pblocks);
			if (ret)
				goto out;
			goto retry;
		}
next:
3847 3848 3849 3850 3851 3852 3853 3854 3855 3856 3857 3858 3859 3860 3861 3862 3863 3864 3865 3866 3867 3868 3869 3870 3871 3872 3873
		if (cur_lblock + nr_pblocks >= sis->max)
			nr_pblocks = sis->max - cur_lblock;

		if (cur_lblock) {	/* exclude the header page */
			if (pblock < lowest_pblock)
				lowest_pblock = pblock;
			if (pblock + nr_pblocks - 1 > highest_pblock)
				highest_pblock = pblock + nr_pblocks - 1;
		}

		/*
		 * We found a PAGE_SIZE-length, PAGE_SIZE-aligned run of blocks
		 */
		ret = add_swap_extent(sis, cur_lblock, nr_pblocks, pblock);
		if (ret < 0)
			goto out;
		nr_extents += ret;
		cur_lblock += nr_pblocks;
	}
	ret = nr_extents;
	*span = 1 + highest_pblock - lowest_pblock;
	if (cur_lblock == 0)
		cur_lblock = 1;	/* force Empty message */
	sis->max = cur_lblock;
	sis->pages = cur_lblock - 1;
	sis->highest_bit = cur_lblock - 1;
out:
3874 3875 3876
	if (not_aligned)
		f2fs_warn(sbi, "Swapfile (%u) is not align to section: 1) creat(), 2) ioctl(F2FS_IOC_SET_PIN_FILE), 3) fallocate(%u * N)",
			  not_aligned, blks_per_sec * F2FS_BLKSIZE);
3877 3878 3879
	return ret;
}

Jaegeuk Kim's avatar
Jaegeuk Kim committed
3880 3881 3882 3883 3884 3885 3886 3887 3888 3889 3890 3891
static int f2fs_swap_activate(struct swap_info_struct *sis, struct file *file,
				sector_t *span)
{
	struct inode *inode = file_inode(file);
	int ret;

	if (!S_ISREG(inode->i_mode))
		return -EINVAL;

	if (f2fs_readonly(F2FS_I_SB(inode)->sb))
		return -EROFS;

3892 3893 3894 3895 3896 3897
	if (f2fs_lfs_mode(F2FS_I_SB(inode))) {
		f2fs_err(F2FS_I_SB(inode),
			"Swapfile not supported in LFS mode");
		return -EINVAL;
	}

Jaegeuk Kim's avatar
Jaegeuk Kim committed
3898 3899 3900 3901
	ret = f2fs_convert_inline_inode(inode);
	if (ret)
		return ret;

3902
	if (!f2fs_disable_compressed_file(inode))
Chao Yu's avatar
Chao Yu committed
3903 3904
		return -EINVAL;

3905 3906
	f2fs_precache_extents(inode);

3907 3908
	ret = check_swap_activate(sis, file, span);
	if (ret < 0)
Jaegeuk Kim's avatar
Jaegeuk Kim committed
3909 3910 3911 3912
		return ret;

	set_inode_flag(inode, FI_PIN_FILE);
	f2fs_update_time(F2FS_I_SB(inode), REQ_TIME);
3913
	return ret;
Jaegeuk Kim's avatar
Jaegeuk Kim committed
3914 3915 3916 3917 3918 3919 3920 3921 3922 3923 3924 3925 3926 3927 3928 3929 3930 3931 3932 3933
}

static void f2fs_swap_deactivate(struct file *file)
{
	struct inode *inode = file_inode(file);

	clear_inode_flag(inode, FI_PIN_FILE);
}
#else
static int f2fs_swap_activate(struct swap_info_struct *sis, struct file *file,
				sector_t *span)
{
	return -EOPNOTSUPP;
}

static void f2fs_swap_deactivate(struct file *file)
{
}
#endif

3934 3935
const struct address_space_operations f2fs_dblock_aops = {
	.readpage	= f2fs_read_data_page,
3936
	.readahead	= f2fs_readahead,
3937 3938 3939
	.writepage	= f2fs_write_data_page,
	.writepages	= f2fs_write_data_pages,
	.write_begin	= f2fs_write_begin,
3940
	.write_end	= f2fs_write_end,
3941
	.set_page_dirty	= f2fs_set_data_page_dirty,
3942 3943
	.invalidatepage	= f2fs_invalidate_page,
	.releasepage	= f2fs_release_page,
Eric Biggers's avatar
Eric Biggers committed
3944
	.direct_IO	= noop_direct_IO,
Jaegeuk Kim's avatar
Jaegeuk Kim committed
3945
	.bmap		= f2fs_bmap,
Jaegeuk Kim's avatar
Jaegeuk Kim committed
3946 3947
	.swap_activate  = f2fs_swap_activate,
	.swap_deactivate = f2fs_swap_deactivate,
3948 3949 3950
#ifdef CONFIG_MIGRATION
	.migratepage    = f2fs_migrate_page,
#endif
3951
};
3952

Matthew Wilcox's avatar
Matthew Wilcox committed
3953
void f2fs_clear_page_cache_dirty_tag(struct page *page)
3954 3955 3956 3957 3958
{
	struct address_space *mapping = page_mapping(page);
	unsigned long flags;

	xa_lock_irqsave(&mapping->i_pages, flags);
Matthew Wilcox's avatar
Matthew Wilcox committed
3959
	__xa_clear_mark(&mapping->i_pages, page_index(page),
3960 3961 3962 3963
						PAGECACHE_TAG_DIRTY);
	xa_unlock_irqrestore(&mapping->i_pages, flags);
}

3964 3965
int __init f2fs_init_post_read_processing(void)
{
Eric Biggers's avatar
Eric Biggers committed
3966 3967 3968
	bio_post_read_ctx_cache =
		kmem_cache_create("f2fs_bio_post_read_ctx",
				  sizeof(struct bio_post_read_ctx), 0, 0, NULL);
3969 3970 3971 3972 3973 3974 3975 3976 3977 3978 3979 3980 3981 3982 3983
	if (!bio_post_read_ctx_cache)
		goto fail;
	bio_post_read_ctx_pool =
		mempool_create_slab_pool(NUM_PREALLOC_POST_READ_CTXS,
					 bio_post_read_ctx_cache);
	if (!bio_post_read_ctx_pool)
		goto fail_free_cache;
	return 0;

fail_free_cache:
	kmem_cache_destroy(bio_post_read_ctx_cache);
fail:
	return -ENOMEM;
}

Chao Yu's avatar
Chao Yu committed
3984
void f2fs_destroy_post_read_processing(void)
3985 3986 3987 3988
{
	mempool_destroy(bio_post_read_ctx_pool);
	kmem_cache_destroy(bio_post_read_ctx_cache);
}
Chao Yu's avatar
Chao Yu committed
3989

Chao Yu's avatar
Chao Yu committed
3990 3991 3992 3993 3994 3995 3996 3997 3998 3999 4000 4001 4002 4003 4004 4005 4006 4007 4008 4009 4010
int f2fs_init_post_read_wq(struct f2fs_sb_info *sbi)
{
	if (!f2fs_sb_has_encrypt(sbi) &&
		!f2fs_sb_has_verity(sbi) &&
		!f2fs_sb_has_compression(sbi))
		return 0;

	sbi->post_read_wq = alloc_workqueue("f2fs_post_read_wq",
						 WQ_UNBOUND | WQ_HIGHPRI,
						 num_online_cpus());
	if (!sbi->post_read_wq)
		return -ENOMEM;
	return 0;
}

void f2fs_destroy_post_read_wq(struct f2fs_sb_info *sbi)
{
	if (sbi->post_read_wq)
		destroy_workqueue(sbi->post_read_wq);
}

Chao Yu's avatar
Chao Yu committed
4011 4012
int __init f2fs_init_bio_entry_cache(void)
{
4013
	bio_entry_slab = f2fs_kmem_cache_create("f2fs_bio_entry_slab",
Chao Yu's avatar
Chao Yu committed
4014 4015 4016 4017 4018 4019
			sizeof(struct bio_entry));
	if (!bio_entry_slab)
		return -ENOMEM;
	return 0;
}

Chao Yu's avatar
Chao Yu committed
4020
void f2fs_destroy_bio_entry_cache(void)
Chao Yu's avatar
Chao Yu committed
4021 4022 4023
{
	kmem_cache_destroy(bio_entry_slab);
}
4024 4025 4026 4027 4028 4029 4030 4031 4032 4033 4034 4035 4036 4037 4038 4039 4040 4041 4042 4043 4044 4045 4046

static int f2fs_iomap_begin(struct inode *inode, loff_t offset, loff_t length,
			    unsigned int flags, struct iomap *iomap,
			    struct iomap *srcmap)
{
	struct f2fs_map_blocks map = {};
	pgoff_t next_pgofs = 0;
	int err;

	map.m_lblk = bytes_to_blks(inode, offset);
	map.m_len = bytes_to_blks(inode, offset + length - 1) - map.m_lblk + 1;
	map.m_next_pgofs = &next_pgofs;
	map.m_seg_type = f2fs_rw_hint_to_seg_type(inode->i_write_hint);
	if (flags & IOMAP_WRITE)
		map.m_may_create = true;

	err = f2fs_map_blocks(inode, &map, flags & IOMAP_WRITE,
			      F2FS_GET_BLOCK_DIO);
	if (err)
		return err;

	iomap->offset = blks_to_bytes(inode, map.m_lblk);

4047 4048 4049 4050 4051 4052 4053
	/*
	 * When inline encryption is enabled, sometimes I/O to an encrypted file
	 * has to be broken up to guarantee DUN contiguity.  Handle this by
	 * limiting the length of the mapping returned.
	 */
	map.m_len = fscrypt_limit_io_blocks(inode, map.m_lblk, map.m_len);

4054 4055 4056 4057 4058 4059 4060 4061 4062 4063 4064 4065 4066 4067 4068 4069 4070 4071 4072 4073 4074 4075 4076 4077 4078 4079 4080 4081 4082 4083 4084 4085
	if (map.m_flags & (F2FS_MAP_MAPPED | F2FS_MAP_UNWRITTEN)) {
		iomap->length = blks_to_bytes(inode, map.m_len);
		if (map.m_flags & F2FS_MAP_MAPPED) {
			iomap->type = IOMAP_MAPPED;
			iomap->flags |= IOMAP_F_MERGED;
		} else {
			iomap->type = IOMAP_UNWRITTEN;
		}
		if (WARN_ON_ONCE(!__is_valid_data_blkaddr(map.m_pblk)))
			return -EINVAL;

		iomap->bdev = map.m_bdev;
		iomap->addr = blks_to_bytes(inode, map.m_pblk);
	} else {
		iomap->length = blks_to_bytes(inode, next_pgofs) -
				iomap->offset;
		iomap->type = IOMAP_HOLE;
		iomap->addr = IOMAP_NULL_ADDR;
	}

	if (map.m_flags & F2FS_MAP_NEW)
		iomap->flags |= IOMAP_F_NEW;
	if ((inode->i_state & I_DIRTY_DATASYNC) ||
	    offset + length > i_size_read(inode))
		iomap->flags |= IOMAP_F_DIRTY;

	return 0;
}

const struct iomap_ops f2fs_iomap_ops = {
	.iomap_begin	= f2fs_iomap_begin,
};