Blame - src/kernel/linux/v4.14/fs/f2fs/data.c - T103

blob: 40486022503d6a74d728fbe64cecfa6d231844ec [file] [log] [blame]

rjw	1f88458	2022-01-06 17:20:42 +0800	[diff] [blame^]	1	/*
				2	* fs/f2fs/data.c
				3	*
				4	* Copyright (c) 2012 Samsung Electronics Co., Ltd.
				5	* http://www.samsung.com/
				6	*
				7	* This program is free software; you can redistribute it and/or modify
				8	* it under the terms of the GNU General Public License version 2 as
				9	* published by the Free Software Foundation.
				10	*/
				11	#include <linux/fs.h>
				12	#include <linux/f2fs_fs.h>
				13	#include <linux/buffer_head.h>
				14	#include <linux/mpage.h>
				15	#include <linux/writeback.h>
				16	#include <linux/backing-dev.h>
				17	#include <linux/pagevec.h>
				18	#include <linux/blkdev.h>
				19	#include <linux/bio.h>
				20	#include <linux/prefetch.h>
				21	#include <linux/uio.h>
				22	#include <linux/cleancache.h>
				23	#include <linux/sched/signal.h>
				24
				25	#include "f2fs.h"
				26	#include "node.h"
				27	#include "segment.h"
				28	#include "trace.h"
				29	#include <trace/events/f2fs.h>
				30	#include <trace/events/android_fs.h>
				31
				32	#define NUM_PREALLOC_POST_READ_CTXS 128
				33
				34	static struct kmem_cache *bio_post_read_ctx_cache;
				35	static mempool_t *bio_post_read_ctx_pool;
				36
				37	static bool __is_cp_guaranteed(struct page *page)
				38	{
				39	struct address_space *mapping = page->mapping;
				40	struct inode *inode;
				41	struct f2fs_sb_info *sbi;
				42
				43	if (!mapping)
				44	return false;
				45
				46	inode = mapping->host;
				47	sbi = F2FS_I_SB(inode);
				48
				49	if (inode->i_ino == F2FS_META_INO(sbi) \|\|
				50	inode->i_ino == F2FS_NODE_INO(sbi) \|\|
				51	S_ISDIR(inode->i_mode) \|\|
				52	is_cold_data(page))
				53	return true;
				54	return false;
				55	}
				56
				57	/* postprocessing steps for read bios */
				58	enum bio_post_read_step {
				59	STEP_INITIAL = 0,
				60	STEP_DECRYPT,
				61	};
				62
				63	struct bio_post_read_ctx {
				64	struct bio *bio;
				65	struct work_struct work;
				66	unsigned int cur_step;
				67	unsigned int enabled_steps;
				68	};
				69
				70	static void __read_end_io(struct bio *bio)
				71	{
				72	struct page *page;
				73	struct bio_vec *bv;
				74	int i;
				75
				76	bio_for_each_segment_all(bv, bio, i) {
				77	page = bv->bv_page;
				78
				79	/* PG_error was set if any post_read step failed */
				80	if (bio->bi_status \|\| PageError(page)) {
				81	ClearPageUptodate(page);
				82	SetPageError(page);
				83	} else {
				84	SetPageUptodate(page);
				85	}
				86	unlock_page(page);
				87	}
				88	if (bio->bi_private)
				89	mempool_free(bio->bi_private, bio_post_read_ctx_pool);
				90	bio_put(bio);
				91	}
				92
				93	static void bio_post_read_processing(struct bio_post_read_ctx *ctx);
				94
				95	static void decrypt_work(struct work_struct *work)
				96	{
				97	struct bio_post_read_ctx *ctx =
				98	container_of(work, struct bio_post_read_ctx, work);
				99
				100	fscrypt_decrypt_bio(ctx->bio);
				101
				102	bio_post_read_processing(ctx);
				103	}
				104
				105	static void bio_post_read_processing(struct bio_post_read_ctx *ctx)
				106	{
				107	switch (++ctx->cur_step) {
				108	case STEP_DECRYPT:
				109	if (ctx->enabled_steps & (1 << STEP_DECRYPT)) {
				110	INIT_WORK(&ctx->work, decrypt_work);
				111	fscrypt_enqueue_decrypt_work(&ctx->work);
				112	return;
				113	}
				114	ctx->cur_step++;
				115	/* fall-through */
				116	default:
				117	__read_end_io(ctx->bio);
				118	}
				119	}
				120
				121	static bool f2fs_bio_post_read_required(struct bio *bio)
				122	{
				123	return bio->bi_private && !bio->bi_status;
				124	}
				125
				126	static void f2fs_read_end_io(struct bio *bio)
				127	{
				128	#ifdef CONFIG_F2FS_FAULT_INJECTION
				129	if (time_to_inject(F2FS_P_SB(bio->bi_io_vec->bv_page), FAULT_IO)) {
				130	f2fs_show_injection_info(FAULT_IO);
				131	bio->bi_status = BLK_STS_IOERR;
				132	}
				133	#endif
				134
				135	if (f2fs_bio_post_read_required(bio)) {
				136	struct bio_post_read_ctx *ctx = bio->bi_private;
				137
				138	ctx->cur_step = STEP_INITIAL;
				139	bio_post_read_processing(ctx);
				140	return;
				141	}
				142
				143	__read_end_io(bio);
				144	}
				145
				146	static void f2fs_write_end_io(struct bio *bio)
				147	{
				148	struct f2fs_sb_info *sbi = bio->bi_private;
				149	struct bio_vec *bvec;
				150	int i;
				151
				152	bio_for_each_segment_all(bvec, bio, i) {
				153	struct page *page = bvec->bv_page;
				154	enum count_type type = WB_DATA_TYPE(page);
				155
				156	if (IS_DUMMY_WRITTEN_PAGE(page)) {
				157	set_page_private(page, (unsigned long)NULL);
				158	ClearPagePrivate(page);
				159	unlock_page(page);
				160	mempool_free(page, sbi->write_io_dummy);
				161
				162	if (unlikely(bio->bi_status))
				163	f2fs_stop_checkpoint(sbi, true);
				164	continue;
				165	}
				166
				167	fscrypt_pullback_bio_page(&page, true);
				168
				169	if (unlikely(bio->bi_status)) {
				170	mapping_set_error(page->mapping, -EIO);
				171	if (type == F2FS_WB_CP_DATA)
				172	f2fs_stop_checkpoint(sbi, true);
				173	}
				174
				175	f2fs_bug_on(sbi, page->mapping == NODE_MAPPING(sbi) &&
				176	page->index != nid_of_node(page));
				177
				178	dec_page_count(sbi, type);
				179	clear_cold_data(page);
				180	end_page_writeback(page);
				181	}
				182	if (!get_pages(sbi, F2FS_WB_CP_DATA) &&
				183	wq_has_sleeper(&sbi->cp_wait))
				184	wake_up(&sbi->cp_wait);
				185
				186	bio_put(bio);
				187	}
				188
				189	/*
				190	* Return true, if pre_bio's bdev is same as its target device.
				191	*/
				192	struct block_device f2fs_target_device(struct f2fs_sb_info sbi,
				193	block_t blk_addr, struct bio *bio)
				194	{
				195	struct block_device *bdev = sbi->sb->s_bdev;
				196	int i;
				197
				198	if (f2fs_is_multi_device(sbi)) {
				199	for (i = 0; i < sbi->s_ndevs; i++) {
				200	if (FDEV(i).start_blk <= blk_addr &&
				201	FDEV(i).end_blk >= blk_addr) {
				202	blk_addr -= FDEV(i).start_blk;
				203	bdev = FDEV(i).bdev;
				204	break;
				205	}
				206	}
				207	}
				208	if (bio) {
				209	bio_set_dev(bio, bdev);
				210	bio->bi_iter.bi_sector = SECTOR_FROM_BLOCK(blk_addr);
				211	}
				212	return bdev;
				213	}
				214
				215	int f2fs_target_device_index(struct f2fs_sb_info *sbi, block_t blkaddr)
				216	{
				217	int i;
				218
				219	if (!f2fs_is_multi_device(sbi))
				220	return 0;
				221
				222	for (i = 0; i < sbi->s_ndevs; i++)
				223	if (FDEV(i).start_blk <= blkaddr && FDEV(i).end_blk >= blkaddr)
				224	return i;
				225	return 0;
				226	}
				227
				228	static bool __same_bdev(struct f2fs_sb_info *sbi,
				229	block_t blk_addr, struct bio *bio)
				230	{
				231	struct block_device *b = f2fs_target_device(sbi, blk_addr, NULL);
				232	return bio->bi_disk == b->bd_disk && bio->bi_partno == b->bd_partno;
				233	}
				234
				235	/*
				236	* Low-level block read/write IO operations.
				237	*/
				238	static struct bio __bio_alloc(struct f2fs_sb_info sbi, block_t blk_addr,
				239	struct writeback_control *wbc,
				240	int npages, bool is_read,
				241	enum page_type type, enum temp_type temp)
				242	{
				243	struct bio *bio;
				244
				245	bio = f2fs_bio_alloc(sbi, npages, true);
				246
				247	f2fs_target_device(sbi, blk_addr, bio);
				248	if (is_read) {
				249	bio->bi_end_io = f2fs_read_end_io;
				250	bio->bi_private = NULL;
				251	} else {
				252	bio->bi_end_io = f2fs_write_end_io;
				253	bio->bi_private = sbi;
				254	bio->bi_write_hint = io_type_to_rw_hint(sbi, type, temp);
				255	}
				256	if (wbc)
				257	wbc_init_bio(wbc, bio);
				258
				259	return bio;
				260	}
				261
				262	static inline void __submit_bio(struct f2fs_sb_info *sbi,
				263	struct bio *bio, enum page_type type)
				264	{
				265	if (!is_read_io(bio_op(bio))) {
				266	unsigned int start;
				267
				268	if (type != DATA && type != NODE)
				269	goto submit_io;
				270
				271	if (f2fs_sb_has_blkzoned(sbi->sb) && current->plug)
				272	blk_finish_plug(current->plug);
				273
				274	start = bio->bi_iter.bi_size >> F2FS_BLKSIZE_BITS;
				275	start %= F2FS_IO_SIZE(sbi);
				276
				277	if (start == 0)
				278	goto submit_io;
				279
				280	/* fill dummy pages */
				281	for (; start < F2FS_IO_SIZE(sbi); start++) {
				282	struct page *page =
				283	mempool_alloc(sbi->write_io_dummy,
				284	GFP_NOIO \| __GFP_ZERO \| __GFP_NOFAIL);
				285	f2fs_bug_on(sbi, !page);
				286
				287	SetPagePrivate(page);
				288	set_page_private(page, (unsigned long)DUMMY_WRITTEN_PAGE);
				289	lock_page(page);
				290	if (bio_add_page(bio, page, PAGE_SIZE, 0) < PAGE_SIZE)
				291	f2fs_bug_on(sbi, 1);
				292	}
				293	/*
				294	* In the NODE case, we lose next block address chain. So, we
				295	* need to do checkpoint in f2fs_sync_file.
				296	*/
				297	if (type == NODE)
				298	set_sbi_flag(sbi, SBI_NEED_CP);
				299	}
				300	submit_io:
				301	if (is_read_io(bio_op(bio)))
				302	trace_f2fs_submit_read_bio(sbi->sb, type, bio);
				303	else
				304	trace_f2fs_submit_write_bio(sbi->sb, type, bio);
				305	submit_bio(bio);
				306	}
				307
				308	static void __submit_merged_bio(struct f2fs_bio_info *io)
				309	{
				310	struct f2fs_io_info *fio = &io->fio;
				311
				312	if (!io->bio)
				313	return;
				314
				315	bio_set_op_attrs(io->bio, fio->op, fio->op_flags);
				316
				317	if (is_read_io(fio->op))
				318	trace_f2fs_prepare_read_bio(io->sbi->sb, fio->type, io->bio);
				319	else
				320	trace_f2fs_prepare_write_bio(io->sbi->sb, fio->type, io->bio);
				321
				322	__submit_bio(io->sbi, io->bio, fio->type);
				323	io->bio = NULL;
				324	}
				325
				326	static bool __has_merged_page(struct f2fs_bio_info *io,
				327	struct inode *inode, nid_t ino, pgoff_t idx)
				328	{
				329	struct bio_vec *bvec;
				330	struct page *target;
				331	int i;
				332
				333	if (!io->bio)
				334	return false;
				335
				336	if (!inode && !ino)
				337	return true;
				338
				339	bio_for_each_segment_all(bvec, io->bio, i) {
				340
				341	if (bvec->bv_page->mapping)
				342	target = bvec->bv_page;
				343	else
				344	target = fscrypt_control_page(bvec->bv_page);
				345
				346	if (idx != target->index)
				347	continue;
				348
				349	if (inode && inode == target->mapping->host)
				350	return true;
				351	if (ino && ino == ino_of_node(target))
				352	return true;
				353	}
				354
				355	return false;
				356	}
				357
				358	static bool has_merged_page(struct f2fs_sb_info sbi, struct inode inode,
				359	nid_t ino, pgoff_t idx, enum page_type type)
				360	{
				361	enum page_type btype = PAGE_TYPE_OF_BIO(type);
				362	enum temp_type temp;
				363	struct f2fs_bio_info *io;
				364	bool ret = false;
				365
				366	for (temp = HOT; temp < NR_TEMP_TYPE; temp++) {
				367	io = sbi->write_io[btype] + temp;
				368
				369	down_read(&io->io_rwsem);
				370	ret = __has_merged_page(io, inode, ino, idx);
				371	up_read(&io->io_rwsem);
				372
				373	/* TODO: use HOT temp only for meta pages now. */
				374	if (ret \|\| btype == META)
				375	break;
				376	}
				377	return ret;
				378	}
				379
				380	static void __f2fs_submit_merged_write(struct f2fs_sb_info *sbi,
				381	enum page_type type, enum temp_type temp)
				382	{
				383	enum page_type btype = PAGE_TYPE_OF_BIO(type);
				384	struct f2fs_bio_info *io = sbi->write_io[btype] + temp;
				385
				386	down_write(&io->io_rwsem);
				387
				388	/* change META to META_FLUSH in the checkpoint procedure */
				389	if (type >= META_FLUSH) {
				390	io->fio.type = META_FLUSH;
				391	io->fio.op = REQ_OP_WRITE;
				392	io->fio.op_flags = REQ_META \| REQ_PRIO \| REQ_SYNC;
				393	if (!test_opt(sbi, NOBARRIER))
				394	io->fio.op_flags \|= REQ_PREFLUSH \| REQ_FUA;
				395	}
				396	__submit_merged_bio(io);
				397	up_write(&io->io_rwsem);
				398	}
				399
				400	static void __submit_merged_write_cond(struct f2fs_sb_info *sbi,
				401	struct inode *inode, nid_t ino, pgoff_t idx,
				402	enum page_type type, bool force)
				403	{
				404	enum temp_type temp;
				405
				406	if (!force && !has_merged_page(sbi, inode, ino, idx, type))
				407	return;
				408
				409	for (temp = HOT; temp < NR_TEMP_TYPE; temp++) {
				410
				411	__f2fs_submit_merged_write(sbi, type, temp);
				412
				413	/* TODO: use HOT temp only for meta pages now. */
				414	if (type >= META)
				415	break;
				416	}
				417	}
				418
				419	void f2fs_submit_merged_write(struct f2fs_sb_info *sbi, enum page_type type)
				420	{
				421	__submit_merged_write_cond(sbi, NULL, 0, 0, type, true);
				422	}
				423
				424	void f2fs_submit_merged_write_cond(struct f2fs_sb_info *sbi,
				425	struct inode *inode, nid_t ino, pgoff_t idx,
				426	enum page_type type)
				427	{
				428	__submit_merged_write_cond(sbi, inode, ino, idx, type, false);
				429	}
				430
				431	void f2fs_flush_merged_writes(struct f2fs_sb_info *sbi)
				432	{
				433	f2fs_submit_merged_write(sbi, DATA);
				434	f2fs_submit_merged_write(sbi, NODE);
				435	f2fs_submit_merged_write(sbi, META);
				436	}
				437
				438	/*
				439	* Fill the locked page with data located in the block address.
				440	* A caller needs to unlock the page on failure.
				441	*/
				442	int f2fs_submit_page_bio(struct f2fs_io_info *fio)
				443	{
				444	struct bio *bio;
				445	struct page *page = fio->encrypted_page ?
				446	fio->encrypted_page : fio->page;
				447
				448	if (!f2fs_is_valid_blkaddr(fio->sbi, fio->new_blkaddr,
				449	__is_meta_io(fio) ? META_GENERIC : DATA_GENERIC))
				450	return -EFSCORRUPTED;
				451
				452	trace_f2fs_submit_page_bio(page, fio);
				453	f2fs_trace_ios(fio, 0);
				454
				455	/* Allocate a new bio */
				456	bio = __bio_alloc(fio->sbi, fio->new_blkaddr, fio->io_wbc,
				457	1, is_read_io(fio->op), fio->type, fio->temp);
				458
				459	if (bio_add_page(bio, page, PAGE_SIZE, 0) < PAGE_SIZE) {
				460	bio_put(bio);
				461	return -EFAULT;
				462	}
				463	bio_set_op_attrs(bio, fio->op, fio->op_flags);
				464
				465	if (!is_read_io(fio->op))
				466	inc_page_count(fio->sbi, WB_DATA_TYPE(fio->page));
				467
				468	__submit_bio(fio->sbi, bio, fio->type);
				469	return 0;
				470	}
				471
				472	int f2fs_submit_page_write(struct f2fs_io_info *fio)
				473	{
				474	struct f2fs_sb_info *sbi = fio->sbi;
				475	enum page_type btype = PAGE_TYPE_OF_BIO(fio->type);
				476	struct f2fs_bio_info *io = sbi->write_io[btype] + fio->temp;
				477	struct page *bio_page;
				478	int err = 0;
				479
				480	f2fs_bug_on(sbi, is_read_io(fio->op));
				481
				482	down_write(&io->io_rwsem);
				483	next:
				484	if (fio->in_list) {
				485	spin_lock(&io->io_lock);
				486	if (list_empty(&io->io_list)) {
				487	spin_unlock(&io->io_lock);
				488	goto out_fail;
				489	}
				490	fio = list_first_entry(&io->io_list,
				491	struct f2fs_io_info, list);
				492	list_del(&fio->list);
				493	spin_unlock(&io->io_lock);
				494	}
				495
				496	if (__is_valid_data_blkaddr(fio->old_blkaddr))
				497	verify_block_addr(fio, fio->old_blkaddr);
				498	verify_block_addr(fio, fio->new_blkaddr);
				499
				500	bio_page = fio->encrypted_page ? fio->encrypted_page : fio->page;
				501
				502	/* set submitted = true as a return value */
				503	fio->submitted = true;
				504
				505	inc_page_count(sbi, WB_DATA_TYPE(bio_page));
				506
				507	if (io->bio && (io->last_block_in_bio != fio->new_blkaddr - 1 \|\|
				508	(io->fio.op != fio->op \|\| io->fio.op_flags != fio->op_flags) \|\|
				509	!__same_bdev(sbi, fio->new_blkaddr, io->bio)))
				510	__submit_merged_bio(io);
				511	alloc_new:
				512	if (io->bio == NULL) {
				513	if ((fio->type == DATA \|\| fio->type == NODE) &&
				514	fio->new_blkaddr & F2FS_IO_SIZE_MASK(sbi)) {
				515	err = -EAGAIN;
				516	dec_page_count(sbi, WB_DATA_TYPE(bio_page));
				517	goto out_fail;
				518	}
				519	io->bio = __bio_alloc(sbi, fio->new_blkaddr, fio->io_wbc,
				520	BIO_MAX_PAGES, false,
				521	fio->type, fio->temp);
				522	io->fio = *fio;
				523	}
				524
				525	if (bio_add_page(io->bio, bio_page, PAGE_SIZE, 0) < PAGE_SIZE) {
				526	__submit_merged_bio(io);
				527	goto alloc_new;
				528	}
				529
				530	if (fio->io_wbc)
				531	wbc_account_io(fio->io_wbc, bio_page, PAGE_SIZE);
				532
				533	io->last_block_in_bio = fio->new_blkaddr;
				534	f2fs_trace_ios(fio, 0);
				535
				536	trace_f2fs_submit_page_write(fio->page, fio);
				537
				538	if (fio->in_list)
				539	goto next;
				540	out_fail:
				541	up_write(&io->io_rwsem);
				542	return err;
				543	}
				544
				545	static struct bio f2fs_grab_read_bio(struct inode inode, block_t blkaddr,
				546	unsigned nr_pages)
				547	{
				548	struct f2fs_sb_info *sbi = F2FS_I_SB(inode);
				549	struct bio *bio;
				550	struct bio_post_read_ctx *ctx;
				551	unsigned int post_read_steps = 0;
				552
				553	if (!f2fs_is_valid_blkaddr(sbi, blkaddr, DATA_GENERIC))
				554	return ERR_PTR(-EFAULT);
				555
				556	bio = f2fs_bio_alloc(sbi, min_t(int, nr_pages, BIO_MAX_PAGES), false);
				557	if (!bio)
				558	return ERR_PTR(-ENOMEM);
				559	f2fs_target_device(sbi, blkaddr, bio);
				560	bio->bi_end_io = f2fs_read_end_io;
				561	bio_set_op_attrs(bio, REQ_OP_READ, 0);
				562
				563	if (f2fs_encrypted_file(inode))
				564	post_read_steps \|= 1 << STEP_DECRYPT;
				565	if (post_read_steps) {
				566	ctx = mempool_alloc(bio_post_read_ctx_pool, GFP_NOFS);
				567	if (!ctx) {
				568	bio_put(bio);
				569	return ERR_PTR(-ENOMEM);
				570	}
				571	ctx->bio = bio;
				572	ctx->enabled_steps = post_read_steps;
				573	bio->bi_private = ctx;
				574
				575	/* wait the page to be moved by cleaning */
				576	f2fs_wait_on_block_writeback(sbi, blkaddr);
				577	}
				578
				579	return bio;
				580	}
				581
				582	/* This can handle encryption stuffs */
				583	static int f2fs_submit_page_read(struct inode inode, struct page page,
				584	block_t blkaddr)
				585	{
				586	struct bio *bio = f2fs_grab_read_bio(inode, blkaddr, 1);
				587
				588	if (IS_ERR(bio))
				589	return PTR_ERR(bio);
				590
				591	if (bio_add_page(bio, page, PAGE_SIZE, 0) < PAGE_SIZE) {
				592	bio_put(bio);
				593	return -EFAULT;
				594	}
				595	__submit_bio(F2FS_I_SB(inode), bio, DATA);
				596	return 0;
				597	}
				598
				599	static void __set_data_blkaddr(struct dnode_of_data *dn)
				600	{
				601	struct f2fs_node *rn = F2FS_NODE(dn->node_page);
				602	__le32 *addr_array;
				603	int base = 0;
				604
				605	if (IS_INODE(dn->node_page) && f2fs_has_extra_attr(dn->inode))
				606	base = get_extra_isize(dn->inode);
				607
				608	/* Get physical address of data block */
				609	addr_array = blkaddr_in_node(rn);
				610	addr_array[base + dn->ofs_in_node] = cpu_to_le32(dn->data_blkaddr);
				611	}
				612
				613	/*
				614	* Lock ordering for the change of data block address:
				615	* ->data_page
				616	* ->node_page
				617	* update block addresses in the node page
				618	*/
				619	void set_data_blkaddr(struct dnode_of_data *dn)
				620	{
				621	f2fs_wait_on_page_writeback(dn->node_page, NODE, true);
				622	__set_data_blkaddr(dn);
				623	if (set_page_dirty(dn->node_page))
				624	dn->node_changed = true;
				625	}
				626
				627	void f2fs_update_data_blkaddr(struct dnode_of_data *dn, block_t blkaddr)
				628	{
				629	dn->data_blkaddr = blkaddr;
				630	set_data_blkaddr(dn);
				631	f2fs_update_extent_cache(dn);
				632	}
				633
				634	/* dn->ofs_in_node will be returned with up-to-date last block pointer */
				635	int reserve_new_blocks(struct dnode_of_data *dn, blkcnt_t count)
				636	{
				637	struct f2fs_sb_info *sbi = F2FS_I_SB(dn->inode);
				638	int err;
				639
				640	if (!count)
				641	return 0;
				642
				643	if (unlikely(is_inode_flag_set(dn->inode, FI_NO_ALLOC)))
				644	return -EPERM;
				645	if (unlikely((err = inc_valid_block_count(sbi, dn->inode, &count))))
				646	return err;
				647
				648	trace_f2fs_reserve_new_blocks(dn->inode, dn->nid,
				649	dn->ofs_in_node, count);
				650
				651	f2fs_wait_on_page_writeback(dn->node_page, NODE, true);
				652
				653	for (; count > 0; dn->ofs_in_node++) {
				654	block_t blkaddr = datablock_addr(dn->inode,
				655	dn->node_page, dn->ofs_in_node);
				656	if (blkaddr == NULL_ADDR) {
				657	dn->data_blkaddr = NEW_ADDR;
				658	__set_data_blkaddr(dn);
				659	count--;
				660	}
				661	}
				662
				663	if (set_page_dirty(dn->node_page))
				664	dn->node_changed = true;
				665	return 0;
				666	}
				667
				668	/* Should keep dn->ofs_in_node unchanged */
				669	int reserve_new_block(struct dnode_of_data *dn)
				670	{
				671	unsigned int ofs_in_node = dn->ofs_in_node;
				672	int ret;
				673
				674	ret = reserve_new_blocks(dn, 1);
				675	dn->ofs_in_node = ofs_in_node;
				676	return ret;
				677	}
				678
				679	int f2fs_reserve_block(struct dnode_of_data *dn, pgoff_t index)
				680	{
				681	bool need_put = dn->inode_page ? false : true;
				682	int err;
				683
				684	err = get_dnode_of_data(dn, index, ALLOC_NODE);
				685	if (err)
				686	return err;
				687
				688	if (dn->data_blkaddr == NULL_ADDR)
				689	err = reserve_new_block(dn);
				690	if (err \|\| need_put)
				691	f2fs_put_dnode(dn);
				692	return err;
				693	}
				694
				695	int f2fs_get_block(struct dnode_of_data *dn, pgoff_t index)
				696	{
				697	struct extent_info ei = {0,0,0};
				698	struct inode *inode = dn->inode;
				699
				700	if (f2fs_lookup_extent_cache(inode, index, &ei)) {
				701	dn->data_blkaddr = ei.blk + index - ei.fofs;
				702	return 0;
				703	}
				704
				705	return f2fs_reserve_block(dn, index);
				706	}
				707
				708	struct page get_read_data_page(struct inode inode, pgoff_t index,
				709	int op_flags, bool for_write)
				710	{
				711	struct address_space *mapping = inode->i_mapping;
				712	struct dnode_of_data dn;
				713	struct page *page;
				714	struct extent_info ei = {0,0,0};
				715	int err;
				716
				717	page = f2fs_grab_cache_page(mapping, index, for_write);
				718	if (!page)
				719	return ERR_PTR(-ENOMEM);
				720
				721	if (f2fs_lookup_extent_cache(inode, index, &ei)) {
				722	dn.data_blkaddr = ei.blk + index - ei.fofs;
				723	goto got_it;
				724	}
				725
				726	set_new_dnode(&dn, inode, NULL, NULL, 0);
				727	err = get_dnode_of_data(&dn, index, LOOKUP_NODE);
				728	if (err)
				729	goto put_err;
				730	f2fs_put_dnode(&dn);
				731
				732	if (unlikely(dn.data_blkaddr == NULL_ADDR)) {
				733	err = -ENOENT;
				734	goto put_err;
				735	}
				736	got_it:
				737	if (PageUptodate(page)) {
				738	unlock_page(page);
				739	return page;
				740	}
				741
				742	/*
				743	* A new dentry page is allocated but not able to be written, since its
				744	* new inode page couldn't be allocated due to -ENOSPC.
				745	* In such the case, its blkaddr can be remained as NEW_ADDR.
				746	* see, f2fs_add_link -> get_new_data_page -> init_inode_metadata.
				747	*/
				748	if (dn.data_blkaddr == NEW_ADDR) {
				749	zero_user_segment(page, 0, PAGE_SIZE);
				750	if (!PageUptodate(page))
				751	SetPageUptodate(page);
				752	unlock_page(page);
				753	return page;
				754	}
				755
				756	err = f2fs_submit_page_read(inode, page, dn.data_blkaddr);
				757	if (err)
				758	goto put_err;
				759	return page;
				760
				761	put_err:
				762	f2fs_put_page(page, 1);
				763	return ERR_PTR(err);
				764	}
				765
				766	struct page find_data_page(struct inode inode, pgoff_t index)
				767	{
				768	struct address_space *mapping = inode->i_mapping;
				769	struct page *page;
				770
				771	page = find_get_page(mapping, index);
				772	if (page && PageUptodate(page))
				773	return page;
				774	f2fs_put_page(page, 0);
				775
				776	page = get_read_data_page(inode, index, 0, false);
				777	if (IS_ERR(page))
				778	return page;
				779
				780	if (PageUptodate(page))
				781	return page;
				782
				783	wait_on_page_locked(page);
				784	if (unlikely(!PageUptodate(page))) {
				785	f2fs_put_page(page, 0);
				786	return ERR_PTR(-EIO);
				787	}
				788	return page;
				789	}
				790
				791	/*
				792	* If it tries to access a hole, return an error.
				793	* Because, the callers, functions in dir.c and GC, should be able to know
				794	* whether this page exists or not.
				795	*/
				796	struct page get_lock_data_page(struct inode inode, pgoff_t index,
				797	bool for_write)
				798	{
				799	struct address_space *mapping = inode->i_mapping;
				800	struct page *page;
				801	repeat:
				802	page = get_read_data_page(inode, index, 0, for_write);
				803	if (IS_ERR(page))
				804	return page;
				805
				806	/* wait for read completion */
				807	lock_page(page);
				808	if (unlikely(page->mapping != mapping)) {
				809	f2fs_put_page(page, 1);
				810	goto repeat;
				811	}
				812	if (unlikely(!PageUptodate(page))) {
				813	f2fs_put_page(page, 1);
				814	return ERR_PTR(-EIO);
				815	}
				816	return page;
				817	}
				818
				819	/*
				820	* Caller ensures that this data page is never allocated.
				821	* A new zero-filled data page is allocated in the page cache.
				822	*
				823	* Also, caller should grab and release a rwsem by calling f2fs_lock_op() and
				824	* f2fs_unlock_op().
				825	* Note that, ipage is set only by make_empty_dir, and if any error occur,
				826	* ipage should be released by this function.
				827	*/
				828	struct page get_new_data_page(struct inode inode,
				829	struct page *ipage, pgoff_t index, bool new_i_size)
				830	{
				831	struct address_space *mapping = inode->i_mapping;
				832	struct page *page;
				833	struct dnode_of_data dn;
				834	int err;
				835
				836	page = f2fs_grab_cache_page(mapping, index, true);
				837	if (!page) {
				838	/*
				839	* before exiting, we should make sure ipage will be released
				840	* if any error occur.
				841	*/
				842	f2fs_put_page(ipage, 1);
				843	return ERR_PTR(-ENOMEM);
				844	}
				845
				846	set_new_dnode(&dn, inode, ipage, NULL, 0);
				847	err = f2fs_reserve_block(&dn, index);
				848	if (err) {
				849	f2fs_put_page(page, 1);
				850	return ERR_PTR(err);
				851	}
				852	if (!ipage)
				853	f2fs_put_dnode(&dn);
				854
				855	if (PageUptodate(page))
				856	goto got_it;
				857
				858	if (dn.data_blkaddr == NEW_ADDR) {
				859	zero_user_segment(page, 0, PAGE_SIZE);
				860	if (!PageUptodate(page))
				861	SetPageUptodate(page);
				862	} else {
				863	f2fs_put_page(page, 1);
				864
				865	/* if ipage exists, blkaddr should be NEW_ADDR */
				866	f2fs_bug_on(F2FS_I_SB(inode), ipage);
				867	page = get_lock_data_page(inode, index, true);
				868	if (IS_ERR(page))
				869	return page;
				870	}
				871	got_it:
				872	if (new_i_size && i_size_read(inode) <
				873	((loff_t)(index + 1) << PAGE_SHIFT))
				874	f2fs_i_size_write(inode, ((loff_t)(index + 1) << PAGE_SHIFT));
				875	return page;
				876	}
				877
				878	static int __allocate_data_block(struct dnode_of_data *dn, int seg_type)
				879	{
				880	struct f2fs_sb_info *sbi = F2FS_I_SB(dn->inode);
				881	struct f2fs_summary sum;
				882	struct node_info ni;
				883	pgoff_t fofs;
				884	blkcnt_t count = 1;
				885	int err;
				886
				887	if (unlikely(is_inode_flag_set(dn->inode, FI_NO_ALLOC)))
				888	return -EPERM;
				889
				890	dn->data_blkaddr = datablock_addr(dn->inode,
				891	dn->node_page, dn->ofs_in_node);
				892	if (dn->data_blkaddr == NEW_ADDR)
				893	goto alloc;
				894
				895	if (unlikely((err = inc_valid_block_count(sbi, dn->inode, &count))))
				896	return err;
				897
				898	alloc:
				899	get_node_info(sbi, dn->nid, &ni);
				900	set_summary(&sum, dn->nid, dn->ofs_in_node, ni.version);
				901
				902	allocate_data_block(sbi, NULL, dn->data_blkaddr, &dn->data_blkaddr,
				903	&sum, seg_type, NULL, false);
				904	set_data_blkaddr(dn);
				905
				906	/* update i_size */
				907	fofs = start_bidx_of_node(ofs_of_node(dn->node_page), dn->inode) +
				908	dn->ofs_in_node;
				909	if (i_size_read(dn->inode) < ((loff_t)(fofs + 1) << PAGE_SHIFT))
				910	f2fs_i_size_write(dn->inode,
				911	((loff_t)(fofs + 1) << PAGE_SHIFT));
				912	return 0;
				913	}
				914
				915	int f2fs_preallocate_blocks(struct kiocb iocb, struct iov_iter from)
				916	{
				917	struct inode *inode = file_inode(iocb->ki_filp);
				918	struct f2fs_map_blocks map;
				919	int flag;
				920	int err = 0;
				921	bool direct_io = iocb->ki_flags & IOCB_DIRECT;
				922
				923	/* convert inline data for Direct I/O*/
				924	if (direct_io) {
				925	err = f2fs_convert_inline_inode(inode);
				926	if (err)
				927	return err;
				928	}
				929
				930	if (is_inode_flag_set(inode, FI_NO_PREALLOC))
				931	return 0;
				932
				933	map.m_lblk = F2FS_BLK_ALIGN(iocb->ki_pos);
				934	map.m_len = F2FS_BYTES_TO_BLK(iocb->ki_pos + iov_iter_count(from));
				935	if (map.m_len > map.m_lblk)
				936	map.m_len -= map.m_lblk;
				937	else
				938	map.m_len = 0;
				939
				940	map.m_next_pgofs = NULL;
				941	map.m_next_extent = NULL;
				942	map.m_seg_type = NO_CHECK_TYPE;
				943
				944	if (direct_io) {
				945	map.m_seg_type = rw_hint_to_seg_type(iocb->ki_hint);
				946	flag = f2fs_force_buffered_io(inode, WRITE) ?
				947	F2FS_GET_BLOCK_PRE_AIO :
				948	F2FS_GET_BLOCK_PRE_DIO;
				949	goto map_blocks;
				950	}
				951	if (iocb->ki_pos + iov_iter_count(from) > MAX_INLINE_DATA(inode)) {
				952	err = f2fs_convert_inline_inode(inode);
				953	if (err)
				954	return err;
				955	}
				956	if (f2fs_has_inline_data(inode))
				957	return err;
				958
				959	flag = F2FS_GET_BLOCK_PRE_AIO;
				960
				961	map_blocks:
				962	err = f2fs_map_blocks(inode, &map, 1, flag);
				963	if (map.m_len > 0 && err == -ENOSPC) {
				964	if (!direct_io)
				965	set_inode_flag(inode, FI_NO_PREALLOC);
				966	err = 0;
				967	}
				968	return err;
				969	}
				970
				971	static inline void __do_map_lock(struct f2fs_sb_info *sbi, int flag, bool lock)
				972	{
				973	if (flag == F2FS_GET_BLOCK_PRE_AIO) {
				974	if (lock)
				975	down_read(&sbi->node_change);
				976	else
				977	up_read(&sbi->node_change);
				978	} else {
				979	if (lock)
				980	f2fs_lock_op(sbi);
				981	else
				982	f2fs_unlock_op(sbi);
				983	}
				984	}
				985
				986	/*
				987	* f2fs_map_blocks() now supported readahead/bmap/rw direct_IO with
				988	* f2fs_map_blocks structure.
				989	* If original data blocks are allocated, then give them to blockdev.
				990	* Otherwise,
				991	* a. preallocate requested block addresses
				992	* b. do not use extent cache for better performance
				993	* c. give the block addresses to blockdev
				994	*/
				995	int f2fs_map_blocks(struct inode inode, struct f2fs_map_blocks map,
				996	int create, int flag)
				997	{
				998	unsigned int maxblocks = map->m_len;
				999	struct dnode_of_data dn;
				1000	struct f2fs_sb_info *sbi = F2FS_I_SB(inode);
				1001	int mode = create ? ALLOC_NODE : LOOKUP_NODE;
				1002	pgoff_t pgofs, end_offset, end;
				1003	int err = 0, ofs = 1;
				1004	unsigned int ofs_in_node, last_ofs_in_node;
				1005	blkcnt_t prealloc;
				1006	struct extent_info ei = {0,0,0};
				1007	block_t blkaddr;
				1008	unsigned int start_pgofs;
				1009
				1010	if (!maxblocks)
				1011	return 0;
				1012
				1013	map->m_len = 0;
				1014	map->m_flags = 0;
				1015
				1016	/* it only supports block size == page size */
				1017	pgofs = (pgoff_t)map->m_lblk;
				1018	end = pgofs + maxblocks;
				1019
				1020	if (!create && f2fs_lookup_extent_cache(inode, pgofs, &ei)) {
				1021	map->m_pblk = ei.blk + pgofs - ei.fofs;
				1022	map->m_len = min((pgoff_t)maxblocks, ei.fofs + ei.len - pgofs);
				1023	map->m_flags = F2FS_MAP_MAPPED;
				1024	if (map->m_next_extent)
				1025	*map->m_next_extent = pgofs + map->m_len;
				1026	goto out;
				1027	}
				1028
				1029	next_dnode:
				1030	if (create)
				1031	__do_map_lock(sbi, flag, true);
				1032
				1033	/* When reading holes, we need its node page */
				1034	set_new_dnode(&dn, inode, NULL, NULL, 0);
				1035	err = get_dnode_of_data(&dn, pgofs, mode);
				1036	if (err) {
				1037	if (flag == F2FS_GET_BLOCK_BMAP)
				1038	map->m_pblk = 0;
				1039	if (err == -ENOENT) {
				1040	err = 0;
				1041	if (map->m_next_pgofs)
				1042	*map->m_next_pgofs =
				1043	get_next_page_offset(&dn, pgofs);
				1044	if (map->m_next_extent)
				1045	*map->m_next_extent =
				1046	get_next_page_offset(&dn, pgofs);
				1047	}
				1048	goto unlock_out;
				1049	}
				1050
				1051	start_pgofs = pgofs;
				1052	prealloc = 0;
				1053	last_ofs_in_node = ofs_in_node = dn.ofs_in_node;
				1054	end_offset = ADDRS_PER_PAGE(dn.node_page, inode);
				1055
				1056	next_block:
				1057	blkaddr = datablock_addr(dn.inode, dn.node_page, dn.ofs_in_node);
				1058
				1059	if (__is_valid_data_blkaddr(blkaddr) &&
				1060	!f2fs_is_valid_blkaddr(sbi, blkaddr, DATA_GENERIC)) {
				1061	err = -EFSCORRUPTED;
				1062	goto sync_out;
				1063	}
				1064
				1065	if (!is_valid_data_blkaddr(sbi, blkaddr)) {
				1066	if (create) {
				1067	if (unlikely(f2fs_cp_error(sbi))) {
				1068	err = -EIO;
				1069	goto sync_out;
				1070	}
				1071	if (flag == F2FS_GET_BLOCK_PRE_AIO) {
				1072	if (blkaddr == NULL_ADDR) {
				1073	prealloc++;
				1074	last_ofs_in_node = dn.ofs_in_node;
				1075	}
				1076	} else {
				1077	err = __allocate_data_block(&dn,
				1078	map->m_seg_type);
				1079	if (!err)
				1080	set_inode_flag(inode, FI_APPEND_WRITE);
				1081	}
				1082	if (err)
				1083	goto sync_out;
				1084	map->m_flags \|= F2FS_MAP_NEW;
				1085	blkaddr = dn.data_blkaddr;
				1086	} else {
				1087	if (flag == F2FS_GET_BLOCK_BMAP) {
				1088	map->m_pblk = 0;
				1089	goto sync_out;
				1090	}
				1091	if (flag == F2FS_GET_BLOCK_PRECACHE)
				1092	goto sync_out;
				1093	if (flag == F2FS_GET_BLOCK_FIEMAP &&
				1094	blkaddr == NULL_ADDR) {
				1095	if (map->m_next_pgofs)
				1096	*map->m_next_pgofs = pgofs + 1;
				1097	goto sync_out;
				1098	}
				1099	if (flag != F2FS_GET_BLOCK_FIEMAP) {
				1100	/* for defragment case */
				1101	if (map->m_next_pgofs)
				1102	*map->m_next_pgofs = pgofs + 1;
				1103	goto sync_out;
				1104	}
				1105	}
				1106	}
				1107
				1108	if (flag == F2FS_GET_BLOCK_PRE_AIO)
				1109	goto skip;
				1110
				1111	if (map->m_len == 0) {
				1112	/* preallocated unwritten block should be mapped for fiemap. */
				1113	if (blkaddr == NEW_ADDR)
				1114	map->m_flags \|= F2FS_MAP_UNWRITTEN;
				1115	map->m_flags \|= F2FS_MAP_MAPPED;
				1116
				1117	map->m_pblk = blkaddr;
				1118	map->m_len = 1;
				1119	} else if ((map->m_pblk != NEW_ADDR &&
				1120	blkaddr == (map->m_pblk + ofs)) \|\|
				1121	(map->m_pblk == NEW_ADDR && blkaddr == NEW_ADDR) \|\|
				1122	flag == F2FS_GET_BLOCK_PRE_DIO) {
				1123	ofs++;
				1124	map->m_len++;
				1125	} else {
				1126	goto sync_out;
				1127	}
				1128
				1129	skip:
				1130	dn.ofs_in_node++;
				1131	pgofs++;
				1132
				1133	/* preallocate blocks in batch for one dnode page */
				1134	if (flag == F2FS_GET_BLOCK_PRE_AIO &&
				1135	(pgofs == end \|\| dn.ofs_in_node == end_offset)) {
				1136
				1137	dn.ofs_in_node = ofs_in_node;
				1138	err = reserve_new_blocks(&dn, prealloc);
				1139	if (err)
				1140	goto sync_out;
				1141
				1142	map->m_len += dn.ofs_in_node - ofs_in_node;
				1143	if (prealloc && dn.ofs_in_node != last_ofs_in_node + 1) {
				1144	err = -ENOSPC;
				1145	goto sync_out;
				1146	}
				1147	dn.ofs_in_node = end_offset;
				1148	}
				1149
				1150	if (pgofs >= end)
				1151	goto sync_out;
				1152	else if (dn.ofs_in_node < end_offset)
				1153	goto next_block;
				1154
				1155	if (flag == F2FS_GET_BLOCK_PRECACHE) {
				1156	if (map->m_flags & F2FS_MAP_MAPPED) {
				1157	unsigned int ofs = start_pgofs - map->m_lblk;
				1158
				1159	f2fs_update_extent_cache_range(&dn,
				1160	start_pgofs, map->m_pblk + ofs,
				1161	map->m_len - ofs);
				1162	}
				1163	}
				1164
				1165	f2fs_put_dnode(&dn);
				1166
				1167	if (create) {
				1168	__do_map_lock(sbi, flag, false);
				1169	f2fs_balance_fs(sbi, dn.node_changed);
				1170	}
				1171	goto next_dnode;
				1172
				1173	sync_out:
				1174	if (flag == F2FS_GET_BLOCK_PRECACHE) {
				1175	if (map->m_flags & F2FS_MAP_MAPPED) {
				1176	unsigned int ofs = start_pgofs - map->m_lblk;
				1177
				1178	f2fs_update_extent_cache_range(&dn,
				1179	start_pgofs, map->m_pblk + ofs,
				1180	map->m_len - ofs);
				1181	}
				1182	if (map->m_next_extent)
				1183	*map->m_next_extent = pgofs + 1;
				1184	}
				1185	f2fs_put_dnode(&dn);
				1186	unlock_out:
				1187	if (create) {
				1188	__do_map_lock(sbi, flag, false);
				1189	f2fs_balance_fs(sbi, dn.node_changed);
				1190	}
				1191	out:
				1192	trace_f2fs_map_blocks(inode, map, err);
				1193	return err;
				1194	}
				1195
				1196	bool f2fs_overwrite_io(struct inode *inode, loff_t pos, size_t len)
				1197	{
				1198	struct f2fs_map_blocks map;
				1199	block_t last_lblk;
				1200	int err;
				1201
				1202	if (pos + len > i_size_read(inode))
				1203	return false;
				1204
				1205	map.m_lblk = F2FS_BYTES_TO_BLK(pos);
				1206	map.m_next_pgofs = NULL;
				1207	map.m_next_extent = NULL;
				1208	map.m_seg_type = NO_CHECK_TYPE;
				1209	last_lblk = F2FS_BLK_ALIGN(pos + len);
				1210
				1211	while (map.m_lblk < last_lblk) {
				1212	map.m_len = last_lblk - map.m_lblk;
				1213	err = f2fs_map_blocks(inode, &map, 0, F2FS_GET_BLOCK_DEFAULT);
				1214	if (err \|\| map.m_len == 0)
				1215	return false;
				1216	map.m_lblk += map.m_len;
				1217	}
				1218	return true;
				1219	}
				1220
				1221	static int __get_data_block(struct inode *inode, sector_t iblock,
				1222	struct buffer_head *bh, int create, int flag,
				1223	pgoff_t *next_pgofs, int seg_type)
				1224	{
				1225	struct f2fs_map_blocks map;
				1226	int err;
				1227
				1228	map.m_lblk = iblock;
				1229	map.m_len = bh->b_size >> inode->i_blkbits;
				1230	map.m_next_pgofs = next_pgofs;
				1231	map.m_next_extent = NULL;
				1232	map.m_seg_type = seg_type;
				1233
				1234	err = f2fs_map_blocks(inode, &map, create, flag);
				1235	if (!err) {
				1236	map_bh(bh, inode->i_sb, map.m_pblk);
				1237	bh->b_state = (bh->b_state & ~F2FS_MAP_FLAGS) \| map.m_flags;
				1238	bh->b_size = (u64)map.m_len << inode->i_blkbits;
				1239	}
				1240	return err;
				1241	}
				1242
				1243	static int get_data_block(struct inode *inode, sector_t iblock,
				1244	struct buffer_head *bh_result, int create, int flag,
				1245	pgoff_t *next_pgofs)
				1246	{
				1247	return __get_data_block(inode, iblock, bh_result, create,
				1248	flag, next_pgofs,
				1249	NO_CHECK_TYPE);
				1250	}
				1251
				1252	static int get_data_block_dio(struct inode *inode, sector_t iblock,
				1253	struct buffer_head *bh_result, int create)
				1254	{
				1255	return __get_data_block(inode, iblock, bh_result, create,
				1256	F2FS_GET_BLOCK_DEFAULT, NULL,
				1257	rw_hint_to_seg_type(
				1258	inode->i_write_hint));
				1259	}
				1260
				1261	static int get_data_block_bmap(struct inode *inode, sector_t iblock,
				1262	struct buffer_head *bh_result, int create)
				1263	{
				1264	/* Block number less than F2FS MAX BLOCKS */
				1265	if (unlikely(iblock >= F2FS_I_SB(inode)->max_file_blocks))
				1266	return -EFBIG;
				1267
				1268	return __get_data_block(inode, iblock, bh_result, create,
				1269	F2FS_GET_BLOCK_BMAP, NULL,
				1270	NO_CHECK_TYPE);
				1271	}
				1272
				1273	static inline sector_t logical_to_blk(struct inode *inode, loff_t offset)
				1274	{
				1275	return (offset >> inode->i_blkbits);
				1276	}
				1277
				1278	static inline loff_t blk_to_logical(struct inode *inode, sector_t blk)
				1279	{
				1280	return (blk << inode->i_blkbits);
				1281	}
				1282
				1283	static int f2fs_xattr_fiemap(struct inode *inode,
				1284	struct fiemap_extent_info *fieinfo)
				1285	{
				1286	struct f2fs_sb_info *sbi = F2FS_I_SB(inode);
				1287	struct page *page;
				1288	struct node_info ni;
				1289	__u64 phys = 0, len;
				1290	__u32 flags;
				1291	nid_t xnid = F2FS_I(inode)->i_xattr_nid;
				1292	int err = 0;
				1293
				1294	if (f2fs_has_inline_xattr(inode)) {
				1295	int offset;
				1296
				1297	page = f2fs_grab_cache_page(NODE_MAPPING(sbi),
				1298	inode->i_ino, false);
				1299	if (!page)
				1300	return -ENOMEM;
				1301
				1302	get_node_info(sbi, inode->i_ino, &ni);
				1303
				1304	phys = (__u64)blk_to_logical(inode, ni.blk_addr);
				1305	offset = offsetof(struct f2fs_inode, i_addr) +
				1306	sizeof(__le32) * (DEF_ADDRS_PER_INODE -
				1307	get_inline_xattr_addrs(inode));
				1308
				1309	phys += offset;
				1310	len = inline_xattr_size(inode);
				1311
				1312	f2fs_put_page(page, 1);
				1313
				1314	flags = FIEMAP_EXTENT_DATA_INLINE \| FIEMAP_EXTENT_NOT_ALIGNED;
				1315
				1316	if (!xnid)
				1317	flags \|= FIEMAP_EXTENT_LAST;
				1318
				1319	err = fiemap_fill_next_extent(fieinfo, 0, phys, len, flags);
				1320	if (err \|\| err == 1)
				1321	return err;
				1322	}
				1323
				1324	if (xnid) {
				1325	page = f2fs_grab_cache_page(NODE_MAPPING(sbi), xnid, false);
				1326	if (!page)
				1327	return -ENOMEM;
				1328
				1329	get_node_info(sbi, xnid, &ni);
				1330
				1331	phys = (__u64)blk_to_logical(inode, ni.blk_addr);
				1332	len = inode->i_sb->s_blocksize;
				1333
				1334	f2fs_put_page(page, 1);
				1335
				1336	flags = FIEMAP_EXTENT_LAST;
				1337	}
				1338
				1339	if (phys)
				1340	err = fiemap_fill_next_extent(fieinfo, 0, phys, len, flags);
				1341
				1342	return (err < 0 ? err : 0);
				1343	}
				1344
				1345	int f2fs_fiemap(struct inode inode, struct fiemap_extent_info fieinfo,
				1346	u64 start, u64 len)
				1347	{
				1348	struct buffer_head map_bh;
				1349	sector_t start_blk, last_blk;
				1350	pgoff_t next_pgofs;
				1351	u64 logical = 0, phys = 0, size = 0;
				1352	u32 flags = 0;
				1353	int ret = 0;
				1354
				1355	if (fieinfo->fi_flags & FIEMAP_FLAG_CACHE) {
				1356	ret = f2fs_precache_extents(inode);
				1357	if (ret)
				1358	return ret;
				1359	}
				1360
				1361	ret = fiemap_check_flags(fieinfo, FIEMAP_FLAG_SYNC \| FIEMAP_FLAG_XATTR);
				1362	if (ret)
				1363	return ret;
				1364
				1365	inode_lock(inode);
				1366
				1367	if (fieinfo->fi_flags & FIEMAP_FLAG_XATTR) {
				1368	ret = f2fs_xattr_fiemap(inode, fieinfo);
				1369	goto out;
				1370	}
				1371
				1372	if (f2fs_has_inline_data(inode)) {
				1373	ret = f2fs_inline_data_fiemap(inode, fieinfo, start, len);
				1374	if (ret != -EAGAIN)
				1375	goto out;
				1376	}
				1377
				1378	if (logical_to_blk(inode, len) == 0)
				1379	len = blk_to_logical(inode, 1);
				1380
				1381	start_blk = logical_to_blk(inode, start);
				1382	last_blk = logical_to_blk(inode, start + len - 1);
				1383
				1384	next:
				1385	memset(&map_bh, 0, sizeof(struct buffer_head));
				1386	map_bh.b_size = len;
				1387
				1388	ret = get_data_block(inode, start_blk, &map_bh, 0,
				1389	F2FS_GET_BLOCK_FIEMAP, &next_pgofs);
				1390	if (ret)
				1391	goto out;
				1392
				1393	/* HOLE */
				1394	if (!buffer_mapped(&map_bh)) {
				1395	start_blk = next_pgofs;
				1396
				1397	if (blk_to_logical(inode, start_blk) < blk_to_logical(inode,
				1398	F2FS_I_SB(inode)->max_file_blocks))
				1399	goto prep_next;
				1400
				1401	flags \|= FIEMAP_EXTENT_LAST;
				1402	}
				1403
				1404	if (size) {
				1405	if (f2fs_encrypted_inode(inode))
				1406	flags \|= FIEMAP_EXTENT_DATA_ENCRYPTED;
				1407
				1408	ret = fiemap_fill_next_extent(fieinfo, logical,
				1409	phys, size, flags);
				1410	}
				1411
				1412	if (start_blk > last_blk \|\| ret)
				1413	goto out;
				1414
				1415	logical = blk_to_logical(inode, start_blk);
				1416	phys = blk_to_logical(inode, map_bh.b_blocknr);
				1417	size = map_bh.b_size;
				1418	flags = 0;
				1419	if (buffer_unwritten(&map_bh))
				1420	flags = FIEMAP_EXTENT_UNWRITTEN;
				1421
				1422	start_blk += logical_to_blk(inode, size);
				1423
				1424	prep_next:
				1425	cond_resched();
				1426	if (fatal_signal_pending(current))
				1427	ret = -EINTR;
				1428	else
				1429	goto next;
				1430	out:
				1431	if (ret == 1)
				1432	ret = 0;
				1433
				1434	inode_unlock(inode);
				1435	return ret;
				1436	}
				1437
				1438	/*
				1439	* This function was originally taken from fs/mpage.c, and customized for f2fs.
				1440	* Major change was from block_size == page_size in f2fs by default.
				1441	*/
				1442	static int f2fs_mpage_readpages(struct address_space *mapping,
				1443	struct list_head pages, struct page page,
				1444	unsigned nr_pages)
				1445	{
				1446	struct bio *bio = NULL;
				1447	sector_t last_block_in_bio = 0;
				1448	struct inode *inode = mapping->host;
				1449	const unsigned blkbits = inode->i_blkbits;
				1450	const unsigned blocksize = 1 << blkbits;
				1451	sector_t block_in_file;
				1452	sector_t last_block;
				1453	sector_t last_block_in_file;
				1454	sector_t block_nr;
				1455	struct f2fs_map_blocks map;
				1456
				1457	map.m_pblk = 0;
				1458	map.m_lblk = 0;
				1459	map.m_len = 0;
				1460	map.m_flags = 0;
				1461	map.m_next_pgofs = NULL;
				1462	map.m_next_extent = NULL;
				1463	map.m_seg_type = NO_CHECK_TYPE;
				1464
				1465	for (; nr_pages; nr_pages--) {
				1466	if (pages) {
				1467	page = list_last_entry(pages, struct page, lru);
				1468
				1469	prefetchw(&page->flags);
				1470	list_del(&page->lru);
				1471	if (add_to_page_cache_lru(page, mapping,
				1472	page->index,
				1473	readahead_gfp_mask(mapping)))
				1474	goto next_page;
				1475	}
				1476
				1477	block_in_file = (sector_t)page->index;
				1478	last_block = block_in_file + nr_pages;
				1479	last_block_in_file = (i_size_read(inode) + blocksize - 1) >>
				1480	blkbits;
				1481	if (last_block > last_block_in_file)
				1482	last_block = last_block_in_file;
				1483
				1484	/*
				1485	* Map blocks using the previous result first.
				1486	*/
				1487	if ((map.m_flags & F2FS_MAP_MAPPED) &&
				1488	block_in_file > map.m_lblk &&
				1489	block_in_file < (map.m_lblk + map.m_len))
				1490	goto got_it;
				1491
				1492	/*
				1493	* Then do more f2fs_map_blocks() calls until we are
				1494	* done with this page.
				1495	*/
				1496	map.m_flags = 0;
				1497
				1498	if (block_in_file < last_block) {
				1499	map.m_lblk = block_in_file;
				1500	map.m_len = last_block - block_in_file;
				1501
				1502	if (f2fs_map_blocks(inode, &map, 0,
				1503	F2FS_GET_BLOCK_DEFAULT))
				1504	goto set_error_page;
				1505	}
				1506	got_it:
				1507	if ((map.m_flags & F2FS_MAP_MAPPED)) {
				1508	block_nr = map.m_pblk + block_in_file - map.m_lblk;
				1509	SetPageMappedToDisk(page);
				1510
				1511	if (!PageUptodate(page) && !cleancache_get_page(page)) {
				1512	SetPageUptodate(page);
				1513	goto confused;
				1514	}
				1515
				1516	if (!f2fs_is_valid_blkaddr(F2FS_I_SB(inode), block_nr,
				1517	DATA_GENERIC))
				1518	goto set_error_page;
				1519	} else {
				1520	zero_user_segment(page, 0, PAGE_SIZE);
				1521	if (!PageUptodate(page))
				1522	SetPageUptodate(page);
				1523	unlock_page(page);
				1524	goto next_page;
				1525	}
				1526
				1527	/*
				1528	* This page will go to BIO. Do we need to send this
				1529	* BIO off first?
				1530	*/
				1531	if (bio && (last_block_in_bio != block_nr - 1 \|\|
				1532	!__same_bdev(F2FS_I_SB(inode), block_nr, bio))) {
				1533	submit_and_realloc:
				1534	__submit_bio(F2FS_I_SB(inode), bio, DATA);
				1535	bio = NULL;
				1536	}
				1537	if (bio == NULL) {
				1538	bio = f2fs_grab_read_bio(inode, block_nr, nr_pages);
				1539	if (IS_ERR(bio)) {
				1540	bio = NULL;
				1541	goto set_error_page;
				1542	}
				1543	}
				1544
				1545	if (bio_add_page(bio, page, blocksize, 0) < blocksize)
				1546	goto submit_and_realloc;
				1547
				1548	last_block_in_bio = block_nr;
				1549	goto next_page;
				1550	set_error_page:
				1551	SetPageError(page);
				1552	zero_user_segment(page, 0, PAGE_SIZE);
				1553	unlock_page(page);
				1554	goto next_page;
				1555	confused:
				1556	if (bio) {
				1557	__submit_bio(F2FS_I_SB(inode), bio, DATA);
				1558	bio = NULL;
				1559	}
				1560	unlock_page(page);
				1561	next_page:
				1562	if (pages)
				1563	put_page(page);
				1564	}
				1565	BUG_ON(pages && !list_empty(pages));
				1566	if (bio)
				1567	__submit_bio(F2FS_I_SB(inode), bio, DATA);
				1568	return 0;
				1569	}
				1570
				1571	static int f2fs_read_data_page(struct file file, struct page page)
				1572	{
				1573	struct inode *inode = page->mapping->host;
				1574	int ret = -EAGAIN;
				1575
				1576	trace_f2fs_readpage(page, DATA);
				1577
				1578	/* If the file has inline data, try to read it directly */
				1579	if (f2fs_has_inline_data(inode))
				1580	ret = f2fs_read_inline_data(inode, page);
				1581	if (ret == -EAGAIN)
				1582	ret = f2fs_mpage_readpages(page->mapping, NULL, page, 1);
				1583	return ret;
				1584	}
				1585
				1586	static int f2fs_read_data_pages(struct file *file,
				1587	struct address_space *mapping,
				1588	struct list_head *pages, unsigned nr_pages)
				1589	{
				1590	struct inode *inode = mapping->host;
				1591	struct page *page = list_last_entry(pages, struct page, lru);
				1592
				1593	trace_f2fs_readpages(inode, page, nr_pages);
				1594
				1595	/* If the file has inline data, skip readpages */
				1596	if (f2fs_has_inline_data(inode))
				1597	return 0;
				1598
				1599	return f2fs_mpage_readpages(mapping, pages, NULL, nr_pages);
				1600	}
				1601
				1602	static int encrypt_one_page(struct f2fs_io_info *fio)
				1603	{
				1604	struct inode *inode = fio->page->mapping->host;
				1605	gfp_t gfp_flags = GFP_NOFS;
				1606
				1607	if (!f2fs_encrypted_file(inode))
				1608	return 0;
				1609
				1610	/* wait for GCed page writeback via META_MAPPING */
				1611	f2fs_wait_on_block_writeback(fio->sbi, fio->old_blkaddr);
				1612
				1613	retry_encrypt:
				1614	fio->encrypted_page = fscrypt_encrypt_page(inode, fio->page,
				1615	PAGE_SIZE, 0, fio->page->index, gfp_flags);
				1616	if (!IS_ERR(fio->encrypted_page))
				1617	return 0;
				1618
				1619	/* flush pending IOs and wait for a while in the ENOMEM case */
				1620	if (PTR_ERR(fio->encrypted_page) == -ENOMEM) {
				1621	f2fs_flush_merged_writes(fio->sbi);
				1622	congestion_wait(BLK_RW_ASYNC, HZ/50);
				1623	gfp_flags \|= __GFP_NOFAIL;
				1624	goto retry_encrypt;
				1625	}
				1626	return PTR_ERR(fio->encrypted_page);
				1627	}
				1628
				1629	static inline bool check_inplace_update_policy(struct inode *inode,
				1630	struct f2fs_io_info *fio)
				1631	{
				1632	struct f2fs_sb_info *sbi = F2FS_I_SB(inode);
				1633	unsigned int policy = SM_I(sbi)->ipu_policy;
				1634
				1635	if (policy & (0x1 << F2FS_IPU_FORCE))
				1636	return true;
				1637	if (policy & (0x1 << F2FS_IPU_SSR) && need_SSR(sbi))
				1638	return true;
				1639	if (policy & (0x1 << F2FS_IPU_UTIL) &&
				1640	utilization(sbi) > SM_I(sbi)->min_ipu_util)
				1641	return true;
				1642	if (policy & (0x1 << F2FS_IPU_SSR_UTIL) && need_SSR(sbi) &&
				1643	utilization(sbi) > SM_I(sbi)->min_ipu_util)
				1644	return true;
				1645
				1646	/*
				1647	* IPU for rewrite async pages
				1648	*/
				1649	if (policy & (0x1 << F2FS_IPU_ASYNC) &&
				1650	fio && fio->op == REQ_OP_WRITE &&
				1651	!(fio->op_flags & REQ_SYNC) &&
				1652	!f2fs_encrypted_inode(inode))
				1653	return true;
				1654
				1655	/* this is only set during fdatasync */
				1656	if (policy & (0x1 << F2FS_IPU_FSYNC) &&
				1657	is_inode_flag_set(inode, FI_NEED_IPU))
				1658	return true;
				1659
				1660	return false;
				1661	}
				1662
				1663	bool should_update_inplace(struct inode inode, struct f2fs_io_info fio)
				1664	{
				1665	if (f2fs_is_pinned_file(inode))
				1666	return true;
				1667
				1668	/* if this is cold file, we should overwrite to avoid fragmentation */
				1669	if (file_is_cold(inode))
				1670	return true;
				1671
				1672	return check_inplace_update_policy(inode, fio);
				1673	}
				1674
				1675	bool should_update_outplace(struct inode inode, struct f2fs_io_info fio)
				1676	{
				1677	struct f2fs_sb_info *sbi = F2FS_I_SB(inode);
				1678
				1679	if (test_opt(sbi, LFS))
				1680	return true;
				1681	if (S_ISDIR(inode->i_mode))
				1682	return true;
				1683	if (f2fs_is_atomic_file(inode))
				1684	return true;
				1685	if (fio) {
				1686	if (is_cold_data(fio->page))
				1687	return true;
				1688	if (IS_ATOMIC_WRITTEN_PAGE(fio->page))
				1689	return true;
				1690	}
				1691	return false;
				1692	}
				1693
				1694	static inline bool need_inplace_update(struct f2fs_io_info *fio)
				1695	{
				1696	struct inode *inode = fio->page->mapping->host;
				1697
				1698	if (should_update_outplace(inode, fio))
				1699	return false;
				1700
				1701	return should_update_inplace(inode, fio);
				1702	}
				1703
				1704	int do_write_data_page(struct f2fs_io_info *fio)
				1705	{
				1706	struct page *page = fio->page;
				1707	struct inode *inode = page->mapping->host;
				1708	struct dnode_of_data dn;
				1709	struct extent_info ei = {0,0,0};
				1710	bool ipu_force = false;
				1711	int err = 0;
				1712
				1713	set_new_dnode(&dn, inode, NULL, NULL, 0);
				1714	if (need_inplace_update(fio) &&
				1715	f2fs_lookup_extent_cache(inode, page->index, &ei)) {
				1716	fio->old_blkaddr = ei.blk + page->index - ei.fofs;
				1717
				1718	if (!f2fs_is_valid_blkaddr(fio->sbi, fio->old_blkaddr,
				1719	DATA_GENERIC))
				1720	return -EFSCORRUPTED;
				1721
				1722	ipu_force = true;
				1723	fio->need_lock = LOCK_DONE;
				1724	goto got_it;
				1725	}
				1726
				1727	/* Deadlock due to between page->lock and f2fs_lock_op */
				1728	if (fio->need_lock == LOCK_REQ && !f2fs_trylock_op(fio->sbi))
				1729	return -EAGAIN;
				1730
				1731	err = get_dnode_of_data(&dn, page->index, LOOKUP_NODE);
				1732	if (err)
				1733	goto out;
				1734
				1735	fio->old_blkaddr = dn.data_blkaddr;
				1736
				1737	/* This page is already truncated */
				1738	if (fio->old_blkaddr == NULL_ADDR) {
				1739	ClearPageUptodate(page);
				1740	clear_cold_data(page);
				1741	goto out_writepage;
				1742	}
				1743	got_it:
				1744	if (__is_valid_data_blkaddr(fio->old_blkaddr) &&
				1745	!f2fs_is_valid_blkaddr(fio->sbi, fio->old_blkaddr,
				1746	DATA_GENERIC)) {
				1747	err = -EFSCORRUPTED;
				1748	goto out_writepage;
				1749	}
				1750	/*
				1751	* If current allocation needs SSR,
				1752	* it had better in-place writes for updated data.
				1753	*/
				1754	if (ipu_force \|\| (is_valid_data_blkaddr(fio->sbi, fio->old_blkaddr) &&
				1755	need_inplace_update(fio))) {
				1756	err = encrypt_one_page(fio);
				1757	if (err)
				1758	goto out_writepage;
				1759
				1760	set_page_writeback(page);
				1761	ClearPageError(page);
				1762	f2fs_put_dnode(&dn);
				1763	if (fio->need_lock == LOCK_REQ)
				1764	f2fs_unlock_op(fio->sbi);
				1765	err = rewrite_data_page(fio);
				1766	trace_f2fs_do_write_data_page(fio->page, IPU);
				1767	set_inode_flag(inode, FI_UPDATE_WRITE);
				1768	return err;
				1769	}
				1770
				1771	if (fio->need_lock == LOCK_RETRY) {
				1772	if (!f2fs_trylock_op(fio->sbi)) {
				1773	err = -EAGAIN;
				1774	goto out_writepage;
				1775	}
				1776	fio->need_lock = LOCK_REQ;
				1777	}
				1778
				1779	err = encrypt_one_page(fio);
				1780	if (err)
				1781	goto out_writepage;
				1782
				1783	set_page_writeback(page);
				1784	ClearPageError(page);
				1785
				1786	/* LFS mode write path */
				1787	write_data_page(&dn, fio);
				1788	trace_f2fs_do_write_data_page(page, OPU);
				1789	set_inode_flag(inode, FI_APPEND_WRITE);
				1790	if (page->index == 0)
				1791	set_inode_flag(inode, FI_FIRST_BLOCK_WRITTEN);
				1792	out_writepage:
				1793	f2fs_put_dnode(&dn);
				1794	out:
				1795	if (fio->need_lock == LOCK_REQ)
				1796	f2fs_unlock_op(fio->sbi);
				1797	return err;
				1798	}
				1799
				1800	static int __write_data_page(struct page page, bool submitted,
				1801	struct writeback_control *wbc,
				1802	enum iostat_type io_type)
				1803	{
				1804	struct inode *inode = page->mapping->host;
				1805	struct f2fs_sb_info *sbi = F2FS_I_SB(inode);
				1806	loff_t i_size = i_size_read(inode);
				1807	const pgoff_t end_index = ((unsigned long long) i_size)
				1808	>> PAGE_SHIFT;
				1809	loff_t psize = (loff_t)(page->index + 1) << PAGE_SHIFT;
				1810	unsigned offset = 0;
				1811	bool need_balance_fs = false;
				1812	int err = 0;
				1813	struct f2fs_io_info fio = {
				1814	.sbi = sbi,
				1815	.ino = inode->i_ino,
				1816	.type = DATA,
				1817	.op = REQ_OP_WRITE,
				1818	.op_flags = wbc_to_write_flags(wbc),
				1819	.old_blkaddr = NULL_ADDR,
				1820	.page = page,
				1821	.encrypted_page = NULL,
				1822	.submitted = false,
				1823	.need_lock = LOCK_RETRY,
				1824	.io_type = io_type,
				1825	.io_wbc = wbc,
				1826	};
				1827
				1828	trace_f2fs_writepage(page, DATA);
				1829
				1830	/* we should bypass data pages to proceed the kworkder jobs */
				1831	if (unlikely(f2fs_cp_error(sbi))) {
				1832	mapping_set_error(page->mapping, -EIO);
				1833	goto out;
				1834	}
				1835
				1836	if (unlikely(is_sbi_flag_set(sbi, SBI_POR_DOING)))
				1837	goto redirty_out;
				1838
				1839	if (page->index < end_index)
				1840	goto write;
				1841
				1842	/*
				1843	* If the offset is out-of-range of file size,
				1844	* this page does not have to be written to disk.
				1845	*/
				1846	offset = i_size & (PAGE_SIZE - 1);
				1847	if ((page->index >= end_index + 1) \|\| !offset)
				1848	goto out;
				1849
				1850	zero_user_segment(page, offset, PAGE_SIZE);
				1851	write:
				1852	if (f2fs_is_drop_cache(inode))
				1853	goto out;
				1854	/* we should not write 0'th page having journal header */
				1855	if (f2fs_is_volatile_file(inode) && (!page->index \|\|
				1856	(!wbc->for_reclaim &&
				1857	available_free_memory(sbi, BASE_CHECK))))
				1858	goto redirty_out;
				1859
				1860	/* Dentry blocks are controlled by checkpoint */
				1861	if (S_ISDIR(inode->i_mode)) {
				1862	fio.need_lock = LOCK_DONE;
				1863	err = do_write_data_page(&fio);
				1864	goto done;
				1865	}
				1866
				1867	if (!wbc->for_reclaim)
				1868	need_balance_fs = true;
				1869	else if (has_not_enough_free_secs(sbi, 0, 0))
				1870	goto redirty_out;
				1871	else
				1872	set_inode_flag(inode, FI_HOT_DATA);
				1873
				1874	err = -EAGAIN;
				1875	if (f2fs_has_inline_data(inode)) {
				1876	err = f2fs_write_inline_data(inode, page);
				1877	if (!err)
				1878	goto out;
				1879	}
				1880
				1881	if (err == -EAGAIN) {
				1882	err = do_write_data_page(&fio);
				1883	if (err == -EAGAIN) {
				1884	fio.need_lock = LOCK_REQ;
				1885	err = do_write_data_page(&fio);
				1886	}
				1887	}
				1888
				1889	if (err) {
				1890	file_set_keep_isize(inode);
				1891	} else {
				1892	down_write(&F2FS_I(inode)->i_sem);
				1893	if (F2FS_I(inode)->last_disk_size < psize)
				1894	F2FS_I(inode)->last_disk_size = psize;
				1895	up_write(&F2FS_I(inode)->i_sem);
				1896	}
				1897
				1898	done:
				1899	if (err && err != -ENOENT)
				1900	goto redirty_out;
				1901
				1902	out:
				1903	inode_dec_dirty_pages(inode);
				1904	if (err) {
				1905	ClearPageUptodate(page);
				1906	clear_cold_data(page);
				1907	}
				1908
				1909	if (wbc->for_reclaim) {
				1910	f2fs_submit_merged_write_cond(sbi, inode, 0, page->index, DATA);
				1911	clear_inode_flag(inode, FI_HOT_DATA);
				1912	remove_dirty_inode(inode);
				1913	submitted = NULL;
				1914	}
				1915
				1916	unlock_page(page);
				1917	if (!S_ISDIR(inode->i_mode))
				1918	f2fs_balance_fs(sbi, need_balance_fs);
				1919
				1920	if (unlikely(f2fs_cp_error(sbi))) {
				1921	f2fs_submit_merged_write(sbi, DATA);
				1922	submitted = NULL;
				1923	}
				1924
				1925	if (submitted)
				1926	*submitted = fio.submitted;
				1927
				1928	return 0;
				1929
				1930	redirty_out:
				1931	redirty_page_for_writepage(wbc, page);
				1932	/*
				1933	* pageout() in MM traslates EAGAIN, so calls handle_write_error()
				1934	* -> mapping_set_error() -> set_bit(AS_EIO, ...).
				1935	* file_write_and_wait_range() will see EIO error, which is critical
				1936	* to return value of fsync() followed by atomic_write failure to user.
				1937	*/
				1938	if (!err \|\| wbc->for_reclaim)
				1939	return AOP_WRITEPAGE_ACTIVATE;
				1940	unlock_page(page);
				1941	return err;
				1942	}
				1943
				1944	static int f2fs_write_data_page(struct page *page,
				1945	struct writeback_control *wbc)
				1946	{
				1947	return __write_data_page(page, NULL, wbc, FS_DATA_IO);
				1948	}
				1949
				1950	/*
				1951	* This function was copied from write_cche_pages from mm/page-writeback.c.
				1952	* The major change is making write step of cold data page separately from
				1953	* warm/hot data page.
				1954	*/
				1955	static int f2fs_write_cache_pages(struct address_space *mapping,
				1956	struct writeback_control *wbc,
				1957	enum iostat_type io_type)
				1958	{
				1959	int ret = 0;
				1960	int done = 0;
				1961	struct pagevec pvec;
				1962	int nr_pages;
				1963	pgoff_t uninitialized_var(writeback_index);
				1964	pgoff_t index;
				1965	pgoff_t end; /* Inclusive */
				1966	pgoff_t done_index;
				1967	pgoff_t last_idx = ULONG_MAX;
				1968	int cycled;
				1969	int range_whole = 0;
				1970	int tag;
				1971
				1972	pagevec_init(&pvec, 0);
				1973
				1974	if (get_dirty_pages(mapping->host) <=
				1975	SM_I(F2FS_M_SB(mapping))->min_hot_blocks)
				1976	set_inode_flag(mapping->host, FI_HOT_DATA);
				1977	else
				1978	clear_inode_flag(mapping->host, FI_HOT_DATA);
				1979
				1980	if (wbc->range_cyclic) {
				1981	writeback_index = mapping->writeback_index; /* prev offset */
				1982	index = writeback_index;
				1983	if (index == 0)
				1984	cycled = 1;
				1985	else
				1986	cycled = 0;
				1987	end = -1;
				1988	} else {
				1989	index = wbc->range_start >> PAGE_SHIFT;
				1990	end = wbc->range_end >> PAGE_SHIFT;
				1991	if (wbc->range_start == 0 && wbc->range_end == LLONG_MAX)
				1992	range_whole = 1;
				1993	cycled = 1; /* ignore range_cyclic tests */
				1994	}
				1995	if (wbc->sync_mode == WB_SYNC_ALL \|\| wbc->tagged_writepages)
				1996	tag = PAGECACHE_TAG_TOWRITE;
				1997	else
				1998	tag = PAGECACHE_TAG_DIRTY;
				1999	retry:
				2000	if (wbc->sync_mode == WB_SYNC_ALL \|\| wbc->tagged_writepages)
				2001	tag_pages_for_writeback(mapping, index, end);
				2002	done_index = index;
				2003	while (!done && (index <= end)) {
				2004	int i;
				2005
				2006	nr_pages = pagevec_lookup_tag(&pvec, mapping, &index, tag,
				2007	min(end - index, (pgoff_t)PAGEVEC_SIZE - 1) + 1);
				2008	if (nr_pages == 0)
				2009	break;
				2010
				2011	for (i = 0; i < nr_pages; i++) {
				2012	struct page *page = pvec.pages[i];
				2013	bool submitted = false;
				2014
				2015	if (page->index > end) {
				2016	done = 1;
				2017	break;
				2018	}
				2019
				2020	done_index = page->index;
				2021	retry_write:
				2022	lock_page(page);
				2023
				2024	if (unlikely(page->mapping != mapping)) {
				2025	continue_unlock:
				2026	unlock_page(page);
				2027	continue;
				2028	}
				2029
				2030	if (!PageDirty(page)) {
				2031	/* someone wrote it for us */
				2032	goto continue_unlock;
				2033	}
				2034
				2035	if (PageWriteback(page)) {
				2036	if (wbc->sync_mode != WB_SYNC_NONE)
				2037	f2fs_wait_on_page_writeback(page,
				2038	DATA, true);
				2039	else
				2040	goto continue_unlock;
				2041	}
				2042
				2043	BUG_ON(PageWriteback(page));
				2044	if (!clear_page_dirty_for_io(page))
				2045	goto continue_unlock;
				2046
				2047	ret = __write_data_page(page, &submitted, wbc, io_type);
				2048	if (unlikely(ret)) {
				2049	/*
				2050	* keep nr_to_write, since vfs uses this to
				2051	* get # of written pages.
				2052	*/
				2053	if (ret == AOP_WRITEPAGE_ACTIVATE) {
				2054	unlock_page(page);
				2055	ret = 0;
				2056	continue;
				2057	} else if (ret == -EAGAIN) {
				2058	ret = 0;
				2059	if (wbc->sync_mode == WB_SYNC_ALL) {
				2060	cond_resched();
				2061	congestion_wait(BLK_RW_ASYNC,
				2062	HZ/50);
				2063	goto retry_write;
				2064	}
				2065	continue;
				2066	}
				2067	done_index = page->index + 1;
				2068	done = 1;
				2069	break;
				2070	} else if (submitted) {
				2071	last_idx = page->index;
				2072	}
				2073
				2074	/* give a priority to WB_SYNC threads */
				2075	if ((atomic_read(&F2FS_M_SB(mapping)->wb_sync_req) \|\|
				2076	--wbc->nr_to_write <= 0) &&
				2077	wbc->sync_mode == WB_SYNC_NONE) {
				2078	done = 1;
				2079	break;
				2080	}
				2081	}
				2082	pagevec_release(&pvec);
				2083	cond_resched();
				2084	}
				2085
				2086	if (!cycled && !done) {
				2087	cycled = 1;
				2088	index = 0;
				2089	end = writeback_index - 1;
				2090	goto retry;
				2091	}
				2092	if (wbc->range_cyclic \|\| (range_whole && wbc->nr_to_write > 0))
				2093	mapping->writeback_index = done_index;
				2094
				2095	if (last_idx != ULONG_MAX)
				2096	f2fs_submit_merged_write_cond(F2FS_M_SB(mapping), mapping->host,
				2097	0, last_idx, DATA);
				2098
				2099	return ret;
				2100	}
				2101
				2102	int __f2fs_write_data_pages(struct address_space *mapping,
				2103	struct writeback_control *wbc,
				2104	enum iostat_type io_type)
				2105	{
				2106	struct inode *inode = mapping->host;
				2107	struct f2fs_sb_info *sbi = F2FS_I_SB(inode);
				2108	struct blk_plug plug;
				2109	int ret;
				2110
				2111	/* deal with chardevs and other special file */
				2112	if (!mapping->a_ops->writepage)
				2113	return 0;
				2114
				2115	/* skip writing if there is no dirty page in this inode */
				2116	if (!get_dirty_pages(inode) && wbc->sync_mode == WB_SYNC_NONE)
				2117	return 0;
				2118
				2119	/* during POR, we don't need to trigger writepage at all. */
				2120	if (unlikely(is_sbi_flag_set(sbi, SBI_POR_DOING)))
				2121	goto skip_write;
				2122
				2123	if (S_ISDIR(inode->i_mode) && wbc->sync_mode == WB_SYNC_NONE &&
				2124	get_dirty_pages(inode) < nr_pages_to_skip(sbi, DATA) &&
				2125	available_free_memory(sbi, DIRTY_DENTS))
				2126	goto skip_write;
				2127
				2128	/* skip writing during file defragment */
				2129	if (is_inode_flag_set(inode, FI_DO_DEFRAG))
				2130	goto skip_write;
				2131
				2132	trace_f2fs_writepages(mapping->host, wbc, DATA);
				2133
				2134	/* to avoid spliting IOs due to mixed WB_SYNC_ALL and WB_SYNC_NONE */
				2135	if (wbc->sync_mode == WB_SYNC_ALL)
				2136	atomic_inc(&sbi->wb_sync_req);
				2137	else if (atomic_read(&sbi->wb_sync_req))
				2138	goto skip_write;
				2139
				2140	blk_start_plug(&plug);
				2141	ret = f2fs_write_cache_pages(mapping, wbc, io_type);
				2142	blk_finish_plug(&plug);
				2143
				2144	if (wbc->sync_mode == WB_SYNC_ALL)
				2145	atomic_dec(&sbi->wb_sync_req);
				2146	/*
				2147	* if some pages were truncated, we cannot guarantee its mapping->host
				2148	* to detect pending bios.
				2149	*/
				2150
				2151	remove_dirty_inode(inode);
				2152	return ret;
				2153
				2154	skip_write:
				2155	wbc->pages_skipped += get_dirty_pages(inode);
				2156	trace_f2fs_writepages(mapping->host, wbc, DATA);
				2157	return 0;
				2158	}
				2159
				2160	static int f2fs_write_data_pages(struct address_space *mapping,
				2161	struct writeback_control *wbc)
				2162	{
				2163	struct inode *inode = mapping->host;
				2164
				2165	return __f2fs_write_data_pages(mapping, wbc,
				2166	F2FS_I(inode)->cp_task == current ?
				2167	FS_CP_DATA_IO : FS_DATA_IO);
				2168	}
				2169
				2170	static void f2fs_write_failed(struct address_space *mapping, loff_t to)
				2171	{
				2172	struct inode *inode = mapping->host;
				2173	loff_t i_size = i_size_read(inode);
				2174
				2175	if (to > i_size) {
				2176	down_write(&F2FS_I(inode)->i_mmap_sem);
				2177	truncate_pagecache(inode, i_size);
				2178	truncate_blocks(inode, i_size, true);
				2179	up_write(&F2FS_I(inode)->i_mmap_sem);
				2180	}
				2181	}
				2182
				2183	static int prepare_write_begin(struct f2fs_sb_info *sbi,
				2184	struct page *page, loff_t pos, unsigned len,
				2185	block_t blk_addr, bool node_changed)
				2186	{
				2187	struct inode *inode = page->mapping->host;
				2188	pgoff_t index = page->index;
				2189	struct dnode_of_data dn;
				2190	struct page *ipage;
				2191	bool locked = false;
				2192	struct extent_info ei = {0,0,0};
				2193	int err = 0;
				2194	int flag;
				2195
				2196	/*
				2197	* we already allocated all the blocks, so we don't need to get
				2198	* the block addresses when there is no need to fill the page.
				2199	*/
				2200	if (!f2fs_has_inline_data(inode) && len == PAGE_SIZE &&
				2201	!is_inode_flag_set(inode, FI_NO_PREALLOC))
				2202	return 0;
				2203
				2204	/* f2fs_lock_op avoids race between write CP and convert_inline_page */
				2205	if (f2fs_has_inline_data(inode) && pos + len > MAX_INLINE_DATA(inode))
				2206	flag = F2FS_GET_BLOCK_DEFAULT;
				2207	else
				2208	flag = F2FS_GET_BLOCK_PRE_AIO;
				2209
				2210	if (f2fs_has_inline_data(inode) \|\|
				2211	(pos & PAGE_MASK) >= i_size_read(inode)) {
				2212	__do_map_lock(sbi, flag, true);
				2213	locked = true;
				2214	}
				2215	restart:
				2216	/* check inline_data */
				2217	ipage = get_node_page(sbi, inode->i_ino);
				2218	if (IS_ERR(ipage)) {
				2219	err = PTR_ERR(ipage);
				2220	goto unlock_out;
				2221	}
				2222
				2223	set_new_dnode(&dn, inode, ipage, ipage, 0);
				2224
				2225	if (f2fs_has_inline_data(inode)) {
				2226	if (pos + len <= MAX_INLINE_DATA(inode)) {
				2227	read_inline_data(page, ipage);
				2228	set_inode_flag(inode, FI_DATA_EXIST);
				2229	if (inode->i_nlink)
				2230	set_inline_node(ipage);
				2231	} else {
				2232	err = f2fs_convert_inline_page(&dn, page);
				2233	if (err)
				2234	goto out;
				2235	if (dn.data_blkaddr == NULL_ADDR)
				2236	err = f2fs_get_block(&dn, index);
				2237	}
				2238	} else if (locked) {
				2239	err = f2fs_get_block(&dn, index);
				2240	} else {
				2241	if (f2fs_lookup_extent_cache(inode, index, &ei)) {
				2242	dn.data_blkaddr = ei.blk + index - ei.fofs;
				2243	} else {
				2244	/* hole case */
				2245	err = get_dnode_of_data(&dn, index, LOOKUP_NODE);
				2246	if (err \|\| dn.data_blkaddr == NULL_ADDR) {
				2247	f2fs_put_dnode(&dn);
				2248	__do_map_lock(sbi, F2FS_GET_BLOCK_PRE_AIO,
				2249	true);
				2250	WARN_ON(flag != F2FS_GET_BLOCK_PRE_AIO);
				2251	locked = true;
				2252	goto restart;
				2253	}
				2254	}
				2255	}
				2256
				2257	/* convert_inline_page can make node_changed */
				2258	*blk_addr = dn.data_blkaddr;
				2259	*node_changed = dn.node_changed;
				2260	out:
				2261	f2fs_put_dnode(&dn);
				2262	unlock_out:
				2263	if (locked)
				2264	__do_map_lock(sbi, flag, false);
				2265	return err;
				2266	}
				2267
				2268	static int f2fs_write_begin(struct file file, struct address_space mapping,
				2269	loff_t pos, unsigned len, unsigned flags,
				2270	struct page pagep, void fsdata)
				2271	{
				2272	struct inode *inode = mapping->host;
				2273	struct f2fs_sb_info *sbi = F2FS_I_SB(inode);
				2274	struct page *page = NULL;
				2275	pgoff_t index = ((unsigned long long) pos) >> PAGE_SHIFT;
				2276	bool need_balance = false, drop_atomic = false;
				2277	block_t blkaddr = NULL_ADDR;
				2278	int err = 0;
				2279
				2280	if (trace_android_fs_datawrite_start_enabled()) {
				2281	char *path, pathbuf[MAX_TRACE_PATHBUF_LEN];
				2282
				2283	path = android_fstrace_get_pathname(pathbuf,
				2284	MAX_TRACE_PATHBUF_LEN,
				2285	inode);
				2286	trace_android_fs_datawrite_start(inode, pos, len,
				2287	current->pid, path,
				2288	current->comm);
				2289	}
				2290	trace_f2fs_write_begin(inode, pos, len, flags);
				2291
				2292	if (f2fs_is_atomic_file(inode) &&
				2293	!available_free_memory(sbi, INMEM_PAGES)) {
				2294	err = -ENOMEM;
				2295	drop_atomic = true;
				2296	goto fail;
				2297	}
				2298
				2299	/*
				2300	* We should check this at this moment to avoid deadlock on inode page
				2301	* and #0 page. The locking rule for inline_data conversion should be:
				2302	* lock_page(page #0) -> lock_page(inode_page)
				2303	*/
				2304	if (index != 0) {
				2305	err = f2fs_convert_inline_inode(inode);
				2306	if (err)
				2307	goto fail;
				2308	}
				2309	repeat:
				2310	/*
				2311	* Do not use grab_cache_page_write_begin() to avoid deadlock due to
				2312	* wait_for_stable_page. Will wait that below with our IO control.
				2313	*/
				2314	page = f2fs_pagecache_get_page(mapping, index,
				2315	FGP_LOCK \| FGP_WRITE \| FGP_CREAT, GFP_NOFS);
				2316	if (!page) {
				2317	err = -ENOMEM;
				2318	goto fail;
				2319	}
				2320
				2321	*pagep = page;
				2322
				2323	err = prepare_write_begin(sbi, page, pos, len,
				2324	&blkaddr, &need_balance);
				2325	if (err)
				2326	goto fail;
				2327
				2328	if (need_balance && has_not_enough_free_secs(sbi, 0, 0)) {
				2329	unlock_page(page);
				2330	f2fs_balance_fs(sbi, true);
				2331	lock_page(page);
				2332	if (page->mapping != mapping) {
				2333	/* The page got truncated from under us */
				2334	f2fs_put_page(page, 1);
				2335	goto repeat;
				2336	}
				2337	}
				2338
				2339	f2fs_wait_on_page_writeback(page, DATA, false);
				2340
				2341	/* wait for GCed page writeback via META_MAPPING */
				2342	if (f2fs_post_read_required(inode))
				2343	f2fs_wait_on_block_writeback(sbi, blkaddr);
				2344
				2345	if (len == PAGE_SIZE \|\| PageUptodate(page))
				2346	return 0;
				2347
				2348	if (!(pos & (PAGE_SIZE - 1)) && (pos + len) >= i_size_read(inode)) {
				2349	zero_user_segment(page, len, PAGE_SIZE);
				2350	return 0;
				2351	}
				2352
				2353	if (blkaddr == NEW_ADDR) {
				2354	zero_user_segment(page, 0, PAGE_SIZE);
				2355	SetPageUptodate(page);
				2356	} else {
				2357	err = f2fs_submit_page_read(inode, page, blkaddr);
				2358	if (err)
				2359	goto fail;
				2360
				2361	lock_page(page);
				2362	if (unlikely(page->mapping != mapping)) {
				2363	f2fs_put_page(page, 1);
				2364	goto repeat;
				2365	}
				2366	if (unlikely(!PageUptodate(page))) {
				2367	err = -EIO;
				2368	goto fail;
				2369	}
				2370	}
				2371	return 0;
				2372
				2373	fail:
				2374	f2fs_put_page(page, 1);
				2375	f2fs_write_failed(mapping, pos + len);
				2376	if (drop_atomic)
				2377	drop_inmem_pages_all(sbi);
				2378	return err;
				2379	}
				2380
				2381	static int f2fs_write_end(struct file *file,
				2382	struct address_space *mapping,
				2383	loff_t pos, unsigned len, unsigned copied,
				2384	struct page page, void fsdata)
				2385	{
				2386	struct inode *inode = page->mapping->host;
				2387
				2388	trace_android_fs_datawrite_end(inode, pos, len);
				2389	trace_f2fs_write_end(inode, pos, len, copied);
				2390
				2391	/*
				2392	* This should be come from len == PAGE_SIZE, and we expect copied
				2393	* should be PAGE_SIZE. Otherwise, we treat it with zero copied and
				2394	* let generic_perform_write() try to copy data again through copied=0.
				2395	*/
				2396	if (!PageUptodate(page)) {
				2397	if (unlikely(copied != len))
				2398	copied = 0;
				2399	else
				2400	SetPageUptodate(page);
				2401	}
				2402	if (!copied)
				2403	goto unlock_out;
				2404
				2405	set_page_dirty(page);
				2406
				2407	if (pos + copied > i_size_read(inode))
				2408	f2fs_i_size_write(inode, pos + copied);
				2409	unlock_out:
				2410	f2fs_put_page(page, 1);
				2411	f2fs_update_time(F2FS_I_SB(inode), REQ_TIME);
				2412	return copied;
				2413	}
				2414
				2415	static int check_direct_IO(struct inode inode, struct iov_iter iter,
				2416	loff_t offset)
				2417	{
				2418	unsigned blocksize_mask = inode->i_sb->s_blocksize - 1;
				2419
				2420	if (offset & blocksize_mask)
				2421	return -EINVAL;
				2422
				2423	if (iov_iter_alignment(iter) & blocksize_mask)
				2424	return -EINVAL;
				2425
				2426	return 0;
				2427	}
				2428
				2429	static ssize_t f2fs_direct_IO(struct kiocb iocb, struct iov_iter iter)
				2430	{
				2431	struct address_space *mapping = iocb->ki_filp->f_mapping;
				2432	struct inode *inode = mapping->host;
				2433	struct f2fs_sb_info *sbi = F2FS_I_SB(inode);
				2434	size_t count = iov_iter_count(iter);
				2435	loff_t offset = iocb->ki_pos;
				2436	int rw = iov_iter_rw(iter);
				2437	int err;
				2438	enum rw_hint hint = iocb->ki_hint;
				2439	int whint_mode = F2FS_OPTION(sbi).whint_mode;
				2440
				2441	err = check_direct_IO(inode, iter, offset);
				2442	if (err)
				2443	return err;
				2444
				2445	if (f2fs_force_buffered_io(inode, rw))
				2446	return 0;
				2447
				2448	trace_f2fs_direct_IO_enter(inode, offset, count, rw);
				2449
				2450	if (trace_android_fs_dataread_start_enabled() &&
				2451	(rw == READ)) {
				2452	char *path, pathbuf[MAX_TRACE_PATHBUF_LEN];
				2453
				2454	path = android_fstrace_get_pathname(pathbuf,
				2455	MAX_TRACE_PATHBUF_LEN,
				2456	inode);
				2457	trace_android_fs_dataread_start(inode, offset,
				2458	count, current->pid, path,
				2459	current->comm);
				2460	}
				2461	if (trace_android_fs_datawrite_start_enabled() &&
				2462	(rw == WRITE)) {
				2463	char *path, pathbuf[MAX_TRACE_PATHBUF_LEN];
				2464
				2465	path = android_fstrace_get_pathname(pathbuf,
				2466	MAX_TRACE_PATHBUF_LEN,
				2467	inode);
				2468	trace_android_fs_datawrite_start(inode, offset, count,
				2469	current->pid, path,
				2470	current->comm);
				2471	}
				2472	if (rw == WRITE && whint_mode == WHINT_MODE_OFF)
				2473	iocb->ki_hint = WRITE_LIFE_NOT_SET;
				2474
				2475	if (!down_read_trylock(&F2FS_I(inode)->dio_rwsem[rw])) {
				2476	if (iocb->ki_flags & IOCB_NOWAIT) {
				2477	iocb->ki_hint = hint;
				2478	err = -EAGAIN;
				2479	goto out;
				2480	}
				2481	down_read(&F2FS_I(inode)->dio_rwsem[rw]);
				2482	}
				2483
				2484	err = blockdev_direct_IO(iocb, inode, iter, get_data_block_dio);
				2485	up_read(&F2FS_I(inode)->dio_rwsem[rw]);
				2486
				2487	if (rw == WRITE) {
				2488	if (whint_mode == WHINT_MODE_OFF)
				2489	iocb->ki_hint = hint;
				2490	if (err > 0) {
				2491	f2fs_update_iostat(F2FS_I_SB(inode), APP_DIRECT_IO,
				2492	err);
				2493	set_inode_flag(inode, FI_UPDATE_WRITE);
				2494	} else if (err < 0) {
				2495	f2fs_write_failed(mapping, offset + count);
				2496	}
				2497	}
				2498	out:
				2499	if (trace_android_fs_dataread_start_enabled() &&
				2500	(rw == READ))
				2501	trace_android_fs_dataread_end(inode, offset, count);
				2502	if (trace_android_fs_datawrite_start_enabled() &&
				2503	(rw == WRITE))
				2504	trace_android_fs_datawrite_end(inode, offset, count);
				2505
				2506	trace_f2fs_direct_IO_exit(inode, offset, count, rw, err);
				2507
				2508	return err;
				2509	}
				2510
				2511	void f2fs_invalidate_page(struct page *page, unsigned int offset,
				2512	unsigned int length)
				2513	{
				2514	struct inode *inode = page->mapping->host;
				2515	struct f2fs_sb_info *sbi = F2FS_I_SB(inode);
				2516
				2517	if (inode->i_ino >= F2FS_ROOT_INO(sbi) &&
				2518	(offset % PAGE_SIZE \|\| length != PAGE_SIZE))
				2519	return;
				2520
				2521	if (PageDirty(page)) {
				2522	if (inode->i_ino == F2FS_META_INO(sbi)) {
				2523	dec_page_count(sbi, F2FS_DIRTY_META);
				2524	} else if (inode->i_ino == F2FS_NODE_INO(sbi)) {
				2525	dec_page_count(sbi, F2FS_DIRTY_NODES);
				2526	} else {
				2527	inode_dec_dirty_pages(inode);
				2528	remove_dirty_inode(inode);
				2529	}
				2530	}
				2531
				2532	clear_cold_data(page);
				2533
				2534	/* This is atomic written page, keep Private */
				2535	if (IS_ATOMIC_WRITTEN_PAGE(page))
				2536	return drop_inmem_page(inode, page);
				2537
				2538	set_page_private(page, 0);
				2539	ClearPagePrivate(page);
				2540	}
				2541
				2542	int f2fs_release_page(struct page *page, gfp_t wait)
				2543	{
				2544	/* If this is dirty page, keep PagePrivate */
				2545	if (PageDirty(page))
				2546	return 0;
				2547
				2548	/* This is atomic written page, keep Private */
				2549	if (IS_ATOMIC_WRITTEN_PAGE(page))
				2550	return 0;
				2551
				2552	clear_cold_data(page);
				2553	set_page_private(page, 0);
				2554	ClearPagePrivate(page);
				2555	return 1;
				2556	}
				2557
				2558	static int f2fs_set_data_page_dirty(struct page *page)
				2559	{
				2560	struct address_space *mapping = page->mapping;
				2561	struct inode *inode = mapping->host;
				2562
				2563	trace_f2fs_set_page_dirty(page, DATA);
				2564
				2565	if (!PageUptodate(page))
				2566	SetPageUptodate(page);
				2567
				2568	if (f2fs_is_atomic_file(inode) && !f2fs_is_commit_atomic_write(inode)) {
				2569	if (!IS_ATOMIC_WRITTEN_PAGE(page)) {
				2570	register_inmem_page(inode, page);
				2571	return 1;
				2572	}
				2573	/*
				2574	* Previously, this page has been registered, we just
				2575	* return here.
				2576	*/
				2577	return 0;
				2578	}
				2579
				2580	if (!PageDirty(page)) {
				2581	__set_page_dirty_nobuffers(page);
				2582	update_dirty_page(inode, page);
				2583	return 1;
				2584	}
				2585	return 0;
				2586	}
				2587
				2588	static sector_t f2fs_bmap(struct address_space *mapping, sector_t block)
				2589	{
				2590	struct inode *inode = mapping->host;
				2591
				2592	if (f2fs_has_inline_data(inode))
				2593	return 0;
				2594
				2595	/* make sure allocating whole blocks */
				2596	if (mapping_tagged(mapping, PAGECACHE_TAG_DIRTY))
				2597	filemap_write_and_wait(mapping);
				2598
				2599	return generic_block_bmap(mapping, block, get_data_block_bmap);
				2600	}
				2601
				2602	#ifdef CONFIG_MIGRATION
				2603	#include <linux/migrate.h>
				2604
				2605	int f2fs_migrate_page(struct address_space *mapping,
				2606	struct page newpage, struct page page, enum migrate_mode mode)
				2607	{
				2608	int rc, extra_count;
				2609	struct f2fs_inode_info *fi = F2FS_I(mapping->host);
				2610	bool atomic_written = IS_ATOMIC_WRITTEN_PAGE(page);
				2611
				2612	BUG_ON(PageWriteback(page));
				2613
				2614	/* migrating an atomic written page is safe with the inmem_lock hold */
				2615	if (atomic_written) {
				2616	if (mode != MIGRATE_SYNC)
				2617	return -EBUSY;
				2618	if (!mutex_trylock(&fi->inmem_lock))
				2619	return -EAGAIN;
				2620	}
				2621
				2622	/*
				2623	* A reference is expected if PagePrivate set when move mapping,
				2624	* however F2FS breaks this for maintaining dirty page counts when
				2625	* truncating pages. So here adjusting the 'extra_count' make it work.
				2626	*/
				2627	extra_count = (atomic_written ? 1 : 0) - page_has_private(page);
				2628	rc = migrate_page_move_mapping(mapping, newpage,
				2629	page, NULL, mode, extra_count);
				2630	if (rc != MIGRATEPAGE_SUCCESS) {
				2631	if (atomic_written)
				2632	mutex_unlock(&fi->inmem_lock);
				2633	return rc;
				2634	}
				2635
				2636	if (atomic_written) {
				2637	struct inmem_pages *cur;
				2638	list_for_each_entry(cur, &fi->inmem_pages, list)
				2639	if (cur->page == page) {
				2640	cur->page = newpage;
				2641	break;
				2642	}
				2643	mutex_unlock(&fi->inmem_lock);
				2644	put_page(page);
				2645	get_page(newpage);
				2646	}
				2647
				2648	if (PagePrivate(page))
				2649	SetPagePrivate(newpage);
				2650	set_page_private(newpage, page_private(page));
				2651
				2652	if (mode != MIGRATE_SYNC_NO_COPY)
				2653	migrate_page_copy(newpage, page);
				2654	else
				2655	migrate_page_states(newpage, page);
				2656
				2657	return MIGRATEPAGE_SUCCESS;
				2658	}
				2659	#endif
				2660
				2661	const struct address_space_operations f2fs_dblock_aops = {
				2662	.readpage = f2fs_read_data_page,
				2663	.readpages = f2fs_read_data_pages,
				2664	.writepage = f2fs_write_data_page,
				2665	.writepages = f2fs_write_data_pages,
				2666	.write_begin = f2fs_write_begin,
				2667	.write_end = f2fs_write_end,
				2668	.set_page_dirty = f2fs_set_data_page_dirty,
				2669	.invalidatepage = f2fs_invalidate_page,
				2670	.releasepage = f2fs_release_page,
				2671	.direct_IO = f2fs_direct_IO,
				2672	.bmap = f2fs_bmap,
				2673	#ifdef CONFIG_MIGRATION
				2674	.migratepage = f2fs_migrate_page,
				2675	#endif
				2676	};
				2677
				2678	int __init f2fs_init_post_read_processing(void)
				2679	{
				2680	bio_post_read_ctx_cache = KMEM_CACHE(bio_post_read_ctx, 0);
				2681	if (!bio_post_read_ctx_cache)
				2682	goto fail;
				2683	bio_post_read_ctx_pool =
				2684	mempool_create_slab_pool(NUM_PREALLOC_POST_READ_CTXS,
				2685	bio_post_read_ctx_cache);
				2686	if (!bio_post_read_ctx_pool)
				2687	goto fail_free_cache;
				2688	return 0;
				2689
				2690	fail_free_cache:
				2691	kmem_cache_destroy(bio_post_read_ctx_cache);
				2692	fail:
				2693	return -ENOMEM;
				2694	}
				2695
				2696	void __exit f2fs_destroy_post_read_processing(void)
				2697	{
				2698	mempool_destroy(bio_post_read_ctx_pool);
				2699	kmem_cache_destroy(bio_post_read_ctx_cache);
				2700	}