Blame - fs/xfs/xfs_aops.c - SHIFTPHONES/mainline/linux

blob: 5c5d8c832dcc2a43b6c14c50cfbb7c697eb045b3 [file] [log] [blame]

Dave Chinner	0b61f8a	2018-06-05 19:42:14 -0700	[diff] [blame]	1	// SPDX-License-Identifier: GPL-2.0
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	2	/*
Nathan Scott	7b71876	2005-11-02 14:58:39 +1100	[diff] [blame]	3	* Copyright (c) 2000-2005 Silicon Graphics, Inc.
				4	* All Rights Reserved.
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	5	*/
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	6	#include "xfs.h"
Dave Chinner	70a9883	2013-10-23 10:36:05 +1100	[diff] [blame]	7	#include "xfs_shared.h"
Dave Chinner	239880e	2013-10-23 10:50:10 +1100	[diff] [blame]	8	#include "xfs_format.h"
				9	#include "xfs_log_format.h"
				10	#include "xfs_trans_resv.h"
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	11	#include "xfs_mount.h"
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	12	#include "xfs_inode.h"
Dave Chinner	239880e	2013-10-23 10:50:10 +1100	[diff] [blame]	13	#include "xfs_trans.h"
Christoph Hellwig	281627d	2012-03-13 08:41:05 +0000	[diff] [blame]	14	#include "xfs_inode_item.h"
Nathan Scott	a844f45	2005-11-02 14:38:42 +1100	[diff] [blame]	15	#include "xfs_alloc.h"
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	16	#include "xfs_error.h"
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	17	#include "xfs_iomap.h"
Christoph Hellwig	0b1b213	2009-12-14 23:14:59 +0000	[diff] [blame]	18	#include "xfs_trace.h"
Dave Chinner	3ed3a43	2010-03-05 02:00:42 +0000	[diff] [blame]	19	#include "xfs_bmap.h"
Dave Chinner	6898811	2013-08-12 20:49:42 +1000	[diff] [blame]	20	#include "xfs_bmap_util.h"
Dave Chinner	a4fbe6a	2013-10-23 10:51:50 +1100	[diff] [blame]	21	#include "xfs_bmap_btree.h"
Darrick J. Wong	ef47366	2016-10-03 09:11:34 -0700	[diff] [blame]	22	#include "xfs_reflink.h"
Tejun Heo	5a0e3ad	2010-03-24 17:04:11 +0900	[diff] [blame]	23	#include <linux/gfp.h>
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	24	#include <linux/mpage.h>
Christoph Hellwig	10ce444	2006-01-11 20:48:14 +1100	[diff] [blame]	25	#include <linux/pagevec.h>
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	26	#include <linux/writeback.h>
				27
Dave Chinner	fbcc025	2016-02-15 17:21:19 +1100	[diff] [blame]	28	/*
				29	* structure owned by writepages passed to individual writepage calls
				30	*/
				31	struct xfs_writepage_ctx {
				32	struct xfs_bmbt_irec imap;
				33	bool imap_valid;
				34	unsigned int io_type;
Dave Chinner	fbcc025	2016-02-15 17:21:19 +1100	[diff] [blame]	35	struct xfs_ioend *ioend;
				36	sector_t last_block;
				37	};
				38
Christoph Hellwig	0b1b213	2009-12-14 23:14:59 +0000	[diff] [blame]	39	void
Nathan Scott	f51623b	2006-03-14 13:26:27 +1100	[diff] [blame]	40	xfs_count_page_state(
				41	struct page *page,
				42	int *delalloc,
Nathan Scott	f51623b	2006-03-14 13:26:27 +1100	[diff] [blame]	43	int *unwritten)
				44	{
				45	struct buffer_head bh, head;
				46
Christoph Hellwig	20cb52e	2010-06-24 09:46:01 +1000	[diff] [blame]	47	delalloc = unwritten = 0;
Nathan Scott	f51623b	2006-03-14 13:26:27 +1100	[diff] [blame]	48
				49	bh = head = page_buffers(page);
				50	do {
Christoph Hellwig	20cb52e	2010-06-24 09:46:01 +1000	[diff] [blame]	51	if (buffer_unwritten(bh))
Nathan Scott	f51623b	2006-03-14 13:26:27 +1100	[diff] [blame]	52	(*unwritten) = 1;
				53	else if (buffer_delay(bh))
				54	(*delalloc) = 1;
				55	} while ((bh = bh->b_this_page) != head);
				56	}
				57
Ross Zwisler	20a90f5	2016-02-26 15:19:52 -0800	[diff] [blame]	58	struct block_device *
Christoph Hellwig	6214ed4	2007-09-14 15:23:17 +1000	[diff] [blame]	59	xfs_find_bdev_for_inode(
Christoph Hellwig	046f168	2010-04-28 12:28:52 +0000	[diff] [blame]	60	struct inode *inode)
Christoph Hellwig	6214ed4	2007-09-14 15:23:17 +1000	[diff] [blame]	61	{
Christoph Hellwig	046f168	2010-04-28 12:28:52 +0000	[diff] [blame]	62	struct xfs_inode *ip = XFS_I(inode);
Christoph Hellwig	6214ed4	2007-09-14 15:23:17 +1000	[diff] [blame]	63	struct xfs_mount *mp = ip->i_mount;
				64
Eric Sandeen	71ddabb	2007-11-23 16:29:42 +1100	[diff] [blame]	65	if (XFS_IS_REALTIME_INODE(ip))
Christoph Hellwig	6214ed4	2007-09-14 15:23:17 +1000	[diff] [blame]	66	return mp->m_rtdev_targp->bt_bdev;
				67	else
				68	return mp->m_ddev_targp->bt_bdev;
				69	}
				70
Dan Williams	486aff5	2017-08-24 15:12:50 -0700	[diff] [blame]	71	struct dax_device *
				72	xfs_find_daxdev_for_inode(
				73	struct inode *inode)
				74	{
				75	struct xfs_inode *ip = XFS_I(inode);
				76	struct xfs_mount *mp = ip->i_mount;
				77
				78	if (XFS_IS_REALTIME_INODE(ip))
				79	return mp->m_rtdev_targp->bt_daxdev;
				80	else
				81	return mp->m_ddev_targp->bt_daxdev;
				82	}
				83
Christoph Hellwig	0829c36	2005-09-02 16:58:49 +1000	[diff] [blame]	84	/*
Dave Chinner	37992c1	2016-04-06 08:12:28 +1000	[diff] [blame]	85	* We're now finished for good with this page. Update the page state via the
				86	* associated buffer_heads, paying attention to the start and end offsets that
				87	* we need to process on the page.
Dave Chinner	28b783e	2016-07-22 09:56:38 +1000	[diff] [blame]	88	*
Christoph Hellwig	8353a81	2017-09-02 09:53:41 -0700	[diff] [blame]	89	* Note that we open code the action in end_buffer_async_write here so that we
				90	* only have to iterate over the buffers attached to the page once. This is not
				91	* only more efficient, but also ensures that we only calls end_page_writeback
				92	* at the end of the iteration, and thus avoids the pitfall of having the page
				93	* and buffers potentially freed after every call to end_buffer_async_write.
Dave Chinner	37992c1	2016-04-06 08:12:28 +1000	[diff] [blame]	94	*/
				95	static void
				96	xfs_finish_page_writeback(
				97	struct inode *inode,
				98	struct bio_vec *bvec,
				99	int error)
				100	{
Christoph Hellwig	8353a81	2017-09-02 09:53:41 -0700	[diff] [blame]	101	struct buffer_head head = page_buffers(bvec->bv_page), bh = head;
				102	bool busy = false;
Dave Chinner	37992c1	2016-04-06 08:12:28 +1000	[diff] [blame]	103	unsigned int off = 0;
Christoph Hellwig	8353a81	2017-09-02 09:53:41 -0700	[diff] [blame]	104	unsigned long flags;
Dave Chinner	37992c1	2016-04-06 08:12:28 +1000	[diff] [blame]	105
				106	ASSERT(bvec->bv_offset < PAGE_SIZE);
Fabian Frederick	9340747	2017-02-27 14:28:32 -0800	[diff] [blame]	107	ASSERT((bvec->bv_offset & (i_blocksize(inode) - 1)) == 0);
Christoph Hellwig	8353a81	2017-09-02 09:53:41 -0700	[diff] [blame]	108	ASSERT(bvec->bv_offset + bvec->bv_len <= PAGE_SIZE);
Fabian Frederick	9340747	2017-02-27 14:28:32 -0800	[diff] [blame]	109	ASSERT((bvec->bv_len & (i_blocksize(inode) - 1)) == 0);
Dave Chinner	37992c1	2016-04-06 08:12:28 +1000	[diff] [blame]	110
Christoph Hellwig	8353a81	2017-09-02 09:53:41 -0700	[diff] [blame]	111	local_irq_save(flags);
				112	bit_spin_lock(BH_Uptodate_Lock, &head->b_state);
Dave Chinner	37992c1	2016-04-06 08:12:28 +1000	[diff] [blame]	113	do {
Christoph Hellwig	8353a81	2017-09-02 09:53:41 -0700	[diff] [blame]	114	if (off >= bvec->bv_offset &&
				115	off < bvec->bv_offset + bvec->bv_len) {
				116	ASSERT(buffer_async_write(bh));
				117	ASSERT(bh->b_end_io == NULL);
				118
				119	if (error) {
				120	mark_buffer_write_io_error(bh);
				121	clear_buffer_uptodate(bh);
				122	SetPageError(bvec->bv_page);
				123	} else {
				124	set_buffer_uptodate(bh);
				125	}
				126	clear_buffer_async_write(bh);
				127	unlock_buffer(bh);
				128	} else if (buffer_async_write(bh)) {
				129	ASSERT(buffer_locked(bh));
				130	busy = true;
				131	}
				132	off += bh->b_size;
				133	} while ((bh = bh->b_this_page) != head);
				134	bit_spin_unlock(BH_Uptodate_Lock, &head->b_state);
				135	local_irq_restore(flags);
				136
				137	if (!busy)
				138	end_page_writeback(bvec->bv_page);
Dave Chinner	37992c1	2016-04-06 08:12:28 +1000	[diff] [blame]	139	}
				140
				141	/*
				142	* We're now finished for good with this ioend structure. Update the page
				143	* state, release holds on bios, and finally free up memory. Do not use the
				144	* ioend after this.
Christoph Hellwig	f6d6d4f	2006-01-11 15:40:13 +1100	[diff] [blame]	145	*/
Christoph Hellwig	0829c36	2005-09-02 16:58:49 +1000	[diff] [blame]	146	STATIC void
				147	xfs_destroy_ioend(
Christoph Hellwig	0e51a8e	2016-04-06 08:34:30 +1000	[diff] [blame]	148	struct xfs_ioend *ioend,
				149	int error)
Christoph Hellwig	0829c36	2005-09-02 16:58:49 +1000	[diff] [blame]	150	{
Dave Chinner	37992c1	2016-04-06 08:12:28 +1000	[diff] [blame]	151	struct inode *inode = ioend->io_inode;
Christoph Hellwig	8353a81	2017-09-02 09:53:41 -0700	[diff] [blame]	152	struct bio *bio = &ioend->io_inline_bio;
				153	struct bio last = ioend->io_bio, next;
				154	u64 start = bio->bi_iter.bi_sector;
				155	bool quiet = bio_flagged(bio, BIO_QUIET);
Christoph Hellwig	f6d6d4f	2006-01-11 15:40:13 +1100	[diff] [blame]	156
Christoph Hellwig	0e51a8e	2016-04-06 08:34:30 +1000	[diff] [blame]	157	for (bio = &ioend->io_inline_bio; bio; bio = next) {
Dave Chinner	37992c1	2016-04-06 08:12:28 +1000	[diff] [blame]	158	struct bio_vec *bvec;
				159	int i;
				160
Christoph Hellwig	0e51a8e	2016-04-06 08:34:30 +1000	[diff] [blame]	161	/*
				162	* For the last bio, bi_private points to the ioend, so we
				163	* need to explicitly end the iteration here.
				164	*/
				165	if (bio == last)
				166	next = NULL;
				167	else
				168	next = bio->bi_private;
Dave Chinner	37992c1	2016-04-06 08:12:28 +1000	[diff] [blame]	169
				170	/* walk each page on bio, ending page IO on them */
				171	bio_for_each_segment_all(bvec, bio, i)
				172	xfs_finish_page_writeback(inode, bvec, error);
				173
				174	bio_put(bio);
Christoph Hellwig	f6d6d4f	2006-01-11 15:40:13 +1100	[diff] [blame]	175	}
Christoph Hellwig	8353a81	2017-09-02 09:53:41 -0700	[diff] [blame]	176
				177	if (unlikely(error && !quiet)) {
				178	xfs_err_ratelimited(XFS_I(inode)->i_mount,
				179	"writeback error on sector %llu", start);
				180	}
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	181	}
				182
				183	/*
Christoph Hellwig	fc0063c	2011-08-23 08:28:11 +0000	[diff] [blame]	184	* Fast and loose check if this write could update the on-disk inode size.
				185	*/
				186	static inline bool xfs_ioend_is_append(struct xfs_ioend *ioend)
				187	{
				188	return ioend->io_offset + ioend->io_size >
				189	XFS_I(ioend->io_inode)->i_d.di_size;
				190	}
				191
Christoph Hellwig	281627d	2012-03-13 08:41:05 +0000	[diff] [blame]	192	STATIC int
				193	xfs_setfilesize_trans_alloc(
				194	struct xfs_ioend *ioend)
				195	{
				196	struct xfs_mount *mp = XFS_I(ioend->io_inode)->i_mount;
				197	struct xfs_trans *tp;
				198	int error;
				199
Dave Chinner	4df0f7f	2018-03-06 17:07:22 -0800	[diff] [blame]	200	error = xfs_trans_alloc(mp, &M_RES(mp)->tr_fsyncts, 0, 0,
				201	XFS_TRANS_NOFS, &tp);
Christoph Hellwig	253f491	2016-04-06 09:19:55 +1000	[diff] [blame]	202	if (error)
Christoph Hellwig	281627d	2012-03-13 08:41:05 +0000	[diff] [blame]	203	return error;
Christoph Hellwig	281627d	2012-03-13 08:41:05 +0000	[diff] [blame]	204
				205	ioend->io_append_trans = tp;
				206
				207	/*
Dave Chinner	437a255	2012-11-28 13:01:00 +1100	[diff] [blame]	208	* We may pass freeze protection with a transaction. So tell lockdep
Jan Kara	d9457dc	2012-06-12 16:20:39 +0200	[diff] [blame]	209	* we released it.
				210	*/
Oleg Nesterov	bee9182	2015-07-19 23:48:20 +0200	[diff] [blame]	211	__sb_writers_release(ioend->io_inode->i_sb, SB_FREEZE_FS);
Jan Kara	d9457dc	2012-06-12 16:20:39 +0200	[diff] [blame]	212	/*
Christoph Hellwig	281627d	2012-03-13 08:41:05 +0000	[diff] [blame]	213	* We hand off the transaction to the completion thread now, so
				214	* clear the flag here.
				215	*/
Michal Hocko	9070733	2017-05-03 14:53:12 -0700	[diff] [blame]	216	current_restore_flags_nested(&tp->t_pflags, PF_MEMALLOC_NOFS);
Christoph Hellwig	281627d	2012-03-13 08:41:05 +0000	[diff] [blame]	217	return 0;
				218	}
				219
Christoph Hellwig	fc0063c	2011-08-23 08:28:11 +0000	[diff] [blame]	220	/*
Christoph Hellwig	2813d68	2011-12-18 20:00:12 +0000	[diff] [blame]	221	* Update on-disk file size now that data has been written to disk.
Lachlan McIlroy	ba87ea6	2007-05-08 13:49:46 +1000	[diff] [blame]	222	*/
Christoph Hellwig	281627d	2012-03-13 08:41:05 +0000	[diff] [blame]	223	STATIC int
Christoph Hellwig	e372843	2016-09-19 11:26:41 +1000	[diff] [blame]	224	__xfs_setfilesize(
Christoph Hellwig	2ba6623	2015-02-02 10:02:09 +1100	[diff] [blame]	225	struct xfs_inode *ip,
				226	struct xfs_trans *tp,
				227	xfs_off_t offset,
				228	size_t size)
Lachlan McIlroy	ba87ea6	2007-05-08 13:49:46 +1000	[diff] [blame]	229	{
Lachlan McIlroy	ba87ea6	2007-05-08 13:49:46 +1000	[diff] [blame]	230	xfs_fsize_t isize;
Lachlan McIlroy	ba87ea6	2007-05-08 13:49:46 +1000	[diff] [blame]	231
Christoph Hellwig	aa6bf01	2012-02-29 09:53:48 +0000	[diff] [blame]	232	xfs_ilock(ip, XFS_ILOCK_EXCL);
Christoph Hellwig	2ba6623	2015-02-02 10:02:09 +1100	[diff] [blame]	233	isize = xfs_new_eof(ip, offset + size);
Christoph Hellwig	281627d	2012-03-13 08:41:05 +0000	[diff] [blame]	234	if (!isize) {
				235	xfs_iunlock(ip, XFS_ILOCK_EXCL);
Christoph Hellwig	4906e21	2015-06-04 13:47:56 +1000	[diff] [blame]	236	xfs_trans_cancel(tp);
Christoph Hellwig	281627d	2012-03-13 08:41:05 +0000	[diff] [blame]	237	return 0;
Lachlan McIlroy	ba87ea6	2007-05-08 13:49:46 +1000	[diff] [blame]	238	}
				239
Christoph Hellwig	2ba6623	2015-02-02 10:02:09 +1100	[diff] [blame]	240	trace_xfs_setfilesize(ip, offset, size);
Christoph Hellwig	281627d	2012-03-13 08:41:05 +0000	[diff] [blame]	241
				242	ip->i_d.di_size = isize;
				243	xfs_trans_ijoin(tp, ip, XFS_ILOCK_EXCL);
				244	xfs_trans_log_inode(tp, ip, XFS_ILOG_CORE);
				245
Christoph Hellwig	7039331	2015-06-04 13:48:08 +1000	[diff] [blame]	246	return xfs_trans_commit(tp);
Christoph Hellwig	0829c36	2005-09-02 16:58:49 +1000	[diff] [blame]	247	}
				248
Christoph Hellwig	e372843	2016-09-19 11:26:41 +1000	[diff] [blame]	249	int
				250	xfs_setfilesize(
				251	struct xfs_inode *ip,
				252	xfs_off_t offset,
				253	size_t size)
				254	{
				255	struct xfs_mount *mp = ip->i_mount;
				256	struct xfs_trans *tp;
				257	int error;
				258
				259	error = xfs_trans_alloc(mp, &M_RES(mp)->tr_fsyncts, 0, 0, 0, &tp);
				260	if (error)
				261	return error;
				262
				263	return __xfs_setfilesize(ip, tp, offset, size);
				264	}
				265
Christoph Hellwig	2ba6623	2015-02-02 10:02:09 +1100	[diff] [blame]	266	STATIC int
				267	xfs_setfilesize_ioend(
Christoph Hellwig	0e51a8e	2016-04-06 08:34:30 +1000	[diff] [blame]	268	struct xfs_ioend *ioend,
				269	int error)
Christoph Hellwig	2ba6623	2015-02-02 10:02:09 +1100	[diff] [blame]	270	{
				271	struct xfs_inode *ip = XFS_I(ioend->io_inode);
				272	struct xfs_trans *tp = ioend->io_append_trans;
				273
				274	/*
				275	* The transaction may have been allocated in the I/O submission thread,
				276	* thus we need to mark ourselves as being in a transaction manually.
				277	* Similarly for freeze protection.
				278	*/
Michal Hocko	9070733	2017-05-03 14:53:12 -0700	[diff] [blame]	279	current_set_flags_nested(&tp->t_pflags, PF_MEMALLOC_NOFS);
Oleg Nesterov	bee9182	2015-07-19 23:48:20 +0200	[diff] [blame]	280	__sb_writers_acquired(VFS_I(ip)->i_sb, SB_FREEZE_FS);
Christoph Hellwig	2ba6623	2015-02-02 10:02:09 +1100	[diff] [blame]	281
Zhaohongjiang	5cb13dc	2015-10-12 15:28:39 +1100	[diff] [blame]	282	/* we abort the update if there was an IO error */
Christoph Hellwig	0e51a8e	2016-04-06 08:34:30 +1000	[diff] [blame]	283	if (error) {
Zhaohongjiang	5cb13dc	2015-10-12 15:28:39 +1100	[diff] [blame]	284	xfs_trans_cancel(tp);
Christoph Hellwig	0e51a8e	2016-04-06 08:34:30 +1000	[diff] [blame]	285	return error;
Zhaohongjiang	5cb13dc	2015-10-12 15:28:39 +1100	[diff] [blame]	286	}
				287
Christoph Hellwig	e372843	2016-09-19 11:26:41 +1000	[diff] [blame]	288	return __xfs_setfilesize(ip, tp, ioend->io_offset, ioend->io_size);
Christoph Hellwig	2ba6623	2015-02-02 10:02:09 +1100	[diff] [blame]	289	}
				290
Christoph Hellwig	0829c36	2005-09-02 16:58:49 +1000	[diff] [blame]	291	/*
Dave Chinner	77d7a0c	2010-02-17 05:36:29 +0000	[diff] [blame]	292	* IO write completion.
				293	*/
				294	STATIC void
				295	xfs_end_io(
				296	struct work_struct *work)
				297	{
Christoph Hellwig	0e51a8e	2016-04-06 08:34:30 +1000	[diff] [blame]	298	struct xfs_ioend *ioend =
				299	container_of(work, struct xfs_ioend, io_work);
				300	struct xfs_inode *ip = XFS_I(ioend->io_inode);
Christoph Hellwig	787eb48	2017-03-02 15:02:51 -0800	[diff] [blame]	301	xfs_off_t offset = ioend->io_offset;
				302	size_t size = ioend->io_size;
Christoph Hellwig	4e4cbee	2017-06-03 09:38:06 +0200	[diff] [blame]	303	int error;
Dave Chinner	77d7a0c	2010-02-17 05:36:29 +0000	[diff] [blame]	304
Brian Foster	af055e3	2016-02-08 15:00:02 +1100	[diff] [blame]	305	/*
Christoph Hellwig	787eb48	2017-03-02 15:02:51 -0800	[diff] [blame]	306	* Just clean up the in-memory strutures if the fs has been shut down.
Brian Foster	af055e3	2016-02-08 15:00:02 +1100	[diff] [blame]	307	*/
Christoph Hellwig	787eb48	2017-03-02 15:02:51 -0800	[diff] [blame]	308	if (XFS_FORCED_SHUTDOWN(ip->i_mount)) {
Christoph Hellwig	0e51a8e	2016-04-06 08:34:30 +1000	[diff] [blame]	309	error = -EIO;
Christoph Hellwig	787eb48	2017-03-02 15:02:51 -0800	[diff] [blame]	310	goto done;
Darrick J. Wong	43caeb1	2016-10-03 09:11:35 -0700	[diff] [blame]	311	}
				312
				313	/*
Christoph Hellwig	787eb48	2017-03-02 15:02:51 -0800	[diff] [blame]	314	* Clean up any COW blocks on an I/O error.
Dave Chinner	77d7a0c	2010-02-17 05:36:29 +0000	[diff] [blame]	315	*/
Christoph Hellwig	4e4cbee	2017-06-03 09:38:06 +0200	[diff] [blame]	316	error = blk_status_to_errno(ioend->io_bio->bi_status);
Christoph Hellwig	787eb48	2017-03-02 15:02:51 -0800	[diff] [blame]	317	if (unlikely(error)) {
				318	switch (ioend->io_type) {
				319	case XFS_IO_COW:
				320	xfs_reflink_cancel_cow_range(ip, offset, size, true);
				321	break;
				322	}
				323
				324	goto done;
				325	}
				326
				327	/*
				328	* Success: commit the COW or unwritten blocks if needed.
				329	*/
				330	switch (ioend->io_type) {
				331	case XFS_IO_COW:
				332	error = xfs_reflink_end_cow(ip, offset, size);
				333	break;
				334	case XFS_IO_UNWRITTEN:
Eryu Guan	ee70daa	2017-09-21 11:26:18 -0700	[diff] [blame]	335	/* writeback should never update isize */
				336	error = xfs_iomap_write_unwritten(ip, offset, size, false);
Christoph Hellwig	787eb48	2017-03-02 15:02:51 -0800	[diff] [blame]	337	break;
				338	default:
				339	ASSERT(!xfs_ioend_is_append(ioend) \|\| ioend->io_append_trans);
				340	break;
Dave Chinner	77d7a0c	2010-02-17 05:36:29 +0000	[diff] [blame]	341	}
				342
Christoph Hellwig	04f658e	2011-08-24 05:59:25 +0000	[diff] [blame]	343	done:
Christoph Hellwig	787eb48	2017-03-02 15:02:51 -0800	[diff] [blame]	344	if (ioend->io_append_trans)
				345	error = xfs_setfilesize_ioend(ioend, error);
Christoph Hellwig	0e51a8e	2016-04-06 08:34:30 +1000	[diff] [blame]	346	xfs_destroy_ioend(ioend, error);
Dave Chinner	77d7a0c	2010-02-17 05:36:29 +0000	[diff] [blame]	347	}
				348
Christoph Hellwig	0e51a8e	2016-04-06 08:34:30 +1000	[diff] [blame]	349	STATIC void
				350	xfs_end_bio(
				351	struct bio *bio)
Christoph Hellwig	0829c36	2005-09-02 16:58:49 +1000	[diff] [blame]	352	{
Christoph Hellwig	0e51a8e	2016-04-06 08:34:30 +1000	[diff] [blame]	353	struct xfs_ioend *ioend = bio->bi_private;
				354	struct xfs_mount *mp = XFS_I(ioend->io_inode)->i_mount;
Christoph Hellwig	0829c36	2005-09-02 16:58:49 +1000	[diff] [blame]	355
Darrick J. Wong	43caeb1	2016-10-03 09:11:35 -0700	[diff] [blame]	356	if (ioend->io_type == XFS_IO_UNWRITTEN \|\| ioend->io_type == XFS_IO_COW)
Christoph Hellwig	0e51a8e	2016-04-06 08:34:30 +1000	[diff] [blame]	357	queue_work(mp->m_unwritten_workqueue, &ioend->io_work);
				358	else if (ioend->io_append_trans)
				359	queue_work(mp->m_data_workqueue, &ioend->io_work);
				360	else
Christoph Hellwig	4e4cbee	2017-06-03 09:38:06 +0200	[diff] [blame]	361	xfs_destroy_ioend(ioend, blk_status_to_errno(bio->bi_status));
Christoph Hellwig	0829c36	2005-09-02 16:58:49 +1000	[diff] [blame]	362	}
				363
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	364	STATIC int
				365	xfs_map_blocks(
Christoph Hellwig	5c665e5	2018-07-11 22:25:59 -0700	[diff] [blame]	366	struct xfs_writepage_ctx *wpc,
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	367	struct inode *inode,
Christoph Hellwig	5c665e5	2018-07-11 22:25:59 -0700	[diff] [blame]	368	loff_t offset)
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	369	{
Christoph Hellwig	a206c81	2010-12-10 08:42:20 +0000	[diff] [blame]	370	struct xfs_inode *ip = XFS_I(inode);
				371	struct xfs_mount *mp = ip->i_mount;
Fabian Frederick	9340747	2017-02-27 14:28:32 -0800	[diff] [blame]	372	ssize_t count = i_blocksize(inode);
Christoph Hellwig	060d4ea	2018-07-11 22:26:01 -0700	[diff] [blame^]	373	xfs_fileoff_t offset_fsb, end_fsb;
Christoph Hellwig	5c665e5	2018-07-11 22:25:59 -0700	[diff] [blame]	374	struct xfs_bmbt_irec imap;
				375	int whichfork = XFS_DATA_FORK;
Christoph Hellwig	060d4ea	2018-07-11 22:26:01 -0700	[diff] [blame^]	376	struct xfs_iext_cursor icur;
Christoph Hellwig	a206c81	2010-12-10 08:42:20 +0000	[diff] [blame]	377	int error = 0;
Christoph Hellwig	a206c81	2010-12-10 08:42:20 +0000	[diff] [blame]	378	int nimaps = 1;
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	379
Christoph Hellwig	a206c81	2010-12-10 08:42:20 +0000	[diff] [blame]	380	if (XFS_FORCED_SHUTDOWN(mp))
Eric Sandeen	b474c7a	2014-06-22 15:04:54 +1000	[diff] [blame]	381	return -EIO;
Christoph Hellwig	a206c81	2010-12-10 08:42:20 +0000	[diff] [blame]	382
Dave Chinner	988ef92	2016-02-15 17:20:50 +1100	[diff] [blame]	383	xfs_ilock(ip, XFS_ILOCK_SHARED);
Christoph Hellwig	8ff2957	2010-12-10 08:42:21 +0000	[diff] [blame]	384	ASSERT(ip->i_d.di_format != XFS_DINODE_FMT_BTREE \|\|
				385	(ip->i_df.if_flags & XFS_IFEXTENTS));
Dave Chinner	d2c2819	2012-06-08 15:44:53 +1000	[diff] [blame]	386	ASSERT(offset <= mp->m_super->s_maxbytes);
Christoph Hellwig	8ff2957	2010-12-10 08:42:21 +0000	[diff] [blame]	387
Christoph Hellwig	060d4ea	2018-07-11 22:26:01 -0700	[diff] [blame^]	388	if (offset > mp->m_super->s_maxbytes - count)
				389	count = mp->m_super->s_maxbytes - offset;
				390	end_fsb = XFS_B_TO_FSB(mp, (xfs_ufsize_t)offset + count);
				391	offset_fsb = XFS_B_TO_FSBT(mp, offset);
				392
				393	/*
				394	* Check if this is offset is covered by a COW extents, and if yes use
				395	* it directly instead of looking up anything in the data fork.
				396	*/
Christoph Hellwig	5c665e5	2018-07-11 22:25:59 -0700	[diff] [blame]	397	if (xfs_is_reflink_inode(ip) &&
Christoph Hellwig	060d4ea	2018-07-11 22:26:01 -0700	[diff] [blame^]	398	xfs_iext_lookup_extent(ip, ip->i_cowfp, offset_fsb, &icur, &imap) &&
				399	imap.br_startoff <= offset_fsb) {
Christoph Hellwig	5c665e5	2018-07-11 22:25:59 -0700	[diff] [blame]	400	xfs_iunlock(ip, XFS_ILOCK_SHARED);
				401	/*
				402	* Truncate can race with writeback since writeback doesn't
				403	* take the iolock and truncate decreases the file size before
				404	* it starts truncating the pages between new_size and old_size.
				405	* Therefore, we can end up in the situation where writeback
				406	* gets a CoW fork mapping but the truncate makes the mapping
				407	* invalid and we end up in here trying to get a new mapping.
				408	* bail out here so that we simply never get a valid mapping
				409	* and so we drop the write altogether. The page truncation
				410	* will kill the contents anyway.
				411	*/
				412	if (offset > i_size_read(inode)) {
				413	wpc->io_type = XFS_IO_HOLE;
				414	return 0;
				415	}
				416	whichfork = XFS_COW_FORK;
				417	wpc->io_type = XFS_IO_COW;
				418	goto allocate_blocks;
				419	}
				420
				421	/*
				422	* Map valid and no COW extent in the way? We're done.
				423	*/
				424	if (wpc->imap_valid) {
				425	xfs_iunlock(ip, XFS_ILOCK_SHARED);
				426	return 0;
				427	}
				428
				429	/*
				430	* If we don't have a valid map, now it's time to get a new one for this
				431	* offset. This will convert delayed allocations (including COW ones)
				432	* into real extents.
				433	*/
Dave Chinner	5c8ed20	2011-09-18 20:40:45 +0000	[diff] [blame]	434	error = xfs_bmapi_read(ip, offset_fsb, end_fsb - offset_fsb,
Christoph Hellwig	5c665e5	2018-07-11 22:25:59 -0700	[diff] [blame]	435	&imap, &nimaps, XFS_BMAPI_ENTIRE);
Christoph Hellwig	8ff2957	2010-12-10 08:42:21 +0000	[diff] [blame]	436	xfs_iunlock(ip, XFS_ILOCK_SHARED);
Christoph Hellwig	a206c81	2010-12-10 08:42:20 +0000	[diff] [blame]	437	if (error)
Dave Chinner	2451337	2014-06-25 14:58:08 +1000	[diff] [blame]	438	return error;
Christoph Hellwig	a206c81	2010-12-10 08:42:20 +0000	[diff] [blame]	439
Christoph Hellwig	5c665e5	2018-07-11 22:25:59 -0700	[diff] [blame]	440	if (!nimaps) {
				441	/*
				442	* Lookup returns no match? Beyond eof? regardless,
				443	* return it as a hole so we don't write it
				444	*/
				445	imap.br_startoff = offset_fsb;
				446	imap.br_blockcount = end_fsb - offset_fsb;
				447	imap.br_startblock = HOLESTARTBLOCK;
				448	wpc->io_type = XFS_IO_HOLE;
				449	} else if (imap.br_startblock == HOLESTARTBLOCK) {
				450	/* landed in a hole */
				451	wpc->io_type = XFS_IO_HOLE;
Dave Chinner	e2f6ad4	2018-07-11 22:26:00 -0700	[diff] [blame]	452	} else {
				453	if (isnullstartblock(imap.br_startblock)) {
				454	/* got a delalloc extent */
				455	wpc->io_type = XFS_IO_DELALLOC;
				456	goto allocate_blocks;
				457	}
				458
				459	if (imap.br_state == XFS_EXT_UNWRITTEN)
				460	wpc->io_type = XFS_IO_UNWRITTEN;
				461	else
				462	wpc->io_type = XFS_IO_OVERWRITE;
Christoph Hellwig	a206c81	2010-12-10 08:42:20 +0000	[diff] [blame]	463	}
				464
Christoph Hellwig	5c665e5	2018-07-11 22:25:59 -0700	[diff] [blame]	465	wpc->imap = imap;
				466	trace_xfs_map_blocks_found(ip, offset, count, wpc->io_type, &imap);
				467	return 0;
				468	allocate_blocks:
				469	error = xfs_iomap_write_allocate(ip, whichfork, offset, &imap);
				470	if (error)
				471	return error;
				472	wpc->imap = imap;
				473	trace_xfs_map_blocks_alloc(ip, offset, count, wpc->io_type, &imap);
Christoph Hellwig	8ff2957	2010-12-10 08:42:21 +0000	[diff] [blame]	474	return 0;
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	475	}
				476
Dave Chinner	fbcc025	2016-02-15 17:21:19 +1100	[diff] [blame]	477	STATIC bool
Christoph Hellwig	558e689	2010-04-28 12:28:58 +0000	[diff] [blame]	478	xfs_imap_valid(
Christoph Hellwig	8699bb0	2010-04-28 12:28:54 +0000	[diff] [blame]	479	struct inode *inode,
Christoph Hellwig	207d041	2010-04-28 12:28:56 +0000	[diff] [blame]	480	struct xfs_bmbt_irec *imap,
Christoph Hellwig	558e689	2010-04-28 12:28:58 +0000	[diff] [blame]	481	xfs_off_t offset)
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	482	{
Christoph Hellwig	558e689	2010-04-28 12:28:58 +0000	[diff] [blame]	483	offset >>= inode->i_blkbits;
Christoph Hellwig	8699bb0	2010-04-28 12:28:54 +0000	[diff] [blame]	484
Brian Foster	40214d1	2017-10-13 09:47:46 -0700	[diff] [blame]	485	/*
				486	* We have to make sure the cached mapping is within EOF to protect
				487	* against eofblocks trimming on file release leaving us with a stale
				488	* mapping. Otherwise, a page for a subsequent file extending buffered
				489	* write could get picked up by this writeback cycle and written to the
				490	* wrong blocks.
				491	*
				492	* Note that what we really want here is a generic mapping invalidation
				493	* mechanism to protect us from arbitrary extent modifying contexts, not
				494	* just eofblocks.
				495	*/
				496	xfs_trim_extent_eof(imap, XFS_I(inode));
				497
Christoph Hellwig	558e689	2010-04-28 12:28:58 +0000	[diff] [blame]	498	return offset >= imap->br_startoff &&
				499	offset < imap->br_startoff + imap->br_blockcount;
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	500	}
				501
Christoph Hellwig	f6d6d4f	2006-01-11 15:40:13 +1100	[diff] [blame]	502	STATIC void
				503	xfs_start_buffer_writeback(
				504	struct buffer_head *bh)
				505	{
				506	ASSERT(buffer_mapped(bh));
				507	ASSERT(buffer_locked(bh));
				508	ASSERT(!buffer_delay(bh));
				509	ASSERT(!buffer_unwritten(bh));
				510
Christoph Hellwig	8353a81	2017-09-02 09:53:41 -0700	[diff] [blame]	511	bh->b_end_io = NULL;
				512	set_buffer_async_write(bh);
Christoph Hellwig	f6d6d4f	2006-01-11 15:40:13 +1100	[diff] [blame]	513	set_buffer_uptodate(bh);
				514	clear_buffer_dirty(bh);
				515	}
				516
				517	STATIC void
				518	xfs_start_page_writeback(
				519	struct page *page,
Dave Chinner	e10de37	2016-02-15 17:23:12 +1100	[diff] [blame]	520	int clear_dirty)
Christoph Hellwig	f6d6d4f	2006-01-11 15:40:13 +1100	[diff] [blame]	521	{
				522	ASSERT(PageLocked(page));
				523	ASSERT(!PageWriteback(page));
Dave Chinner	0d085a5	2014-09-23 15:36:27 +1000	[diff] [blame]	524
				525	/*
				526	* if the page was not fully cleaned, we need to ensure that the higher
				527	* layers come back to it correctly. That means we need to keep the page
				528	* dirty, and for WB_SYNC_ALL writeback we need to ensure the
				529	* PAGECACHE_TAG_TOWRITE index mark is not removed so another attempt to
				530	* write this page in this writeback sweep will be made.
				531	*/
				532	if (clear_dirty) {
David Chinner	9213202	2006-12-21 10:24:01 +1100	[diff] [blame]	533	clear_page_dirty_for_io(page);
Dave Chinner	0d085a5	2014-09-23 15:36:27 +1000	[diff] [blame]	534	set_page_writeback(page);
				535	} else
				536	set_page_writeback_keepwrite(page);
				537
Christoph Hellwig	f6d6d4f	2006-01-11 15:40:13 +1100	[diff] [blame]	538	unlock_page(page);
Christoph Hellwig	f6d6d4f	2006-01-11 15:40:13 +1100	[diff] [blame]	539	}
				540
Zhi Yong Wu	c7c1a7d	2013-08-07 10:11:09 +0000	[diff] [blame]	541	static inline int xfs_bio_add_buffer(struct bio bio, struct buffer_head bh)
Christoph Hellwig	f6d6d4f	2006-01-11 15:40:13 +1100	[diff] [blame]	542	{
				543	return bio_add_page(bio, bh->b_page, bh->b_size, bh_offset(bh));
				544	}
				545
				546	/*
Dave Chinner	bb18782	2016-04-06 08:11:25 +1000	[diff] [blame]	547	* Submit the bio for an ioend. We are passed an ioend with a bio attached to
				548	* it, and we submit that bio. The ioend may be used for multiple bio
				549	* submissions, so we only want to allocate an append transaction for the ioend
				550	* once. In the case of multiple bio submission, each bio will take an IO
				551	* reference to the ioend to ensure that the ioend completion is only done once
				552	* all bios have been submitted and the ioend is really done.
Dave Chinner	7bf7f35	2012-11-12 22:09:45 +1100	[diff] [blame]	553	*
				554	* If @fail is non-zero, it means that we have a situation where some part of
				555	* the submission process has failed after we have marked paged for writeback
Dave Chinner	bb18782	2016-04-06 08:11:25 +1000	[diff] [blame]	556	* and unlocked them. In this situation, we need to fail the bio and ioend
				557	* rather than submit it to IO. This typically only happens on a filesystem
				558	* shutdown.
Christoph Hellwig	f6d6d4f	2006-01-11 15:40:13 +1100	[diff] [blame]	559	*/
Dave Chinner	e10de37	2016-02-15 17:23:12 +1100	[diff] [blame]	560	STATIC int
Christoph Hellwig	f6d6d4f	2006-01-11 15:40:13 +1100	[diff] [blame]	561	xfs_submit_ioend(
Christoph Hellwig	06342cf	2009-10-30 09:09:15 +0000	[diff] [blame]	562	struct writeback_control *wbc,
Christoph Hellwig	0e51a8e	2016-04-06 08:34:30 +1000	[diff] [blame]	563	struct xfs_ioend *ioend,
Dave Chinner	e10de37	2016-02-15 17:23:12 +1100	[diff] [blame]	564	int status)
Christoph Hellwig	f6d6d4f	2006-01-11 15:40:13 +1100	[diff] [blame]	565	{
Darrick J. Wong	5eda430	2017-02-02 15:14:02 -0800	[diff] [blame]	566	/* Convert CoW extents to regular */
				567	if (!status && ioend->io_type == XFS_IO_COW) {
Dave Chinner	4a2d01b	2018-06-07 07:46:42 -0700	[diff] [blame]	568	/*
				569	* Yuk. This can do memory allocation, but is not a
				570	* transactional operation so everything is done in GFP_KERNEL
				571	* context. That can deadlock, because we hold pages in
				572	* writeback state and GFP_KERNEL allocations can block on them.
				573	* Hence we must operate in nofs conditions here.
				574	*/
				575	unsigned nofs_flag;
				576
				577	nofs_flag = memalloc_nofs_save();
Darrick J. Wong	5eda430	2017-02-02 15:14:02 -0800	[diff] [blame]	578	status = xfs_reflink_convert_cow(XFS_I(ioend->io_inode),
				579	ioend->io_offset, ioend->io_size);
Dave Chinner	4a2d01b	2018-06-07 07:46:42 -0700	[diff] [blame]	580	memalloc_nofs_restore(nofs_flag);
Darrick J. Wong	5eda430	2017-02-02 15:14:02 -0800	[diff] [blame]	581	}
				582
Dave Chinner	e10de37	2016-02-15 17:23:12 +1100	[diff] [blame]	583	/* Reserve log space if we might write beyond the on-disk inode size. */
				584	if (!status &&
Christoph Hellwig	0e51a8e	2016-04-06 08:34:30 +1000	[diff] [blame]	585	ioend->io_type != XFS_IO_UNWRITTEN &&
Dave Chinner	bb18782	2016-04-06 08:11:25 +1000	[diff] [blame]	586	xfs_ioend_is_append(ioend) &&
				587	!ioend->io_append_trans)
Dave Chinner	e10de37	2016-02-15 17:23:12 +1100	[diff] [blame]	588	status = xfs_setfilesize_trans_alloc(ioend);
Dave Chinner	bb18782	2016-04-06 08:11:25 +1000	[diff] [blame]	589
Christoph Hellwig	0e51a8e	2016-04-06 08:34:30 +1000	[diff] [blame]	590	ioend->io_bio->bi_private = ioend;
				591	ioend->io_bio->bi_end_io = xfs_end_bio;
Jens Axboe	7637241	2016-11-01 10:00:38 -0600	[diff] [blame]	592	ioend->io_bio->bi_opf = REQ_OP_WRITE \| wbc_to_write_flags(wbc);
Christoph Hellwig	70fd761	2016-11-01 07:40:10 -0600	[diff] [blame]	593
Dave Chinner	e10de37	2016-02-15 17:23:12 +1100	[diff] [blame]	594	/*
				595	* If we are failing the IO now, just mark the ioend with an
				596	* error and finish it. This will run IO completion immediately
				597	* as there is only one reference to the ioend at this point in
				598	* time.
				599	*/
				600	if (status) {
Christoph Hellwig	4e4cbee	2017-06-03 09:38:06 +0200	[diff] [blame]	601	ioend->io_bio->bi_status = errno_to_blk_status(status);
Christoph Hellwig	0e51a8e	2016-04-06 08:34:30 +1000	[diff] [blame]	602	bio_endio(ioend->io_bio);
Dave Chinner	e10de37	2016-02-15 17:23:12 +1100	[diff] [blame]	603	return status;
				604	}
Christoph Hellwig	f6d6d4f	2006-01-11 15:40:13 +1100	[diff] [blame]	605
Jens Axboe	31d7d58	2017-06-27 09:34:01 -0600	[diff] [blame]	606	ioend->io_bio->bi_write_hint = ioend->io_inode->i_write_hint;
Mike Christie	4e49ea4	2016-06-05 14:31:41 -0500	[diff] [blame]	607	submit_bio(ioend->io_bio);
Dave Chinner	e10de37	2016-02-15 17:23:12 +1100	[diff] [blame]	608	return 0;
Christoph Hellwig	f6d6d4f	2006-01-11 15:40:13 +1100	[diff] [blame]	609	}
				610
Christoph Hellwig	0e51a8e	2016-04-06 08:34:30 +1000	[diff] [blame]	611	static void
				612	xfs_init_bio_from_bh(
				613	struct bio *bio,
				614	struct buffer_head *bh)
				615	{
				616	bio->bi_iter.bi_sector = bh->b_blocknr * (bh->b_size >> 9);
Christoph Hellwig	74d4699	2017-08-23 19:10:32 +0200	[diff] [blame]	617	bio_set_dev(bio, bh->b_bdev);
Christoph Hellwig	0e51a8e	2016-04-06 08:34:30 +1000	[diff] [blame]	618	}
				619
				620	static struct xfs_ioend *
				621	xfs_alloc_ioend(
				622	struct inode *inode,
				623	unsigned int type,
				624	xfs_off_t offset,
				625	struct buffer_head *bh)
				626	{
				627	struct xfs_ioend *ioend;
				628	struct bio *bio;
				629
Kent Overstreet	e292d7b	2018-05-20 18:25:57 -0400	[diff] [blame]	630	bio = bio_alloc_bioset(GFP_NOFS, BIO_MAX_PAGES, &xfs_ioend_bioset);
Christoph Hellwig	0e51a8e	2016-04-06 08:34:30 +1000	[diff] [blame]	631	xfs_init_bio_from_bh(bio, bh);
				632
				633	ioend = container_of(bio, struct xfs_ioend, io_inline_bio);
				634	INIT_LIST_HEAD(&ioend->io_list);
				635	ioend->io_type = type;
				636	ioend->io_inode = inode;
				637	ioend->io_size = 0;
				638	ioend->io_offset = offset;
				639	INIT_WORK(&ioend->io_work, xfs_end_io);
				640	ioend->io_append_trans = NULL;
				641	ioend->io_bio = bio;
				642	return ioend;
				643	}
				644
				645	/*
				646	* Allocate a new bio, and chain the old bio to the new one.
				647	*
				648	* Note that we have to do perform the chaining in this unintuitive order
				649	* so that the bi_private linkage is set up in the right direction for the
				650	* traversal in xfs_destroy_ioend().
				651	*/
				652	static void
				653	xfs_chain_bio(
				654	struct xfs_ioend *ioend,
				655	struct writeback_control *wbc,
				656	struct buffer_head *bh)
				657	{
				658	struct bio *new;
				659
				660	new = bio_alloc(GFP_NOFS, BIO_MAX_PAGES);
				661	xfs_init_bio_from_bh(new, bh);
				662
				663	bio_chain(ioend->io_bio, new);
				664	bio_get(ioend->io_bio); /* for xfs_destroy_ioend */
Jens Axboe	7637241	2016-11-01 10:00:38 -0600	[diff] [blame]	665	ioend->io_bio->bi_opf = REQ_OP_WRITE \| wbc_to_write_flags(wbc);
Jens Axboe	31d7d58	2017-06-27 09:34:01 -0600	[diff] [blame]	666	ioend->io_bio->bi_write_hint = ioend->io_inode->i_write_hint;
Mike Christie	4e49ea4	2016-06-05 14:31:41 -0500	[diff] [blame]	667	submit_bio(ioend->io_bio);
Christoph Hellwig	0e51a8e	2016-04-06 08:34:30 +1000	[diff] [blame]	668	ioend->io_bio = new;
				669	}
				670
Christoph Hellwig	f6d6d4f	2006-01-11 15:40:13 +1100	[diff] [blame]	671	/*
				672	* Test to see if we've been building up a completion structure for
				673	* earlier buffers -- if so, we try to append to this ioend if we
				674	* can, otherwise we finish off any current ioend and start another.
Dave Chinner	e10de37	2016-02-15 17:23:12 +1100	[diff] [blame]	675	* Return the ioend we finished off so that the caller can submit it
				676	* once it has finished processing the dirty page.
Christoph Hellwig	f6d6d4f	2006-01-11 15:40:13 +1100	[diff] [blame]	677	*/
				678	STATIC void
				679	xfs_add_to_ioend(
				680	struct inode *inode,
				681	struct buffer_head *bh,
Christoph Hellwig	7336cea	2006-01-11 20:49:16 +1100	[diff] [blame]	682	xfs_off_t offset,
Dave Chinner	e10de37	2016-02-15 17:23:12 +1100	[diff] [blame]	683	struct xfs_writepage_ctx *wpc,
Dave Chinner	bb18782	2016-04-06 08:11:25 +1000	[diff] [blame]	684	struct writeback_control *wbc,
Dave Chinner	e10de37	2016-02-15 17:23:12 +1100	[diff] [blame]	685	struct list_head *iolist)
Christoph Hellwig	f6d6d4f	2006-01-11 15:40:13 +1100	[diff] [blame]	686	{
Dave Chinner	fbcc025	2016-02-15 17:21:19 +1100	[diff] [blame]	687	if (!wpc->ioend \|\| wpc->io_type != wpc->ioend->io_type \|\|
Darrick J. Wong	0df61da	2016-03-07 09:32:14 +1100	[diff] [blame]	688	bh->b_blocknr != wpc->last_block + 1 \|\|
				689	offset != wpc->ioend->io_offset + wpc->ioend->io_size) {
Dave Chinner	e10de37	2016-02-15 17:23:12 +1100	[diff] [blame]	690	if (wpc->ioend)
				691	list_add(&wpc->ioend->io_list, iolist);
Christoph Hellwig	0e51a8e	2016-04-06 08:34:30 +1000	[diff] [blame]	692	wpc->ioend = xfs_alloc_ioend(inode, wpc->io_type, offset, bh);
Christoph Hellwig	f6d6d4f	2006-01-11 15:40:13 +1100	[diff] [blame]	693	}
				694
Christoph Hellwig	0e51a8e	2016-04-06 08:34:30 +1000	[diff] [blame]	695	/*
				696	* If the buffer doesn't fit into the bio we need to allocate a new
				697	* one. This shouldn't happen more than once for a given buffer.
				698	*/
				699	while (xfs_bio_add_buffer(wpc->ioend->io_bio, bh) != bh->b_size)
				700	xfs_chain_bio(wpc->ioend, wbc, bh);
Dave Chinner	bb18782	2016-04-06 08:11:25 +1000	[diff] [blame]	701
Dave Chinner	fbcc025	2016-02-15 17:21:19 +1100	[diff] [blame]	702	wpc->ioend->io_size += bh->b_size;
				703	wpc->last_block = bh->b_blocknr;
Dave Chinner	e10de37	2016-02-15 17:23:12 +1100	[diff] [blame]	704	xfs_start_buffer_writeback(bh);
Christoph Hellwig	f6d6d4f	2006-01-11 15:40:13 +1100	[diff] [blame]	705	}
				706
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	707	STATIC void
Nathan Scott	87cbc49	2006-03-14 13:26:43 +1100	[diff] [blame]	708	xfs_map_buffer(
Christoph Hellwig	046f168	2010-04-28 12:28:52 +0000	[diff] [blame]	709	struct inode *inode,
Nathan Scott	87cbc49	2006-03-14 13:26:43 +1100	[diff] [blame]	710	struct buffer_head *bh,
Christoph Hellwig	207d041	2010-04-28 12:28:56 +0000	[diff] [blame]	711	struct xfs_bmbt_irec *imap,
Christoph Hellwig	046f168	2010-04-28 12:28:52 +0000	[diff] [blame]	712	xfs_off_t offset)
Nathan Scott	87cbc49	2006-03-14 13:26:43 +1100	[diff] [blame]	713	{
				714	sector_t bn;
Christoph Hellwig	8699bb0	2010-04-28 12:28:54 +0000	[diff] [blame]	715	struct xfs_mount *m = XFS_I(inode)->i_mount;
Christoph Hellwig	207d041	2010-04-28 12:28:56 +0000	[diff] [blame]	716	xfs_off_t iomap_offset = XFS_FSB_TO_B(m, imap->br_startoff);
				717	xfs_daddr_t iomap_bn = xfs_fsb_to_db(XFS_I(inode), imap->br_startblock);
Nathan Scott	87cbc49	2006-03-14 13:26:43 +1100	[diff] [blame]	718
Christoph Hellwig	207d041	2010-04-28 12:28:56 +0000	[diff] [blame]	719	ASSERT(imap->br_startblock != HOLESTARTBLOCK);
				720	ASSERT(imap->br_startblock != DELAYSTARTBLOCK);
Nathan Scott	87cbc49	2006-03-14 13:26:43 +1100	[diff] [blame]	721
Christoph Hellwig	e513182	2010-04-28 12:28:55 +0000	[diff] [blame]	722	bn = (iomap_bn >> (inode->i_blkbits - BBSHIFT)) +
Christoph Hellwig	8699bb0	2010-04-28 12:28:54 +0000	[diff] [blame]	723	((offset - iomap_offset) >> inode->i_blkbits);
Nathan Scott	87cbc49	2006-03-14 13:26:43 +1100	[diff] [blame]	724
Christoph Hellwig	046f168	2010-04-28 12:28:52 +0000	[diff] [blame]	725	ASSERT(bn \|\| XFS_IS_REALTIME_INODE(XFS_I(inode)));
Nathan Scott	87cbc49	2006-03-14 13:26:43 +1100	[diff] [blame]	726
				727	bh->b_blocknr = bn;
				728	set_buffer_mapped(bh);
				729	}
				730
				731	STATIC void
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	732	xfs_map_at_offset(
Christoph Hellwig	046f168	2010-04-28 12:28:52 +0000	[diff] [blame]	733	struct inode *inode,
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	734	struct buffer_head *bh,
Christoph Hellwig	207d041	2010-04-28 12:28:56 +0000	[diff] [blame]	735	struct xfs_bmbt_irec *imap,
Christoph Hellwig	046f168	2010-04-28 12:28:52 +0000	[diff] [blame]	736	xfs_off_t offset)
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	737	{
Christoph Hellwig	207d041	2010-04-28 12:28:56 +0000	[diff] [blame]	738	ASSERT(imap->br_startblock != HOLESTARTBLOCK);
				739	ASSERT(imap->br_startblock != DELAYSTARTBLOCK);
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	740
Christoph Hellwig	207d041	2010-04-28 12:28:56 +0000	[diff] [blame]	741	xfs_map_buffer(inode, bh, imap, offset);
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	742	set_buffer_mapped(bh);
				743	clear_buffer_delay(bh);
Christoph Hellwig	f6d6d4f	2006-01-11 15:40:13 +1100	[diff] [blame]	744	clear_buffer_unwritten(bh);
Dave Chinner	e2f6ad4	2018-07-11 22:26:00 -0700	[diff] [blame]	745
				746	/*
				747	* If this is a realtime file, data may be on a different device.
				748	* to that pointed to from the buffer_head b_bdev currently. We can't
				749	* trust that the bufferhead has a already been mapped correctly, so
				750	* set the bdev now.
				751	*/
				752	bh->b_bdev = xfs_find_bdev_for_inode(inode);
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	753	}
				754
Dave Chinner	3ed3a43	2010-03-05 02:00:42 +0000	[diff] [blame]	755	STATIC void
				756	xfs_vm_invalidatepage(
				757	struct page *page,
Lukas Czerner	d47992f	2013-05-21 23:17:23 -0400	[diff] [blame]	758	unsigned int offset,
				759	unsigned int length)
Dave Chinner	3ed3a43	2010-03-05 02:00:42 +0000	[diff] [blame]	760	{
Lukas Czerner	34097df	2013-05-21 23:58:01 -0400	[diff] [blame]	761	trace_xfs_invalidatepage(page->mapping->host, page, offset,
				762	length);
Dave Chinner	793d7db	2017-10-13 09:47:45 -0700	[diff] [blame]	763
				764	/*
				765	* If we are invalidating the entire page, clear the dirty state from it
				766	* so that we can check for attempts to release dirty cached pages in
				767	* xfs_vm_releasepage().
				768	*/
				769	if (offset == 0 && length >= PAGE_SIZE)
				770	cancel_dirty_page(page);
Lukas Czerner	34097df	2013-05-21 23:58:01 -0400	[diff] [blame]	771	block_invalidatepage(page, offset, length);
Dave Chinner	3ed3a43	2010-03-05 02:00:42 +0000	[diff] [blame]	772	}
				773
				774	/*
				775	* If the page has delalloc buffers on it, we need to punch them out before we
				776	* invalidate the page. If we don't, we leave a stale delalloc mapping on the
				777	* inode that can trip a BUG() in xfs_get_blocks() later on if a direct IO read
				778	* is done on that same region - the delalloc extent is returned when none is
				779	* supposed to be there.
				780	*
				781	* We prevent this by truncating away the delalloc regions on the page before
				782	* invalidating it. Because they are delalloc, we can do this without needing a
				783	* transaction. Indeed - if we get ENOSPC errors, we have to be able to do this
				784	* truncation without a transaction as there is no space left for block
				785	* reservation (typically why we see a ENOSPC in writeback).
Dave Chinner	3ed3a43	2010-03-05 02:00:42 +0000	[diff] [blame]	786	*/
				787	STATIC void
				788	xfs_aops_discard_page(
				789	struct page *page)
				790	{
				791	struct inode *inode = page->mapping->host;
				792	struct xfs_inode *ip = XFS_I(inode);
Christoph Hellwig	0362572	2018-07-11 22:25:57 -0700	[diff] [blame]	793	struct xfs_mount *mp = ip->i_mount;
Dave Chinner	3ed3a43	2010-03-05 02:00:42 +0000	[diff] [blame]	794	loff_t offset = page_offset(page);
Christoph Hellwig	0362572	2018-07-11 22:25:57 -0700	[diff] [blame]	795	xfs_fileoff_t start_fsb = XFS_B_TO_FSBT(mp, offset);
				796	int error;
Dave Chinner	3ed3a43	2010-03-05 02:00:42 +0000	[diff] [blame]	797
Christoph Hellwig	0362572	2018-07-11 22:25:57 -0700	[diff] [blame]	798	if (XFS_FORCED_SHUTDOWN(mp))
Dave Chinner	3ed3a43	2010-03-05 02:00:42 +0000	[diff] [blame]	799	goto out_invalidate;
				800
Christoph Hellwig	0362572	2018-07-11 22:25:57 -0700	[diff] [blame]	801	xfs_alert(mp,
Darrick J. Wong	c969004	2018-01-09 12:02:55 -0800	[diff] [blame]	802	"page discard on page "PTR_FMT", inode 0x%llx, offset %llu.",
Dave Chinner	3ed3a43	2010-03-05 02:00:42 +0000	[diff] [blame]	803	page, ip->i_ino, offset);
				804
Christoph Hellwig	0362572	2018-07-11 22:25:57 -0700	[diff] [blame]	805	error = xfs_bmap_punch_delalloc_range(ip, start_fsb,
				806	PAGE_SIZE / i_blocksize(inode));
Christoph Hellwig	0362572	2018-07-11 22:25:57 -0700	[diff] [blame]	807	if (error && !XFS_FORCED_SHUTDOWN(mp))
				808	xfs_alert(mp, "page discard unable to remove delalloc mapping.");
Dave Chinner	3ed3a43	2010-03-05 02:00:42 +0000	[diff] [blame]	809	out_invalidate:
Kirill A. Shutemov	09cbfea	2016-04-01 15:29:47 +0300	[diff] [blame]	810	xfs_vm_invalidatepage(page, 0, PAGE_SIZE);
Dave Chinner	3ed3a43	2010-03-05 02:00:42 +0000	[diff] [blame]	811	}
				812
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	813	/*
Dave Chinner	e10de37	2016-02-15 17:23:12 +1100	[diff] [blame]	814	* We implement an immediate ioend submission policy here to avoid needing to
				815	* chain multiple ioends and hence nest mempool allocations which can violate
				816	* forward progress guarantees we need to provide. The current ioend we are
				817	* adding buffers to is cached on the writepage context, and if the new buffer
				818	* does not append to the cached ioend it will create a new ioend and cache that
				819	* instead.
				820	*
				821	* If a new ioend is created and cached, the old ioend is returned and queued
				822	* locally for submission once the entire page is processed or an error has been
				823	* detected. While ioends are submitted immediately after they are completed,
				824	* batching optimisations are provided by higher level block plugging.
				825	*
				826	* At the end of a writeback pass, there will be a cached ioend remaining on the
				827	* writepage context that the caller will need to submit.
				828	*/
Dave Chinner	bfce7d2	2016-02-15 17:21:37 +1100	[diff] [blame]	829	static int
				830	xfs_writepage_map(
				831	struct xfs_writepage_ctx *wpc,
Dave Chinner	e10de37	2016-02-15 17:23:12 +1100	[diff] [blame]	832	struct writeback_control *wbc,
Dave Chinner	bfce7d2	2016-02-15 17:21:37 +1100	[diff] [blame]	833	struct inode *inode,
				834	struct page *page,
Darrick J. Wong	2d5f4b5	2017-11-27 09:50:22 -0800	[diff] [blame]	835	uint64_t end_offset)
Dave Chinner	bfce7d2	2016-02-15 17:21:37 +1100	[diff] [blame]	836	{
Dave Chinner	e10de37	2016-02-15 17:23:12 +1100	[diff] [blame]	837	LIST_HEAD(submit_list);
				838	struct xfs_ioend ioend, next;
Dave Chinner	e2f6ad4	2018-07-11 22:26:00 -0700	[diff] [blame]	839	struct buffer_head *bh;
Fabian Frederick	9340747	2017-02-27 14:28:32 -0800	[diff] [blame]	840	ssize_t len = i_blocksize(inode);
Christoph Hellwig	6a4c950	2018-07-11 22:26:00 -0700	[diff] [blame]	841	uint64_t file_offset; /* file offset of page */
Dave Chinner	e2f6ad4	2018-07-11 22:26:00 -0700	[diff] [blame]	842	unsigned poffset; /* offset into page */
Dave Chinner	bfce7d2	2016-02-15 17:21:37 +1100	[diff] [blame]	843	int error = 0;
Dave Chinner	bfce7d2	2016-02-15 17:21:37 +1100	[diff] [blame]	844	int count = 0;
				845
Dave Chinner	e2f6ad4	2018-07-11 22:26:00 -0700	[diff] [blame]	846	/*
				847	* Walk the blocks on the page, and if we run off the end of the current
				848	* map or find the current map invalid, grab a new one. We only use
				849	* bufferheads here to check per-block state - they no longer control
				850	* the iteration through the page. This allows us to replace the
				851	* bufferhead with some other state tracking mechanism in future.
				852	*/
Christoph Hellwig	6a4c950	2018-07-11 22:26:00 -0700	[diff] [blame]	853	file_offset = page_offset(page);
Dave Chinner	e2f6ad4	2018-07-11 22:26:00 -0700	[diff] [blame]	854	bh = page_buffers(page);
				855	for (poffset = 0;
				856	poffset < PAGE_SIZE;
				857	poffset += len, file_offset += len, bh = bh->b_this_page) {
				858	/* past the range we are writing, so nothing more to write. */
Christoph Hellwig	6a4c950	2018-07-11 22:26:00 -0700	[diff] [blame]	859	if (file_offset >= end_offset)
Dave Chinner	bfce7d2	2016-02-15 17:21:37 +1100	[diff] [blame]	860	break;
Dave Chinner	bfce7d2	2016-02-15 17:21:37 +1100	[diff] [blame]	861
Dave Chinner	e2f6ad4	2018-07-11 22:26:00 -0700	[diff] [blame]	862	if (!buffer_uptodate(bh)) {
Dave Chinner	bfce7d2	2016-02-15 17:21:37 +1100	[diff] [blame]	863	if (PageUptodate(page))
				864	ASSERT(buffer_mapped(bh));
Dave Chinner	bfce7d2	2016-02-15 17:21:37 +1100	[diff] [blame]	865	continue;
				866	}
				867
				868	if (wpc->imap_valid)
				869	wpc->imap_valid = xfs_imap_valid(inode, &wpc->imap,
Christoph Hellwig	6a4c950	2018-07-11 22:26:00 -0700	[diff] [blame]	870	file_offset);
Christoph Hellwig	5c665e5	2018-07-11 22:25:59 -0700	[diff] [blame]	871
				872	/*
				873	* COW fork blocks can overlap data fork blocks even if the
				874	* blocks aren't shared. COW I/O always takes precedent, so we
				875	* must always check for overlap on reflink inodes unless the
				876	* mapping is already a COW one.
				877	*/
				878	if (!wpc->imap_valid \|\|
				879	(xfs_is_reflink_inode(XFS_I(inode)) &&
				880	wpc->io_type != XFS_IO_COW)) {
Christoph Hellwig	6a4c950	2018-07-11 22:26:00 -0700	[diff] [blame]	881	error = xfs_map_blocks(wpc, inode, file_offset);
Dave Chinner	bfce7d2	2016-02-15 17:21:37 +1100	[diff] [blame]	882	if (error)
Dave Chinner	e10de37	2016-02-15 17:23:12 +1100	[diff] [blame]	883	goto out;
Dave Chinner	bfce7d2	2016-02-15 17:21:37 +1100	[diff] [blame]	884	wpc->imap_valid = xfs_imap_valid(inode, &wpc->imap,
Christoph Hellwig	6a4c950	2018-07-11 22:26:00 -0700	[diff] [blame]	885	file_offset);
Dave Chinner	bfce7d2	2016-02-15 17:21:37 +1100	[diff] [blame]	886	}
Dave Chinner	bfce7d2	2016-02-15 17:21:37 +1100	[diff] [blame]	887
Christoph Hellwig	5c665e5	2018-07-11 22:25:59 -0700	[diff] [blame]	888	if (!wpc->imap_valid \|\| wpc->io_type == XFS_IO_HOLE)
				889	continue;
				890
				891	lock_buffer(bh);
Dave Chinner	e2f6ad4	2018-07-11 22:26:00 -0700	[diff] [blame]	892	xfs_map_at_offset(inode, bh, &wpc->imap, file_offset);
Christoph Hellwig	6a4c950	2018-07-11 22:26:00 -0700	[diff] [blame]	893	xfs_add_to_ioend(inode, bh, file_offset, wpc, wbc, &submit_list);
Christoph Hellwig	5c665e5	2018-07-11 22:25:59 -0700	[diff] [blame]	894	count++;
Dave Chinner	e2f6ad4	2018-07-11 22:26:00 -0700	[diff] [blame]	895	}
Dave Chinner	bfce7d2	2016-02-15 17:21:37 +1100	[diff] [blame]	896
Dave Chinner	e10de37	2016-02-15 17:23:12 +1100	[diff] [blame]	897	ASSERT(wpc->ioend \|\| list_empty(&submit_list));
Dave Chinner	bfce7d2	2016-02-15 17:21:37 +1100	[diff] [blame]	898
Dave Chinner	e10de37	2016-02-15 17:23:12 +1100	[diff] [blame]	899	out:
Dave Chinner	bfce7d2	2016-02-15 17:21:37 +1100	[diff] [blame]	900	/*
Dave Chinner	e10de37	2016-02-15 17:23:12 +1100	[diff] [blame]	901	* On error, we have to fail the ioend here because we have locked
				902	* buffers in the ioend. If we don't do this, we'll deadlock
				903	* invalidating the page as that tries to lock the buffers on the page.
				904	* Also, because we may have set pages under writeback, we have to make
				905	* sure we run IO completion to mark the error state of the IO
				906	* appropriately, so we can't cancel the ioend directly here. That means
				907	* we have to mark this page as under writeback if we included any
				908	* buffers from it in the ioend chain so that completion treats it
				909	* correctly.
Dave Chinner	bfce7d2	2016-02-15 17:21:37 +1100	[diff] [blame]	910	*
Dave Chinner	e10de37	2016-02-15 17:23:12 +1100	[diff] [blame]	911	* If we didn't include the page in the ioend, the on error we can
				912	* simply discard and unlock it as there are no other users of the page
				913	* or it's buffers right now. The caller will still need to trigger
				914	* submission of outstanding ioends on the writepage context so they are
				915	* treated correctly on error.
Dave Chinner	bfce7d2	2016-02-15 17:21:37 +1100	[diff] [blame]	916	*/
Dave Chinner	e10de37	2016-02-15 17:23:12 +1100	[diff] [blame]	917	if (count) {
				918	xfs_start_page_writeback(page, !error);
				919
				920	/*
				921	* Preserve the original error if there was one, otherwise catch
				922	* submission errors here and propagate into subsequent ioend
				923	* submissions.
				924	*/
				925	list_for_each_entry_safe(ioend, next, &submit_list, io_list) {
				926	int error2;
				927
				928	list_del_init(&ioend->io_list);
				929	error2 = xfs_submit_ioend(wbc, ioend, error);
				930	if (error2 && !error)
				931	error = error2;
				932	}
				933	} else if (error) {
Dave Chinner	bfce7d2	2016-02-15 17:21:37 +1100	[diff] [blame]	934	xfs_aops_discard_page(page);
				935	ClearPageUptodate(page);
				936	unlock_page(page);
Dave Chinner	e10de37	2016-02-15 17:23:12 +1100	[diff] [blame]	937	} else {
				938	/*
				939	* We can end up here with no error and nothing to write if we
				940	* race with a partial page truncate on a sub-page block sized
				941	* filesystem. In that case we need to mark the page clean.
				942	*/
				943	xfs_start_page_writeback(page, 1);
				944	end_page_writeback(page);
Dave Chinner	bfce7d2	2016-02-15 17:21:37 +1100	[diff] [blame]	945	}
Dave Chinner	e10de37	2016-02-15 17:23:12 +1100	[diff] [blame]	946
Dave Chinner	bfce7d2	2016-02-15 17:21:37 +1100	[diff] [blame]	947	mapping_set_error(page->mapping, error);
				948	return error;
				949	}
				950
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	951	/*
Christoph Hellwig	89f3b363	2010-06-24 09:45:48 +1000	[diff] [blame]	952	* Write out a dirty page.
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	953	*
Christoph Hellwig	89f3b363	2010-06-24 09:45:48 +1000	[diff] [blame]	954	* For delalloc space on the page we need to allocate space and flush it.
				955	* For unwritten space on the page we need to start the conversion to
				956	* regular allocated space.
Christoph Hellwig	89f3b363	2010-06-24 09:45:48 +1000	[diff] [blame]	957	* For any other dirty buffer heads on the page we should flush them.
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	958	*/
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	959	STATIC int
Dave Chinner	fbcc025	2016-02-15 17:21:19 +1100	[diff] [blame]	960	xfs_do_writepage(
Christoph Hellwig	89f3b363	2010-06-24 09:45:48 +1000	[diff] [blame]	961	struct page *page,
Dave Chinner	fbcc025	2016-02-15 17:21:19 +1100	[diff] [blame]	962	struct writeback_control *wbc,
				963	void *data)
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	964	{
Dave Chinner	fbcc025	2016-02-15 17:21:19 +1100	[diff] [blame]	965	struct xfs_writepage_ctx *wpc = data;
Christoph Hellwig	89f3b363	2010-06-24 09:45:48 +1000	[diff] [blame]	966	struct inode *inode = page->mapping->host;
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	967	loff_t offset;
Darrick J. Wong	c8ce540	2017-06-16 11:00:05 -0700	[diff] [blame]	968	uint64_t end_offset;
Dave Chinner	ad68972	2016-02-15 17:21:31 +1100	[diff] [blame]	969	pgoff_t end_index;
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	970
Lukas Czerner	34097df	2013-05-21 23:58:01 -0400	[diff] [blame]	971	trace_xfs_writepage(inode, page, 0, 0);
Christoph Hellwig	89f3b363	2010-06-24 09:45:48 +1000	[diff] [blame]	972
Christoph Hellwig	20cb52e	2010-06-24 09:46:01 +1000	[diff] [blame]	973	ASSERT(page_has_buffers(page));
				974
Christoph Hellwig	89f3b363	2010-06-24 09:45:48 +1000	[diff] [blame]	975	/*
				976	* Refuse to write the page out if we are called from reclaim context.
				977	*
Christoph Hellwig	d4f7a5c	2010-06-28 10:34:44 -0400	[diff] [blame]	978	* This avoids stack overflows when called from deeply used stacks in
				979	* random callers for direct reclaim or memcg reclaim. We explicitly
				980	* allow reclaim from kswapd as the stack usage there is relatively low.
Christoph Hellwig	89f3b363	2010-06-24 09:45:48 +1000	[diff] [blame]	981	*
Mel Gorman	94054fa	2011-10-31 17:07:45 -0700	[diff] [blame]	982	* This should never happen except in the case of a VM regression so
				983	* warn about it.
Christoph Hellwig	89f3b363	2010-06-24 09:45:48 +1000	[diff] [blame]	984	*/
Mel Gorman	94054fa	2011-10-31 17:07:45 -0700	[diff] [blame]	985	if (WARN_ON_ONCE((current->flags & (PF_MEMALLOC\|PF_KSWAPD)) ==
				986	PF_MEMALLOC))
Christoph Hellwig	b5420f2	2010-08-24 11:47:51 +1000	[diff] [blame]	987	goto redirty;
Christoph Hellwig	89f3b363	2010-06-24 09:45:48 +1000	[diff] [blame]	988
				989	/*
Christoph Hellwig	680a647	2011-07-08 14:34:05 +0200	[diff] [blame]	990	* Given that we do not allow direct reclaim to call us, we should
				991	* never be called while in a filesystem transaction.
Christoph Hellwig	89f3b363	2010-06-24 09:45:48 +1000	[diff] [blame]	992	*/
Michal Hocko	9070733	2017-05-03 14:53:12 -0700	[diff] [blame]	993	if (WARN_ON_ONCE(current->flags & PF_MEMALLOC_NOFS))
Christoph Hellwig	b5420f2	2010-08-24 11:47:51 +1000	[diff] [blame]	994	goto redirty;
Christoph Hellwig	89f3b363	2010-06-24 09:45:48 +1000	[diff] [blame]	995
Jie Liu	8695d27	2014-05-20 08:24:26 +1000	[diff] [blame]	996	/*
Dave Chinner	ad68972	2016-02-15 17:21:31 +1100	[diff] [blame]	997	* Is this page beyond the end of the file?
				998	*
Jie Liu	8695d27	2014-05-20 08:24:26 +1000	[diff] [blame]	999	* The page index is less than the end_index, adjust the end_offset
				1000	* to the highest offset that this page should represent.
				1001	* -----------------------------------------------------
				1002	* \| file mapping \| <EOF> \|
				1003	* -----------------------------------------------------
				1004	* \| Page ... \| Page N-2 \| Page N-1 \| Page N \| \|
				1005	* ^--------------------------------^----------\|--------
				1006	* \| desired writeback range \| see else \|
				1007	* ---------------------------------^------------------\|
				1008	*/
Dave Chinner	ad68972	2016-02-15 17:21:31 +1100	[diff] [blame]	1009	offset = i_size_read(inode);
Kirill A. Shutemov	09cbfea	2016-04-01 15:29:47 +0300	[diff] [blame]	1010	end_index = offset >> PAGE_SHIFT;
Jie Liu	8695d27	2014-05-20 08:24:26 +1000	[diff] [blame]	1011	if (page->index < end_index)
Kirill A. Shutemov	09cbfea	2016-04-01 15:29:47 +0300	[diff] [blame]	1012	end_offset = (xfs_off_t)(page->index + 1) << PAGE_SHIFT;
Jie Liu	8695d27	2014-05-20 08:24:26 +1000	[diff] [blame]	1013	else {
				1014	/*
				1015	* Check whether the page to write out is beyond or straddles
				1016	* i_size or not.
				1017	* -------------------------------------------------------
				1018	* \| file mapping \| <EOF> \|
				1019	* -------------------------------------------------------
				1020	* \| Page ... \| Page N-2 \| Page N-1 \| Page N \| Beyond \|
				1021	* ^--------------------------------^-----------\|---------
				1022	* \| \| Straddles \|
				1023	* ---------------------------------^-----------\|--------\|
				1024	*/
Kirill A. Shutemov	09cbfea	2016-04-01 15:29:47 +0300	[diff] [blame]	1025	unsigned offset_into_page = offset & (PAGE_SIZE - 1);
Christoph Hellwig	6b7a03f	2012-07-03 12:20:00 -0400	[diff] [blame]	1026
				1027	/*
Jan Kara	ff9a28f	2013-03-14 14:30:54 +0100	[diff] [blame]	1028	* Skip the page if it is fully outside i_size, e.g. due to a
				1029	* truncate operation that is in progress. We must redirty the
				1030	* page so that reclaim stops reclaiming it. Otherwise
				1031	* xfs_vm_releasepage() is called on it and gets confused.
Jie Liu	8695d27	2014-05-20 08:24:26 +1000	[diff] [blame]	1032	*
				1033	* Note that the end_index is unsigned long, it would overflow
				1034	* if the given offset is greater than 16TB on 32-bit system
				1035	* and if we do check the page is fully outside i_size or not
				1036	* via "if (page->index >= end_index + 1)" as "end_index + 1"
				1037	* will be evaluated to 0. Hence this page will be redirtied
				1038	* and be written out repeatedly which would result in an
				1039	* infinite loop, the user program that perform this operation
				1040	* will hang. Instead, we can verify this situation by checking
				1041	* if the page to write is totally beyond the i_size or if it's
				1042	* offset is just equal to the EOF.
Christoph Hellwig	6b7a03f	2012-07-03 12:20:00 -0400	[diff] [blame]	1043	*/
Jie Liu	8695d27	2014-05-20 08:24:26 +1000	[diff] [blame]	1044	if (page->index > end_index \|\|
				1045	(page->index == end_index && offset_into_page == 0))
Jan Kara	ff9a28f	2013-03-14 14:30:54 +0100	[diff] [blame]	1046	goto redirty;
Christoph Hellwig	6b7a03f	2012-07-03 12:20:00 -0400	[diff] [blame]	1047
				1048	/*
				1049	* The page straddles i_size. It must be zeroed out on each
				1050	* and every writepage invocation because it may be mmapped.
				1051	* "A file is mapped in multiples of the page size. For a file
Jie Liu	8695d27	2014-05-20 08:24:26 +1000	[diff] [blame]	1052	* that is not a multiple of the page size, the remaining
Christoph Hellwig	6b7a03f	2012-07-03 12:20:00 -0400	[diff] [blame]	1053	* memory is zeroed when mapped, and writes to that region are
				1054	* not written out to the file."
				1055	*/
Kirill A. Shutemov	09cbfea	2016-04-01 15:29:47 +0300	[diff] [blame]	1056	zero_user_segment(page, offset_into_page, PAGE_SIZE);
Jie Liu	8695d27	2014-05-20 08:24:26 +1000	[diff] [blame]	1057
				1058	/* Adjust the end_offset to the end of file */
				1059	end_offset = offset;
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	1060	}
				1061
Darrick J. Wong	2d5f4b5	2017-11-27 09:50:22 -0800	[diff] [blame]	1062	return xfs_writepage_map(wpc, wbc, inode, page, end_offset);
Nathan Scott	f51623b	2006-03-14 13:26:27 +1100	[diff] [blame]	1063
Christoph Hellwig	b5420f2	2010-08-24 11:47:51 +1000	[diff] [blame]	1064	redirty:
Nathan Scott	f51623b	2006-03-14 13:26:27 +1100	[diff] [blame]	1065	redirty_page_for_writepage(wbc, page);
				1066	unlock_page(page);
				1067	return 0;
Nathan Scott	f51623b	2006-03-14 13:26:27 +1100	[diff] [blame]	1068	}
				1069
Nathan Scott	7d4fb40	2006-06-09 15:27:16 +1000	[diff] [blame]	1070	STATIC int
Dave Chinner	fbcc025	2016-02-15 17:21:19 +1100	[diff] [blame]	1071	xfs_vm_writepage(
				1072	struct page *page,
				1073	struct writeback_control *wbc)
				1074	{
				1075	struct xfs_writepage_ctx wpc = {
				1076	.io_type = XFS_IO_INVALID,
				1077	};
				1078	int ret;
				1079
				1080	ret = xfs_do_writepage(page, wbc, &wpc);
Dave Chinner	e10de37	2016-02-15 17:23:12 +1100	[diff] [blame]	1081	if (wpc.ioend)
				1082	ret = xfs_submit_ioend(wbc, wpc.ioend, ret);
				1083	return ret;
Dave Chinner	fbcc025	2016-02-15 17:21:19 +1100	[diff] [blame]	1084	}
				1085
				1086	STATIC int
Nathan Scott	7d4fb40	2006-06-09 15:27:16 +1000	[diff] [blame]	1087	xfs_vm_writepages(
				1088	struct address_space *mapping,
				1089	struct writeback_control *wbc)
				1090	{
Dave Chinner	fbcc025	2016-02-15 17:21:19 +1100	[diff] [blame]	1091	struct xfs_writepage_ctx wpc = {
				1092	.io_type = XFS_IO_INVALID,
				1093	};
				1094	int ret;
				1095
Christoph Hellwig	b3aea4e	2007-08-29 11:44:37 +1000	[diff] [blame]	1096	xfs_iflags_clear(XFS_I(mapping->host), XFS_ITRUNCATED);
Dave Chinner	fbcc025	2016-02-15 17:21:19 +1100	[diff] [blame]	1097	ret = write_cache_pages(mapping, wbc, xfs_do_writepage, &wpc);
Dave Chinner	e10de37	2016-02-15 17:23:12 +1100	[diff] [blame]	1098	if (wpc.ioend)
				1099	ret = xfs_submit_ioend(wbc, wpc.ioend, ret);
				1100	return ret;
Nathan Scott	7d4fb40	2006-06-09 15:27:16 +1000	[diff] [blame]	1101	}
				1102
Dan Williams	6e2608d	2018-03-07 15:26:44 -0800	[diff] [blame]	1103	STATIC int
				1104	xfs_dax_writepages(
				1105	struct address_space *mapping,
				1106	struct writeback_control *wbc)
				1107	{
				1108	xfs_iflags_clear(XFS_I(mapping->host), XFS_ITRUNCATED);
				1109	return dax_writeback_mapping_range(mapping,
				1110	xfs_find_bdev_for_inode(mapping->host), wbc);
				1111	}
				1112
Nathan Scott	f51623b	2006-03-14 13:26:27 +1100	[diff] [blame]	1113	/*
				1114	* Called to move a page into cleanable state - and from there
Christoph Hellwig	89f3b363	2010-06-24 09:45:48 +1000	[diff] [blame]	1115	* to be released. The page should already be clean. We always
Nathan Scott	f51623b	2006-03-14 13:26:27 +1100	[diff] [blame]	1116	* have buffer heads in this call.
				1117	*
Christoph Hellwig	89f3b363	2010-06-24 09:45:48 +1000	[diff] [blame]	1118	* Returns 1 if the page is ok to release, 0 otherwise.
Nathan Scott	f51623b	2006-03-14 13:26:27 +1100	[diff] [blame]	1119	*/
				1120	STATIC int
Nathan Scott	238f4c5	2006-03-17 17:26:25 +1100	[diff] [blame]	1121	xfs_vm_releasepage(
Nathan Scott	f51623b	2006-03-14 13:26:27 +1100	[diff] [blame]	1122	struct page *page,
				1123	gfp_t gfp_mask)
				1124	{
Christoph Hellwig	20cb52e	2010-06-24 09:46:01 +1000	[diff] [blame]	1125	int delalloc, unwritten;
Nathan Scott	f51623b	2006-03-14 13:26:27 +1100	[diff] [blame]	1126
Lukas Czerner	34097df	2013-05-21 23:58:01 -0400	[diff] [blame]	1127	trace_xfs_releasepage(page->mapping->host, page, 0, 0);
Nathan Scott	238f4c5	2006-03-17 17:26:25 +1100	[diff] [blame]	1128
Brian Foster	99579cc	2016-07-22 09:50:38 +1000	[diff] [blame]	1129	/*
				1130	* mm accommodates an old ext3 case where clean pages might not have had
				1131	* the dirty bit cleared. Thus, it can send actual dirty pages to
				1132	* ->releasepage() via shrink_active_list(). Conversely,
Dave Chinner	793d7db	2017-10-13 09:47:45 -0700	[diff] [blame]	1133	* block_invalidatepage() can send pages that are still marked dirty but
				1134	* otherwise have invalidated buffers.
Brian Foster	99579cc	2016-07-22 09:50:38 +1000	[diff] [blame]	1135	*
Jan Kara	0a417b8	2017-01-11 10:20:04 -0800	[diff] [blame]	1136	* We want to release the latter to avoid unnecessary buildup of the
Dave Chinner	793d7db	2017-10-13 09:47:45 -0700	[diff] [blame]	1137	* LRU, so xfs_vm_invalidatepage() clears the page dirty flag on pages
				1138	* that are entirely invalidated and need to be released. Hence the
				1139	* only time we should get dirty pages here is through
				1140	* shrink_active_list() and so we can simply skip those now.
				1141	*
				1142	* warn if we've left any lingering delalloc/unwritten buffers on clean
				1143	* or invalidated pages we are about to release.
Brian Foster	99579cc	2016-07-22 09:50:38 +1000	[diff] [blame]	1144	*/
Dave Chinner	793d7db	2017-10-13 09:47:45 -0700	[diff] [blame]	1145	if (PageDirty(page))
				1146	return 0;
				1147
Christoph Hellwig	20cb52e	2010-06-24 09:46:01 +1000	[diff] [blame]	1148	xfs_count_page_state(page, &delalloc, &unwritten);
Nathan Scott	f51623b	2006-03-14 13:26:27 +1100	[diff] [blame]	1149
Dave Chinner	793d7db	2017-10-13 09:47:45 -0700	[diff] [blame]	1150	if (WARN_ON_ONCE(delalloc))
Christoph Hellwig	89f3b363	2010-06-24 09:45:48 +1000	[diff] [blame]	1151	return 0;
Dave Chinner	793d7db	2017-10-13 09:47:45 -0700	[diff] [blame]	1152	if (WARN_ON_ONCE(unwritten))
Nathan Scott	f51623b	2006-03-14 13:26:27 +1100	[diff] [blame]	1153	return 0;
				1154
Nathan Scott	f51623b	2006-03-14 13:26:27 +1100	[diff] [blame]	1155	return try_to_free_buffers(page);
				1156	}
				1157
Dave Chinner	a719370	2015-04-16 21:57:48 +1000	[diff] [blame]	1158	/*
Dave Chinner	1fdca9c	2015-04-16 21:58:21 +1000	[diff] [blame]	1159	* If this is O_DIRECT or the mpage code calling tell them how large the mapping
				1160	* is, so that we can avoid repeated get_blocks calls.
				1161	*
				1162	* If the mapping spans EOF, then we have to break the mapping up as the mapping
				1163	* for blocks beyond EOF must be marked new so that sub block regions can be
				1164	* correctly zeroed. We can't do this for mappings within EOF unless the mapping
				1165	* was just allocated or is unwritten, otherwise the callers would overwrite
				1166	* existing data with zeros. Hence we have to split the mapping into a range up
				1167	* to and including EOF, and a second mapping for beyond EOF.
				1168	*/
				1169	static void
				1170	xfs_map_trim_size(
				1171	struct inode *inode,
				1172	sector_t iblock,
				1173	struct buffer_head *bh_result,
				1174	struct xfs_bmbt_irec *imap,
				1175	xfs_off_t offset,
				1176	ssize_t size)
				1177	{
				1178	xfs_off_t mapping_size;
				1179
				1180	mapping_size = imap->br_startoff + imap->br_blockcount - iblock;
				1181	mapping_size <<= inode->i_blkbits;
				1182
				1183	ASSERT(mapping_size > 0);
				1184	if (mapping_size > size)
				1185	mapping_size = size;
				1186	if (offset < i_size_read(inode) &&
Darrick J. Wong	22a6c83	2017-11-27 09:50:17 -0800	[diff] [blame]	1187	(xfs_ufsize_t)offset + mapping_size >= i_size_read(inode)) {
Dave Chinner	1fdca9c	2015-04-16 21:58:21 +1000	[diff] [blame]	1188	/* limit mapping to block that spans EOF */
				1189	mapping_size = roundup_64(i_size_read(inode) - offset,
Fabian Frederick	9340747	2017-02-27 14:28:32 -0800	[diff] [blame]	1190	i_blocksize(inode));
Dave Chinner	1fdca9c	2015-04-16 21:58:21 +1000	[diff] [blame]	1191	}
				1192	if (mapping_size > LONG_MAX)
				1193	mapping_size = LONG_MAX;
				1194
				1195	bh_result->b_size = mapping_size;
				1196	}
				1197
Darrick J. Wong	0613f16	2016-10-03 09:11:37 -0700	[diff] [blame]	1198	static int
Christoph Hellwig	acdda3a	2016-11-30 14:37:15 +1100	[diff] [blame]	1199	xfs_get_blocks(
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	1200	struct inode *inode,
				1201	sector_t iblock,
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	1202	struct buffer_head *bh_result,
Christoph Hellwig	acdda3a	2016-11-30 14:37:15 +1100	[diff] [blame]	1203	int create)
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	1204	{
Christoph Hellwig	a206c81	2010-12-10 08:42:20 +0000	[diff] [blame]	1205	struct xfs_inode *ip = XFS_I(inode);
				1206	struct xfs_mount *mp = ip->i_mount;
				1207	xfs_fileoff_t offset_fsb, end_fsb;
				1208	int error = 0;
				1209	int lockmode = 0;
Christoph Hellwig	207d041	2010-04-28 12:28:56 +0000	[diff] [blame]	1210	struct xfs_bmbt_irec imap;
Christoph Hellwig	a206c81	2010-12-10 08:42:20 +0000	[diff] [blame]	1211	int nimaps = 1;
Nathan Scott	fdc7ed7	2005-11-02 15:13:13 +1100	[diff] [blame]	1212	xfs_off_t offset;
				1213	ssize_t size;
Christoph Hellwig	a206c81	2010-12-10 08:42:20 +0000	[diff] [blame]	1214
Christoph Hellwig	acdda3a	2016-11-30 14:37:15 +1100	[diff] [blame]	1215	BUG_ON(create);
Christoph Hellwig	6e8a27a	2016-06-21 09:53:45 +1000	[diff] [blame]	1216
Christoph Hellwig	a206c81	2010-12-10 08:42:20 +0000	[diff] [blame]	1217	if (XFS_FORCED_SHUTDOWN(mp))
Eric Sandeen	b474c7a	2014-06-22 15:04:54 +1000	[diff] [blame]	1218	return -EIO;
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	1219
Nathan Scott	fdc7ed7	2005-11-02 15:13:13 +1100	[diff] [blame]	1220	offset = (xfs_off_t)iblock << inode->i_blkbits;
Fabian Frederick	9340747	2017-02-27 14:28:32 -0800	[diff] [blame]	1221	ASSERT(bh_result->b_size >= i_blocksize(inode));
Nathan Scott	c253666	2006-03-29 10:44:40 +1000	[diff] [blame]	1222	size = bh_result->b_size;
Lachlan McIlroy	364f358	2008-09-17 16:50:14 +1000	[diff] [blame]	1223
Christoph Hellwig	acdda3a	2016-11-30 14:37:15 +1100	[diff] [blame]	1224	if (offset >= i_size_read(inode))
Lachlan McIlroy	364f358	2008-09-17 16:50:14 +1000	[diff] [blame]	1225	return 0;
				1226
Dave Chinner	507630b	2012-03-27 10:34:50 -0400	[diff] [blame]	1227	/*
				1228	* Direct I/O is usually done on preallocated files, so try getting
Christoph Hellwig	6e8a27a	2016-06-21 09:53:45 +1000	[diff] [blame]	1229	* a block mapping without an exclusive lock first.
Dave Chinner	507630b	2012-03-27 10:34:50 -0400	[diff] [blame]	1230	*/
Christoph Hellwig	6e8a27a	2016-06-21 09:53:45 +1000	[diff] [blame]	1231	lockmode = xfs_ilock_data_map_shared(ip);
Christoph Hellwig	f2bde9b	2010-06-24 11:44:35 +1000	[diff] [blame]	1232
Dave Chinner	d2c2819	2012-06-08 15:44:53 +1000	[diff] [blame]	1233	ASSERT(offset <= mp->m_super->s_maxbytes);
Darrick J. Wong	b4d8ad7f	2017-12-22 13:14:34 -0800	[diff] [blame]	1234	if (offset > mp->m_super->s_maxbytes - size)
Dave Chinner	d2c2819	2012-06-08 15:44:53 +1000	[diff] [blame]	1235	size = mp->m_super->s_maxbytes - offset;
Christoph Hellwig	a206c81	2010-12-10 08:42:20 +0000	[diff] [blame]	1236	end_fsb = XFS_B_TO_FSB(mp, (xfs_ufsize_t)offset + size);
				1237	offset_fsb = XFS_B_TO_FSBT(mp, offset);
				1238
Christoph Hellwig	7d9df3c	2018-03-13 23:15:31 -0700	[diff] [blame]	1239	error = xfs_bmapi_read(ip, offset_fsb, end_fsb - offset_fsb, &imap,
				1240	&nimaps, 0);
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	1241	if (error)
Christoph Hellwig	a206c81	2010-12-10 08:42:20 +0000	[diff] [blame]	1242	goto out_unlock;
Christoph Hellwig	1d4352d	2018-03-13 23:15:32 -0700	[diff] [blame]	1243	if (!nimaps) {
Christoph Hellwig	a206c81	2010-12-10 08:42:20 +0000	[diff] [blame]	1244	trace_xfs_get_blocks_notfound(ip, offset, size);
				1245	goto out_unlock;
				1246	}
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	1247
Christoph Hellwig	1d4352d	2018-03-13 23:15:32 -0700	[diff] [blame]	1248	trace_xfs_get_blocks_found(ip, offset, size,
				1249	imap.br_state == XFS_EXT_UNWRITTEN ?
				1250	XFS_IO_UNWRITTEN : XFS_IO_OVERWRITE, &imap);
				1251	xfs_iunlock(ip, lockmode);
				1252
Dave Chinner	1fdca9c	2015-04-16 21:58:21 +1000	[diff] [blame]	1253	/* trim mapping down to size requested */
Christoph Hellwig	6e8a27a	2016-06-21 09:53:45 +1000	[diff] [blame]	1254	xfs_map_trim_size(inode, iblock, bh_result, &imap, offset, size);
Dave Chinner	1fdca9c	2015-04-16 21:58:21 +1000	[diff] [blame]	1255
Dave Chinner	a719370	2015-04-16 21:57:48 +1000	[diff] [blame]	1256	/*
				1257	* For unwritten extents do not report a disk address in the buffered
				1258	* read case (treat as if we're reading into a hole).
				1259	*/
Christoph Hellwig	9c4f29d	2017-03-28 14:53:35 -0700	[diff] [blame]	1260	if (xfs_bmap_is_real_extent(&imap))
Dave Chinner	a719370	2015-04-16 21:57:48 +1000	[diff] [blame]	1261	xfs_map_buffer(inode, bh_result, &imap, offset);
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	1262
Nathan Scott	c253666	2006-03-29 10:44:40 +1000	[diff] [blame]	1263	/*
				1264	* If this is a realtime file, data may be on a different device.
				1265	* to that pointed to from the buffer_head b_bdev currently.
				1266	*/
Christoph Hellwig	046f168	2010-04-28 12:28:52 +0000	[diff] [blame]	1267	bh_result->b_bdev = xfs_find_bdev_for_inode(inode);
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	1268	return 0;
Christoph Hellwig	a206c81	2010-12-10 08:42:20 +0000	[diff] [blame]	1269
				1270	out_unlock:
				1271	xfs_iunlock(ip, lockmode);
Dave Chinner	2451337	2014-06-25 14:58:08 +1000	[diff] [blame]	1272	return error;
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	1273	}
				1274
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	1275	STATIC sector_t
Nathan Scott	e4c573b	2006-03-14 13:54:26 +1100	[diff] [blame]	1276	xfs_vm_bmap(
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	1277	struct address_space *mapping,
				1278	sector_t block)
				1279	{
Christoph Hellwig	b84e772	2018-06-01 09:03:09 -0700	[diff] [blame]	1280	struct xfs_inode *ip = XFS_I(mapping->host);
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	1281
Christoph Hellwig	b84e772	2018-06-01 09:03:09 -0700	[diff] [blame]	1282	trace_xfs_vm_bmap(ip);
Darrick J. Wong	db1327b	2016-10-03 09:11:36 -0700	[diff] [blame]	1283
				1284	/*
				1285	* The swap code (ab-)uses ->bmap to get a block mapping and then
Ingo Molnar	793057e	2018-02-28 09:39:48 +0100	[diff] [blame]	1286	* bypasses the file system for actual I/O. We really can't allow
Darrick J. Wong	db1327b	2016-10-03 09:11:36 -0700	[diff] [blame]	1287	* that on reflinks inodes, so we have to skip out here. And yes,
Darrick J. Wong	eb5e248	2017-06-21 20:27:35 -0700	[diff] [blame]	1288	* 0 is the magic code for a bmap error.
				1289	*
				1290	* Since we don't pass back blockdev info, we can't return bmap
				1291	* information for rt files either.
Darrick J. Wong	db1327b	2016-10-03 09:11:36 -0700	[diff] [blame]	1292	*/
Darrick J. Wong	eb5e248	2017-06-21 20:27:35 -0700	[diff] [blame]	1293	if (xfs_is_reflink_inode(ip) \|\| XFS_IS_REALTIME_INODE(ip))
Darrick J. Wong	db1327b	2016-10-03 09:11:36 -0700	[diff] [blame]	1294	return 0;
Christoph Hellwig	b84e772	2018-06-01 09:03:09 -0700	[diff] [blame]	1295	return iomap_bmap(mapping, block, &xfs_iomap_ops);
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	1296	}
				1297
				1298	STATIC int
Nathan Scott	e4c573b	2006-03-14 13:54:26 +1100	[diff] [blame]	1299	xfs_vm_readpage(
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	1300	struct file *unused,
				1301	struct page *page)
				1302	{
Dave Chinner	121e213	2016-01-08 11:28:35 +1100	[diff] [blame]	1303	trace_xfs_vm_readpage(page->mapping->host, 1);
Christoph Hellwig	8b2e77c	2018-07-11 22:25:56 -0700	[diff] [blame]	1304	if (i_blocksize(page->mapping->host) == PAGE_SIZE)
				1305	return iomap_readpage(page, &xfs_iomap_ops);
Nathan Scott	c253666	2006-03-29 10:44:40 +1000	[diff] [blame]	1306	return mpage_readpage(page, xfs_get_blocks);
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	1307	}
				1308
				1309	STATIC int
Nathan Scott	e4c573b	2006-03-14 13:54:26 +1100	[diff] [blame]	1310	xfs_vm_readpages(
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	1311	struct file *unused,
				1312	struct address_space *mapping,
				1313	struct list_head *pages,
				1314	unsigned nr_pages)
				1315	{
Dave Chinner	121e213	2016-01-08 11:28:35 +1100	[diff] [blame]	1316	trace_xfs_vm_readpages(mapping->host, nr_pages);
Christoph Hellwig	8b2e77c	2018-07-11 22:25:56 -0700	[diff] [blame]	1317	if (i_blocksize(mapping->host) == PAGE_SIZE)
				1318	return iomap_readpages(mapping, pages, nr_pages, &xfs_iomap_ops);
Nathan Scott	c253666	2006-03-29 10:44:40 +1000	[diff] [blame]	1319	return mpage_readpages(mapping, pages, nr_pages, xfs_get_blocks);
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	1320	}
				1321
Dave Chinner	22e757a	2014-09-02 12:12:51 +1000	[diff] [blame]	1322	/*
				1323	* This is basically a copy of __set_page_dirty_buffers() with one
				1324	* small tweak: buffers beyond EOF do not get marked dirty. If we mark them
				1325	* dirty, we'll never be able to clean them because we don't write buffers
				1326	* beyond EOF, and that means we can't invalidate pages that span EOF
				1327	* that have been marked dirty. Further, the dirty state can leak into
				1328	* the file interior if the file is extended, resulting in all sorts of
				1329	* bad things happening as the state does not match the underlying data.
				1330	*
				1331	* XXX: this really indicates that bufferheads in XFS need to die. Warts like
				1332	* this only exist because of bufferheads and how the generic code manages them.
				1333	*/
				1334	STATIC int
				1335	xfs_vm_set_page_dirty(
				1336	struct page *page)
				1337	{
				1338	struct address_space *mapping = page->mapping;
				1339	struct inode *inode = mapping->host;
				1340	loff_t end_offset;
				1341	loff_t offset;
				1342	int newly_dirty;
				1343
				1344	if (unlikely(!mapping))
				1345	return !TestSetPageDirty(page);
				1346
				1347	end_offset = i_size_read(inode);
				1348	offset = page_offset(page);
				1349
				1350	spin_lock(&mapping->private_lock);
				1351	if (page_has_buffers(page)) {
				1352	struct buffer_head *head = page_buffers(page);
				1353	struct buffer_head *bh = head;
				1354
				1355	do {
				1356	if (offset < end_offset)
				1357	set_buffer_dirty(bh);
				1358	bh = bh->b_this_page;
Fabian Frederick	9340747	2017-02-27 14:28:32 -0800	[diff] [blame]	1359	offset += i_blocksize(inode);
Dave Chinner	22e757a	2014-09-02 12:12:51 +1000	[diff] [blame]	1360	} while (bh != head);
				1361	}
Greg Thelen	c4843a7	2015-05-22 17:13:16 -0400	[diff] [blame]	1362	/*
Johannes Weiner	81f8c3a	2016-03-15 14:57:04 -0700	[diff] [blame]	1363	* Lock out page->mem_cgroup migration to keep PageDirty
				1364	* synchronized with per-memcg dirty page counters.
Greg Thelen	c4843a7	2015-05-22 17:13:16 -0400	[diff] [blame]	1365	*/
Johannes Weiner	62cccb8	2016-03-15 14:57:22 -0700	[diff] [blame]	1366	lock_page_memcg(page);
Dave Chinner	22e757a	2014-09-02 12:12:51 +1000	[diff] [blame]	1367	newly_dirty = !TestSetPageDirty(page);
				1368	spin_unlock(&mapping->private_lock);
				1369
Matthew Wilcox	f82b376	2018-04-10 16:36:44 -0700	[diff] [blame]	1370	if (newly_dirty)
				1371	__set_page_dirty(page, mapping, 1);
Johannes Weiner	62cccb8	2016-03-15 14:57:22 -0700	[diff] [blame]	1372	unlock_page_memcg(page);
Greg Thelen	c4843a7	2015-05-22 17:13:16 -0400	[diff] [blame]	1373	if (newly_dirty)
				1374	__mark_inode_dirty(mapping->host, I_DIRTY_PAGES);
Dave Chinner	22e757a	2014-09-02 12:12:51 +1000	[diff] [blame]	1375	return newly_dirty;
				1376	}
				1377
Darrick J. Wong	6748212	2018-05-10 08:38:15 -0700	[diff] [blame]	1378	static int
				1379	xfs_iomap_swapfile_activate(
				1380	struct swap_info_struct *sis,
				1381	struct file *swap_file,
				1382	sector_t *span)
				1383	{
				1384	sis->bdev = xfs_find_bdev_for_inode(file_inode(swap_file));
				1385	return iomap_swapfile_activate(sis, swap_file, span, &xfs_iomap_ops);
				1386	}
				1387
Christoph Hellwig	f5e54d6	2006-06-28 04:26:44 -0700	[diff] [blame]	1388	const struct address_space_operations xfs_address_space_operations = {
Nathan Scott	e4c573b	2006-03-14 13:54:26 +1100	[diff] [blame]	1389	.readpage = xfs_vm_readpage,
				1390	.readpages = xfs_vm_readpages,
				1391	.writepage = xfs_vm_writepage,
Nathan Scott	7d4fb40	2006-06-09 15:27:16 +1000	[diff] [blame]	1392	.writepages = xfs_vm_writepages,
Dave Chinner	22e757a	2014-09-02 12:12:51 +1000	[diff] [blame]	1393	.set_page_dirty = xfs_vm_set_page_dirty,
Nathan Scott	238f4c5	2006-03-17 17:26:25 +1100	[diff] [blame]	1394	.releasepage = xfs_vm_releasepage,
				1395	.invalidatepage = xfs_vm_invalidatepage,
Nathan Scott	e4c573b	2006-03-14 13:54:26 +1100	[diff] [blame]	1396	.bmap = xfs_vm_bmap,
Dan Williams	6e2608d	2018-03-07 15:26:44 -0800	[diff] [blame]	1397	.direct_IO = noop_direct_IO,
Christoph Lameter	e965f96	2006-02-01 03:05:41 -0800	[diff] [blame]	1398	.migratepage = buffer_migrate_page,
Hisashi Hifumi	bddaafa	2009-03-29 09:53:38 +0200	[diff] [blame]	1399	.is_partially_uptodate = block_is_partially_uptodate,
Andi Kleen	aa261f5	2009-09-16 11:50:16 +0200	[diff] [blame]	1400	.error_remove_page = generic_error_remove_page,
Darrick J. Wong	6748212	2018-05-10 08:38:15 -0700	[diff] [blame]	1401	.swap_activate = xfs_iomap_swapfile_activate,
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	1402	};
Dan Williams	6e2608d	2018-03-07 15:26:44 -0800	[diff] [blame]	1403
				1404	const struct address_space_operations xfs_dax_aops = {
				1405	.writepages = xfs_dax_writepages,
				1406	.direct_IO = noop_direct_IO,
				1407	.set_page_dirty = noop_set_page_dirty,
				1408	.invalidatepage = noop_invalidatepage,
Darrick J. Wong	6748212	2018-05-10 08:38:15 -0700	[diff] [blame]	1409	.swap_activate = xfs_iomap_swapfile_activate,
Dan Williams	6e2608d	2018-03-07 15:26:44 -0800	[diff] [blame]	1410	};