Blame - fs/ext4/file.c - SHIFTPHONES/mainline/linux

blob: 453cafecf5cc0ff120a2485a3d1ab9f8229bfa6d [file] [log] [blame]

Greg Kroah-Hartman	b244131	2017-11-01 15:07:57 +0100	[diff] [blame]	1	// SPDX-License-Identifier: GPL-2.0
Dave Kleikamp	ac27a0e	2006-10-11 01:20:50 -0700	[diff] [blame]	2	/*
Mingming Cao	617ba13	2006-10-11 01:20:53 -0700	[diff] [blame]	3	* linux/fs/ext4/file.c
Dave Kleikamp	ac27a0e	2006-10-11 01:20:50 -0700	[diff] [blame]	4	*
				5	* Copyright (C) 1992, 1993, 1994, 1995
				6	* Remy Card (card@masi.ibp.fr)
				7	* Laboratoire MASI - Institut Blaise Pascal
				8	* Universite Pierre et Marie Curie (Paris VI)
				9	*
				10	* from
				11	*
				12	* linux/fs/minix/file.c
				13	*
				14	* Copyright (C) 1991, 1992 Linus Torvalds
				15	*
Mingming Cao	617ba13	2006-10-11 01:20:53 -0700	[diff] [blame]	16	* ext4 fs regular file handling primitives
Dave Kleikamp	ac27a0e	2006-10-11 01:20:50 -0700	[diff] [blame]	17	*
				18	* 64-bit file support on 64-bit platforms by Jakub Jelinek
				19	* (jj@sunsite.ms.mff.cuni.cz)
				20	*/
				21
				22	#include <linux/time.h>
				23	#include <linux/fs.h>
Christoph Hellwig	545052e	2017-10-01 17:58:54 -0400	[diff] [blame]	24	#include <linux/iomap.h>
Theodore Ts'o	bc0b0d6	2009-06-13 10:09:48 -0400	[diff] [blame]	25	#include <linux/mount.h>
				26	#include <linux/path.h>
Matthew Wilcox	c94c2ac	2015-09-08 14:58:40 -0700	[diff] [blame]	27	#include <linux/dax.h>
Christoph Hellwig	871a293	2010-03-03 09:05:07 -0500	[diff] [blame]	28	#include <linux/quotaops.h>
Zheng Liu	c8c0df2	2012-11-08 21:57:40 -0500	[diff] [blame]	29	#include <linux/pagevec.h>
Christoph Hellwig	e2e40f2	2015-02-22 08:58:50 -0800	[diff] [blame]	30	#include <linux/uio.h>
Jan Kara	b8a6176	2017-11-01 16:36:45 +0100	[diff] [blame]	31	#include <linux/mman.h>
Matthew Bobrowski	378f32b	2019-11-05 23:02:39 +1100	[diff] [blame]	32	#include <linux/backing-dev.h>
Christoph Hellwig	3dcf545	2008-04-29 18:13:32 -0400	[diff] [blame]	33	#include "ext4.h"
				34	#include "ext4_jbd2.h"
Dave Kleikamp	ac27a0e	2006-10-11 01:20:50 -0700	[diff] [blame]	35	#include "xattr.h"
				36	#include "acl.h"
Matthew Bobrowski	569342d	2019-11-05 23:01:51 +1100	[diff] [blame]	37	#include "truncate.h"
Dave Kleikamp	ac27a0e	2006-10-11 01:20:50 -0700	[diff] [blame]	38
Matthew Bobrowski	b1b4705	2019-11-05 23:01:37 +1100	[diff] [blame]	39	static bool ext4_dio_supported(struct inode *inode)
				40	{
				41	if (IS_ENABLED(CONFIG_FS_ENCRYPTION) && IS_ENCRYPTED(inode))
				42	return false;
				43	if (fsverity_active(inode))
				44	return false;
				45	if (ext4_should_journal_data(inode))
				46	return false;
				47	if (ext4_has_inline_data(inode))
				48	return false;
				49	return true;
				50	}
				51
				52	static ssize_t ext4_dio_read_iter(struct kiocb iocb, struct iov_iter to)
				53	{
				54	ssize_t ret;
				55	struct inode *inode = file_inode(iocb->ki_filp);
				56
				57	if (iocb->ki_flags & IOCB_NOWAIT) {
				58	if (!inode_trylock_shared(inode))
				59	return -EAGAIN;
				60	} else {
				61	inode_lock_shared(inode);
				62	}
				63
				64	if (!ext4_dio_supported(inode)) {
				65	inode_unlock_shared(inode);
				66	/*
				67	* Fallback to buffered I/O if the operation being performed on
				68	* the inode is not supported by direct I/O. The IOCB_DIRECT
				69	* flag needs to be cleared here in order to ensure that the
				70	* direct I/O path within generic_file_read_iter() is not
				71	* taken.
				72	*/
				73	iocb->ki_flags &= ~IOCB_DIRECT;
				74	return generic_file_read_iter(iocb, to);
				75	}
				76
				77	ret = iomap_dio_rw(iocb, to, &ext4_iomap_ops, NULL,
				78	is_sync_kiocb(iocb));
				79	inode_unlock_shared(inode);
				80
				81	file_accessed(iocb->ki_filp);
				82	return ret;
				83	}
				84
Jan Kara	364443c	2016-11-20 17:36:06 -0500	[diff] [blame]	85	#ifdef CONFIG_FS_DAX
				86	static ssize_t ext4_dax_read_iter(struct kiocb iocb, struct iov_iter to)
				87	{
				88	struct inode *inode = file_inode(iocb->ki_filp);
				89	ssize_t ret;
				90
Ritesh Harjani	f629afe	2019-12-12 11:25:55 +0530	[diff] [blame]	91	if (iocb->ki_flags & IOCB_NOWAIT) {
				92	if (!inode_trylock_shared(inode))
Goldwyn Rodrigues	728fbc0	2017-06-20 07:05:47 -0500	[diff] [blame]	93	return -EAGAIN;
Ritesh Harjani	f629afe	2019-12-12 11:25:55 +0530	[diff] [blame]	94	} else {
Goldwyn Rodrigues	728fbc0	2017-06-20 07:05:47 -0500	[diff] [blame]	95	inode_lock_shared(inode);
				96	}
Jan Kara	364443c	2016-11-20 17:36:06 -0500	[diff] [blame]	97	/*
				98	* Recheck under inode lock - at this point we are sure it cannot
				99	* change anymore
				100	*/
				101	if (!IS_DAX(inode)) {
				102	inode_unlock_shared(inode);
				103	/* Fallback to buffered IO in case we cannot support DAX */
				104	return generic_file_read_iter(iocb, to);
				105	}
				106	ret = dax_iomap_rw(iocb, to, &ext4_iomap_ops);
				107	inode_unlock_shared(inode);
				108
				109	file_accessed(iocb->ki_filp);
				110	return ret;
				111	}
				112	#endif
				113
				114	static ssize_t ext4_file_read_iter(struct kiocb iocb, struct iov_iter to)
				115	{
Matthew Bobrowski	b1b4705	2019-11-05 23:01:37 +1100	[diff] [blame]	116	struct inode *inode = file_inode(iocb->ki_filp);
				117
				118	if (unlikely(ext4_forced_shutdown(EXT4_SB(inode->i_sb))))
Theodore Ts'o	0db1ff2	2017-02-05 01:28:48 -0500	[diff] [blame]	119	return -EIO;
				120
Jan Kara	364443c	2016-11-20 17:36:06 -0500	[diff] [blame]	121	if (!iov_iter_count(to))
				122	return 0; /* skip atime */
				123
				124	#ifdef CONFIG_FS_DAX
Matthew Bobrowski	b1b4705	2019-11-05 23:01:37 +1100	[diff] [blame]	125	if (IS_DAX(inode))
Jan Kara	364443c	2016-11-20 17:36:06 -0500	[diff] [blame]	126	return ext4_dax_read_iter(iocb, to);
				127	#endif
Matthew Bobrowski	b1b4705	2019-11-05 23:01:37 +1100	[diff] [blame]	128	if (iocb->ki_flags & IOCB_DIRECT)
				129	return ext4_dio_read_iter(iocb, to);
				130
Jan Kara	364443c	2016-11-20 17:36:06 -0500	[diff] [blame]	131	return generic_file_read_iter(iocb, to);
				132	}
				133
Dave Kleikamp	ac27a0e	2006-10-11 01:20:50 -0700	[diff] [blame]	134	/*
				135	* Called when an inode is released. Note that this is different
Mingming Cao	617ba13	2006-10-11 01:20:53 -0700	[diff] [blame]	136	* from ext4_file_open: open gets called at every open, but release
Dave Kleikamp	ac27a0e	2006-10-11 01:20:50 -0700	[diff] [blame]	137	* gets called only when /all/ the files are closed.
				138	*/
Theodore Ts'o	af5bc92	2008-09-08 22:25:24 -0400	[diff] [blame]	139	static int ext4_release_file(struct inode inode, struct file filp)
Dave Kleikamp	ac27a0e	2006-10-11 01:20:50 -0700	[diff] [blame]	140	{
Theodore Ts'o	19f5fb7	2010-01-24 14:34:07 -0500	[diff] [blame]	141	if (ext4_test_inode_state(inode, EXT4_STATE_DA_ALLOC_CLOSE)) {
Theodore Ts'o	7d8f9f7	2009-02-24 08:21:14 -0500	[diff] [blame]	142	ext4_alloc_da_blocks(inode);
Theodore Ts'o	19f5fb7	2010-01-24 14:34:07 -0500	[diff] [blame]	143	ext4_clear_inode_state(inode, EXT4_STATE_DA_ALLOC_CLOSE);
Theodore Ts'o	7d8f9f7	2009-02-24 08:21:14 -0500	[diff] [blame]	144	}
Dave Kleikamp	ac27a0e	2006-10-11 01:20:50 -0700	[diff] [blame]	145	/* if we are the last writer on the inode, drop the block reservation */
				146	if ((filp->f_mode & FMODE_WRITE) &&
Aneesh Kumar K.V	d601430	2009-03-27 22:36:43 -0400	[diff] [blame]	147	(atomic_read(&inode->i_writecount) == 1) &&
Dio Putra	e030a28	2020-06-14 11:45:44 +0700	[diff] [blame^]	148	!EXT4_I(inode)->i_reserved_data_blocks) {
Aneesh Kumar K.V	0e855ac	2008-01-28 23:58:26 -0500	[diff] [blame]	149	down_write(&EXT4_I(inode)->i_data_sem);
Theodore Ts'o	c2ea3fd	2008-10-10 09:40:52 -0400	[diff] [blame]	150	ext4_discard_preallocations(inode);
Aneesh Kumar K.V	0e855ac	2008-01-28 23:58:26 -0500	[diff] [blame]	151	up_write(&EXT4_I(inode)->i_data_sem);
Dave Kleikamp	ac27a0e	2006-10-11 01:20:50 -0700	[diff] [blame]	152	}
				153	if (is_dx(inode) && filp->private_data)
Mingming Cao	617ba13	2006-10-11 01:20:53 -0700	[diff] [blame]	154	ext4_htree_free_dir_info(filp->private_data);
Dave Kleikamp	ac27a0e	2006-10-11 01:20:50 -0700	[diff] [blame]	155
				156	return 0;
				157	}
				158
Eric Sandeen	e9e3bce	2011-02-12 08:17:34 -0500	[diff] [blame]	159	/*
				160	* This tests whether the IO in question is block-aligned or not.
				161	* Ext4 utilizes unwritten extents when hole-filling during direct IO, and they
				162	* are converted to written only after the IO is complete. Until they are
				163	* mapped, these blocks appear as holes, so dio_zero_block() will assume that
				164	* it needs to zero out portions of the start and/or end block. If 2 AIO
				165	* threads are at work on the same unwritten block, they must be synchronized
				166	* or one thread will zero the other's data, causing corruption.
				167	*/
Ritesh Harjani	aa9714d0	2019-12-12 11:25:56 +0530	[diff] [blame]	168	static bool
				169	ext4_unaligned_io(struct inode inode, struct iov_iter from, loff_t pos)
Eric Sandeen	e9e3bce	2011-02-12 08:17:34 -0500	[diff] [blame]	170	{
				171	struct super_block *sb = inode->i_sb;
Ritesh Harjani	aa9714d0	2019-12-12 11:25:56 +0530	[diff] [blame]	172	unsigned long blockmask = sb->s_blocksize - 1;
Eric Sandeen	e9e3bce	2011-02-12 08:17:34 -0500	[diff] [blame]	173
Al Viro	9b88416	2014-04-17 16:09:22 -0400	[diff] [blame]	174	if ((pos \| iov_iter_alignment(from)) & blockmask)
Ritesh Harjani	aa9714d0	2019-12-12 11:25:56 +0530	[diff] [blame]	175	return true;
Eric Sandeen	e9e3bce	2011-02-12 08:17:34 -0500	[diff] [blame]	176
Ritesh Harjani	aa9714d0	2019-12-12 11:25:56 +0530	[diff] [blame]	177	return false;
				178	}
				179
				180	static bool
				181	ext4_extending_io(struct inode *inode, loff_t offset, size_t len)
				182	{
				183	if (offset + len > i_size_read(inode) \|\|
				184	offset + len > EXT4_I(inode)->i_disksize)
				185	return true;
				186	return false;
Eric Sandeen	e9e3bce	2011-02-12 08:17:34 -0500	[diff] [blame]	187	}
				188
Jan Kara	213bcd9	2016-11-20 17:29:51 -0500	[diff] [blame]	189	/* Is IO overwriting allocated and initialized blocks? */
				190	static bool ext4_overwrite_io(struct inode *inode, loff_t pos, loff_t len)
				191	{
				192	struct ext4_map_blocks map;
				193	unsigned int blkbits = inode->i_blkbits;
				194	int err, blklen;
				195
				196	if (pos + len > i_size_read(inode))
				197	return false;
				198
				199	map.m_lblk = pos >> blkbits;
				200	map.m_len = EXT4_MAX_BLOCKS(len, pos, blkbits);
				201	blklen = map.m_len;
				202
				203	err = ext4_map_blocks(NULL, inode, &map, 0);
				204	/*
				205	* 'err==len' means that all of the blocks have been preallocated,
				206	* regardless of whether they have been initialized or not. To exclude
				207	* unwritten extents, we need to check m_flags.
				208	*/
				209	return err == blklen && (map.m_flags & EXT4_MAP_MAPPED);
				210	}
				211
Ritesh Harjani	aa9714d0	2019-12-12 11:25:56 +0530	[diff] [blame]	212	static ssize_t ext4_generic_write_checks(struct kiocb *iocb,
				213	struct iov_iter *from)
Jan Kara	213bcd9	2016-11-20 17:29:51 -0500	[diff] [blame]	214	{
				215	struct inode *inode = file_inode(iocb->ki_filp);
				216	ssize_t ret;
				217
Matthew Bobrowski	378f32b	2019-11-05 23:02:39 +1100	[diff] [blame]	218	if (unlikely(IS_IMMUTABLE(inode)))
				219	return -EPERM;
				220
Jan Kara	213bcd9	2016-11-20 17:29:51 -0500	[diff] [blame]	221	ret = generic_write_checks(iocb, from);
				222	if (ret <= 0)
				223	return ret;
Theodore Ts'o	02b016c	2019-06-09 22:04:33 -0400	[diff] [blame]	224
Jan Kara	213bcd9	2016-11-20 17:29:51 -0500	[diff] [blame]	225	/*
				226	* If we have encountered a bitmap-format file, the size limit
				227	* is smaller than s_maxbytes, which is for extent-mapped files.
				228	*/
				229	if (!(ext4_test_inode_flag(inode, EXT4_INODE_EXTENTS))) {
				230	struct ext4_sb_info *sbi = EXT4_SB(inode->i_sb);
				231
				232	if (iocb->ki_pos >= sbi->s_bitmap_maxbytes)
				233	return -EFBIG;
				234	iov_iter_truncate(from, sbi->s_bitmap_maxbytes - iocb->ki_pos);
				235	}
Matthew Bobrowski	378f32b	2019-11-05 23:02:39 +1100	[diff] [blame]	236
Ritesh Harjani	aa9714d0	2019-12-12 11:25:56 +0530	[diff] [blame]	237	return iov_iter_count(from);
				238	}
				239
				240	static ssize_t ext4_write_checks(struct kiocb iocb, struct iov_iter from)
				241	{
				242	ssize_t ret, count;
				243
				244	count = ext4_generic_write_checks(iocb, from);
				245	if (count <= 0)
				246	return count;
				247
Matthew Bobrowski	378f32b	2019-11-05 23:02:39 +1100	[diff] [blame]	248	ret = file_modified(iocb->ki_filp);
				249	if (ret)
				250	return ret;
Ritesh Harjani	aa9714d0	2019-12-12 11:25:56 +0530	[diff] [blame]	251	return count;
Jan Kara	213bcd9	2016-11-20 17:29:51 -0500	[diff] [blame]	252	}
				253
Matthew Bobrowski	378f32b	2019-11-05 23:02:39 +1100	[diff] [blame]	254	static ssize_t ext4_buffered_write_iter(struct kiocb *iocb,
				255	struct iov_iter *from)
				256	{
				257	ssize_t ret;
				258	struct inode *inode = file_inode(iocb->ki_filp);
				259
				260	if (iocb->ki_flags & IOCB_NOWAIT)
				261	return -EOPNOTSUPP;
				262
				263	inode_lock(inode);
				264	ret = ext4_write_checks(iocb, from);
				265	if (ret <= 0)
				266	goto out;
				267
				268	current->backing_dev_info = inode_to_bdi(inode);
				269	ret = generic_perform_write(iocb->ki_filp, from, iocb->ki_pos);
				270	current->backing_dev_info = NULL;
				271
				272	out:
				273	inode_unlock(inode);
				274	if (likely(ret > 0)) {
				275	iocb->ki_pos += ret;
				276	ret = generic_write_sync(iocb, ret);
				277	}
				278
				279	return ret;
				280	}
				281
Matthew Bobrowski	569342d	2019-11-05 23:01:51 +1100	[diff] [blame]	282	static ssize_t ext4_handle_inode_extension(struct inode *inode, loff_t offset,
				283	ssize_t written, size_t count)
				284	{
				285	handle_t *handle;
				286	bool truncate = false;
				287	u8 blkbits = inode->i_blkbits;
				288	ext4_lblk_t written_blk, end_blk;
Harshad Shirwadkar	4209ae1	2020-04-26 18:34:37 -0700	[diff] [blame]	289	int ret;
Matthew Bobrowski	569342d	2019-11-05 23:01:51 +1100	[diff] [blame]	290
				291	/*
				292	* Note that EXT4_I(inode)->i_disksize can get extended up to
				293	* inode->i_size while the I/O was running due to writeback of delalloc
				294	* blocks. But, the code in ext4_iomap_alloc() is careful to use
				295	* zeroed/unwritten extents if this is possible; thus we won't leave
				296	* uninitialized blocks in a file even if we didn't succeed in writing
				297	* as much as we intended.
				298	*/
				299	WARN_ON_ONCE(i_size_read(inode) < EXT4_I(inode)->i_disksize);
				300	if (offset + count <= EXT4_I(inode)->i_disksize) {
				301	/*
				302	* We need to ensure that the inode is removed from the orphan
				303	* list if it has been added prematurely, due to writeback of
				304	* delalloc blocks.
				305	*/
				306	if (!list_empty(&EXT4_I(inode)->i_orphan) && inode->i_nlink) {
				307	handle = ext4_journal_start(inode, EXT4_HT_INODE, 2);
				308
				309	if (IS_ERR(handle)) {
				310	ext4_orphan_del(NULL, inode);
				311	return PTR_ERR(handle);
				312	}
				313
				314	ext4_orphan_del(handle, inode);
				315	ext4_journal_stop(handle);
				316	}
				317
				318	return written;
				319	}
				320
				321	if (written < 0)
				322	goto truncate;
				323
				324	handle = ext4_journal_start(inode, EXT4_HT_INODE, 2);
				325	if (IS_ERR(handle)) {
				326	written = PTR_ERR(handle);
				327	goto truncate;
				328	}
				329
Harshad Shirwadkar	4209ae1	2020-04-26 18:34:37 -0700	[diff] [blame]	330	if (ext4_update_inode_size(inode, offset + written)) {
				331	ret = ext4_mark_inode_dirty(handle, inode);
				332	if (unlikely(ret)) {
				333	written = ret;
				334	ext4_journal_stop(handle);
				335	goto truncate;
				336	}
				337	}
Matthew Bobrowski	569342d	2019-11-05 23:01:51 +1100	[diff] [blame]	338
				339	/*
				340	* We may need to truncate allocated but not written blocks beyond EOF.
				341	*/
				342	written_blk = ALIGN(offset + written, 1 << blkbits);
				343	end_blk = ALIGN(offset + count, 1 << blkbits);
				344	if (written_blk < end_blk && ext4_can_truncate(inode))
				345	truncate = true;
				346
				347	/*
				348	* Remove the inode from the orphan list if it has been extended and
				349	* everything went OK.
				350	*/
				351	if (!truncate && inode->i_nlink)
				352	ext4_orphan_del(handle, inode);
				353	ext4_journal_stop(handle);
				354
				355	if (truncate) {
				356	truncate:
				357	ext4_truncate_failed_write(inode);
				358	/*
				359	* If the truncate operation failed early, then the inode may
				360	* still be on the orphan list. In that case, we need to try
				361	* remove the inode from the in-memory linked list.
				362	*/
				363	if (inode->i_nlink)
				364	ext4_orphan_del(NULL, inode);
				365	}
				366
				367	return written;
				368	}
				369
Matthew Bobrowski	378f32b	2019-11-05 23:02:39 +1100	[diff] [blame]	370	static int ext4_dio_write_end_io(struct kiocb *iocb, ssize_t size,
				371	int error, unsigned int flags)
				372	{
				373	loff_t offset = iocb->ki_pos;
				374	struct inode *inode = file_inode(iocb->ki_filp);
				375
				376	if (error)
				377	return error;
				378
				379	if (size && flags & IOMAP_DIO_UNWRITTEN)
				380	return ext4_convert_unwritten_extents(NULL, inode,
				381	offset, size);
				382
				383	return 0;
				384	}
				385
				386	static const struct iomap_dio_ops ext4_dio_write_ops = {
				387	.end_io = ext4_dio_write_end_io,
				388	};
				389
Ritesh Harjani	aa9714d0	2019-12-12 11:25:56 +0530	[diff] [blame]	390	/*
				391	* The intention here is to start with shared lock acquired then see if any
				392	* condition requires an exclusive inode lock. If yes, then we restart the
				393	* whole operation by releasing the shared lock and acquiring exclusive lock.
				394	*
				395	* - For unaligned_io we never take shared lock as it may cause data corruption
				396	* when two unaligned IO tries to modify the same block e.g. while zeroing.
				397	*
				398	* - For extending writes case we don't take the shared lock, since it requires
				399	* updating inode i_disksize and/or orphan handling with exclusive lock.
				400	*
Ritesh Harjani	bc6385d	2019-12-12 11:25:57 +0530	[diff] [blame]	401	* - shared locking will only be true mostly with overwrites. Otherwise we will
				402	* switch to exclusive i_rwsem lock.
Ritesh Harjani	aa9714d0	2019-12-12 11:25:56 +0530	[diff] [blame]	403	*/
				404	static ssize_t ext4_dio_write_checks(struct kiocb iocb, struct iov_iter from,
				405	bool ilock_shared, bool extend)
				406	{
				407	struct file *file = iocb->ki_filp;
				408	struct inode *inode = file_inode(file);
				409	loff_t offset;
				410	size_t count;
				411	ssize_t ret;
				412
				413	restart:
				414	ret = ext4_generic_write_checks(iocb, from);
				415	if (ret <= 0)
				416	goto out;
				417
				418	offset = iocb->ki_pos;
				419	count = ret;
				420	if (ext4_extending_io(inode, offset, count))
				421	*extend = true;
				422	/*
				423	* Determine whether the IO operation will overwrite allocated
Ritesh Harjani	bc6385d	2019-12-12 11:25:57 +0530	[diff] [blame]	424	* and initialized blocks.
Ritesh Harjani	aa9714d0	2019-12-12 11:25:56 +0530	[diff] [blame]	425	* We need exclusive i_rwsem for changing security info
				426	* in file_modified().
				427	*/
				428	if (ilock_shared && (!IS_NOSEC(inode) \|\| extend \|\|
Ritesh Harjani	aa9714d0	2019-12-12 11:25:56 +0530	[diff] [blame]	429	!ext4_overwrite_io(inode, offset, count))) {
				430	inode_unlock_shared(inode);
				431	*ilock_shared = false;
				432	inode_lock(inode);
				433	goto restart;
				434	}
				435
				436	ret = file_modified(file);
				437	if (ret < 0)
				438	goto out;
				439
				440	return count;
				441	out:
				442	if (*ilock_shared)
				443	inode_unlock_shared(inode);
				444	else
				445	inode_unlock(inode);
				446	return ret;
				447	}
				448
Matthew Bobrowski	378f32b	2019-11-05 23:02:39 +1100	[diff] [blame]	449	static ssize_t ext4_dio_write_iter(struct kiocb iocb, struct iov_iter from)
				450	{
				451	ssize_t ret;
Matthew Bobrowski	378f32b	2019-11-05 23:02:39 +1100	[diff] [blame]	452	handle_t *handle;
				453	struct inode *inode = file_inode(iocb->ki_filp);
Ritesh Harjani	aa9714d0	2019-12-12 11:25:56 +0530	[diff] [blame]	454	loff_t offset = iocb->ki_pos;
				455	size_t count = iov_iter_count(from);
Jan Kara	8cd115b	2019-12-18 18:44:33 +0100	[diff] [blame]	456	const struct iomap_ops *iomap_ops = &ext4_iomap_ops;
Ritesh Harjani	aa9714d0	2019-12-12 11:25:56 +0530	[diff] [blame]	457	bool extend = false, unaligned_io = false;
				458	bool ilock_shared = true;
				459
				460	/*
				461	* We initially start with shared inode lock unless it is
				462	* unaligned IO which needs exclusive lock anyways.
				463	*/
				464	if (ext4_unaligned_io(inode, from, offset)) {
				465	unaligned_io = true;
				466	ilock_shared = false;
				467	}
				468	/*
				469	* Quick check here without any i_rwsem lock to see if it is extending
				470	* IO. A more reliable check is done in ext4_dio_write_checks() with
				471	* proper locking in place.
				472	*/
				473	if (offset + count > i_size_read(inode))
				474	ilock_shared = false;
Matthew Bobrowski	378f32b	2019-11-05 23:02:39 +1100	[diff] [blame]	475
				476	if (iocb->ki_flags & IOCB_NOWAIT) {
Ritesh Harjani	aa9714d0	2019-12-12 11:25:56 +0530	[diff] [blame]	477	if (ilock_shared) {
				478	if (!inode_trylock_shared(inode))
				479	return -EAGAIN;
				480	} else {
				481	if (!inode_trylock(inode))
				482	return -EAGAIN;
				483	}
Matthew Bobrowski	378f32b	2019-11-05 23:02:39 +1100	[diff] [blame]	484	} else {
Ritesh Harjani	aa9714d0	2019-12-12 11:25:56 +0530	[diff] [blame]	485	if (ilock_shared)
				486	inode_lock_shared(inode);
				487	else
				488	inode_lock(inode);
Matthew Bobrowski	378f32b	2019-11-05 23:02:39 +1100	[diff] [blame]	489	}
				490
Ritesh Harjani	aa9714d0	2019-12-12 11:25:56 +0530	[diff] [blame]	491	/* Fallback to buffered I/O if the inode does not support direct I/O. */
Matthew Bobrowski	378f32b	2019-11-05 23:02:39 +1100	[diff] [blame]	492	if (!ext4_dio_supported(inode)) {
Ritesh Harjani	aa9714d0	2019-12-12 11:25:56 +0530	[diff] [blame]	493	if (ilock_shared)
				494	inode_unlock_shared(inode);
				495	else
				496	inode_unlock(inode);
Matthew Bobrowski	378f32b	2019-11-05 23:02:39 +1100	[diff] [blame]	497	return ext4_buffered_write_iter(iocb, from);
				498	}
				499
Ritesh Harjani	aa9714d0	2019-12-12 11:25:56 +0530	[diff] [blame]	500	ret = ext4_dio_write_checks(iocb, from, &ilock_shared, &extend);
				501	if (ret <= 0)
Matthew Bobrowski	378f32b	2019-11-05 23:02:39 +1100	[diff] [blame]	502	return ret;
Matthew Bobrowski	378f32b	2019-11-05 23:02:39 +1100	[diff] [blame]	503
Jens Axboe	6e014c6	2020-05-24 16:53:16 -0600	[diff] [blame]	504	/* if we're going to block and IOCB_NOWAIT is set, return -EAGAIN */
				505	if ((iocb->ki_flags & IOCB_NOWAIT) && (unaligned_io \|\| extend)) {
				506	ret = -EAGAIN;
				507	goto out;
				508	}
				509
Matthew Bobrowski	378f32b	2019-11-05 23:02:39 +1100	[diff] [blame]	510	offset = iocb->ki_pos;
Ritesh Harjani	aa9714d0	2019-12-12 11:25:56 +0530	[diff] [blame]	511	count = ret;
Matthew Bobrowski	378f32b	2019-11-05 23:02:39 +1100	[diff] [blame]	512
				513	/*
Ritesh Harjani	aa9714d0	2019-12-12 11:25:56 +0530	[diff] [blame]	514	* Unaligned direct IO must be serialized among each other as zeroing
				515	* of partial blocks of two competing unaligned IOs can result in data
				516	* corruption.
				517	*
				518	* So we make sure we don't allow any unaligned IO in flight.
				519	* For IOs where we need not wait (like unaligned non-AIO DIO),
				520	* below inode_dio_wait() may anyway become a no-op, since we start
				521	* with exclusive lock.
Matthew Bobrowski	378f32b	2019-11-05 23:02:39 +1100	[diff] [blame]	522	*/
Ritesh Harjani	aa9714d0	2019-12-12 11:25:56 +0530	[diff] [blame]	523	if (unaligned_io)
				524	inode_dio_wait(inode);
Matthew Bobrowski	378f32b	2019-11-05 23:02:39 +1100	[diff] [blame]	525
Ritesh Harjani	aa9714d0	2019-12-12 11:25:56 +0530	[diff] [blame]	526	if (extend) {
Matthew Bobrowski	378f32b	2019-11-05 23:02:39 +1100	[diff] [blame]	527	handle = ext4_journal_start(inode, EXT4_HT_INODE, 2);
				528	if (IS_ERR(handle)) {
				529	ret = PTR_ERR(handle);
				530	goto out;
				531	}
				532
				533	ret = ext4_orphan_add(handle, inode);
				534	if (ret) {
				535	ext4_journal_stop(handle);
				536	goto out;
				537	}
				538
Matthew Bobrowski	378f32b	2019-11-05 23:02:39 +1100	[diff] [blame]	539	ext4_journal_stop(handle);
				540	}
				541
Jan Kara	8cd115b	2019-12-18 18:44:33 +0100	[diff] [blame]	542	if (ilock_shared)
				543	iomap_ops = &ext4_iomap_overwrite_ops;
				544	ret = iomap_dio_rw(iocb, from, iomap_ops, &ext4_dio_write_ops,
Ritesh Harjani	aa9714d0	2019-12-12 11:25:56 +0530	[diff] [blame]	545	is_sync_kiocb(iocb) \|\| unaligned_io \|\| extend);
Matthew Bobrowski	378f32b	2019-11-05 23:02:39 +1100	[diff] [blame]	546
				547	if (extend)
				548	ret = ext4_handle_inode_extension(inode, offset, ret, count);
				549
				550	out:
Ritesh Harjani	aa9714d0	2019-12-12 11:25:56 +0530	[diff] [blame]	551	if (ilock_shared)
Matthew Bobrowski	378f32b	2019-11-05 23:02:39 +1100	[diff] [blame]	552	inode_unlock_shared(inode);
				553	else
				554	inode_unlock(inode);
				555
				556	if (ret >= 0 && iov_iter_count(from)) {
				557	ssize_t err;
				558	loff_t endbyte;
				559
				560	offset = iocb->ki_pos;
				561	err = ext4_buffered_write_iter(iocb, from);
				562	if (err < 0)
				563	return err;
				564
				565	/*
				566	* We need to ensure that the pages within the page cache for
				567	* the range covered by this I/O are written to disk and
				568	* invalidated. This is in attempt to preserve the expected
				569	* direct I/O semantics in the case we fallback to buffered I/O
				570	* to complete off the I/O request.
				571	*/
				572	ret += err;
				573	endbyte = offset + err - 1;
				574	err = filemap_write_and_wait_range(iocb->ki_filp->f_mapping,
				575	offset, endbyte);
				576	if (!err)
				577	invalidate_mapping_pages(iocb->ki_filp->f_mapping,
				578	offset >> PAGE_SHIFT,
				579	endbyte >> PAGE_SHIFT);
				580	}
				581
				582	return ret;
				583	}
				584
Jan Kara	776722e	2016-11-20 18:09:11 -0500	[diff] [blame]	585	#ifdef CONFIG_FS_DAX
				586	static ssize_t
				587	ext4_dax_write_iter(struct kiocb iocb, struct iov_iter from)
				588	{
Jan Kara	776722e	2016-11-20 18:09:11 -0500	[diff] [blame]	589	ssize_t ret;
Matthew Bobrowski	569342d	2019-11-05 23:01:51 +1100	[diff] [blame]	590	size_t count;
				591	loff_t offset;
Matthew Bobrowski	0b9f230	2019-11-05 23:02:08 +1100	[diff] [blame]	592	handle_t *handle;
				593	bool extend = false;
Matthew Bobrowski	569342d	2019-11-05 23:01:51 +1100	[diff] [blame]	594	struct inode *inode = file_inode(iocb->ki_filp);
Jan Kara	776722e	2016-11-20 18:09:11 -0500	[diff] [blame]	595
Ritesh Harjani	f629afe	2019-12-12 11:25:55 +0530	[diff] [blame]	596	if (iocb->ki_flags & IOCB_NOWAIT) {
				597	if (!inode_trylock(inode))
Goldwyn Rodrigues	728fbc0	2017-06-20 07:05:47 -0500	[diff] [blame]	598	return -EAGAIN;
Ritesh Harjani	f629afe	2019-12-12 11:25:55 +0530	[diff] [blame]	599	} else {
Goldwyn Rodrigues	728fbc0	2017-06-20 07:05:47 -0500	[diff] [blame]	600	inode_lock(inode);
				601	}
Matthew Bobrowski	378f32b	2019-11-05 23:02:39 +1100	[diff] [blame]	602
Jan Kara	776722e	2016-11-20 18:09:11 -0500	[diff] [blame]	603	ret = ext4_write_checks(iocb, from);
				604	if (ret <= 0)
				605	goto out;
Jan Kara	776722e	2016-11-20 18:09:11 -0500	[diff] [blame]	606
Matthew Bobrowski	569342d	2019-11-05 23:01:51 +1100	[diff] [blame]	607	offset = iocb->ki_pos;
				608	count = iov_iter_count(from);
Matthew Bobrowski	0b9f230	2019-11-05 23:02:08 +1100	[diff] [blame]	609
				610	if (offset + count > EXT4_I(inode)->i_disksize) {
				611	handle = ext4_journal_start(inode, EXT4_HT_INODE, 2);
				612	if (IS_ERR(handle)) {
				613	ret = PTR_ERR(handle);
				614	goto out;
				615	}
				616
				617	ret = ext4_orphan_add(handle, inode);
				618	if (ret) {
				619	ext4_journal_stop(handle);
				620	goto out;
				621	}
				622
				623	extend = true;
				624	ext4_journal_stop(handle);
				625	}
				626
Jan Kara	776722e	2016-11-20 18:09:11 -0500	[diff] [blame]	627	ret = dax_iomap_rw(iocb, from, &ext4_iomap_ops);
Matthew Bobrowski	0b9f230	2019-11-05 23:02:08 +1100	[diff] [blame]	628
				629	if (extend)
				630	ret = ext4_handle_inode_extension(inode, offset, ret, count);
Jan Kara	776722e	2016-11-20 18:09:11 -0500	[diff] [blame]	631	out:
Christoph Hellwig	ff5462e	2017-02-08 14:39:27 -0500	[diff] [blame]	632	inode_unlock(inode);
Jan Kara	776722e	2016-11-20 18:09:11 -0500	[diff] [blame]	633	if (ret > 0)
				634	ret = generic_write_sync(iocb, ret);
				635	return ret;
				636	}
				637	#endif
				638
Dave Kleikamp	ac27a0e	2006-10-11 01:20:50 -0700	[diff] [blame]	639	static ssize_t
Al Viro	9b88416	2014-04-17 16:09:22 -0400	[diff] [blame]	640	ext4_file_write_iter(struct kiocb iocb, struct iov_iter from)
Dave Kleikamp	ac27a0e	2006-10-11 01:20:50 -0700	[diff] [blame]	641	{
Al Viro	496ad9a	2013-01-23 17:07:38 -0500	[diff] [blame]	642	struct inode *inode = file_inode(iocb->ki_filp);
Theodore Ts'o	7608e61	2014-04-21 14:26:28 -0400	[diff] [blame]	643
Theodore Ts'o	0db1ff2	2017-02-05 01:28:48 -0500	[diff] [blame]	644	if (unlikely(ext4_forced_shutdown(EXT4_SB(inode->i_sb))))
				645	return -EIO;
				646
Jan Kara	776722e	2016-11-20 18:09:11 -0500	[diff] [blame]	647	#ifdef CONFIG_FS_DAX
				648	if (IS_DAX(inode))
				649	return ext4_dax_write_iter(iocb, from);
				650	#endif
Matthew Bobrowski	378f32b	2019-11-05 23:02:39 +1100	[diff] [blame]	651	if (iocb->ki_flags & IOCB_DIRECT)
				652	return ext4_dio_write_iter(iocb, from);
Jan Kara	776722e	2016-11-20 18:09:11 -0500	[diff] [blame]	653
Matthew Bobrowski	378f32b	2019-11-05 23:02:39 +1100	[diff] [blame]	654	return ext4_buffered_write_iter(iocb, from);
Dave Kleikamp	ac27a0e	2006-10-11 01:20:50 -0700	[diff] [blame]	655	}
				656
Ross Zwisler	923ae0f	2015-02-16 15:59:38 -0800	[diff] [blame]	657	#ifdef CONFIG_FS_DAX
Souptick Joarder	71fe9899	2018-05-13 16:01:49 -0400	[diff] [blame]	658	static vm_fault_t ext4_dax_huge_fault(struct vm_fault *vmf,
Dave Jiang	c791ace	2017-02-24 14:57:08 -0800	[diff] [blame]	659	enum page_entry_size pe_size)
Ross Zwisler	923ae0f	2015-02-16 15:59:38 -0800	[diff] [blame]	660	{
Souptick Joarder	71fe9899	2018-05-13 16:01:49 -0400	[diff] [blame]	661	int error = 0;
				662	vm_fault_t result;
Jan Kara	2244642	2018-01-07 16:41:01 -0500	[diff] [blame]	663	int retries = 0;
Jan Kara	fb26a1c	2017-05-12 15:46:54 -0700	[diff] [blame]	664	handle_t *handle = NULL;
Dave Jiang	11bac80	2017-02-24 14:56:41 -0800	[diff] [blame]	665	struct inode *inode = file_inode(vmf->vma->vm_file);
Jan Kara	ea3d720	2015-12-07 14:28:03 -0500	[diff] [blame]	666	struct super_block *sb = inode->i_sb;
Randy Dodgen	fd96b8d	2017-08-24 15:26:01 -0400	[diff] [blame]	667
				668	/*
				669	* We have to distinguish real writes from writes which will result in a
				670	* COW page; COW writes should not poke the journal (the file will not
				671	* be changed). Doing so would cause unintended failures when mounted
				672	* read-only.
				673	*
				674	* We check for VM_SHARED rather than vmf->cow_page since the latter is
				675	* unset for pe_size != PE_SIZE_PTE (i.e. only in do_cow_fault); for
				676	* other sizes, dax_iomap_fault will handle splitting / fallback so that
				677	* we eventually come back with a COW page.
				678	*/
				679	bool write = (vmf->flags & FAULT_FLAG_WRITE) &&
				680	(vmf->vma->vm_flags & VM_SHARED);
Jan Kara	b8a6176	2017-11-01 16:36:45 +0100	[diff] [blame]	681	pfn_t pfn;
Matthew Wilcox	01a33b4	2015-09-08 14:59:22 -0700	[diff] [blame]	682
				683	if (write) {
				684	sb_start_pagefault(sb);
Dave Jiang	11bac80	2017-02-24 14:56:41 -0800	[diff] [blame]	685	file_update_time(vmf->vma->vm_file);
Jan Kara	fb26a1c	2017-05-12 15:46:54 -0700	[diff] [blame]	686	down_read(&EXT4_I(inode)->i_mmap_sem);
Jan Kara	2244642	2018-01-07 16:41:01 -0500	[diff] [blame]	687	retry:
Jan Kara	fb26a1c	2017-05-12 15:46:54 -0700	[diff] [blame]	688	handle = ext4_journal_start_sb(sb, EXT4_HT_WRITE_PAGE,
				689	EXT4_DATA_TRANS_BLOCKS(sb));
Jan Kara	497f692	2017-11-01 16:36:44 +0100	[diff] [blame]	690	if (IS_ERR(handle)) {
				691	up_read(&EXT4_I(inode)->i_mmap_sem);
				692	sb_end_pagefault(sb);
				693	return VM_FAULT_SIGBUS;
				694	}
Jan Kara	fb26a1c	2017-05-12 15:46:54 -0700	[diff] [blame]	695	} else {
				696	down_read(&EXT4_I(inode)->i_mmap_sem);
Jan Kara	1db1754	2016-10-21 11:33:49 +0200	[diff] [blame]	697	}
Jan Kara	2244642	2018-01-07 16:41:01 -0500	[diff] [blame]	698	result = dax_iomap_fault(vmf, pe_size, &pfn, &error, &ext4_iomap_ops);
Jan Kara	fb26a1c	2017-05-12 15:46:54 -0700	[diff] [blame]	699	if (write) {
Jan Kara	497f692	2017-11-01 16:36:44 +0100	[diff] [blame]	700	ext4_journal_stop(handle);
Jan Kara	2244642	2018-01-07 16:41:01 -0500	[diff] [blame]	701
				702	if ((result & VM_FAULT_ERROR) && error == -ENOSPC &&
				703	ext4_should_retry_alloc(sb, &retries))
				704	goto retry;
Jan Kara	b8a6176	2017-11-01 16:36:45 +0100	[diff] [blame]	705	/* Handling synchronous page fault? */
				706	if (result & VM_FAULT_NEEDDSYNC)
				707	result = dax_finish_sync_fault(vmf, pe_size, pfn);
Jan Kara	fb26a1c	2017-05-12 15:46:54 -0700	[diff] [blame]	708	up_read(&EXT4_I(inode)->i_mmap_sem);
Matthew Wilcox	01a33b4	2015-09-08 14:59:22 -0700	[diff] [blame]	709	sb_end_pagefault(sb);
Jan Kara	fb26a1c	2017-05-12 15:46:54 -0700	[diff] [blame]	710	} else {
				711	up_read(&EXT4_I(inode)->i_mmap_sem);
				712	}
Matthew Wilcox	01a33b4	2015-09-08 14:59:22 -0700	[diff] [blame]	713
				714	return result;
Ross Zwisler	923ae0f	2015-02-16 15:59:38 -0800	[diff] [blame]	715	}
				716
Souptick Joarder	71fe9899	2018-05-13 16:01:49 -0400	[diff] [blame]	717	static vm_fault_t ext4_dax_fault(struct vm_fault *vmf)
Dave Jiang	c791ace	2017-02-24 14:57:08 -0800	[diff] [blame]	718	{
				719	return ext4_dax_huge_fault(vmf, PE_SIZE_PTE);
				720	}
				721
Ross Zwisler	923ae0f	2015-02-16 15:59:38 -0800	[diff] [blame]	722	static const struct vm_operations_struct ext4_dax_vm_ops = {
				723	.fault = ext4_dax_fault,
Dave Jiang	c791ace	2017-02-24 14:57:08 -0800	[diff] [blame]	724	.huge_fault = ext4_dax_huge_fault,
Ross Zwisler	1e9d180	2016-02-27 14:01:13 -0500	[diff] [blame]	725	.page_mkwrite = ext4_dax_fault,
Ross Zwisler	91d25ba	2017-09-06 16:18:43 -0700	[diff] [blame]	726	.pfn_mkwrite = ext4_dax_fault,
Ross Zwisler	923ae0f	2015-02-16 15:59:38 -0800	[diff] [blame]	727	};
				728	#else
				729	#define ext4_dax_vm_ops ext4_file_vm_ops
				730	#endif
				731
Alexey Dobriyan	f0f37e2f	2009-09-27 22:29:37 +0400	[diff] [blame]	732	static const struct vm_operations_struct ext4_file_vm_ops = {
Jan Kara	ea3d720	2015-12-07 14:28:03 -0500	[diff] [blame]	733	.fault = ext4_filemap_fault,
Kirill A. Shutemov	f182036	2014-04-07 15:37:19 -0700	[diff] [blame]	734	.map_pages = filemap_map_pages,
Aneesh Kumar K.V	2e9ee85	2008-07-11 19:27:31 -0400	[diff] [blame]	735	.page_mkwrite = ext4_page_mkwrite,
				736	};
				737
				738	static int ext4_file_mmap(struct file file, struct vm_area_struct vma)
				739	{
Michael Halcrow	c9c7429	2015-04-12 00:56:10 -0400	[diff] [blame]	740	struct inode *inode = file->f_mapping->host;
Pankaj Gupta	e46bfc3	2019-07-05 19:33:27 +0530	[diff] [blame]	741	struct ext4_sb_info *sbi = EXT4_SB(inode->i_sb);
				742	struct dax_device *dax_dev = sbi->s_daxdev;
Michael Halcrow	c9c7429	2015-04-12 00:56:10 -0400	[diff] [blame]	743
Pankaj Gupta	e46bfc3	2019-07-05 19:33:27 +0530	[diff] [blame]	744	if (unlikely(ext4_forced_shutdown(sbi)))
Theodore Ts'o	0db1ff2	2017-02-05 01:28:48 -0500	[diff] [blame]	745	return -EIO;
				746
Jan Kara	b8a6176	2017-11-01 16:36:45 +0100	[diff] [blame]	747	/*
Pankaj Gupta	e46bfc3	2019-07-05 19:33:27 +0530	[diff] [blame]	748	* We don't support synchronous mappings for non-DAX files and
				749	* for DAX files if underneath dax_device is not synchronous.
Jan Kara	b8a6176	2017-11-01 16:36:45 +0100	[diff] [blame]	750	*/
Pankaj Gupta	e46bfc3	2019-07-05 19:33:27 +0530	[diff] [blame]	751	if (!daxdev_mapping_supported(vma, dax_dev))
Jan Kara	b8a6176	2017-11-01 16:36:45 +0100	[diff] [blame]	752	return -EOPNOTSUPP;
				753
Aneesh Kumar K.V	2e9ee85	2008-07-11 19:27:31 -0400	[diff] [blame]	754	file_accessed(file);
Ross Zwisler	923ae0f	2015-02-16 15:59:38 -0800	[diff] [blame]	755	if (IS_DAX(file_inode(file))) {
				756	vma->vm_ops = &ext4_dax_vm_ops;
Dave Jiang	e1fb4a0	2018-08-17 15:43:40 -0700	[diff] [blame]	757	vma->vm_flags \|= VM_HUGEPAGE;
Ross Zwisler	923ae0f	2015-02-16 15:59:38 -0800	[diff] [blame]	758	} else {
				759	vma->vm_ops = &ext4_file_vm_ops;
				760	}
Aneesh Kumar K.V	2e9ee85	2008-07-11 19:27:31 -0400	[diff] [blame]	761	return 0;
				762	}
				763
Amir Goldstein	833a950	2018-05-13 22:44:23 -0400	[diff] [blame]	764	static int ext4_sample_last_mounted(struct super_block *sb,
				765	struct vfsmount *mnt)
Theodore Ts'o	bc0b0d6	2009-06-13 10:09:48 -0400	[diff] [blame]	766	{
Amir Goldstein	833a950	2018-05-13 22:44:23 -0400	[diff] [blame]	767	struct ext4_sb_info *sbi = EXT4_SB(sb);
Theodore Ts'o	bc0b0d6	2009-06-13 10:09:48 -0400	[diff] [blame]	768	struct path path;
				769	char buf[64], *cp;
Amir Goldstein	833a950	2018-05-13 22:44:23 -0400	[diff] [blame]	770	handle_t *handle;
				771	int err;
				772
				773	if (likely(sbi->s_mount_flags & EXT4_MF_MNTDIR_SAMPLED))
				774	return 0;
				775
Amir Goldstein	db6516a	2018-05-13 22:54:44 -0400	[diff] [blame]	776	if (sb_rdonly(sb) \|\| !sb_start_intwrite_trylock(sb))
Amir Goldstein	833a950	2018-05-13 22:44:23 -0400	[diff] [blame]	777	return 0;
				778
				779	sbi->s_mount_flags \|= EXT4_MF_MNTDIR_SAMPLED;
				780	/*
				781	* Sample where the filesystem has been mounted and
				782	* store it in the superblock for sysadmin convenience
				783	* when trying to sort through large numbers of block
				784	* devices or filesystem images.
				785	*/
				786	memset(buf, 0, sizeof(buf));
				787	path.mnt = mnt;
				788	path.dentry = mnt->mnt_root;
				789	cp = d_path(&path, buf, sizeof(buf));
Amir Goldstein	db6516a	2018-05-13 22:54:44 -0400	[diff] [blame]	790	err = 0;
Amir Goldstein	833a950	2018-05-13 22:44:23 -0400	[diff] [blame]	791	if (IS_ERR(cp))
Amir Goldstein	db6516a	2018-05-13 22:54:44 -0400	[diff] [blame]	792	goto out;
Amir Goldstein	833a950	2018-05-13 22:44:23 -0400	[diff] [blame]	793
				794	handle = ext4_journal_start_sb(sb, EXT4_HT_MISC, 1);
Amir Goldstein	db6516a	2018-05-13 22:54:44 -0400	[diff] [blame]	795	err = PTR_ERR(handle);
Amir Goldstein	833a950	2018-05-13 22:44:23 -0400	[diff] [blame]	796	if (IS_ERR(handle))
Amir Goldstein	db6516a	2018-05-13 22:54:44 -0400	[diff] [blame]	797	goto out;
Amir Goldstein	833a950	2018-05-13 22:44:23 -0400	[diff] [blame]	798	BUFFER_TRACE(sbi->s_sbh, "get_write_access");
				799	err = ext4_journal_get_write_access(handle, sbi->s_sbh);
				800	if (err)
Amir Goldstein	db6516a	2018-05-13 22:54:44 -0400	[diff] [blame]	801	goto out_journal;
Amir Goldstein	833a950	2018-05-13 22:44:23 -0400	[diff] [blame]	802	strlcpy(sbi->s_es->s_last_mounted, cp,
				803	sizeof(sbi->s_es->s_last_mounted));
				804	ext4_handle_dirty_super(handle, sb);
Amir Goldstein	db6516a	2018-05-13 22:54:44 -0400	[diff] [blame]	805	out_journal:
Amir Goldstein	833a950	2018-05-13 22:44:23 -0400	[diff] [blame]	806	ext4_journal_stop(handle);
Amir Goldstein	db6516a	2018-05-13 22:54:44 -0400	[diff] [blame]	807	out:
				808	sb_end_intwrite(sb);
Amir Goldstein	833a950	2018-05-13 22:44:23 -0400	[diff] [blame]	809	return err;
				810	}
				811
Dio Putra	e030a28	2020-06-14 11:45:44 +0700	[diff] [blame^]	812	static int ext4_file_open(struct inode inode, struct file filp)
Amir Goldstein	833a950	2018-05-13 22:44:23 -0400	[diff] [blame]	813	{
Michael Halcrow	c9c7429	2015-04-12 00:56:10 -0400	[diff] [blame]	814	int ret;
Theodore Ts'o	bc0b0d6	2009-06-13 10:09:48 -0400	[diff] [blame]	815
Theodore Ts'o	0db1ff2	2017-02-05 01:28:48 -0500	[diff] [blame]	816	if (unlikely(ext4_forced_shutdown(EXT4_SB(inode->i_sb))))
				817	return -EIO;
				818
Amir Goldstein	833a950	2018-05-13 22:44:23 -0400	[diff] [blame]	819	ret = ext4_sample_last_mounted(inode->i_sb, filp->f_path.mnt);
				820	if (ret)
				821	return ret;
Miklos Szeredi	9dd78d8	2016-03-26 16:14:41 -0400	[diff] [blame]	822
Eric Biggers	09a5c31	2017-10-18 20:21:57 -0400	[diff] [blame]	823	ret = fscrypt_file_open(inode, filp);
				824	if (ret)
				825	return ret;
				826
Eric Biggers	c93d8f8	2019-07-22 09:26:24 -0700	[diff] [blame]	827	ret = fsverity_file_open(inode, filp);
				828	if (ret)
				829	return ret;
				830
Theodore Ts'o	8aefcd5	2011-01-10 12:29:43 -0500	[diff] [blame]	831	/*
				832	* Set up the jbd2_inode if we are opening the inode for
				833	* writing and the journal is present
				834	*/
Jan Kara	a361293	2013-08-16 21:19:41 -0400	[diff] [blame]	835	if (filp->f_mode & FMODE_WRITE) {
Michael Halcrow	c9c7429	2015-04-12 00:56:10 -0400	[diff] [blame]	836	ret = ext4_inode_attach_jinode(inode);
Jan Kara	a361293	2013-08-16 21:19:41 -0400	[diff] [blame]	837	if (ret < 0)
				838	return ret;
Theodore Ts'o	8aefcd5	2011-01-10 12:29:43 -0500	[diff] [blame]	839	}
Goldwyn Rodrigues	728fbc0	2017-06-20 07:05:47 -0500	[diff] [blame]	840
Christoph Hellwig	91f9943	2017-08-29 16:13:20 +0200	[diff] [blame]	841	filp->f_mode \|= FMODE_NOWAIT;
Theodore Ts'o	abdd438	2015-05-31 13:35:39 -0400	[diff] [blame]	842	return dquot_file_open(inode, filp);
Theodore Ts'o	bc0b0d6	2009-06-13 10:09:48 -0400	[diff] [blame]	843	}
				844
Toshiyuki Okajima	e0d10bf	2010-10-27 21:30:06 -0400	[diff] [blame]	845	/*
Eric Sandeen	ec7268c	2012-04-30 13:14:03 -0500	[diff] [blame]	846	* ext4_llseek() handles both block-mapped and extent-mapped maxbytes values
				847	* by calling generic_file_llseek_size() with the appropriate maxbytes
				848	* value for each.
Toshiyuki Okajima	e0d10bf	2010-10-27 21:30:06 -0400	[diff] [blame]	849	*/
Andrew Morton	965c8e5	2012-12-17 15:59:39 -0800	[diff] [blame]	850	loff_t ext4_llseek(struct file *file, loff_t offset, int whence)
Toshiyuki Okajima	e0d10bf	2010-10-27 21:30:06 -0400	[diff] [blame]	851	{
				852	struct inode *inode = file->f_mapping->host;
				853	loff_t maxbytes;
				854
				855	if (!(ext4_test_inode_flag(inode, EXT4_INODE_EXTENTS)))
				856	maxbytes = EXT4_SB(inode->i_sb)->s_bitmap_maxbytes;
				857	else
				858	maxbytes = inode->i_sb->s_maxbytes;
Toshiyuki Okajima	e0d10bf	2010-10-27 21:30:06 -0400	[diff] [blame]	859
Andrew Morton	965c8e5	2012-12-17 15:59:39 -0800	[diff] [blame]	860	switch (whence) {
Christoph Hellwig	545052e	2017-10-01 17:58:54 -0400	[diff] [blame]	861	default:
Andrew Morton	965c8e5	2012-12-17 15:59:39 -0800	[diff] [blame]	862	return generic_file_llseek_size(file, offset, whence,
Zheng Liu	c8c0df2	2012-11-08 21:57:40 -0500	[diff] [blame]	863	maxbytes, i_size_read(inode));
Zheng Liu	c8c0df2	2012-11-08 21:57:40 -0500	[diff] [blame]	864	case SEEK_HOLE:
Christoph Hellwig	545052e	2017-10-01 17:58:54 -0400	[diff] [blame]	865	inode_lock_shared(inode);
Matthew Bobrowski	09edf4d	2019-11-05 23:03:31 +1100	[diff] [blame]	866	offset = iomap_seek_hole(inode, offset,
				867	&ext4_iomap_report_ops);
Christoph Hellwig	545052e	2017-10-01 17:58:54 -0400	[diff] [blame]	868	inode_unlock_shared(inode);
				869	break;
				870	case SEEK_DATA:
				871	inode_lock_shared(inode);
Matthew Bobrowski	09edf4d	2019-11-05 23:03:31 +1100	[diff] [blame]	872	offset = iomap_seek_data(inode, offset,
				873	&ext4_iomap_report_ops);
Christoph Hellwig	545052e	2017-10-01 17:58:54 -0400	[diff] [blame]	874	inode_unlock_shared(inode);
				875	break;
Zheng Liu	c8c0df2	2012-11-08 21:57:40 -0500	[diff] [blame]	876	}
				877
Christoph Hellwig	545052e	2017-10-01 17:58:54 -0400	[diff] [blame]	878	if (offset < 0)
				879	return offset;
				880	return vfs_setpos(file, offset, maxbytes);
Toshiyuki Okajima	e0d10bf	2010-10-27 21:30:06 -0400	[diff] [blame]	881	}
				882
Mingming Cao	617ba13	2006-10-11 01:20:53 -0700	[diff] [blame]	883	const struct file_operations ext4_file_operations = {
Toshiyuki Okajima	e0d10bf	2010-10-27 21:30:06 -0400	[diff] [blame]	884	.llseek = ext4_llseek,
Jan Kara	364443c	2016-11-20 17:36:06 -0500	[diff] [blame]	885	.read_iter = ext4_file_read_iter,
Al Viro	9b88416	2014-04-17 16:09:22 -0400	[diff] [blame]	886	.write_iter = ext4_file_write_iter,
Xiaoguang Wang	72f9da1	2020-02-07 20:07:58 +0800	[diff] [blame]	887	.iopoll = iomap_dio_iopoll,
Andi Kleen	5cdd7b2	2008-04-29 22:03:54 -0400	[diff] [blame]	888	.unlocked_ioctl = ext4_ioctl,
Dave Kleikamp	ac27a0e	2006-10-11 01:20:50 -0700	[diff] [blame]	889	#ifdef CONFIG_COMPAT
Mingming Cao	617ba13	2006-10-11 01:20:53 -0700	[diff] [blame]	890	.compat_ioctl = ext4_compat_ioctl,
Dave Kleikamp	ac27a0e	2006-10-11 01:20:50 -0700	[diff] [blame]	891	#endif
Aneesh Kumar K.V	2e9ee85	2008-07-11 19:27:31 -0400	[diff] [blame]	892	.mmap = ext4_file_mmap,
Jan Kara	b8a6176	2017-11-01 16:36:45 +0100	[diff] [blame]	893	.mmap_supported_flags = MAP_SYNC,
Theodore Ts'o	bc0b0d6	2009-06-13 10:09:48 -0400	[diff] [blame]	894	.open = ext4_file_open,
Mingming Cao	617ba13	2006-10-11 01:20:53 -0700	[diff] [blame]	895	.release = ext4_release_file,
				896	.fsync = ext4_sync_file,
Toshi Kani	dbe6ec8	2016-10-07 16:59:59 -0700	[diff] [blame]	897	.get_unmapped_area = thp_get_unmapped_area,
Dave Kleikamp	ac27a0e	2006-10-11 01:20:50 -0700	[diff] [blame]	898	.splice_read = generic_file_splice_read,
Al Viro	8d02076	2014-04-05 04:27:08 -0400	[diff] [blame]	899	.splice_write = iter_file_splice_write,
Christoph Hellwig	2fe17c1	2011-01-14 13:07:43 +0100	[diff] [blame]	900	.fallocate = ext4_fallocate,
Dave Kleikamp	ac27a0e	2006-10-11 01:20:50 -0700	[diff] [blame]	901	};
				902
Arjan van de Ven	754661f	2007-02-12 00:55:38 -0800	[diff] [blame]	903	const struct inode_operations ext4_file_inode_operations = {
Mingming Cao	617ba13	2006-10-11 01:20:53 -0700	[diff] [blame]	904	.setattr = ext4_setattr,
David Howells	99652ea	2017-03-31 18:31:56 +0100	[diff] [blame]	905	.getattr = ext4_file_getattr,
Mingming Cao	617ba13	2006-10-11 01:20:53 -0700	[diff] [blame]	906	.listxattr = ext4_listxattr,
Christoph Hellwig	4e34e71	2011-07-23 17:37:31 +0200	[diff] [blame]	907	.get_acl = ext4_get_acl,
Christoph Hellwig	64e178a	2013-12-20 05:16:44 -0800	[diff] [blame]	908	.set_acl = ext4_set_acl,
Eric Sandeen	6873fa0	2008-10-07 00:46:36 -0400	[diff] [blame]	909	.fiemap = ext4_fiemap,
Dave Kleikamp	ac27a0e	2006-10-11 01:20:50 -0700	[diff] [blame]	910	};
				911