Blame - fs/ext4/file.c - SHIFTPHONES/mainline/linux

blob: 8cc11715518ac1a460070d76e26caee32a9b9d16 [file] [log] [blame]

Greg Kroah-Hartman	b244131	2017-11-01 15:07:57 +0100	[diff] [blame]	1	// SPDX-License-Identifier: GPL-2.0
Dave Kleikamp	ac27a0e	2006-10-11 01:20:50 -0700	[diff] [blame]	2	/*
Mingming Cao	617ba13	2006-10-11 01:20:53 -0700	[diff] [blame]	3	* linux/fs/ext4/file.c
Dave Kleikamp	ac27a0e	2006-10-11 01:20:50 -0700	[diff] [blame]	4	*
				5	* Copyright (C) 1992, 1993, 1994, 1995
				6	* Remy Card (card@masi.ibp.fr)
				7	* Laboratoire MASI - Institut Blaise Pascal
				8	* Universite Pierre et Marie Curie (Paris VI)
				9	*
				10	* from
				11	*
				12	* linux/fs/minix/file.c
				13	*
				14	* Copyright (C) 1991, 1992 Linus Torvalds
				15	*
Mingming Cao	617ba13	2006-10-11 01:20:53 -0700	[diff] [blame]	16	* ext4 fs regular file handling primitives
Dave Kleikamp	ac27a0e	2006-10-11 01:20:50 -0700	[diff] [blame]	17	*
				18	* 64-bit file support on 64-bit platforms by Jakub Jelinek
				19	* (jj@sunsite.ms.mff.cuni.cz)
				20	*/
				21
				22	#include <linux/time.h>
				23	#include <linux/fs.h>
Christoph Hellwig	545052e	2017-10-01 17:58:54 -0400	[diff] [blame]	24	#include <linux/iomap.h>
Theodore Ts'o	bc0b0d6	2009-06-13 10:09:48 -0400	[diff] [blame]	25	#include <linux/mount.h>
				26	#include <linux/path.h>
Matthew Wilcox	c94c2ac	2015-09-08 14:58:40 -0700	[diff] [blame]	27	#include <linux/dax.h>
Christoph Hellwig	871a293	2010-03-03 09:05:07 -0500	[diff] [blame]	28	#include <linux/quotaops.h>
Zheng Liu	c8c0df2	2012-11-08 21:57:40 -0500	[diff] [blame]	29	#include <linux/pagevec.h>
Christoph Hellwig	e2e40f2	2015-02-22 08:58:50 -0800	[diff] [blame]	30	#include <linux/uio.h>
Jan Kara	b8a6176	2017-11-01 16:36:45 +0100	[diff] [blame]	31	#include <linux/mman.h>
Matthew Bobrowski	378f32b	2019-11-05 23:02:39 +1100	[diff] [blame]	32	#include <linux/backing-dev.h>
Christoph Hellwig	3dcf545	2008-04-29 18:13:32 -0400	[diff] [blame]	33	#include "ext4.h"
				34	#include "ext4_jbd2.h"
Dave Kleikamp	ac27a0e	2006-10-11 01:20:50 -0700	[diff] [blame]	35	#include "xattr.h"
				36	#include "acl.h"
Matthew Bobrowski	569342d	2019-11-05 23:01:51 +1100	[diff] [blame]	37	#include "truncate.h"
Dave Kleikamp	ac27a0e	2006-10-11 01:20:50 -0700	[diff] [blame]	38
Matthew Bobrowski	b1b4705	2019-11-05 23:01:37 +1100	[diff] [blame]	39	static bool ext4_dio_supported(struct inode *inode)
				40	{
				41	if (IS_ENABLED(CONFIG_FS_ENCRYPTION) && IS_ENCRYPTED(inode))
				42	return false;
				43	if (fsverity_active(inode))
				44	return false;
				45	if (ext4_should_journal_data(inode))
				46	return false;
				47	if (ext4_has_inline_data(inode))
				48	return false;
				49	return true;
				50	}
				51
				52	static ssize_t ext4_dio_read_iter(struct kiocb iocb, struct iov_iter to)
				53	{
				54	ssize_t ret;
				55	struct inode *inode = file_inode(iocb->ki_filp);
				56
				57	if (iocb->ki_flags & IOCB_NOWAIT) {
				58	if (!inode_trylock_shared(inode))
				59	return -EAGAIN;
				60	} else {
				61	inode_lock_shared(inode);
				62	}
				63
				64	if (!ext4_dio_supported(inode)) {
				65	inode_unlock_shared(inode);
				66	/*
				67	* Fallback to buffered I/O if the operation being performed on
				68	* the inode is not supported by direct I/O. The IOCB_DIRECT
				69	* flag needs to be cleared here in order to ensure that the
				70	* direct I/O path within generic_file_read_iter() is not
				71	* taken.
				72	*/
				73	iocb->ki_flags &= ~IOCB_DIRECT;
				74	return generic_file_read_iter(iocb, to);
				75	}
				76
Andreas Gruenbacher	4fdccaa	2021-07-24 12:26:41 +0200	[diff] [blame]	77	ret = iomap_dio_rw(iocb, to, &ext4_iomap_ops, NULL, 0, 0);
Matthew Bobrowski	b1b4705	2019-11-05 23:01:37 +1100	[diff] [blame]	78	inode_unlock_shared(inode);
				79
				80	file_accessed(iocb->ki_filp);
				81	return ret;
				82	}
				83
Jan Kara	364443c	2016-11-20 17:36:06 -0500	[diff] [blame]	84	#ifdef CONFIG_FS_DAX
				85	static ssize_t ext4_dax_read_iter(struct kiocb iocb, struct iov_iter to)
				86	{
				87	struct inode *inode = file_inode(iocb->ki_filp);
				88	ssize_t ret;
				89
Ritesh Harjani	f629afe	2019-12-12 11:25:55 +0530	[diff] [blame]	90	if (iocb->ki_flags & IOCB_NOWAIT) {
				91	if (!inode_trylock_shared(inode))
Goldwyn Rodrigues	728fbc0	2017-06-20 07:05:47 -0500	[diff] [blame]	92	return -EAGAIN;
Ritesh Harjani	f629afe	2019-12-12 11:25:55 +0530	[diff] [blame]	93	} else {
Goldwyn Rodrigues	728fbc0	2017-06-20 07:05:47 -0500	[diff] [blame]	94	inode_lock_shared(inode);
				95	}
Jan Kara	364443c	2016-11-20 17:36:06 -0500	[diff] [blame]	96	/*
				97	* Recheck under inode lock - at this point we are sure it cannot
				98	* change anymore
				99	*/
				100	if (!IS_DAX(inode)) {
				101	inode_unlock_shared(inode);
				102	/* Fallback to buffered IO in case we cannot support DAX */
				103	return generic_file_read_iter(iocb, to);
				104	}
				105	ret = dax_iomap_rw(iocb, to, &ext4_iomap_ops);
				106	inode_unlock_shared(inode);
				107
				108	file_accessed(iocb->ki_filp);
				109	return ret;
				110	}
				111	#endif
				112
				113	static ssize_t ext4_file_read_iter(struct kiocb iocb, struct iov_iter to)
				114	{
Matthew Bobrowski	b1b4705	2019-11-05 23:01:37 +1100	[diff] [blame]	115	struct inode *inode = file_inode(iocb->ki_filp);
				116
				117	if (unlikely(ext4_forced_shutdown(EXT4_SB(inode->i_sb))))
Theodore Ts'o	0db1ff2	2017-02-05 01:28:48 -0500	[diff] [blame]	118	return -EIO;
				119
Jan Kara	364443c	2016-11-20 17:36:06 -0500	[diff] [blame]	120	if (!iov_iter_count(to))
				121	return 0; /* skip atime */
				122
				123	#ifdef CONFIG_FS_DAX
Matthew Bobrowski	b1b4705	2019-11-05 23:01:37 +1100	[diff] [blame]	124	if (IS_DAX(inode))
Jan Kara	364443c	2016-11-20 17:36:06 -0500	[diff] [blame]	125	return ext4_dax_read_iter(iocb, to);
				126	#endif
Matthew Bobrowski	b1b4705	2019-11-05 23:01:37 +1100	[diff] [blame]	127	if (iocb->ki_flags & IOCB_DIRECT)
				128	return ext4_dio_read_iter(iocb, to);
				129
Jan Kara	364443c	2016-11-20 17:36:06 -0500	[diff] [blame]	130	return generic_file_read_iter(iocb, to);
				131	}
				132
Dave Kleikamp	ac27a0e	2006-10-11 01:20:50 -0700	[diff] [blame]	133	/*
				134	* Called when an inode is released. Note that this is different
Mingming Cao	617ba13	2006-10-11 01:20:53 -0700	[diff] [blame]	135	* from ext4_file_open: open gets called at every open, but release
Dave Kleikamp	ac27a0e	2006-10-11 01:20:50 -0700	[diff] [blame]	136	* gets called only when /all/ the files are closed.
				137	*/
Theodore Ts'o	af5bc92	2008-09-08 22:25:24 -0400	[diff] [blame]	138	static int ext4_release_file(struct inode inode, struct file filp)
Dave Kleikamp	ac27a0e	2006-10-11 01:20:50 -0700	[diff] [blame]	139	{
Theodore Ts'o	19f5fb7	2010-01-24 14:34:07 -0500	[diff] [blame]	140	if (ext4_test_inode_state(inode, EXT4_STATE_DA_ALLOC_CLOSE)) {
Theodore Ts'o	7d8f9f7	2009-02-24 08:21:14 -0500	[diff] [blame]	141	ext4_alloc_da_blocks(inode);
Theodore Ts'o	19f5fb7	2010-01-24 14:34:07 -0500	[diff] [blame]	142	ext4_clear_inode_state(inode, EXT4_STATE_DA_ALLOC_CLOSE);
Theodore Ts'o	7d8f9f7	2009-02-24 08:21:14 -0500	[diff] [blame]	143	}
Dave Kleikamp	ac27a0e	2006-10-11 01:20:50 -0700	[diff] [blame]	144	/* if we are the last writer on the inode, drop the block reservation */
				145	if ((filp->f_mode & FMODE_WRITE) &&
Aneesh Kumar K.V	d601430	2009-03-27 22:36:43 -0400	[diff] [blame]	146	(atomic_read(&inode->i_writecount) == 1) &&
Dio Putra	e030a28	2020-06-14 11:45:44 +0700	[diff] [blame]	147	!EXT4_I(inode)->i_reserved_data_blocks) {
Aneesh Kumar K.V	0e855ac	2008-01-28 23:58:26 -0500	[diff] [blame]	148	down_write(&EXT4_I(inode)->i_data_sem);
brookxu	27bc446	2020-08-17 15:36:15 +0800	[diff] [blame]	149	ext4_discard_preallocations(inode, 0);
Aneesh Kumar K.V	0e855ac	2008-01-28 23:58:26 -0500	[diff] [blame]	150	up_write(&EXT4_I(inode)->i_data_sem);
Dave Kleikamp	ac27a0e	2006-10-11 01:20:50 -0700	[diff] [blame]	151	}
				152	if (is_dx(inode) && filp->private_data)
Mingming Cao	617ba13	2006-10-11 01:20:53 -0700	[diff] [blame]	153	ext4_htree_free_dir_info(filp->private_data);
Dave Kleikamp	ac27a0e	2006-10-11 01:20:50 -0700	[diff] [blame]	154
				155	return 0;
				156	}
				157
Eric Sandeen	e9e3bce	2011-02-12 08:17:34 -0500	[diff] [blame]	158	/*
				159	* This tests whether the IO in question is block-aligned or not.
				160	* Ext4 utilizes unwritten extents when hole-filling during direct IO, and they
				161	* are converted to written only after the IO is complete. Until they are
				162	* mapped, these blocks appear as holes, so dio_zero_block() will assume that
				163	* it needs to zero out portions of the start and/or end block. If 2 AIO
				164	* threads are at work on the same unwritten block, they must be synchronized
				165	* or one thread will zero the other's data, causing corruption.
				166	*/
Ritesh Harjani	aa9714d0	2019-12-12 11:25:56 +0530	[diff] [blame]	167	static bool
				168	ext4_unaligned_io(struct inode inode, struct iov_iter from, loff_t pos)
Eric Sandeen	e9e3bce	2011-02-12 08:17:34 -0500	[diff] [blame]	169	{
				170	struct super_block *sb = inode->i_sb;
Ritesh Harjani	aa9714d0	2019-12-12 11:25:56 +0530	[diff] [blame]	171	unsigned long blockmask = sb->s_blocksize - 1;
Eric Sandeen	e9e3bce	2011-02-12 08:17:34 -0500	[diff] [blame]	172
Al Viro	9b88416	2014-04-17 16:09:22 -0400	[diff] [blame]	173	if ((pos \| iov_iter_alignment(from)) & blockmask)
Ritesh Harjani	aa9714d0	2019-12-12 11:25:56 +0530	[diff] [blame]	174	return true;
Eric Sandeen	e9e3bce	2011-02-12 08:17:34 -0500	[diff] [blame]	175
Ritesh Harjani	aa9714d0	2019-12-12 11:25:56 +0530	[diff] [blame]	176	return false;
				177	}
				178
				179	static bool
				180	ext4_extending_io(struct inode *inode, loff_t offset, size_t len)
				181	{
				182	if (offset + len > i_size_read(inode) \|\|
				183	offset + len > EXT4_I(inode)->i_disksize)
				184	return true;
				185	return false;
Eric Sandeen	e9e3bce	2011-02-12 08:17:34 -0500	[diff] [blame]	186	}
				187
Jan Kara	213bcd9	2016-11-20 17:29:51 -0500	[diff] [blame]	188	/* Is IO overwriting allocated and initialized blocks? */
				189	static bool ext4_overwrite_io(struct inode *inode, loff_t pos, loff_t len)
				190	{
				191	struct ext4_map_blocks map;
				192	unsigned int blkbits = inode->i_blkbits;
				193	int err, blklen;
				194
				195	if (pos + len > i_size_read(inode))
				196	return false;
				197
				198	map.m_lblk = pos >> blkbits;
				199	map.m_len = EXT4_MAX_BLOCKS(len, pos, blkbits);
				200	blklen = map.m_len;
				201
				202	err = ext4_map_blocks(NULL, inode, &map, 0);
				203	/*
				204	* 'err==len' means that all of the blocks have been preallocated,
				205	* regardless of whether they have been initialized or not. To exclude
				206	* unwritten extents, we need to check m_flags.
				207	*/
				208	return err == blklen && (map.m_flags & EXT4_MAP_MAPPED);
				209	}
				210
Ritesh Harjani	aa9714d0	2019-12-12 11:25:56 +0530	[diff] [blame]	211	static ssize_t ext4_generic_write_checks(struct kiocb *iocb,
				212	struct iov_iter *from)
Jan Kara	213bcd9	2016-11-20 17:29:51 -0500	[diff] [blame]	213	{
				214	struct inode *inode = file_inode(iocb->ki_filp);
				215	ssize_t ret;
				216
Matthew Bobrowski	378f32b	2019-11-05 23:02:39 +1100	[diff] [blame]	217	if (unlikely(IS_IMMUTABLE(inode)))
				218	return -EPERM;
				219
Jan Kara	213bcd9	2016-11-20 17:29:51 -0500	[diff] [blame]	220	ret = generic_write_checks(iocb, from);
				221	if (ret <= 0)
				222	return ret;
Theodore Ts'o	02b016c	2019-06-09 22:04:33 -0400	[diff] [blame]	223
Jan Kara	213bcd9	2016-11-20 17:29:51 -0500	[diff] [blame]	224	/*
				225	* If we have encountered a bitmap-format file, the size limit
				226	* is smaller than s_maxbytes, which is for extent-mapped files.
				227	*/
				228	if (!(ext4_test_inode_flag(inode, EXT4_INODE_EXTENTS))) {
				229	struct ext4_sb_info *sbi = EXT4_SB(inode->i_sb);
				230
				231	if (iocb->ki_pos >= sbi->s_bitmap_maxbytes)
				232	return -EFBIG;
				233	iov_iter_truncate(from, sbi->s_bitmap_maxbytes - iocb->ki_pos);
				234	}
Matthew Bobrowski	378f32b	2019-11-05 23:02:39 +1100	[diff] [blame]	235
Ritesh Harjani	aa9714d0	2019-12-12 11:25:56 +0530	[diff] [blame]	236	return iov_iter_count(from);
				237	}
				238
				239	static ssize_t ext4_write_checks(struct kiocb iocb, struct iov_iter from)
				240	{
				241	ssize_t ret, count;
				242
				243	count = ext4_generic_write_checks(iocb, from);
				244	if (count <= 0)
				245	return count;
				246
Matthew Bobrowski	378f32b	2019-11-05 23:02:39 +1100	[diff] [blame]	247	ret = file_modified(iocb->ki_filp);
				248	if (ret)
				249	return ret;
Ritesh Harjani	aa9714d0	2019-12-12 11:25:56 +0530	[diff] [blame]	250	return count;
Jan Kara	213bcd9	2016-11-20 17:29:51 -0500	[diff] [blame]	251	}
				252
Matthew Bobrowski	378f32b	2019-11-05 23:02:39 +1100	[diff] [blame]	253	static ssize_t ext4_buffered_write_iter(struct kiocb *iocb,
				254	struct iov_iter *from)
				255	{
				256	ssize_t ret;
				257	struct inode *inode = file_inode(iocb->ki_filp);
				258
				259	if (iocb->ki_flags & IOCB_NOWAIT)
				260	return -EOPNOTSUPP;
				261
				262	inode_lock(inode);
				263	ret = ext4_write_checks(iocb, from);
				264	if (ret <= 0)
				265	goto out;
				266
				267	current->backing_dev_info = inode_to_bdi(inode);
				268	ret = generic_perform_write(iocb->ki_filp, from, iocb->ki_pos);
				269	current->backing_dev_info = NULL;
				270
				271	out:
				272	inode_unlock(inode);
				273	if (likely(ret > 0)) {
				274	iocb->ki_pos += ret;
				275	ret = generic_write_sync(iocb, ret);
				276	}
				277
				278	return ret;
				279	}
				280
Matthew Bobrowski	569342d	2019-11-05 23:01:51 +1100	[diff] [blame]	281	static ssize_t ext4_handle_inode_extension(struct inode *inode, loff_t offset,
				282	ssize_t written, size_t count)
				283	{
				284	handle_t *handle;
				285	bool truncate = false;
				286	u8 blkbits = inode->i_blkbits;
				287	ext4_lblk_t written_blk, end_blk;
Harshad Shirwadkar	4209ae1	2020-04-26 18:34:37 -0700	[diff] [blame]	288	int ret;
Matthew Bobrowski	569342d	2019-11-05 23:01:51 +1100	[diff] [blame]	289
				290	/*
				291	* Note that EXT4_I(inode)->i_disksize can get extended up to
				292	* inode->i_size while the I/O was running due to writeback of delalloc
				293	* blocks. But, the code in ext4_iomap_alloc() is careful to use
				294	* zeroed/unwritten extents if this is possible; thus we won't leave
				295	* uninitialized blocks in a file even if we didn't succeed in writing
				296	* as much as we intended.
				297	*/
				298	WARN_ON_ONCE(i_size_read(inode) < EXT4_I(inode)->i_disksize);
				299	if (offset + count <= EXT4_I(inode)->i_disksize) {
				300	/*
				301	* We need to ensure that the inode is removed from the orphan
				302	* list if it has been added prematurely, due to writeback of
				303	* delalloc blocks.
				304	*/
				305	if (!list_empty(&EXT4_I(inode)->i_orphan) && inode->i_nlink) {
				306	handle = ext4_journal_start(inode, EXT4_HT_INODE, 2);
				307
				308	if (IS_ERR(handle)) {
				309	ext4_orphan_del(NULL, inode);
				310	return PTR_ERR(handle);
				311	}
				312
				313	ext4_orphan_del(handle, inode);
				314	ext4_journal_stop(handle);
				315	}
				316
				317	return written;
				318	}
				319
				320	if (written < 0)
				321	goto truncate;
				322
				323	handle = ext4_journal_start(inode, EXT4_HT_INODE, 2);
				324	if (IS_ERR(handle)) {
				325	written = PTR_ERR(handle);
				326	goto truncate;
				327	}
				328
Harshad Shirwadkar	4209ae1	2020-04-26 18:34:37 -0700	[diff] [blame]	329	if (ext4_update_inode_size(inode, offset + written)) {
				330	ret = ext4_mark_inode_dirty(handle, inode);
				331	if (unlikely(ret)) {
				332	written = ret;
				333	ext4_journal_stop(handle);
				334	goto truncate;
				335	}
				336	}
Matthew Bobrowski	569342d	2019-11-05 23:01:51 +1100	[diff] [blame]	337
				338	/*
				339	* We may need to truncate allocated but not written blocks beyond EOF.
				340	*/
				341	written_blk = ALIGN(offset + written, 1 << blkbits);
				342	end_blk = ALIGN(offset + count, 1 << blkbits);
				343	if (written_blk < end_blk && ext4_can_truncate(inode))
				344	truncate = true;
				345
				346	/*
				347	* Remove the inode from the orphan list if it has been extended and
				348	* everything went OK.
				349	*/
				350	if (!truncate && inode->i_nlink)
				351	ext4_orphan_del(handle, inode);
				352	ext4_journal_stop(handle);
				353
				354	if (truncate) {
				355	truncate:
				356	ext4_truncate_failed_write(inode);
				357	/*
				358	* If the truncate operation failed early, then the inode may
				359	* still be on the orphan list. In that case, we need to try
				360	* remove the inode from the in-memory linked list.
				361	*/
				362	if (inode->i_nlink)
				363	ext4_orphan_del(NULL, inode);
				364	}
				365
				366	return written;
				367	}
				368
Matthew Bobrowski	378f32b	2019-11-05 23:02:39 +1100	[diff] [blame]	369	static int ext4_dio_write_end_io(struct kiocb *iocb, ssize_t size,
				370	int error, unsigned int flags)
				371	{
Jan Kara	5899593	2021-04-15 17:54:17 +0200	[diff] [blame]	372	loff_t pos = iocb->ki_pos;
Matthew Bobrowski	378f32b	2019-11-05 23:02:39 +1100	[diff] [blame]	373	struct inode *inode = file_inode(iocb->ki_filp);
				374
				375	if (error)
				376	return error;
				377
Jan Kara	5899593	2021-04-15 17:54:17 +0200	[diff] [blame]	378	if (size && flags & IOMAP_DIO_UNWRITTEN) {
				379	error = ext4_convert_unwritten_extents(NULL, inode, pos, size);
				380	if (error < 0)
				381	return error;
				382	}
				383	/*
				384	* If we are extending the file, we have to update i_size here before
				385	* page cache gets invalidated in iomap_dio_rw(). Otherwise racing
				386	* buffered reads could zero out too much from page cache pages. Update
				387	* of on-disk size will happen later in ext4_dio_write_iter() where
				388	* we have enough information to also perform orphan list handling etc.
				389	* Note that we perform all extending writes synchronously under
				390	* i_rwsem held exclusively so i_size update is safe here in that case.
				391	* If the write was not extending, we cannot see pos > i_size here
				392	* because operations reducing i_size like truncate wait for all
				393	* outstanding DIO before updating i_size.
				394	*/
				395	pos += size;
				396	if (pos > i_size_read(inode))
				397	i_size_write(inode, pos);
Matthew Bobrowski	378f32b	2019-11-05 23:02:39 +1100	[diff] [blame]	398
				399	return 0;
				400	}
				401
				402	static const struct iomap_dio_ops ext4_dio_write_ops = {
				403	.end_io = ext4_dio_write_end_io,
				404	};
				405
Ritesh Harjani	aa9714d0	2019-12-12 11:25:56 +0530	[diff] [blame]	406	/*
				407	* The intention here is to start with shared lock acquired then see if any
				408	* condition requires an exclusive inode lock. If yes, then we restart the
				409	* whole operation by releasing the shared lock and acquiring exclusive lock.
				410	*
				411	* - For unaligned_io we never take shared lock as it may cause data corruption
				412	* when two unaligned IO tries to modify the same block e.g. while zeroing.
				413	*
				414	* - For extending writes case we don't take the shared lock, since it requires
				415	* updating inode i_disksize and/or orphan handling with exclusive lock.
				416	*
Ritesh Harjani	bc6385d	2019-12-12 11:25:57 +0530	[diff] [blame]	417	* - shared locking will only be true mostly with overwrites. Otherwise we will
				418	* switch to exclusive i_rwsem lock.
Ritesh Harjani	aa9714d0	2019-12-12 11:25:56 +0530	[diff] [blame]	419	*/
				420	static ssize_t ext4_dio_write_checks(struct kiocb iocb, struct iov_iter from,
				421	bool ilock_shared, bool extend)
				422	{
				423	struct file *file = iocb->ki_filp;
				424	struct inode *inode = file_inode(file);
				425	loff_t offset;
				426	size_t count;
				427	ssize_t ret;
				428
				429	restart:
				430	ret = ext4_generic_write_checks(iocb, from);
				431	if (ret <= 0)
				432	goto out;
				433
				434	offset = iocb->ki_pos;
				435	count = ret;
				436	if (ext4_extending_io(inode, offset, count))
				437	*extend = true;
				438	/*
				439	* Determine whether the IO operation will overwrite allocated
Ritesh Harjani	bc6385d	2019-12-12 11:25:57 +0530	[diff] [blame]	440	* and initialized blocks.
Ritesh Harjani	aa9714d0	2019-12-12 11:25:56 +0530	[diff] [blame]	441	* We need exclusive i_rwsem for changing security info
				442	* in file_modified().
				443	*/
				444	if (ilock_shared && (!IS_NOSEC(inode) \|\| extend \|\|
Ritesh Harjani	aa9714d0	2019-12-12 11:25:56 +0530	[diff] [blame]	445	!ext4_overwrite_io(inode, offset, count))) {
Jan Kara	0b3171b	2020-07-08 17:35:16 +0200	[diff] [blame]	446	if (iocb->ki_flags & IOCB_NOWAIT) {
				447	ret = -EAGAIN;
				448	goto out;
				449	}
Ritesh Harjani	aa9714d0	2019-12-12 11:25:56 +0530	[diff] [blame]	450	inode_unlock_shared(inode);
				451	*ilock_shared = false;
				452	inode_lock(inode);
				453	goto restart;
				454	}
				455
				456	ret = file_modified(file);
				457	if (ret < 0)
				458	goto out;
				459
				460	return count;
				461	out:
				462	if (*ilock_shared)
				463	inode_unlock_shared(inode);
				464	else
				465	inode_unlock(inode);
				466	return ret;
				467	}
				468
Matthew Bobrowski	378f32b	2019-11-05 23:02:39 +1100	[diff] [blame]	469	static ssize_t ext4_dio_write_iter(struct kiocb iocb, struct iov_iter from)
				470	{
				471	ssize_t ret;
Matthew Bobrowski	378f32b	2019-11-05 23:02:39 +1100	[diff] [blame]	472	handle_t *handle;
				473	struct inode *inode = file_inode(iocb->ki_filp);
Ritesh Harjani	aa9714d0	2019-12-12 11:25:56 +0530	[diff] [blame]	474	loff_t offset = iocb->ki_pos;
				475	size_t count = iov_iter_count(from);
Jan Kara	8cd115b	2019-12-18 18:44:33 +0100	[diff] [blame]	476	const struct iomap_ops *iomap_ops = &ext4_iomap_ops;
Ritesh Harjani	aa9714d0	2019-12-12 11:25:56 +0530	[diff] [blame]	477	bool extend = false, unaligned_io = false;
				478	bool ilock_shared = true;
				479
				480	/*
				481	* We initially start with shared inode lock unless it is
				482	* unaligned IO which needs exclusive lock anyways.
				483	*/
				484	if (ext4_unaligned_io(inode, from, offset)) {
				485	unaligned_io = true;
				486	ilock_shared = false;
				487	}
				488	/*
				489	* Quick check here without any i_rwsem lock to see if it is extending
				490	* IO. A more reliable check is done in ext4_dio_write_checks() with
				491	* proper locking in place.
				492	*/
				493	if (offset + count > i_size_read(inode))
				494	ilock_shared = false;
Matthew Bobrowski	378f32b	2019-11-05 23:02:39 +1100	[diff] [blame]	495
				496	if (iocb->ki_flags & IOCB_NOWAIT) {
Ritesh Harjani	aa9714d0	2019-12-12 11:25:56 +0530	[diff] [blame]	497	if (ilock_shared) {
				498	if (!inode_trylock_shared(inode))
				499	return -EAGAIN;
				500	} else {
				501	if (!inode_trylock(inode))
				502	return -EAGAIN;
				503	}
Matthew Bobrowski	378f32b	2019-11-05 23:02:39 +1100	[diff] [blame]	504	} else {
Ritesh Harjani	aa9714d0	2019-12-12 11:25:56 +0530	[diff] [blame]	505	if (ilock_shared)
				506	inode_lock_shared(inode);
				507	else
				508	inode_lock(inode);
Matthew Bobrowski	378f32b	2019-11-05 23:02:39 +1100	[diff] [blame]	509	}
				510
Ritesh Harjani	aa9714d0	2019-12-12 11:25:56 +0530	[diff] [blame]	511	/* Fallback to buffered I/O if the inode does not support direct I/O. */
Matthew Bobrowski	378f32b	2019-11-05 23:02:39 +1100	[diff] [blame]	512	if (!ext4_dio_supported(inode)) {
Ritesh Harjani	aa9714d0	2019-12-12 11:25:56 +0530	[diff] [blame]	513	if (ilock_shared)
				514	inode_unlock_shared(inode);
				515	else
				516	inode_unlock(inode);
Matthew Bobrowski	378f32b	2019-11-05 23:02:39 +1100	[diff] [blame]	517	return ext4_buffered_write_iter(iocb, from);
				518	}
				519
Ritesh Harjani	aa9714d0	2019-12-12 11:25:56 +0530	[diff] [blame]	520	ret = ext4_dio_write_checks(iocb, from, &ilock_shared, &extend);
				521	if (ret <= 0)
Matthew Bobrowski	378f32b	2019-11-05 23:02:39 +1100	[diff] [blame]	522	return ret;
Matthew Bobrowski	378f32b	2019-11-05 23:02:39 +1100	[diff] [blame]	523
Jens Axboe	6e014c6	2020-05-24 16:53:16 -0600	[diff] [blame]	524	/* if we're going to block and IOCB_NOWAIT is set, return -EAGAIN */
				525	if ((iocb->ki_flags & IOCB_NOWAIT) && (unaligned_io \|\| extend)) {
				526	ret = -EAGAIN;
				527	goto out;
				528	}
				529
Matthew Bobrowski	378f32b	2019-11-05 23:02:39 +1100	[diff] [blame]	530	offset = iocb->ki_pos;
Ritesh Harjani	aa9714d0	2019-12-12 11:25:56 +0530	[diff] [blame]	531	count = ret;
Matthew Bobrowski	378f32b	2019-11-05 23:02:39 +1100	[diff] [blame]	532
				533	/*
Ritesh Harjani	aa9714d0	2019-12-12 11:25:56 +0530	[diff] [blame]	534	* Unaligned direct IO must be serialized among each other as zeroing
				535	* of partial blocks of two competing unaligned IOs can result in data
				536	* corruption.
				537	*
				538	* So we make sure we don't allow any unaligned IO in flight.
				539	* For IOs where we need not wait (like unaligned non-AIO DIO),
				540	* below inode_dio_wait() may anyway become a no-op, since we start
				541	* with exclusive lock.
Matthew Bobrowski	378f32b	2019-11-05 23:02:39 +1100	[diff] [blame]	542	*/
Ritesh Harjani	aa9714d0	2019-12-12 11:25:56 +0530	[diff] [blame]	543	if (unaligned_io)
				544	inode_dio_wait(inode);
Matthew Bobrowski	378f32b	2019-11-05 23:02:39 +1100	[diff] [blame]	545
Ritesh Harjani	aa9714d0	2019-12-12 11:25:56 +0530	[diff] [blame]	546	if (extend) {
Matthew Bobrowski	378f32b	2019-11-05 23:02:39 +1100	[diff] [blame]	547	handle = ext4_journal_start(inode, EXT4_HT_INODE, 2);
				548	if (IS_ERR(handle)) {
				549	ret = PTR_ERR(handle);
				550	goto out;
				551	}
				552
				553	ret = ext4_orphan_add(handle, inode);
				554	if (ret) {
				555	ext4_journal_stop(handle);
				556	goto out;
				557	}
				558
Matthew Bobrowski	378f32b	2019-11-05 23:02:39 +1100	[diff] [blame]	559	ext4_journal_stop(handle);
				560	}
				561
Jan Kara	8cd115b	2019-12-18 18:44:33 +0100	[diff] [blame]	562	if (ilock_shared)
				563	iomap_ops = &ext4_iomap_overwrite_ops;
				564	ret = iomap_dio_rw(iocb, from, iomap_ops, &ext4_dio_write_ops,
Andreas Gruenbacher	4fdccaa	2021-07-24 12:26:41 +0200	[diff] [blame]	565	(unaligned_io \|\| extend) ? IOMAP_DIO_FORCE_WAIT : 0,
				566	0);
Christoph Hellwig	60263d5	2020-07-23 22:45:59 -0700	[diff] [blame]	567	if (ret == -ENOTBLK)
				568	ret = 0;
Matthew Bobrowski	378f32b	2019-11-05 23:02:39 +1100	[diff] [blame]	569
				570	if (extend)
				571	ret = ext4_handle_inode_extension(inode, offset, ret, count);
				572
				573	out:
Ritesh Harjani	aa9714d0	2019-12-12 11:25:56 +0530	[diff] [blame]	574	if (ilock_shared)
Matthew Bobrowski	378f32b	2019-11-05 23:02:39 +1100	[diff] [blame]	575	inode_unlock_shared(inode);
				576	else
				577	inode_unlock(inode);
				578
				579	if (ret >= 0 && iov_iter_count(from)) {
				580	ssize_t err;
				581	loff_t endbyte;
				582
				583	offset = iocb->ki_pos;
				584	err = ext4_buffered_write_iter(iocb, from);
				585	if (err < 0)
				586	return err;
				587
				588	/*
				589	* We need to ensure that the pages within the page cache for
				590	* the range covered by this I/O are written to disk and
				591	* invalidated. This is in attempt to preserve the expected
				592	* direct I/O semantics in the case we fallback to buffered I/O
				593	* to complete off the I/O request.
				594	*/
				595	ret += err;
				596	endbyte = offset + err - 1;
				597	err = filemap_write_and_wait_range(iocb->ki_filp->f_mapping,
				598	offset, endbyte);
				599	if (!err)
				600	invalidate_mapping_pages(iocb->ki_filp->f_mapping,
				601	offset >> PAGE_SHIFT,
				602	endbyte >> PAGE_SHIFT);
				603	}
				604
				605	return ret;
				606	}
				607
Jan Kara	776722e	2016-11-20 18:09:11 -0500	[diff] [blame]	608	#ifdef CONFIG_FS_DAX
				609	static ssize_t
				610	ext4_dax_write_iter(struct kiocb iocb, struct iov_iter from)
				611	{
Jan Kara	776722e	2016-11-20 18:09:11 -0500	[diff] [blame]	612	ssize_t ret;
Matthew Bobrowski	569342d	2019-11-05 23:01:51 +1100	[diff] [blame]	613	size_t count;
				614	loff_t offset;
Matthew Bobrowski	0b9f230	2019-11-05 23:02:08 +1100	[diff] [blame]	615	handle_t *handle;
				616	bool extend = false;
Matthew Bobrowski	569342d	2019-11-05 23:01:51 +1100	[diff] [blame]	617	struct inode *inode = file_inode(iocb->ki_filp);
Jan Kara	776722e	2016-11-20 18:09:11 -0500	[diff] [blame]	618
Ritesh Harjani	f629afe	2019-12-12 11:25:55 +0530	[diff] [blame]	619	if (iocb->ki_flags & IOCB_NOWAIT) {
				620	if (!inode_trylock(inode))
Goldwyn Rodrigues	728fbc0	2017-06-20 07:05:47 -0500	[diff] [blame]	621	return -EAGAIN;
Ritesh Harjani	f629afe	2019-12-12 11:25:55 +0530	[diff] [blame]	622	} else {
Goldwyn Rodrigues	728fbc0	2017-06-20 07:05:47 -0500	[diff] [blame]	623	inode_lock(inode);
				624	}
Matthew Bobrowski	378f32b	2019-11-05 23:02:39 +1100	[diff] [blame]	625
Jan Kara	776722e	2016-11-20 18:09:11 -0500	[diff] [blame]	626	ret = ext4_write_checks(iocb, from);
				627	if (ret <= 0)
				628	goto out;
Jan Kara	776722e	2016-11-20 18:09:11 -0500	[diff] [blame]	629
Matthew Bobrowski	569342d	2019-11-05 23:01:51 +1100	[diff] [blame]	630	offset = iocb->ki_pos;
				631	count = iov_iter_count(from);
Matthew Bobrowski	0b9f230	2019-11-05 23:02:08 +1100	[diff] [blame]	632
				633	if (offset + count > EXT4_I(inode)->i_disksize) {
				634	handle = ext4_journal_start(inode, EXT4_HT_INODE, 2);
				635	if (IS_ERR(handle)) {
				636	ret = PTR_ERR(handle);
				637	goto out;
				638	}
				639
				640	ret = ext4_orphan_add(handle, inode);
				641	if (ret) {
				642	ext4_journal_stop(handle);
				643	goto out;
				644	}
				645
				646	extend = true;
				647	ext4_journal_stop(handle);
				648	}
				649
Jan Kara	776722e	2016-11-20 18:09:11 -0500	[diff] [blame]	650	ret = dax_iomap_rw(iocb, from, &ext4_iomap_ops);
Matthew Bobrowski	0b9f230	2019-11-05 23:02:08 +1100	[diff] [blame]	651
				652	if (extend)
				653	ret = ext4_handle_inode_extension(inode, offset, ret, count);
Jan Kara	776722e	2016-11-20 18:09:11 -0500	[diff] [blame]	654	out:
Christoph Hellwig	ff5462e	2017-02-08 14:39:27 -0500	[diff] [blame]	655	inode_unlock(inode);
Jan Kara	776722e	2016-11-20 18:09:11 -0500	[diff] [blame]	656	if (ret > 0)
				657	ret = generic_write_sync(iocb, ret);
				658	return ret;
				659	}
				660	#endif
				661
Dave Kleikamp	ac27a0e	2006-10-11 01:20:50 -0700	[diff] [blame]	662	static ssize_t
Al Viro	9b88416	2014-04-17 16:09:22 -0400	[diff] [blame]	663	ext4_file_write_iter(struct kiocb iocb, struct iov_iter from)
Dave Kleikamp	ac27a0e	2006-10-11 01:20:50 -0700	[diff] [blame]	664	{
Al Viro	496ad9a	2013-01-23 17:07:38 -0500	[diff] [blame]	665	struct inode *inode = file_inode(iocb->ki_filp);
Theodore Ts'o	7608e61	2014-04-21 14:26:28 -0400	[diff] [blame]	666
Theodore Ts'o	0db1ff2	2017-02-05 01:28:48 -0500	[diff] [blame]	667	if (unlikely(ext4_forced_shutdown(EXT4_SB(inode->i_sb))))
				668	return -EIO;
				669
Jan Kara	776722e	2016-11-20 18:09:11 -0500	[diff] [blame]	670	#ifdef CONFIG_FS_DAX
				671	if (IS_DAX(inode))
				672	return ext4_dax_write_iter(iocb, from);
				673	#endif
Matthew Bobrowski	378f32b	2019-11-05 23:02:39 +1100	[diff] [blame]	674	if (iocb->ki_flags & IOCB_DIRECT)
				675	return ext4_dio_write_iter(iocb, from);
Harshad Shirwadkar	aa75f4d	2020-10-15 13:37:57 -0700	[diff] [blame]	676	else
				677	return ext4_buffered_write_iter(iocb, from);
Dave Kleikamp	ac27a0e	2006-10-11 01:20:50 -0700	[diff] [blame]	678	}
				679
Ross Zwisler	923ae0f	2015-02-16 15:59:38 -0800	[diff] [blame]	680	#ifdef CONFIG_FS_DAX
Souptick Joarder	71fe9899	2018-05-13 16:01:49 -0400	[diff] [blame]	681	static vm_fault_t ext4_dax_huge_fault(struct vm_fault *vmf,
Dave Jiang	c791ace	2017-02-24 14:57:08 -0800	[diff] [blame]	682	enum page_entry_size pe_size)
Ross Zwisler	923ae0f	2015-02-16 15:59:38 -0800	[diff] [blame]	683	{
Souptick Joarder	71fe9899	2018-05-13 16:01:49 -0400	[diff] [blame]	684	int error = 0;
				685	vm_fault_t result;
Jan Kara	2244642	2018-01-07 16:41:01 -0500	[diff] [blame]	686	int retries = 0;
Jan Kara	fb26a1c	2017-05-12 15:46:54 -0700	[diff] [blame]	687	handle_t *handle = NULL;
Dave Jiang	11bac80	2017-02-24 14:56:41 -0800	[diff] [blame]	688	struct inode *inode = file_inode(vmf->vma->vm_file);
Jan Kara	ea3d720	2015-12-07 14:28:03 -0500	[diff] [blame]	689	struct super_block *sb = inode->i_sb;
Randy Dodgen	fd96b8d	2017-08-24 15:26:01 -0400	[diff] [blame]	690
				691	/*
				692	* We have to distinguish real writes from writes which will result in a
				693	* COW page; COW writes should not poke the journal (the file will not
				694	* be changed). Doing so would cause unintended failures when mounted
				695	* read-only.
				696	*
				697	* We check for VM_SHARED rather than vmf->cow_page since the latter is
				698	* unset for pe_size != PE_SIZE_PTE (i.e. only in do_cow_fault); for
				699	* other sizes, dax_iomap_fault will handle splitting / fallback so that
				700	* we eventually come back with a COW page.
				701	*/
				702	bool write = (vmf->flags & FAULT_FLAG_WRITE) &&
				703	(vmf->vma->vm_flags & VM_SHARED);
Jan Kara	d4f5258	2021-02-04 18:05:42 +0100	[diff] [blame]	704	struct address_space *mapping = vmf->vma->vm_file->f_mapping;
Jan Kara	b8a6176	2017-11-01 16:36:45 +0100	[diff] [blame]	705	pfn_t pfn;
Matthew Wilcox	01a33b4	2015-09-08 14:59:22 -0700	[diff] [blame]	706
				707	if (write) {
				708	sb_start_pagefault(sb);
Dave Jiang	11bac80	2017-02-24 14:56:41 -0800	[diff] [blame]	709	file_update_time(vmf->vma->vm_file);
Jan Kara	d4f5258	2021-02-04 18:05:42 +0100	[diff] [blame]	710	filemap_invalidate_lock_shared(mapping);
Jan Kara	2244642	2018-01-07 16:41:01 -0500	[diff] [blame]	711	retry:
Jan Kara	fb26a1c	2017-05-12 15:46:54 -0700	[diff] [blame]	712	handle = ext4_journal_start_sb(sb, EXT4_HT_WRITE_PAGE,
				713	EXT4_DATA_TRANS_BLOCKS(sb));
Jan Kara	497f692	2017-11-01 16:36:44 +0100	[diff] [blame]	714	if (IS_ERR(handle)) {
Jan Kara	d4f5258	2021-02-04 18:05:42 +0100	[diff] [blame]	715	filemap_invalidate_unlock_shared(mapping);
Jan Kara	497f692	2017-11-01 16:36:44 +0100	[diff] [blame]	716	sb_end_pagefault(sb);
				717	return VM_FAULT_SIGBUS;
				718	}
Jan Kara	fb26a1c	2017-05-12 15:46:54 -0700	[diff] [blame]	719	} else {
Jan Kara	d4f5258	2021-02-04 18:05:42 +0100	[diff] [blame]	720	filemap_invalidate_lock_shared(mapping);
Jan Kara	1db1754	2016-10-21 11:33:49 +0200	[diff] [blame]	721	}
Jan Kara	2244642	2018-01-07 16:41:01 -0500	[diff] [blame]	722	result = dax_iomap_fault(vmf, pe_size, &pfn, &error, &ext4_iomap_ops);
Jan Kara	fb26a1c	2017-05-12 15:46:54 -0700	[diff] [blame]	723	if (write) {
Jan Kara	497f692	2017-11-01 16:36:44 +0100	[diff] [blame]	724	ext4_journal_stop(handle);
Jan Kara	2244642	2018-01-07 16:41:01 -0500	[diff] [blame]	725
				726	if ((result & VM_FAULT_ERROR) && error == -ENOSPC &&
				727	ext4_should_retry_alloc(sb, &retries))
				728	goto retry;
Jan Kara	b8a6176	2017-11-01 16:36:45 +0100	[diff] [blame]	729	/* Handling synchronous page fault? */
				730	if (result & VM_FAULT_NEEDDSYNC)
				731	result = dax_finish_sync_fault(vmf, pe_size, pfn);
Jan Kara	d4f5258	2021-02-04 18:05:42 +0100	[diff] [blame]	732	filemap_invalidate_unlock_shared(mapping);
Matthew Wilcox	01a33b4	2015-09-08 14:59:22 -0700	[diff] [blame]	733	sb_end_pagefault(sb);
Jan Kara	fb26a1c	2017-05-12 15:46:54 -0700	[diff] [blame]	734	} else {
Jan Kara	d4f5258	2021-02-04 18:05:42 +0100	[diff] [blame]	735	filemap_invalidate_unlock_shared(mapping);
Jan Kara	fb26a1c	2017-05-12 15:46:54 -0700	[diff] [blame]	736	}
Matthew Wilcox	01a33b4	2015-09-08 14:59:22 -0700	[diff] [blame]	737
				738	return result;
Ross Zwisler	923ae0f	2015-02-16 15:59:38 -0800	[diff] [blame]	739	}
				740
Souptick Joarder	71fe9899	2018-05-13 16:01:49 -0400	[diff] [blame]	741	static vm_fault_t ext4_dax_fault(struct vm_fault *vmf)
Dave Jiang	c791ace	2017-02-24 14:57:08 -0800	[diff] [blame]	742	{
				743	return ext4_dax_huge_fault(vmf, PE_SIZE_PTE);
				744	}
				745
Ross Zwisler	923ae0f	2015-02-16 15:59:38 -0800	[diff] [blame]	746	static const struct vm_operations_struct ext4_dax_vm_ops = {
				747	.fault = ext4_dax_fault,
Dave Jiang	c791ace	2017-02-24 14:57:08 -0800	[diff] [blame]	748	.huge_fault = ext4_dax_huge_fault,
Ross Zwisler	1e9d180	2016-02-27 14:01:13 -0500	[diff] [blame]	749	.page_mkwrite = ext4_dax_fault,
Ross Zwisler	91d25ba	2017-09-06 16:18:43 -0700	[diff] [blame]	750	.pfn_mkwrite = ext4_dax_fault,
Ross Zwisler	923ae0f	2015-02-16 15:59:38 -0800	[diff] [blame]	751	};
				752	#else
				753	#define ext4_dax_vm_ops ext4_file_vm_ops
				754	#endif
				755
Alexey Dobriyan	f0f37e2f	2009-09-27 22:29:37 +0400	[diff] [blame]	756	static const struct vm_operations_struct ext4_file_vm_ops = {
Jan Kara	d4f5258	2021-02-04 18:05:42 +0100	[diff] [blame]	757	.fault = filemap_fault,
Kirill A. Shutemov	f182036	2014-04-07 15:37:19 -0700	[diff] [blame]	758	.map_pages = filemap_map_pages,
Aneesh Kumar K.V	2e9ee85	2008-07-11 19:27:31 -0400	[diff] [blame]	759	.page_mkwrite = ext4_page_mkwrite,
				760	};
				761
				762	static int ext4_file_mmap(struct file file, struct vm_area_struct vma)
				763	{
Michael Halcrow	c9c7429	2015-04-12 00:56:10 -0400	[diff] [blame]	764	struct inode *inode = file->f_mapping->host;
Pankaj Gupta	e46bfc3	2019-07-05 19:33:27 +0530	[diff] [blame]	765	struct ext4_sb_info *sbi = EXT4_SB(inode->i_sb);
				766	struct dax_device *dax_dev = sbi->s_daxdev;
Michael Halcrow	c9c7429	2015-04-12 00:56:10 -0400	[diff] [blame]	767
Pankaj Gupta	e46bfc3	2019-07-05 19:33:27 +0530	[diff] [blame]	768	if (unlikely(ext4_forced_shutdown(sbi)))
Theodore Ts'o	0db1ff2	2017-02-05 01:28:48 -0500	[diff] [blame]	769	return -EIO;
				770
Jan Kara	b8a6176	2017-11-01 16:36:45 +0100	[diff] [blame]	771	/*
Pankaj Gupta	e46bfc3	2019-07-05 19:33:27 +0530	[diff] [blame]	772	* We don't support synchronous mappings for non-DAX files and
				773	* for DAX files if underneath dax_device is not synchronous.
Jan Kara	b8a6176	2017-11-01 16:36:45 +0100	[diff] [blame]	774	*/
Pankaj Gupta	e46bfc3	2019-07-05 19:33:27 +0530	[diff] [blame]	775	if (!daxdev_mapping_supported(vma, dax_dev))
Jan Kara	b8a6176	2017-11-01 16:36:45 +0100	[diff] [blame]	776	return -EOPNOTSUPP;
				777
Aneesh Kumar K.V	2e9ee85	2008-07-11 19:27:31 -0400	[diff] [blame]	778	file_accessed(file);
Ross Zwisler	923ae0f	2015-02-16 15:59:38 -0800	[diff] [blame]	779	if (IS_DAX(file_inode(file))) {
				780	vma->vm_ops = &ext4_dax_vm_ops;
Dave Jiang	e1fb4a0	2018-08-17 15:43:40 -0700	[diff] [blame]	781	vma->vm_flags \|= VM_HUGEPAGE;
Ross Zwisler	923ae0f	2015-02-16 15:59:38 -0800	[diff] [blame]	782	} else {
				783	vma->vm_ops = &ext4_file_vm_ops;
				784	}
Aneesh Kumar K.V	2e9ee85	2008-07-11 19:27:31 -0400	[diff] [blame]	785	return 0;
				786	}
				787
Amir Goldstein	833a950	2018-05-13 22:44:23 -0400	[diff] [blame]	788	static int ext4_sample_last_mounted(struct super_block *sb,
				789	struct vfsmount *mnt)
Theodore Ts'o	bc0b0d6	2009-06-13 10:09:48 -0400	[diff] [blame]	790	{
Amir Goldstein	833a950	2018-05-13 22:44:23 -0400	[diff] [blame]	791	struct ext4_sb_info *sbi = EXT4_SB(sb);
Theodore Ts'o	bc0b0d6	2009-06-13 10:09:48 -0400	[diff] [blame]	792	struct path path;
				793	char buf[64], *cp;
Amir Goldstein	833a950	2018-05-13 22:44:23 -0400	[diff] [blame]	794	handle_t *handle;
				795	int err;
				796
Harshad Shirwadkar	9b5f6c9	2020-11-05 19:59:09 -0800	[diff] [blame]	797	if (likely(ext4_test_mount_flag(sb, EXT4_MF_MNTDIR_SAMPLED)))
Amir Goldstein	833a950	2018-05-13 22:44:23 -0400	[diff] [blame]	798	return 0;
				799
Amir Goldstein	db6516a	2018-05-13 22:54:44 -0400	[diff] [blame]	800	if (sb_rdonly(sb) \|\| !sb_start_intwrite_trylock(sb))
Amir Goldstein	833a950	2018-05-13 22:44:23 -0400	[diff] [blame]	801	return 0;
				802
Harshad Shirwadkar	9b5f6c9	2020-11-05 19:59:09 -0800	[diff] [blame]	803	ext4_set_mount_flag(sb, EXT4_MF_MNTDIR_SAMPLED);
Amir Goldstein	833a950	2018-05-13 22:44:23 -0400	[diff] [blame]	804	/*
				805	* Sample where the filesystem has been mounted and
				806	* store it in the superblock for sysadmin convenience
				807	* when trying to sort through large numbers of block
				808	* devices or filesystem images.
				809	*/
				810	memset(buf, 0, sizeof(buf));
				811	path.mnt = mnt;
				812	path.dentry = mnt->mnt_root;
				813	cp = d_path(&path, buf, sizeof(buf));
Amir Goldstein	db6516a	2018-05-13 22:54:44 -0400	[diff] [blame]	814	err = 0;
Amir Goldstein	833a950	2018-05-13 22:44:23 -0400	[diff] [blame]	815	if (IS_ERR(cp))
Amir Goldstein	db6516a	2018-05-13 22:54:44 -0400	[diff] [blame]	816	goto out;
Amir Goldstein	833a950	2018-05-13 22:44:23 -0400	[diff] [blame]	817
				818	handle = ext4_journal_start_sb(sb, EXT4_HT_MISC, 1);
Amir Goldstein	db6516a	2018-05-13 22:54:44 -0400	[diff] [blame]	819	err = PTR_ERR(handle);
Amir Goldstein	833a950	2018-05-13 22:44:23 -0400	[diff] [blame]	820	if (IS_ERR(handle))
Amir Goldstein	db6516a	2018-05-13 22:54:44 -0400	[diff] [blame]	821	goto out;
Amir Goldstein	833a950	2018-05-13 22:44:23 -0400	[diff] [blame]	822	BUFFER_TRACE(sbi->s_sbh, "get_write_access");
Jan Kara	188c299	2021-08-16 11:57:04 +0200	[diff] [blame]	823	err = ext4_journal_get_write_access(handle, sb, sbi->s_sbh,
				824	EXT4_JTR_NONE);
Amir Goldstein	833a950	2018-05-13 22:44:23 -0400	[diff] [blame]	825	if (err)
Amir Goldstein	db6516a	2018-05-13 22:54:44 -0400	[diff] [blame]	826	goto out_journal;
Jan Kara	05c2c00	2020-12-16 11:18:39 +0100	[diff] [blame]	827	lock_buffer(sbi->s_sbh);
Theodore Ts'o	5a3b590	2020-12-17 13:24:15 -0500	[diff] [blame]	828	strncpy(sbi->s_es->s_last_mounted, cp,
Amir Goldstein	833a950	2018-05-13 22:44:23 -0400	[diff] [blame]	829	sizeof(sbi->s_es->s_last_mounted));
Jan Kara	05c2c00	2020-12-16 11:18:39 +0100	[diff] [blame]	830	ext4_superblock_csum_set(sb);
				831	unlock_buffer(sbi->s_sbh);
Jan Kara	a3f5cf1	2020-12-16 11:18:44 +0100	[diff] [blame]	832	ext4_handle_dirty_metadata(handle, NULL, sbi->s_sbh);
Amir Goldstein	db6516a	2018-05-13 22:54:44 -0400	[diff] [blame]	833	out_journal:
Amir Goldstein	833a950	2018-05-13 22:44:23 -0400	[diff] [blame]	834	ext4_journal_stop(handle);
Amir Goldstein	db6516a	2018-05-13 22:54:44 -0400	[diff] [blame]	835	out:
				836	sb_end_intwrite(sb);
Amir Goldstein	833a950	2018-05-13 22:44:23 -0400	[diff] [blame]	837	return err;
				838	}
				839
Dio Putra	e030a28	2020-06-14 11:45:44 +0700	[diff] [blame]	840	static int ext4_file_open(struct inode inode, struct file filp)
Amir Goldstein	833a950	2018-05-13 22:44:23 -0400	[diff] [blame]	841	{
Michael Halcrow	c9c7429	2015-04-12 00:56:10 -0400	[diff] [blame]	842	int ret;
Theodore Ts'o	bc0b0d6	2009-06-13 10:09:48 -0400	[diff] [blame]	843
Theodore Ts'o	0db1ff2	2017-02-05 01:28:48 -0500	[diff] [blame]	844	if (unlikely(ext4_forced_shutdown(EXT4_SB(inode->i_sb))))
				845	return -EIO;
				846
Amir Goldstein	833a950	2018-05-13 22:44:23 -0400	[diff] [blame]	847	ret = ext4_sample_last_mounted(inode->i_sb, filp->f_path.mnt);
				848	if (ret)
				849	return ret;
Miklos Szeredi	9dd78d8	2016-03-26 16:14:41 -0400	[diff] [blame]	850
Eric Biggers	09a5c31	2017-10-18 20:21:57 -0400	[diff] [blame]	851	ret = fscrypt_file_open(inode, filp);
				852	if (ret)
				853	return ret;
				854
Eric Biggers	c93d8f8	2019-07-22 09:26:24 -0700	[diff] [blame]	855	ret = fsverity_file_open(inode, filp);
				856	if (ret)
				857	return ret;
				858
Theodore Ts'o	8aefcd5	2011-01-10 12:29:43 -0500	[diff] [blame]	859	/*
				860	* Set up the jbd2_inode if we are opening the inode for
				861	* writing and the journal is present
				862	*/
Jan Kara	a361293	2013-08-16 21:19:41 -0400	[diff] [blame]	863	if (filp->f_mode & FMODE_WRITE) {
Michael Halcrow	c9c7429	2015-04-12 00:56:10 -0400	[diff] [blame]	864	ret = ext4_inode_attach_jinode(inode);
Jan Kara	a361293	2013-08-16 21:19:41 -0400	[diff] [blame]	865	if (ret < 0)
				866	return ret;
Theodore Ts'o	8aefcd5	2011-01-10 12:29:43 -0500	[diff] [blame]	867	}
Goldwyn Rodrigues	728fbc0	2017-06-20 07:05:47 -0500	[diff] [blame]	868
Jens Axboe	766ef1e	2020-08-03 17:02:11 -0600	[diff] [blame]	869	filp->f_mode \|= FMODE_NOWAIT \| FMODE_BUF_RASYNC;
Theodore Ts'o	abdd438	2015-05-31 13:35:39 -0400	[diff] [blame]	870	return dquot_file_open(inode, filp);
Theodore Ts'o	bc0b0d6	2009-06-13 10:09:48 -0400	[diff] [blame]	871	}
				872
Toshiyuki Okajima	e0d10bf	2010-10-27 21:30:06 -0400	[diff] [blame]	873	/*
Eric Sandeen	ec7268c	2012-04-30 13:14:03 -0500	[diff] [blame]	874	* ext4_llseek() handles both block-mapped and extent-mapped maxbytes values
				875	* by calling generic_file_llseek_size() with the appropriate maxbytes
				876	* value for each.
Toshiyuki Okajima	e0d10bf	2010-10-27 21:30:06 -0400	[diff] [blame]	877	*/
Andrew Morton	965c8e5	2012-12-17 15:59:39 -0800	[diff] [blame]	878	loff_t ext4_llseek(struct file *file, loff_t offset, int whence)
Toshiyuki Okajima	e0d10bf	2010-10-27 21:30:06 -0400	[diff] [blame]	879	{
				880	struct inode *inode = file->f_mapping->host;
				881	loff_t maxbytes;
				882
				883	if (!(ext4_test_inode_flag(inode, EXT4_INODE_EXTENTS)))
				884	maxbytes = EXT4_SB(inode->i_sb)->s_bitmap_maxbytes;
				885	else
				886	maxbytes = inode->i_sb->s_maxbytes;
Toshiyuki Okajima	e0d10bf	2010-10-27 21:30:06 -0400	[diff] [blame]	887
Andrew Morton	965c8e5	2012-12-17 15:59:39 -0800	[diff] [blame]	888	switch (whence) {
Christoph Hellwig	545052e	2017-10-01 17:58:54 -0400	[diff] [blame]	889	default:
Andrew Morton	965c8e5	2012-12-17 15:59:39 -0800	[diff] [blame]	890	return generic_file_llseek_size(file, offset, whence,
Zheng Liu	c8c0df2	2012-11-08 21:57:40 -0500	[diff] [blame]	891	maxbytes, i_size_read(inode));
Zheng Liu	c8c0df2	2012-11-08 21:57:40 -0500	[diff] [blame]	892	case SEEK_HOLE:
Christoph Hellwig	545052e	2017-10-01 17:58:54 -0400	[diff] [blame]	893	inode_lock_shared(inode);
Matthew Bobrowski	09edf4d	2019-11-05 23:03:31 +1100	[diff] [blame]	894	offset = iomap_seek_hole(inode, offset,
				895	&ext4_iomap_report_ops);
Christoph Hellwig	545052e	2017-10-01 17:58:54 -0400	[diff] [blame]	896	inode_unlock_shared(inode);
				897	break;
				898	case SEEK_DATA:
				899	inode_lock_shared(inode);
Matthew Bobrowski	09edf4d	2019-11-05 23:03:31 +1100	[diff] [blame]	900	offset = iomap_seek_data(inode, offset,
				901	&ext4_iomap_report_ops);
Christoph Hellwig	545052e	2017-10-01 17:58:54 -0400	[diff] [blame]	902	inode_unlock_shared(inode);
				903	break;
Zheng Liu	c8c0df2	2012-11-08 21:57:40 -0500	[diff] [blame]	904	}
				905
Christoph Hellwig	545052e	2017-10-01 17:58:54 -0400	[diff] [blame]	906	if (offset < 0)
				907	return offset;
				908	return vfs_setpos(file, offset, maxbytes);
Toshiyuki Okajima	e0d10bf	2010-10-27 21:30:06 -0400	[diff] [blame]	909	}
				910
Mingming Cao	617ba13	2006-10-11 01:20:53 -0700	[diff] [blame]	911	const struct file_operations ext4_file_operations = {
Toshiyuki Okajima	e0d10bf	2010-10-27 21:30:06 -0400	[diff] [blame]	912	.llseek = ext4_llseek,
Jan Kara	364443c	2016-11-20 17:36:06 -0500	[diff] [blame]	913	.read_iter = ext4_file_read_iter,
Al Viro	9b88416	2014-04-17 16:09:22 -0400	[diff] [blame]	914	.write_iter = ext4_file_write_iter,
Christoph Hellwig	3e08773	2021-10-12 13:12:24 +0200	[diff] [blame]	915	.iopoll = iocb_bio_iopoll,
Andi Kleen	5cdd7b2	2008-04-29 22:03:54 -0400	[diff] [blame]	916	.unlocked_ioctl = ext4_ioctl,
Dave Kleikamp	ac27a0e	2006-10-11 01:20:50 -0700	[diff] [blame]	917	#ifdef CONFIG_COMPAT
Mingming Cao	617ba13	2006-10-11 01:20:53 -0700	[diff] [blame]	918	.compat_ioctl = ext4_compat_ioctl,
Dave Kleikamp	ac27a0e	2006-10-11 01:20:50 -0700	[diff] [blame]	919	#endif
Aneesh Kumar K.V	2e9ee85	2008-07-11 19:27:31 -0400	[diff] [blame]	920	.mmap = ext4_file_mmap,
Jan Kara	b8a6176	2017-11-01 16:36:45 +0100	[diff] [blame]	921	.mmap_supported_flags = MAP_SYNC,
Theodore Ts'o	bc0b0d6	2009-06-13 10:09:48 -0400	[diff] [blame]	922	.open = ext4_file_open,
Mingming Cao	617ba13	2006-10-11 01:20:53 -0700	[diff] [blame]	923	.release = ext4_release_file,
				924	.fsync = ext4_sync_file,
Toshi Kani	dbe6ec8	2016-10-07 16:59:59 -0700	[diff] [blame]	925	.get_unmapped_area = thp_get_unmapped_area,
Dave Kleikamp	ac27a0e	2006-10-11 01:20:50 -0700	[diff] [blame]	926	.splice_read = generic_file_splice_read,
Al Viro	8d02076	2014-04-05 04:27:08 -0400	[diff] [blame]	927	.splice_write = iter_file_splice_write,
Christoph Hellwig	2fe17c1	2011-01-14 13:07:43 +0100	[diff] [blame]	928	.fallocate = ext4_fallocate,
Dave Kleikamp	ac27a0e	2006-10-11 01:20:50 -0700	[diff] [blame]	929	};
				930
Arjan van de Ven	754661f	2007-02-12 00:55:38 -0800	[diff] [blame]	931	const struct inode_operations ext4_file_inode_operations = {
Mingming Cao	617ba13	2006-10-11 01:20:53 -0700	[diff] [blame]	932	.setattr = ext4_setattr,
David Howells	99652ea	2017-03-31 18:31:56 +0100	[diff] [blame]	933	.getattr = ext4_file_getattr,
Mingming Cao	617ba13	2006-10-11 01:20:53 -0700	[diff] [blame]	934	.listxattr = ext4_listxattr,
Christoph Hellwig	4e34e71	2011-07-23 17:37:31 +0200	[diff] [blame]	935	.get_acl = ext4_get_acl,
Christoph Hellwig	64e178a	2013-12-20 05:16:44 -0800	[diff] [blame]	936	.set_acl = ext4_set_acl,
Eric Sandeen	6873fa0	2008-10-07 00:46:36 -0400	[diff] [blame]	937	.fiemap = ext4_fiemap,
Miklos Szeredi	4db5c2e	2021-04-07 14:36:43 +0200	[diff] [blame]	938	.fileattr_get = ext4_fileattr_get,
				939	.fileattr_set = ext4_fileattr_set,
Dave Kleikamp	ac27a0e	2006-10-11 01:20:50 -0700	[diff] [blame]	940	};
				941