blob: 4774c7172ef46ff95d83896d469308e950c1c201 [file] [log] [blame]
Linus Torvalds1da177e2005-04-16 15:20:36 -07001/*
Nathan Scott7b718762005-11-02 14:58:39 +11002 * Copyright (c) 2000-2005 Silicon Graphics, Inc.
3 * All Rights Reserved.
Linus Torvalds1da177e2005-04-16 15:20:36 -07004 *
Nathan Scott7b718762005-11-02 14:58:39 +11005 * This program is free software; you can redistribute it and/or
6 * modify it under the terms of the GNU General Public License as
Linus Torvalds1da177e2005-04-16 15:20:36 -07007 * published by the Free Software Foundation.
8 *
Nathan Scott7b718762005-11-02 14:58:39 +11009 * This program is distributed in the hope that it would be useful,
10 * but WITHOUT ANY WARRANTY; without even the implied warranty of
11 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
12 * GNU General Public License for more details.
Linus Torvalds1da177e2005-04-16 15:20:36 -070013 *
Nathan Scott7b718762005-11-02 14:58:39 +110014 * You should have received a copy of the GNU General Public License
15 * along with this program; if not, write the Free Software Foundation,
16 * Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA
Linus Torvalds1da177e2005-04-16 15:20:36 -070017 */
Linus Torvalds1da177e2005-04-16 15:20:36 -070018#include "xfs.h"
Christoph Hellwigdda35b82010-02-15 09:44:46 +000019#include "xfs_fs.h"
Dave Chinner70a98832013-10-23 10:36:05 +110020#include "xfs_shared.h"
Dave Chinnera4fbe6a2013-10-23 10:51:50 +110021#include "xfs_format.h"
Dave Chinner239880e2013-10-23 10:50:10 +110022#include "xfs_log_format.h"
23#include "xfs_trans_resv.h"
Linus Torvalds1da177e2005-04-16 15:20:36 -070024#include "xfs_mount.h"
Dave Chinner57062782013-10-15 09:17:51 +110025#include "xfs_da_format.h"
26#include "xfs_da_btree.h"
Linus Torvalds1da177e2005-04-16 15:20:36 -070027#include "xfs_inode.h"
Dave Chinner239880e2013-10-23 10:50:10 +110028#include "xfs_trans.h"
Christoph Hellwigfd3200b2010-02-15 09:44:48 +000029#include "xfs_inode_item.h"
Christoph Hellwigdda35b82010-02-15 09:44:46 +000030#include "xfs_bmap.h"
Dave Chinnerc24b5df2013-08-12 20:49:45 +100031#include "xfs_bmap_util.h"
Linus Torvalds1da177e2005-04-16 15:20:36 -070032#include "xfs_error.h"
Dave Chinner2b9ab5a2013-08-12 20:49:37 +100033#include "xfs_dir2.h"
Dave Chinnerc24b5df2013-08-12 20:49:45 +100034#include "xfs_dir2_priv.h"
Christoph Hellwigddcd8562008-12-03 07:55:34 -050035#include "xfs_ioctl.h"
Christoph Hellwigdda35b82010-02-15 09:44:46 +000036#include "xfs_trace.h"
Dave Chinner239880e2013-10-23 10:50:10 +110037#include "xfs_log.h"
Brian Fosterdc06f3982014-07-24 19:49:28 +100038#include "xfs_icache.h"
Christoph Hellwig781355c2015-02-16 11:59:50 +110039#include "xfs_pnfs.h"
Christoph Hellwig68a9f5e2016-06-21 09:53:44 +100040#include "xfs_iomap.h"
Darrick J. Wong0613f162016-10-03 09:11:37 -070041#include "xfs_reflink.h"
Linus Torvalds1da177e2005-04-16 15:20:36 -070042
43#include <linux/dcache.h>
Christoph Hellwig2fe17c12011-01-14 13:07:43 +010044#include <linux/falloc.h>
Jeff Liud126d432012-08-21 17:11:57 +080045#include <linux/pagevec.h>
Tejun Heo66114ca2015-05-22 17:13:32 -040046#include <linux/backing-dev.h>
Christoph Hellwiga39e5962017-11-01 16:36:47 +010047#include <linux/mman.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070048
Alexey Dobriyanf0f37e2f2009-09-27 22:29:37 +040049static const struct vm_operations_struct xfs_file_vm_ops;
Linus Torvalds1da177e2005-04-16 15:20:36 -070050
Christoph Hellwig8add71c2015-02-02 09:53:56 +110051int
52xfs_update_prealloc_flags(
53 struct xfs_inode *ip,
54 enum xfs_prealloc_flags flags)
55{
56 struct xfs_trans *tp;
57 int error;
58
Christoph Hellwig253f4912016-04-06 09:19:55 +100059 error = xfs_trans_alloc(ip->i_mount, &M_RES(ip->i_mount)->tr_writeid,
60 0, 0, 0, &tp);
61 if (error)
Christoph Hellwig8add71c2015-02-02 09:53:56 +110062 return error;
Christoph Hellwig8add71c2015-02-02 09:53:56 +110063
64 xfs_ilock(ip, XFS_ILOCK_EXCL);
65 xfs_trans_ijoin(tp, ip, XFS_ILOCK_EXCL);
66
67 if (!(flags & XFS_PREALLOC_INVISIBLE)) {
Dave Chinnerc19b3b052016-02-09 16:54:58 +110068 VFS_I(ip)->i_mode &= ~S_ISUID;
69 if (VFS_I(ip)->i_mode & S_IXGRP)
70 VFS_I(ip)->i_mode &= ~S_ISGID;
Christoph Hellwig8add71c2015-02-02 09:53:56 +110071 xfs_trans_ichgtime(tp, ip, XFS_ICHGTIME_MOD | XFS_ICHGTIME_CHG);
72 }
73
74 if (flags & XFS_PREALLOC_SET)
75 ip->i_d.di_flags |= XFS_DIFLAG_PREALLOC;
76 if (flags & XFS_PREALLOC_CLEAR)
77 ip->i_d.di_flags &= ~XFS_DIFLAG_PREALLOC;
78
79 xfs_trans_log_inode(tp, ip, XFS_ILOG_CORE);
80 if (flags & XFS_PREALLOC_SYNC)
81 xfs_trans_set_sync(tp);
Christoph Hellwig70393312015-06-04 13:48:08 +100082 return xfs_trans_commit(tp);
Christoph Hellwig8add71c2015-02-02 09:53:56 +110083}
84
Christoph Hellwig1da2f2d2011-10-02 14:25:16 +000085/*
86 * Fsync operations on directories are much simpler than on regular files,
87 * as there is no file data to flush, and thus also no need for explicit
88 * cache flush operations, and there are no non-transaction metadata updates
89 * on directories either.
90 */
91STATIC int
92xfs_dir_fsync(
93 struct file *file,
94 loff_t start,
95 loff_t end,
96 int datasync)
97{
98 struct xfs_inode *ip = XFS_I(file->f_mapping->host);
99 struct xfs_mount *mp = ip->i_mount;
100 xfs_lsn_t lsn = 0;
101
102 trace_xfs_dir_fsync(ip);
103
104 xfs_ilock(ip, XFS_ILOCK_SHARED);
105 if (xfs_ipincount(ip))
106 lsn = ip->i_itemp->ili_last_lsn;
107 xfs_iunlock(ip, XFS_ILOCK_SHARED);
108
109 if (!lsn)
110 return 0;
Christoph Hellwig656de4f2018-03-13 23:15:28 -0700111 return xfs_log_force_lsn(mp, lsn, XFS_LOG_SYNC, NULL);
Christoph Hellwig1da2f2d2011-10-02 14:25:16 +0000112}
113
Christoph Hellwigfd3200b2010-02-15 09:44:48 +0000114STATIC int
115xfs_file_fsync(
116 struct file *file,
Josef Bacik02c24a82011-07-16 20:44:56 -0400117 loff_t start,
118 loff_t end,
Christoph Hellwigfd3200b2010-02-15 09:44:48 +0000119 int datasync)
120{
Christoph Hellwig7ea80852010-05-26 17:53:25 +0200121 struct inode *inode = file->f_mapping->host;
122 struct xfs_inode *ip = XFS_I(inode);
Christoph Hellwiga27a2632011-06-16 12:02:23 +0000123 struct xfs_mount *mp = ip->i_mount;
Christoph Hellwigfd3200b2010-02-15 09:44:48 +0000124 int error = 0;
125 int log_flushed = 0;
Christoph Hellwigb1037052011-09-19 14:55:51 +0000126 xfs_lsn_t lsn = 0;
Christoph Hellwigfd3200b2010-02-15 09:44:48 +0000127
Christoph Hellwigcca28fb2010-06-24 11:57:09 +1000128 trace_xfs_file_fsync(ip);
Christoph Hellwigfd3200b2010-02-15 09:44:48 +0000129
Jeff Layton1b180272017-07-06 07:02:30 -0400130 error = file_write_and_wait_range(file, start, end);
Josef Bacik02c24a82011-07-16 20:44:56 -0400131 if (error)
132 return error;
133
Christoph Hellwiga27a2632011-06-16 12:02:23 +0000134 if (XFS_FORCED_SHUTDOWN(mp))
Eric Sandeenb474c7a2014-06-22 15:04:54 +1000135 return -EIO;
Christoph Hellwigfd3200b2010-02-15 09:44:48 +0000136
137 xfs_iflags_clear(ip, XFS_ITRUNCATED);
138
Dave Chinner2291dab2016-12-09 16:49:54 +1100139 /*
140 * If we have an RT and/or log subvolume we need to make sure to flush
141 * the write cache the device used for file data first. This is to
142 * ensure newly written file data make it to disk before logging the new
143 * inode size in case of an extending write.
144 */
145 if (XFS_IS_REALTIME_INODE(ip))
146 xfs_blkdev_issue_flush(mp->m_rtdev_targp);
147 else if (mp->m_logdev_targp != mp->m_ddev_targp)
148 xfs_blkdev_issue_flush(mp->m_ddev_targp);
Christoph Hellwiga27a2632011-06-16 12:02:23 +0000149
Christoph Hellwigfd3200b2010-02-15 09:44:48 +0000150 /*
Dave Chinnerfc0561c2015-11-03 13:14:59 +1100151 * All metadata updates are logged, which means that we just have to
152 * flush the log up to the latest LSN that touched the inode. If we have
153 * concurrent fsync/fdatasync() calls, we need them to all block on the
154 * log force before we clear the ili_fsync_fields field. This ensures
155 * that we don't get a racing sync operation that does not wait for the
156 * metadata to hit the journal before returning. If we race with
157 * clearing the ili_fsync_fields, then all that will happen is the log
158 * force will do nothing as the lsn will already be on disk. We can't
159 * race with setting ili_fsync_fields because that is done under
160 * XFS_ILOCK_EXCL, and that can't happen because we hold the lock shared
161 * until after the ili_fsync_fields is cleared.
Christoph Hellwigfd3200b2010-02-15 09:44:48 +0000162 */
163 xfs_ilock(ip, XFS_ILOCK_SHARED);
Christoph Hellwig8f639dd2012-02-29 09:53:55 +0000164 if (xfs_ipincount(ip)) {
165 if (!datasync ||
Dave Chinnerfc0561c2015-11-03 13:14:59 +1100166 (ip->i_itemp->ili_fsync_fields & ~XFS_ILOG_TIMESTAMP))
Christoph Hellwig8f639dd2012-02-29 09:53:55 +0000167 lsn = ip->i_itemp->ili_last_lsn;
168 }
Christoph Hellwigfd3200b2010-02-15 09:44:48 +0000169
Dave Chinnerfc0561c2015-11-03 13:14:59 +1100170 if (lsn) {
Christoph Hellwig656de4f2018-03-13 23:15:28 -0700171 error = xfs_log_force_lsn(mp, lsn, XFS_LOG_SYNC, &log_flushed);
Dave Chinnerfc0561c2015-11-03 13:14:59 +1100172 ip->i_itemp->ili_fsync_fields = 0;
173 }
174 xfs_iunlock(ip, XFS_ILOCK_SHARED);
Christoph Hellwigb1037052011-09-19 14:55:51 +0000175
Christoph Hellwiga27a2632011-06-16 12:02:23 +0000176 /*
177 * If we only have a single device, and the log force about was
178 * a no-op we might have to flush the data device cache here.
179 * This can only happen for fdatasync/O_DSYNC if we were overwriting
180 * an already allocated file and thus do not have any metadata to
181 * commit.
182 */
Dave Chinner2291dab2016-12-09 16:49:54 +1100183 if (!log_flushed && !XFS_IS_REALTIME_INODE(ip) &&
184 mp->m_logdev_targp == mp->m_ddev_targp)
Christoph Hellwiga27a2632011-06-16 12:02:23 +0000185 xfs_blkdev_issue_flush(mp->m_ddev_targp);
Christoph Hellwigfd3200b2010-02-15 09:44:48 +0000186
Dave Chinner24513372014-06-25 14:58:08 +1000187 return error;
Christoph Hellwigfd3200b2010-02-15 09:44:48 +0000188}
189
Christoph Hellwig00258e32010-02-15 09:44:47 +0000190STATIC ssize_t
Christoph Hellwigbbc5a742016-07-20 11:35:42 +1000191xfs_file_dio_aio_read(
Christoph Hellwigdda35b82010-02-15 09:44:46 +0000192 struct kiocb *iocb,
Al Virob4f5d2c2014-04-02 14:37:59 -0400193 struct iov_iter *to)
Christoph Hellwigdda35b82010-02-15 09:44:46 +0000194{
Christoph Hellwigacdda3a2016-11-30 14:37:15 +1100195 struct xfs_inode *ip = XFS_I(file_inode(iocb->ki_filp));
Christoph Hellwigbbc5a742016-07-20 11:35:42 +1000196 size_t count = iov_iter_count(to);
Christoph Hellwigacdda3a2016-11-30 14:37:15 +1100197 ssize_t ret;
Christoph Hellwigdda35b82010-02-15 09:44:46 +0000198
Christoph Hellwigbbc5a742016-07-20 11:35:42 +1000199 trace_xfs_file_direct_read(ip, count, iocb->ki_pos);
Christoph Hellwigdda35b82010-02-15 09:44:46 +0000200
Christoph Hellwigf1285ff2016-07-20 11:36:57 +1000201 if (!count)
202 return 0; /* skip atime */
Christoph Hellwig00258e32010-02-15 09:44:47 +0000203
Christoph Hellwiga447d7c2016-10-03 09:47:34 +1100204 file_accessed(iocb->ki_filp);
205
Christoph Hellwig65523212016-11-30 14:33:25 +1100206 xfs_ilock(ip, XFS_IOLOCK_SHARED);
Christoph Hellwigacdda3a2016-11-30 14:37:15 +1100207 ret = iomap_dio_rw(iocb, to, &xfs_iomap_ops, NULL);
Christoph Hellwig65523212016-11-30 14:33:25 +1100208 xfs_iunlock(ip, XFS_IOLOCK_SHARED);
Christoph Hellwigacdda3a2016-11-30 14:37:15 +1100209
Christoph Hellwig16d4d432016-07-20 11:38:55 +1000210 return ret;
211}
212
Arnd Bergmannf021bd02016-07-22 09:50:55 +1000213static noinline ssize_t
Christoph Hellwig16d4d432016-07-20 11:38:55 +1000214xfs_file_dax_read(
215 struct kiocb *iocb,
216 struct iov_iter *to)
217{
Christoph Hellwig6c31f4952016-09-19 11:28:38 +1000218 struct xfs_inode *ip = XFS_I(iocb->ki_filp->f_mapping->host);
Christoph Hellwig16d4d432016-07-20 11:38:55 +1000219 size_t count = iov_iter_count(to);
220 ssize_t ret = 0;
221
222 trace_xfs_file_dax_read(ip, count, iocb->ki_pos);
223
224 if (!count)
225 return 0; /* skip atime */
226
Christoph Hellwig942491c2017-10-23 18:31:50 -0700227 if (iocb->ki_flags & IOCB_NOWAIT) {
228 if (!xfs_ilock_nowait(ip, XFS_IOLOCK_SHARED))
Goldwyn Rodrigues29a5d292017-06-20 07:05:48 -0500229 return -EAGAIN;
Christoph Hellwig942491c2017-10-23 18:31:50 -0700230 } else {
Goldwyn Rodrigues29a5d292017-06-20 07:05:48 -0500231 xfs_ilock(ip, XFS_IOLOCK_SHARED);
232 }
Christoph Hellwig942491c2017-10-23 18:31:50 -0700233
Ross Zwisler11c59c92016-11-08 11:32:46 +1100234 ret = dax_iomap_rw(iocb, to, &xfs_iomap_ops);
Christoph Hellwig65523212016-11-30 14:33:25 +1100235 xfs_iunlock(ip, XFS_IOLOCK_SHARED);
Christoph Hellwigbbc5a742016-07-20 11:35:42 +1000236
Christoph Hellwigf1285ff2016-07-20 11:36:57 +1000237 file_accessed(iocb->ki_filp);
Christoph Hellwigbbc5a742016-07-20 11:35:42 +1000238 return ret;
239}
240
241STATIC ssize_t
242xfs_file_buffered_aio_read(
243 struct kiocb *iocb,
244 struct iov_iter *to)
245{
246 struct xfs_inode *ip = XFS_I(file_inode(iocb->ki_filp));
247 ssize_t ret;
248
249 trace_xfs_file_buffered_read(ip, iov_iter_count(to), iocb->ki_pos);
250
Christoph Hellwig942491c2017-10-23 18:31:50 -0700251 if (iocb->ki_flags & IOCB_NOWAIT) {
252 if (!xfs_ilock_nowait(ip, XFS_IOLOCK_SHARED))
Christoph Hellwig91f99432017-08-29 16:13:20 +0200253 return -EAGAIN;
Christoph Hellwig942491c2017-10-23 18:31:50 -0700254 } else {
Christoph Hellwig91f99432017-08-29 16:13:20 +0200255 xfs_ilock(ip, XFS_IOLOCK_SHARED);
256 }
Al Virob4f5d2c2014-04-02 14:37:59 -0400257 ret = generic_file_read_iter(iocb, to);
Christoph Hellwig65523212016-11-30 14:33:25 +1100258 xfs_iunlock(ip, XFS_IOLOCK_SHARED);
Christoph Hellwigbbc5a742016-07-20 11:35:42 +1000259
260 return ret;
261}
262
263STATIC ssize_t
264xfs_file_read_iter(
265 struct kiocb *iocb,
266 struct iov_iter *to)
267{
Christoph Hellwig16d4d432016-07-20 11:38:55 +1000268 struct inode *inode = file_inode(iocb->ki_filp);
269 struct xfs_mount *mp = XFS_I(inode)->i_mount;
Christoph Hellwigbbc5a742016-07-20 11:35:42 +1000270 ssize_t ret = 0;
271
272 XFS_STATS_INC(mp, xs_read_calls);
273
274 if (XFS_FORCED_SHUTDOWN(mp))
275 return -EIO;
276
Christoph Hellwig16d4d432016-07-20 11:38:55 +1000277 if (IS_DAX(inode))
278 ret = xfs_file_dax_read(iocb, to);
279 else if (iocb->ki_flags & IOCB_DIRECT)
Christoph Hellwigbbc5a742016-07-20 11:35:42 +1000280 ret = xfs_file_dio_aio_read(iocb, to);
281 else
282 ret = xfs_file_buffered_aio_read(iocb, to);
283
Christoph Hellwigdda35b82010-02-15 09:44:46 +0000284 if (ret > 0)
Bill O'Donnellff6d6af2015-10-12 18:21:22 +1100285 XFS_STATS_ADD(mp, xs_read_bytes, ret);
Christoph Hellwigdda35b82010-02-15 09:44:46 +0000286 return ret;
287}
288
Dave Chinner4c5cfd12011-01-11 10:14:16 +1100289/*
Dave Chinner4d8d1582011-01-11 10:23:42 +1100290 * Common pre-write limit and setup checks.
291 *
Christoph Hellwig5bf1f262011-12-18 20:00:13 +0000292 * Called with the iolocked held either shared and exclusive according to
293 * @iolock, and returns with it held. Might upgrade the iolock to exclusive
294 * if called for a direct write beyond i_size.
Dave Chinner4d8d1582011-01-11 10:23:42 +1100295 */
296STATIC ssize_t
297xfs_file_aio_write_checks(
Al Viro99733fa2015-04-07 14:25:18 -0400298 struct kiocb *iocb,
299 struct iov_iter *from,
Dave Chinner4d8d1582011-01-11 10:23:42 +1100300 int *iolock)
301{
Al Viro99733fa2015-04-07 14:25:18 -0400302 struct file *file = iocb->ki_filp;
Dave Chinner4d8d1582011-01-11 10:23:42 +1100303 struct inode *inode = file->f_mapping->host;
304 struct xfs_inode *ip = XFS_I(inode);
Al Viro3309dd02015-04-09 12:55:47 -0400305 ssize_t error = 0;
Al Viro99733fa2015-04-07 14:25:18 -0400306 size_t count = iov_iter_count(from);
Brian Foster3136e8b2015-10-12 16:02:05 +1100307 bool drained_dio = false;
Christoph Hellwigf5c547172018-03-13 23:15:32 -0700308 loff_t isize;
Dave Chinner4d8d1582011-01-11 10:23:42 +1100309
Dave Chinner7271d242011-08-25 07:17:02 +0000310restart:
Al Viro3309dd02015-04-09 12:55:47 -0400311 error = generic_write_checks(iocb, from);
312 if (error <= 0)
Dave Chinner4d8d1582011-01-11 10:23:42 +1100313 return error;
Dave Chinner4d8d1582011-01-11 10:23:42 +1100314
Dan Williams69eb5fa2018-03-20 14:42:38 -0700315 error = xfs_break_layouts(inode, iolock, BREAK_WRITE);
Christoph Hellwig781355c2015-02-16 11:59:50 +1100316 if (error)
317 return error;
318
Christoph Hellwig65523212016-11-30 14:33:25 +1100319 /*
320 * For changing security info in file_remove_privs() we need i_rwsem
321 * exclusively.
322 */
Jan Karaa6de82c2015-05-21 16:05:56 +0200323 if (*iolock == XFS_IOLOCK_SHARED && !IS_NOSEC(inode)) {
Christoph Hellwig65523212016-11-30 14:33:25 +1100324 xfs_iunlock(ip, *iolock);
Jan Karaa6de82c2015-05-21 16:05:56 +0200325 *iolock = XFS_IOLOCK_EXCL;
Christoph Hellwig65523212016-11-30 14:33:25 +1100326 xfs_ilock(ip, *iolock);
Jan Karaa6de82c2015-05-21 16:05:56 +0200327 goto restart;
328 }
Dave Chinner4d8d1582011-01-11 10:23:42 +1100329 /*
330 * If the offset is beyond the size of the file, we need to zero any
331 * blocks that fall between the existing EOF and the start of this
Christoph Hellwig2813d682011-12-18 20:00:12 +0000332 * write. If zeroing is needed and we are currently holding the
Christoph Hellwig467f7892012-03-27 10:34:47 -0400333 * iolock shared, we need to update it to exclusive which implies
334 * having to redo all checks before.
Dave Chinnerb9d59842015-04-16 22:03:07 +1000335 *
336 * We need to serialise against EOF updates that occur in IO
337 * completions here. We want to make sure that nobody is changing the
338 * size while we do this check until we have placed an IO barrier (i.e.
339 * hold the XFS_IOLOCK_EXCL) that prevents new IO from being dispatched.
340 * The spinlock effectively forms a memory barrier once we have the
341 * XFS_IOLOCK_EXCL so we are guaranteed to see the latest EOF value
342 * and hence be able to correctly determine if we need to run zeroing.
Dave Chinner4d8d1582011-01-11 10:23:42 +1100343 */
Dave Chinnerb9d59842015-04-16 22:03:07 +1000344 spin_lock(&ip->i_flags_lock);
Christoph Hellwigf5c547172018-03-13 23:15:32 -0700345 isize = i_size_read(inode);
346 if (iocb->ki_pos > isize) {
Dave Chinnerb9d59842015-04-16 22:03:07 +1000347 spin_unlock(&ip->i_flags_lock);
Brian Foster3136e8b2015-10-12 16:02:05 +1100348 if (!drained_dio) {
349 if (*iolock == XFS_IOLOCK_SHARED) {
Christoph Hellwig65523212016-11-30 14:33:25 +1100350 xfs_iunlock(ip, *iolock);
Brian Foster3136e8b2015-10-12 16:02:05 +1100351 *iolock = XFS_IOLOCK_EXCL;
Christoph Hellwig65523212016-11-30 14:33:25 +1100352 xfs_ilock(ip, *iolock);
Brian Foster3136e8b2015-10-12 16:02:05 +1100353 iov_iter_reexpand(from, count);
354 }
Dave Chinner40c63fb2015-04-16 22:03:17 +1000355 /*
356 * We now have an IO submission barrier in place, but
357 * AIO can do EOF updates during IO completion and hence
358 * we now need to wait for all of them to drain. Non-AIO
359 * DIO will have drained before we are given the
360 * XFS_IOLOCK_EXCL, and so for most cases this wait is a
361 * no-op.
362 */
363 inode_dio_wait(inode);
Brian Foster3136e8b2015-10-12 16:02:05 +1100364 drained_dio = true;
Dave Chinner7271d242011-08-25 07:17:02 +0000365 goto restart;
366 }
Christoph Hellwigf5c547172018-03-13 23:15:32 -0700367
368 trace_xfs_zero_eof(ip, isize, iocb->ki_pos - isize);
369 error = iomap_zero_range(inode, isize, iocb->ki_pos - isize,
370 NULL, &xfs_iomap_ops);
Christoph Hellwig467f7892012-03-27 10:34:47 -0400371 if (error)
372 return error;
Dave Chinnerb9d59842015-04-16 22:03:07 +1000373 } else
374 spin_unlock(&ip->i_flags_lock);
Dave Chinner4d8d1582011-01-11 10:23:42 +1100375
376 /*
Christoph Hellwig8a9c9982012-02-29 09:53:52 +0000377 * Updating the timestamps will grab the ilock again from
378 * xfs_fs_dirty_inode, so we have to call it after dropping the
379 * lock above. Eventually we should look into a way to avoid
380 * the pointless lock roundtrip.
381 */
Josef Bacikc3b2da32012-03-26 09:59:21 -0400382 if (likely(!(file->f_mode & FMODE_NOCMTIME))) {
383 error = file_update_time(file);
384 if (error)
385 return error;
386 }
Christoph Hellwig8a9c9982012-02-29 09:53:52 +0000387
388 /*
Dave Chinner4d8d1582011-01-11 10:23:42 +1100389 * If we're writing the file then make sure to clear the setuid and
390 * setgid bits if the process is not being run by root. This keeps
391 * people from modifying setuid and setgid binaries.
392 */
Jan Karaa6de82c2015-05-21 16:05:56 +0200393 if (!IS_NOSEC(inode))
394 return file_remove_privs(file);
395 return 0;
Dave Chinner4d8d1582011-01-11 10:23:42 +1100396}
397
Christoph Hellwigacdda3a2016-11-30 14:37:15 +1100398static int
399xfs_dio_write_end_io(
400 struct kiocb *iocb,
401 ssize_t size,
402 unsigned flags)
403{
404 struct inode *inode = file_inode(iocb->ki_filp);
405 struct xfs_inode *ip = XFS_I(inode);
406 loff_t offset = iocb->ki_pos;
Christoph Hellwigacdda3a2016-11-30 14:37:15 +1100407 int error = 0;
408
409 trace_xfs_end_io_direct_write(ip, offset, size);
410
411 if (XFS_FORCED_SHUTDOWN(ip->i_mount))
412 return -EIO;
413
414 if (size <= 0)
415 return size;
416
Eryu Guanee70daa2017-09-21 11:26:18 -0700417 if (flags & IOMAP_DIO_COW) {
418 error = xfs_reflink_end_cow(ip, offset, size);
419 if (error)
420 return error;
421 }
422
423 /*
424 * Unwritten conversion updates the in-core isize after extent
425 * conversion but before updating the on-disk size. Updating isize any
426 * earlier allows a racing dio read to find unwritten extents before
427 * they are converted.
428 */
429 if (flags & IOMAP_DIO_UNWRITTEN)
430 return xfs_iomap_write_unwritten(ip, offset, size, true);
431
Christoph Hellwigacdda3a2016-11-30 14:37:15 +1100432 /*
433 * We need to update the in-core inode size here so that we don't end up
434 * with the on-disk inode size being outside the in-core inode size. We
435 * have no other method of updating EOF for AIO, so always do it here
436 * if necessary.
437 *
438 * We need to lock the test/set EOF update as we can be racing with
439 * other IO completions here to update the EOF. Failing to serialise
440 * here can result in EOF moving backwards and Bad Things Happen when
441 * that occurs.
442 */
443 spin_lock(&ip->i_flags_lock);
444 if (offset + size > i_size_read(inode)) {
445 i_size_write(inode, offset + size);
Eryu Guanee70daa2017-09-21 11:26:18 -0700446 spin_unlock(&ip->i_flags_lock);
Christoph Hellwigacdda3a2016-11-30 14:37:15 +1100447 error = xfs_setfilesize(ip, offset, size);
Eryu Guanee70daa2017-09-21 11:26:18 -0700448 } else {
449 spin_unlock(&ip->i_flags_lock);
450 }
Christoph Hellwigacdda3a2016-11-30 14:37:15 +1100451
452 return error;
453}
454
Dave Chinner4d8d1582011-01-11 10:23:42 +1100455/*
Dave Chinnerf0d26e82011-01-11 10:15:36 +1100456 * xfs_file_dio_aio_write - handle direct IO writes
457 *
458 * Lock the inode appropriately to prepare for and issue a direct IO write.
Dave Chinnereda77982011-01-11 10:22:40 +1100459 * By separating it from the buffered write path we remove all the tricky to
Dave Chinnerf0d26e82011-01-11 10:15:36 +1100460 * follow locking changes and looping.
461 *
Dave Chinnereda77982011-01-11 10:22:40 +1100462 * If there are cached pages or we're extending the file, we need IOLOCK_EXCL
463 * until we're sure the bytes at the new EOF have been zeroed and/or the cached
464 * pages are flushed out.
465 *
466 * In most cases the direct IO writes will be done holding IOLOCK_SHARED
467 * allowing them to be done in parallel with reads and other direct IO writes.
468 * However, if the IO is not aligned to filesystem blocks, the direct IO layer
469 * needs to do sub-block zeroing and that requires serialisation against other
470 * direct IOs to the same block. In this case we need to serialise the
471 * submission of the unaligned IOs so that we don't get racing block zeroing in
472 * the dio layer. To avoid the problem with aio, we also need to wait for
473 * outstanding IOs to complete so that unwritten extent conversion is completed
474 * before we try to map the overlapping block. This is currently implemented by
Christoph Hellwig4a06fd22011-08-23 08:28:13 +0000475 * hitting it with a big hammer (i.e. inode_dio_wait()).
Dave Chinnereda77982011-01-11 10:22:40 +1100476 *
Dave Chinnerf0d26e82011-01-11 10:15:36 +1100477 * Returns with locks held indicated by @iolock and errors indicated by
478 * negative return values.
479 */
480STATIC ssize_t
481xfs_file_dio_aio_write(
482 struct kiocb *iocb,
Al Virob3188912014-04-02 07:06:30 -0400483 struct iov_iter *from)
Dave Chinnerf0d26e82011-01-11 10:15:36 +1100484{
485 struct file *file = iocb->ki_filp;
486 struct address_space *mapping = file->f_mapping;
487 struct inode *inode = mapping->host;
488 struct xfs_inode *ip = XFS_I(inode);
489 struct xfs_mount *mp = ip->i_mount;
490 ssize_t ret = 0;
Dave Chinnereda77982011-01-11 10:22:40 +1100491 int unaligned_io = 0;
Christoph Hellwigd0606462011-12-18 20:00:14 +0000492 int iolock;
Al Virob3188912014-04-02 07:06:30 -0400493 size_t count = iov_iter_count(from);
Christoph Hellwigacdda3a2016-11-30 14:37:15 +1100494 struct xfs_buftarg *target = XFS_IS_REALTIME_INODE(ip) ?
Dave Chinnerf0d26e82011-01-11 10:15:36 +1100495 mp->m_rtdev_targp : mp->m_ddev_targp;
496
Eric Sandeen7c71ee72014-01-21 16:46:23 -0600497 /* DIO must be aligned to device logical sector size */
Christoph Hellwig16d4d432016-07-20 11:38:55 +1000498 if ((iocb->ki_pos | count) & target->bt_logical_sectormask)
Eric Sandeenb474c7a2014-06-22 15:04:54 +1000499 return -EINVAL;
Dave Chinnerf0d26e82011-01-11 10:15:36 +1100500
Christoph Hellwig0ee7a3f2016-10-20 15:44:14 +1100501 /*
502 * Don't take the exclusive iolock here unless the I/O is unaligned to
503 * the file system block size. We don't need to consider the EOF
504 * extension case here because xfs_file_aio_write_checks() will relock
505 * the inode as necessary for EOF zeroing cases and fill out the new
506 * inode size as appropriate.
507 */
Christoph Hellwig13712712016-04-07 08:51:57 -0700508 if ((iocb->ki_pos & mp->m_blockmask) ||
Christoph Hellwig0ee7a3f2016-10-20 15:44:14 +1100509 ((iocb->ki_pos + count) & mp->m_blockmask)) {
Dave Chinnereda77982011-01-11 10:22:40 +1100510 unaligned_io = 1;
Christoph Hellwig54a4ef82017-02-06 13:00:54 -0800511
512 /*
513 * We can't properly handle unaligned direct I/O to reflink
514 * files yet, as we can't unshare a partial block.
515 */
516 if (xfs_is_reflink_inode(ip)) {
517 trace_xfs_reflink_bounce_dio_write(ip, iocb->ki_pos, count);
518 return -EREMCHG;
519 }
Christoph Hellwigd0606462011-12-18 20:00:14 +0000520 iolock = XFS_IOLOCK_EXCL;
Christoph Hellwig0ee7a3f2016-10-20 15:44:14 +1100521 } else {
Christoph Hellwigd0606462011-12-18 20:00:14 +0000522 iolock = XFS_IOLOCK_SHARED;
Christoph Hellwigc58cb162011-08-27 14:42:53 +0000523 }
Dave Chinnerf0d26e82011-01-11 10:15:36 +1100524
Christoph Hellwig942491c2017-10-23 18:31:50 -0700525 if (iocb->ki_flags & IOCB_NOWAIT) {
526 if (!xfs_ilock_nowait(ip, iolock))
Goldwyn Rodrigues29a5d292017-06-20 07:05:48 -0500527 return -EAGAIN;
Christoph Hellwig942491c2017-10-23 18:31:50 -0700528 } else {
Goldwyn Rodrigues29a5d292017-06-20 07:05:48 -0500529 xfs_ilock(ip, iolock);
530 }
Christoph Hellwig0ee7a3f2016-10-20 15:44:14 +1100531
Al Viro99733fa2015-04-07 14:25:18 -0400532 ret = xfs_file_aio_write_checks(iocb, from, &iolock);
Dave Chinner4d8d1582011-01-11 10:23:42 +1100533 if (ret)
Christoph Hellwigd0606462011-12-18 20:00:14 +0000534 goto out;
Al Viro99733fa2015-04-07 14:25:18 -0400535 count = iov_iter_count(from);
Dave Chinnerf0d26e82011-01-11 10:15:36 +1100536
Dave Chinnereda77982011-01-11 10:22:40 +1100537 /*
538 * If we are doing unaligned IO, wait for all other IO to drain,
Christoph Hellwig0ee7a3f2016-10-20 15:44:14 +1100539 * otherwise demote the lock if we had to take the exclusive lock
540 * for other reasons in xfs_file_aio_write_checks.
Dave Chinnereda77982011-01-11 10:22:40 +1100541 */
Goldwyn Rodrigues29a5d292017-06-20 07:05:48 -0500542 if (unaligned_io) {
543 /* If we are going to wait for other DIO to finish, bail */
544 if (iocb->ki_flags & IOCB_NOWAIT) {
545 if (atomic_read(&inode->i_dio_count))
546 return -EAGAIN;
547 } else {
548 inode_dio_wait(inode);
549 }
550 } else if (iolock == XFS_IOLOCK_EXCL) {
Christoph Hellwig65523212016-11-30 14:33:25 +1100551 xfs_ilock_demote(ip, XFS_IOLOCK_EXCL);
Christoph Hellwigd0606462011-12-18 20:00:14 +0000552 iolock = XFS_IOLOCK_SHARED;
Dave Chinnerf0d26e82011-01-11 10:15:36 +1100553 }
554
Christoph Hellwig3176c3e2016-07-20 11:31:42 +1000555 trace_xfs_file_direct_write(ip, count, iocb->ki_pos);
Christoph Hellwigacdda3a2016-11-30 14:37:15 +1100556 ret = iomap_dio_rw(iocb, from, &xfs_iomap_ops, xfs_dio_write_end_io);
Christoph Hellwigd0606462011-12-18 20:00:14 +0000557out:
Christoph Hellwig65523212016-11-30 14:33:25 +1100558 xfs_iunlock(ip, iolock);
Christoph Hellwigd0606462011-12-18 20:00:14 +0000559
Dave Chinner6b698ed2015-06-04 09:18:53 +1000560 /*
Christoph Hellwig16d4d432016-07-20 11:38:55 +1000561 * No fallback to buffered IO on errors for XFS, direct IO will either
562 * complete fully or fail.
Dave Chinner6b698ed2015-06-04 09:18:53 +1000563 */
Christoph Hellwig16d4d432016-07-20 11:38:55 +1000564 ASSERT(ret < 0 || ret == count);
565 return ret;
566}
567
Arnd Bergmannf021bd02016-07-22 09:50:55 +1000568static noinline ssize_t
Christoph Hellwig16d4d432016-07-20 11:38:55 +1000569xfs_file_dax_write(
570 struct kiocb *iocb,
571 struct iov_iter *from)
572{
Christoph Hellwig6c31f4952016-09-19 11:28:38 +1000573 struct inode *inode = iocb->ki_filp->f_mapping->host;
Christoph Hellwig16d4d432016-07-20 11:38:55 +1000574 struct xfs_inode *ip = XFS_I(inode);
Christoph Hellwig17879e82016-09-19 11:24:50 +1000575 int iolock = XFS_IOLOCK_EXCL;
Christoph Hellwig6c31f4952016-09-19 11:28:38 +1000576 ssize_t ret, error = 0;
577 size_t count;
578 loff_t pos;
Christoph Hellwig16d4d432016-07-20 11:38:55 +1000579
Christoph Hellwig942491c2017-10-23 18:31:50 -0700580 if (iocb->ki_flags & IOCB_NOWAIT) {
581 if (!xfs_ilock_nowait(ip, iolock))
Goldwyn Rodrigues29a5d292017-06-20 07:05:48 -0500582 return -EAGAIN;
Christoph Hellwig942491c2017-10-23 18:31:50 -0700583 } else {
Goldwyn Rodrigues29a5d292017-06-20 07:05:48 -0500584 xfs_ilock(ip, iolock);
585 }
586
Christoph Hellwig16d4d432016-07-20 11:38:55 +1000587 ret = xfs_file_aio_write_checks(iocb, from, &iolock);
588 if (ret)
589 goto out;
590
Christoph Hellwig6c31f4952016-09-19 11:28:38 +1000591 pos = iocb->ki_pos;
592 count = iov_iter_count(from);
Dave Chinner8b2180b2016-08-17 08:31:33 +1000593
Christoph Hellwig6c31f4952016-09-19 11:28:38 +1000594 trace_xfs_file_dax_write(ip, count, pos);
Ross Zwisler11c59c92016-11-08 11:32:46 +1100595 ret = dax_iomap_rw(iocb, from, &xfs_iomap_ops);
Christoph Hellwig6c31f4952016-09-19 11:28:38 +1000596 if (ret > 0 && iocb->ki_pos > i_size_read(inode)) {
597 i_size_write(inode, iocb->ki_pos);
598 error = xfs_setfilesize(ip, pos, ret);
Christoph Hellwig16d4d432016-07-20 11:38:55 +1000599 }
Christoph Hellwig16d4d432016-07-20 11:38:55 +1000600out:
Christoph Hellwig65523212016-11-30 14:33:25 +1100601 xfs_iunlock(ip, iolock);
Christoph Hellwig6c31f4952016-09-19 11:28:38 +1000602 return error ? error : ret;
Dave Chinnerf0d26e82011-01-11 10:15:36 +1100603}
604
Christoph Hellwig00258e32010-02-15 09:44:47 +0000605STATIC ssize_t
Dave Chinner637bbc72011-01-11 10:17:30 +1100606xfs_file_buffered_aio_write(
607 struct kiocb *iocb,
Al Virob3188912014-04-02 07:06:30 -0400608 struct iov_iter *from)
Dave Chinner637bbc72011-01-11 10:17:30 +1100609{
610 struct file *file = iocb->ki_filp;
611 struct address_space *mapping = file->f_mapping;
612 struct inode *inode = mapping->host;
613 struct xfs_inode *ip = XFS_I(inode);
614 ssize_t ret;
615 int enospc = 0;
Brian Fosterc3155092017-01-27 23:22:56 -0800616 int iolock;
Dave Chinner637bbc72011-01-11 10:17:30 +1100617
Christoph Hellwig91f99432017-08-29 16:13:20 +0200618 if (iocb->ki_flags & IOCB_NOWAIT)
619 return -EOPNOTSUPP;
620
Brian Fosterc3155092017-01-27 23:22:56 -0800621write_retry:
622 iolock = XFS_IOLOCK_EXCL;
Christoph Hellwig65523212016-11-30 14:33:25 +1100623 xfs_ilock(ip, iolock);
Dave Chinner637bbc72011-01-11 10:17:30 +1100624
Al Viro99733fa2015-04-07 14:25:18 -0400625 ret = xfs_file_aio_write_checks(iocb, from, &iolock);
Dave Chinner4d8d1582011-01-11 10:23:42 +1100626 if (ret)
Christoph Hellwigd0606462011-12-18 20:00:14 +0000627 goto out;
Dave Chinner637bbc72011-01-11 10:17:30 +1100628
629 /* We can write back this queue in page reclaim */
Christoph Hellwigde1414a2015-01-14 10:42:36 +0100630 current->backing_dev_info = inode_to_bdi(inode);
Dave Chinner637bbc72011-01-11 10:17:30 +1100631
Christoph Hellwig3176c3e2016-07-20 11:31:42 +1000632 trace_xfs_file_buffered_write(ip, iov_iter_count(from), iocb->ki_pos);
Christoph Hellwig68a9f5e2016-06-21 09:53:44 +1000633 ret = iomap_file_buffered_write(iocb, from, &xfs_iomap_ops);
Al Viro0a64bc22014-02-11 22:25:22 -0500634 if (likely(ret >= 0))
Al Viro99733fa2015-04-07 14:25:18 -0400635 iocb->ki_pos += ret;
Brian Fosterdc06f3982014-07-24 19:49:28 +1000636
Dave Chinner637bbc72011-01-11 10:17:30 +1100637 /*
Brian Fosterdc06f3982014-07-24 19:49:28 +1000638 * If we hit a space limit, try to free up some lingering preallocated
639 * space before returning an error. In the case of ENOSPC, first try to
640 * write back all dirty inodes to free up some of the excess reserved
641 * metadata space. This reduces the chances that the eofblocks scan
642 * waits on dirty mappings. Since xfs_flush_inodes() is serialized, this
643 * also behaves as a filter to prevent too many eofblocks scans from
644 * running at the same time.
Dave Chinner637bbc72011-01-11 10:17:30 +1100645 */
Brian Fosterdc06f3982014-07-24 19:49:28 +1000646 if (ret == -EDQUOT && !enospc) {
Brian Fosterc3155092017-01-27 23:22:56 -0800647 xfs_iunlock(ip, iolock);
Brian Fosterdc06f3982014-07-24 19:49:28 +1000648 enospc = xfs_inode_free_quota_eofblocks(ip);
649 if (enospc)
650 goto write_retry;
Darrick J. Wong83104d42016-10-03 09:11:46 -0700651 enospc = xfs_inode_free_quota_cowblocks(ip);
652 if (enospc)
653 goto write_retry;
Brian Fosterc3155092017-01-27 23:22:56 -0800654 iolock = 0;
Brian Fosterdc06f3982014-07-24 19:49:28 +1000655 } else if (ret == -ENOSPC && !enospc) {
656 struct xfs_eofblocks eofb = {0};
657
Dave Chinner637bbc72011-01-11 10:17:30 +1100658 enospc = 1;
Dave Chinner9aa05002012-10-08 21:56:04 +1100659 xfs_flush_inodes(ip->i_mount);
Brian Fosterc3155092017-01-27 23:22:56 -0800660
661 xfs_iunlock(ip, iolock);
Brian Fosterdc06f3982014-07-24 19:49:28 +1000662 eofb.eof_flags = XFS_EOF_FLAGS_SYNC;
663 xfs_icache_free_eofblocks(ip->i_mount, &eofb);
Brian Fostercf2cb782017-06-20 14:36:19 -0700664 xfs_icache_free_cowblocks(ip->i_mount, &eofb);
Dave Chinner9aa05002012-10-08 21:56:04 +1100665 goto write_retry;
Dave Chinner637bbc72011-01-11 10:17:30 +1100666 }
Christoph Hellwigd0606462011-12-18 20:00:14 +0000667
Dave Chinner637bbc72011-01-11 10:17:30 +1100668 current->backing_dev_info = NULL;
Christoph Hellwigd0606462011-12-18 20:00:14 +0000669out:
Brian Fosterc3155092017-01-27 23:22:56 -0800670 if (iolock)
671 xfs_iunlock(ip, iolock);
Dave Chinner637bbc72011-01-11 10:17:30 +1100672 return ret;
673}
674
675STATIC ssize_t
Al Virobf97f3bc2014-04-03 14:20:23 -0400676xfs_file_write_iter(
Christoph Hellwigdda35b82010-02-15 09:44:46 +0000677 struct kiocb *iocb,
Al Virobf97f3bc2014-04-03 14:20:23 -0400678 struct iov_iter *from)
Christoph Hellwigdda35b82010-02-15 09:44:46 +0000679{
680 struct file *file = iocb->ki_filp;
681 struct address_space *mapping = file->f_mapping;
682 struct inode *inode = mapping->host;
Christoph Hellwig00258e32010-02-15 09:44:47 +0000683 struct xfs_inode *ip = XFS_I(inode);
Dave Chinner637bbc72011-01-11 10:17:30 +1100684 ssize_t ret;
Al Virobf97f3bc2014-04-03 14:20:23 -0400685 size_t ocount = iov_iter_count(from);
Christoph Hellwigdda35b82010-02-15 09:44:46 +0000686
Bill O'Donnellff6d6af2015-10-12 18:21:22 +1100687 XFS_STATS_INC(ip->i_mount, xs_write_calls);
Christoph Hellwigdda35b82010-02-15 09:44:46 +0000688
Dave Chinner637bbc72011-01-11 10:17:30 +1100689 if (ocount == 0)
Christoph Hellwigdda35b82010-02-15 09:44:46 +0000690 return 0;
691
Al Virobf97f3bc2014-04-03 14:20:23 -0400692 if (XFS_FORCED_SHUTDOWN(ip->i_mount))
693 return -EIO;
Christoph Hellwigdda35b82010-02-15 09:44:46 +0000694
Christoph Hellwig16d4d432016-07-20 11:38:55 +1000695 if (IS_DAX(inode))
696 ret = xfs_file_dax_write(iocb, from);
Darrick J. Wong0613f162016-10-03 09:11:37 -0700697 else if (iocb->ki_flags & IOCB_DIRECT) {
698 /*
699 * Allow a directio write to fall back to a buffered
700 * write *only* in the case that we're doing a reflink
701 * CoW. In all other directio scenarios we do not
702 * allow an operation to fall back to buffered mode.
703 */
Al Virobf97f3bc2014-04-03 14:20:23 -0400704 ret = xfs_file_dio_aio_write(iocb, from);
Darrick J. Wong0613f162016-10-03 09:11:37 -0700705 if (ret == -EREMCHG)
706 goto buffered;
707 } else {
708buffered:
Al Virobf97f3bc2014-04-03 14:20:23 -0400709 ret = xfs_file_buffered_aio_write(iocb, from);
Darrick J. Wong0613f162016-10-03 09:11:37 -0700710 }
Christoph Hellwigdda35b82010-02-15 09:44:46 +0000711
Christoph Hellwigd0606462011-12-18 20:00:14 +0000712 if (ret > 0) {
Bill O'Donnellff6d6af2015-10-12 18:21:22 +1100713 XFS_STATS_ADD(ip->i_mount, xs_write_bytes, ret);
Christoph Hellwigce7ae1512011-12-18 20:00:11 +0000714
Christoph Hellwigd0606462011-12-18 20:00:14 +0000715 /* Handle various SYNC-type writes */
Christoph Hellwige2592212016-04-07 08:52:01 -0700716 ret = generic_write_sync(iocb, ret);
Christoph Hellwigdda35b82010-02-15 09:44:46 +0000717 }
Dave Chinnera363f0c2011-01-11 10:13:53 +1100718 return ret;
Christoph Hellwigdda35b82010-02-15 09:44:46 +0000719}
720
Dan Williams69eb5fa2018-03-20 14:42:38 -0700721int
722xfs_break_layouts(
723 struct inode *inode,
724 uint *iolock,
725 enum layout_break_reason reason)
726{
727 bool retry;
728
729 ASSERT(xfs_isilocked(XFS_I(inode), XFS_IOLOCK_SHARED|XFS_IOLOCK_EXCL));
730
731 switch (reason) {
732 case BREAK_UNMAP:
733 ASSERT(xfs_isilocked(XFS_I(inode), XFS_MMAPLOCK_EXCL));
734 /* fall through */
735 case BREAK_WRITE:
736 return xfs_break_leased_layouts(inode, iolock, &retry);
737 default:
738 WARN_ON_ONCE(1);
739 return -EINVAL;
740 }
741}
742
Namjae Jeona904b1c2015-03-25 15:08:56 +1100743#define XFS_FALLOC_FL_SUPPORTED \
744 (FALLOC_FL_KEEP_SIZE | FALLOC_FL_PUNCH_HOLE | \
745 FALLOC_FL_COLLAPSE_RANGE | FALLOC_FL_ZERO_RANGE | \
Darrick J. Wong98cc2db2016-10-03 09:11:43 -0700746 FALLOC_FL_INSERT_RANGE | FALLOC_FL_UNSHARE_RANGE)
Namjae Jeona904b1c2015-03-25 15:08:56 +1100747
Christoph Hellwig2fe17c12011-01-14 13:07:43 +0100748STATIC long
749xfs_file_fallocate(
Christoph Hellwig83aee9e2013-10-12 00:55:07 -0700750 struct file *file,
751 int mode,
752 loff_t offset,
753 loff_t len)
Christoph Hellwig2fe17c12011-01-14 13:07:43 +0100754{
Christoph Hellwig83aee9e2013-10-12 00:55:07 -0700755 struct inode *inode = file_inode(file);
756 struct xfs_inode *ip = XFS_I(inode);
Christoph Hellwig83aee9e2013-10-12 00:55:07 -0700757 long error;
Christoph Hellwig8add71c2015-02-02 09:53:56 +1100758 enum xfs_prealloc_flags flags = 0;
Dan Williamsc63a8ea2018-03-12 14:12:29 -0700759 uint iolock = XFS_IOLOCK_EXCL | XFS_MMAPLOCK_EXCL;
Christoph Hellwig83aee9e2013-10-12 00:55:07 -0700760 loff_t new_size = 0;
Thomas Meyer749f24f2017-10-09 11:38:54 -0700761 bool do_file_insert = false;
Christoph Hellwig2fe17c12011-01-14 13:07:43 +0100762
Christoph Hellwig83aee9e2013-10-12 00:55:07 -0700763 if (!S_ISREG(inode->i_mode))
764 return -EINVAL;
Namjae Jeona904b1c2015-03-25 15:08:56 +1100765 if (mode & ~XFS_FALLOC_FL_SUPPORTED)
Christoph Hellwig2fe17c12011-01-14 13:07:43 +0100766 return -EOPNOTSUPP;
767
Christoph Hellwig781355c2015-02-16 11:59:50 +1100768 xfs_ilock(ip, iolock);
Dan Williams69eb5fa2018-03-20 14:42:38 -0700769 error = xfs_break_layouts(inode, &iolock, BREAK_UNMAP);
Christoph Hellwig781355c2015-02-16 11:59:50 +1100770 if (error)
771 goto out_unlock;
772
Christoph Hellwig83aee9e2013-10-12 00:55:07 -0700773 if (mode & FALLOC_FL_PUNCH_HOLE) {
774 error = xfs_free_file_space(ip, offset, len);
775 if (error)
776 goto out_unlock;
Namjae Jeone1d8fb82014-02-24 10:58:19 +1100777 } else if (mode & FALLOC_FL_COLLAPSE_RANGE) {
Fabian Frederick93407472017-02-27 14:28:32 -0800778 unsigned int blksize_mask = i_blocksize(inode) - 1;
Namjae Jeone1d8fb82014-02-24 10:58:19 +1100779
780 if (offset & blksize_mask || len & blksize_mask) {
Dave Chinner24513372014-06-25 14:58:08 +1000781 error = -EINVAL;
Namjae Jeone1d8fb82014-02-24 10:58:19 +1100782 goto out_unlock;
783 }
784
Lukas Czerner23fffa92014-04-12 09:56:41 -0400785 /*
786 * There is no need to overlap collapse range with EOF,
787 * in which case it is effectively a truncate operation
788 */
789 if (offset + len >= i_size_read(inode)) {
Dave Chinner24513372014-06-25 14:58:08 +1000790 error = -EINVAL;
Lukas Czerner23fffa92014-04-12 09:56:41 -0400791 goto out_unlock;
792 }
793
Namjae Jeone1d8fb82014-02-24 10:58:19 +1100794 new_size = i_size_read(inode) - len;
795
796 error = xfs_collapse_file_space(ip, offset, len);
797 if (error)
798 goto out_unlock;
Namjae Jeona904b1c2015-03-25 15:08:56 +1100799 } else if (mode & FALLOC_FL_INSERT_RANGE) {
Fabian Frederick93407472017-02-27 14:28:32 -0800800 unsigned int blksize_mask = i_blocksize(inode) - 1;
Namjae Jeona904b1c2015-03-25 15:08:56 +1100801
802 new_size = i_size_read(inode) + len;
803 if (offset & blksize_mask || len & blksize_mask) {
804 error = -EINVAL;
805 goto out_unlock;
806 }
807
808 /* check the new inode size does not wrap through zero */
809 if (new_size > inode->i_sb->s_maxbytes) {
810 error = -EFBIG;
811 goto out_unlock;
812 }
813
814 /* Offset should be less than i_size */
815 if (offset >= i_size_read(inode)) {
816 error = -EINVAL;
817 goto out_unlock;
818 }
Thomas Meyer749f24f2017-10-09 11:38:54 -0700819 do_file_insert = true;
Christoph Hellwig83aee9e2013-10-12 00:55:07 -0700820 } else {
Christoph Hellwig8add71c2015-02-02 09:53:56 +1100821 flags |= XFS_PREALLOC_SET;
822
Christoph Hellwig83aee9e2013-10-12 00:55:07 -0700823 if (!(mode & FALLOC_FL_KEEP_SIZE) &&
824 offset + len > i_size_read(inode)) {
825 new_size = offset + len;
Dave Chinner24513372014-06-25 14:58:08 +1000826 error = inode_newsize_ok(inode, new_size);
Christoph Hellwig83aee9e2013-10-12 00:55:07 -0700827 if (error)
828 goto out_unlock;
829 }
Christoph Hellwig2fe17c12011-01-14 13:07:43 +0100830
Lukas Czerner376ba312014-03-13 19:07:58 +1100831 if (mode & FALLOC_FL_ZERO_RANGE)
832 error = xfs_zero_file_space(ip, offset, len);
Darrick J. Wong98cc2db2016-10-03 09:11:43 -0700833 else {
834 if (mode & FALLOC_FL_UNSHARE_RANGE) {
835 error = xfs_reflink_unshare(ip, offset, len);
836 if (error)
837 goto out_unlock;
838 }
Lukas Czerner376ba312014-03-13 19:07:58 +1100839 error = xfs_alloc_file_space(ip, offset, len,
840 XFS_BMAPI_PREALLOC);
Darrick J. Wong98cc2db2016-10-03 09:11:43 -0700841 }
Christoph Hellwig2fe17c12011-01-14 13:07:43 +0100842 if (error)
843 goto out_unlock;
844 }
845
Christoph Hellwig83aee9e2013-10-12 00:55:07 -0700846 if (file->f_flags & O_DSYNC)
Christoph Hellwig8add71c2015-02-02 09:53:56 +1100847 flags |= XFS_PREALLOC_SYNC;
848
849 error = xfs_update_prealloc_flags(ip, flags);
Christoph Hellwig2fe17c12011-01-14 13:07:43 +0100850 if (error)
851 goto out_unlock;
852
853 /* Change file size if needed */
854 if (new_size) {
855 struct iattr iattr;
856
857 iattr.ia_valid = ATTR_SIZE;
858 iattr.ia_size = new_size;
Jan Kara69bca802016-05-26 14:46:43 +0200859 error = xfs_vn_setattr_size(file_dentry(file), &iattr);
Namjae Jeona904b1c2015-03-25 15:08:56 +1100860 if (error)
861 goto out_unlock;
Christoph Hellwig2fe17c12011-01-14 13:07:43 +0100862 }
863
Namjae Jeona904b1c2015-03-25 15:08:56 +1100864 /*
865 * Perform hole insertion now that the file size has been
866 * updated so that if we crash during the operation we don't
867 * leave shifted extents past EOF and hence losing access to
868 * the data that is contained within them.
869 */
870 if (do_file_insert)
871 error = xfs_insert_file_space(ip, offset, len);
872
Christoph Hellwig2fe17c12011-01-14 13:07:43 +0100873out_unlock:
Christoph Hellwig781355c2015-02-16 11:59:50 +1100874 xfs_iunlock(ip, iolock);
Dave Chinner24513372014-06-25 14:58:08 +1000875 return error;
Christoph Hellwig2fe17c12011-01-14 13:07:43 +0100876}
877
Darrick J. Wong9fe26042016-10-03 09:11:40 -0700878STATIC int
879xfs_file_clone_range(
880 struct file *file_in,
881 loff_t pos_in,
882 struct file *file_out,
883 loff_t pos_out,
884 u64 len)
885{
Christoph Hellwig5faaf4f2016-10-20 15:50:07 +1100886 return xfs_reflink_remap_range(file_in, pos_in, file_out, pos_out,
Darrick J. Wongcc714662016-10-03 09:11:41 -0700887 len, false);
888}
889
Darrick J. Wongcc714662016-10-03 09:11:41 -0700890STATIC ssize_t
891xfs_file_dedupe_range(
892 struct file *src_file,
893 u64 loff,
894 u64 len,
895 struct file *dst_file,
896 u64 dst_loff)
897{
898 int error;
899
Christoph Hellwig5faaf4f2016-10-20 15:50:07 +1100900 error = xfs_reflink_remap_range(src_file, loff, dst_file, dst_loff,
Darrick J. Wongcc714662016-10-03 09:11:41 -0700901 len, true);
902 if (error)
903 return error;
904 return len;
Darrick J. Wong9fe26042016-10-03 09:11:40 -0700905}
Christoph Hellwig2fe17c12011-01-14 13:07:43 +0100906
Linus Torvalds1da177e2005-04-16 15:20:36 -0700907STATIC int
Nathan Scott3562fd42006-03-14 14:00:35 +1100908xfs_file_open(
Linus Torvalds1da177e2005-04-16 15:20:36 -0700909 struct inode *inode,
Christoph Hellwigf999a5b2008-11-28 14:23:32 +1100910 struct file *file)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700911{
Christoph Hellwigf999a5b2008-11-28 14:23:32 +1100912 if (!(file->f_flags & O_LARGEFILE) && i_size_read(inode) > MAX_NON_LFS)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700913 return -EFBIG;
Christoph Hellwigf999a5b2008-11-28 14:23:32 +1100914 if (XFS_FORCED_SHUTDOWN(XFS_M(inode->i_sb)))
915 return -EIO;
Christoph Hellwig91f99432017-08-29 16:13:20 +0200916 file->f_mode |= FMODE_NOWAIT;
Christoph Hellwigf999a5b2008-11-28 14:23:32 +1100917 return 0;
918}
919
920STATIC int
921xfs_dir_open(
922 struct inode *inode,
923 struct file *file)
924{
925 struct xfs_inode *ip = XFS_I(inode);
926 int mode;
927 int error;
928
929 error = xfs_file_open(inode, file);
930 if (error)
931 return error;
932
933 /*
934 * If there are any blocks, read-ahead block 0 as we're almost
935 * certain to have the next operation be a read there.
936 */
Christoph Hellwig309ecac82013-12-06 12:30:09 -0800937 mode = xfs_ilock_data_map_shared(ip);
Christoph Hellwigf999a5b2008-11-28 14:23:32 +1100938 if (ip->i_d.di_nextents > 0)
Darrick J. Wong7a652bb2017-02-02 15:13:58 -0800939 error = xfs_dir3_data_readahead(ip, 0, -1);
Christoph Hellwigf999a5b2008-11-28 14:23:32 +1100940 xfs_iunlock(ip, mode);
Darrick J. Wong7a652bb2017-02-02 15:13:58 -0800941 return error;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700942}
943
Linus Torvalds1da177e2005-04-16 15:20:36 -0700944STATIC int
Nathan Scott3562fd42006-03-14 14:00:35 +1100945xfs_file_release(
Linus Torvalds1da177e2005-04-16 15:20:36 -0700946 struct inode *inode,
947 struct file *filp)
948{
Dave Chinner24513372014-06-25 14:58:08 +1000949 return xfs_release(XFS_I(inode));
Linus Torvalds1da177e2005-04-16 15:20:36 -0700950}
951
Linus Torvalds1da177e2005-04-16 15:20:36 -0700952STATIC int
Nathan Scott3562fd42006-03-14 14:00:35 +1100953xfs_file_readdir(
Al Virob8227552013-05-22 17:07:56 -0400954 struct file *file,
955 struct dir_context *ctx)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700956{
Al Virob8227552013-05-22 17:07:56 -0400957 struct inode *inode = file_inode(file);
Christoph Hellwig739bfb22007-08-29 10:58:01 +1000958 xfs_inode_t *ip = XFS_I(inode);
Christoph Hellwig051e7cd2007-08-28 13:58:24 +1000959 size_t bufsize;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700960
Christoph Hellwig051e7cd2007-08-28 13:58:24 +1000961 /*
962 * The Linux API doesn't pass down the total size of the buffer
963 * we read into down to the filesystem. With the filldir concept
964 * it's not needed for correct information, but the XFS dir2 leaf
965 * code wants an estimate of the buffer size to calculate it's
966 * readahead window and size the buffers used for mapping to
967 * physical blocks.
968 *
969 * Try to give it an estimate that's good enough, maybe at some
970 * point we can change the ->readdir prototype to include the
Eric Sandeena9cc7992010-02-03 17:50:13 +0000971 * buffer size. For now we use the current glibc buffer size.
Christoph Hellwig051e7cd2007-08-28 13:58:24 +1000972 */
Darrick J. Wonga5c46e52017-10-17 21:37:44 -0700973 bufsize = (size_t)min_t(loff_t, XFS_READDIR_BUFSIZE, ip->i_d.di_size);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700974
Darrick J. Wongacb95532017-06-16 11:00:14 -0700975 return xfs_readdir(NULL, ip, ctx, bufsize);
Jeff Liu3fe3e6b2012-05-10 21:29:17 +0800976}
977
978STATIC loff_t
979xfs_file_llseek(
980 struct file *file,
981 loff_t offset,
Eric Sandeen59f9c002014-09-09 11:57:10 +1000982 int whence)
Jeff Liu3fe3e6b2012-05-10 21:29:17 +0800983{
Christoph Hellwig9b2970a2017-06-29 11:43:21 -0700984 struct inode *inode = file->f_mapping->host;
985
986 if (XFS_FORCED_SHUTDOWN(XFS_I(inode)->i_mount))
987 return -EIO;
988
Eric Sandeen59f9c002014-09-09 11:57:10 +1000989 switch (whence) {
Christoph Hellwig9b2970a2017-06-29 11:43:21 -0700990 default:
Eric Sandeen59f9c002014-09-09 11:57:10 +1000991 return generic_file_llseek(file, offset, whence);
Jeff Liu3fe3e6b2012-05-10 21:29:17 +0800992 case SEEK_HOLE:
Christoph Hellwig9b2970a2017-06-29 11:43:21 -0700993 offset = iomap_seek_hole(inode, offset, &xfs_iomap_ops);
994 break;
Eric Sandeen49c69592014-09-09 11:56:48 +1000995 case SEEK_DATA:
Christoph Hellwig9b2970a2017-06-29 11:43:21 -0700996 offset = iomap_seek_data(inode, offset, &xfs_iomap_ops);
997 break;
Jeff Liu3fe3e6b2012-05-10 21:29:17 +0800998 }
Christoph Hellwig9b2970a2017-06-29 11:43:21 -0700999
1000 if (offset < 0)
1001 return offset;
1002 return vfs_setpos(file, offset, inode->i_sb->s_maxbytes);
Jeff Liu3fe3e6b2012-05-10 21:29:17 +08001003}
1004
Dave Chinnerde0e8c22015-02-23 21:44:19 +11001005/*
1006 * Locking for serialisation of IO during page faults. This results in a lock
1007 * ordering of:
1008 *
1009 * mmap_sem (MM)
Dave Chinner6b698ed2015-06-04 09:18:53 +10001010 * sb_start_pagefault(vfs, freeze)
Dave Chinner13ad4fe2015-11-03 12:37:02 +11001011 * i_mmaplock (XFS - truncate serialisation)
Dave Chinner6b698ed2015-06-04 09:18:53 +10001012 * page_lock (MM)
1013 * i_lock (XFS - extent map serialisation)
Dave Chinnerde0e8c22015-02-23 21:44:19 +11001014 */
Christoph Hellwigd522d562017-08-29 10:08:41 -07001015static int
1016__xfs_filemap_fault(
Dave Jiangc791ace2017-02-24 14:57:08 -08001017 struct vm_fault *vmf,
Christoph Hellwigd522d562017-08-29 10:08:41 -07001018 enum page_entry_size pe_size,
1019 bool write_fault)
Matthew Wilcoxacd76e72015-09-08 14:59:06 -07001020{
Dave Jiangf4200392017-02-22 15:40:06 -08001021 struct inode *inode = file_inode(vmf->vma->vm_file);
Matthew Wilcoxacd76e72015-09-08 14:59:06 -07001022 struct xfs_inode *ip = XFS_I(inode);
1023 int ret;
1024
Christoph Hellwigd522d562017-08-29 10:08:41 -07001025 trace_xfs_filemap_fault(ip, pe_size, write_fault);
Matthew Wilcoxacd76e72015-09-08 14:59:06 -07001026
Christoph Hellwigd522d562017-08-29 10:08:41 -07001027 if (write_fault) {
Dave Chinner13ad4fe2015-11-03 12:37:02 +11001028 sb_start_pagefault(inode->i_sb);
Dave Jiangf4200392017-02-22 15:40:06 -08001029 file_update_time(vmf->vma->vm_file);
Dave Chinner13ad4fe2015-11-03 12:37:02 +11001030 }
1031
Matthew Wilcoxacd76e72015-09-08 14:59:06 -07001032 xfs_ilock(XFS_I(inode), XFS_MMAPLOCK_SHARED);
Christoph Hellwigd522d562017-08-29 10:08:41 -07001033 if (IS_DAX(inode)) {
Christoph Hellwiga39e5962017-11-01 16:36:47 +01001034 pfn_t pfn;
1035
Jan Karac0b24622018-01-07 16:38:43 -05001036 ret = dax_iomap_fault(vmf, pe_size, &pfn, NULL, &xfs_iomap_ops);
Christoph Hellwiga39e5962017-11-01 16:36:47 +01001037 if (ret & VM_FAULT_NEEDDSYNC)
1038 ret = dax_finish_sync_fault(vmf, pe_size, pfn);
Christoph Hellwigd522d562017-08-29 10:08:41 -07001039 } else {
1040 if (write_fault)
1041 ret = iomap_page_mkwrite(vmf, &xfs_iomap_ops);
1042 else
1043 ret = filemap_fault(vmf);
1044 }
Matthew Wilcoxacd76e72015-09-08 14:59:06 -07001045 xfs_iunlock(XFS_I(inode), XFS_MMAPLOCK_SHARED);
Dave Chinner13ad4fe2015-11-03 12:37:02 +11001046
Christoph Hellwigd522d562017-08-29 10:08:41 -07001047 if (write_fault)
Dave Chinner13ad4fe2015-11-03 12:37:02 +11001048 sb_end_pagefault(inode->i_sb);
Matthew Wilcoxacd76e72015-09-08 14:59:06 -07001049 return ret;
1050}
1051
Christoph Hellwigd522d562017-08-29 10:08:41 -07001052static int
1053xfs_filemap_fault(
1054 struct vm_fault *vmf)
1055{
1056 /* DAX can shortcut the normal fault path on write faults! */
1057 return __xfs_filemap_fault(vmf, PE_SIZE_PTE,
1058 IS_DAX(file_inode(vmf->vma->vm_file)) &&
1059 (vmf->flags & FAULT_FLAG_WRITE));
1060}
1061
1062static int
1063xfs_filemap_huge_fault(
1064 struct vm_fault *vmf,
1065 enum page_entry_size pe_size)
1066{
1067 if (!IS_DAX(file_inode(vmf->vma->vm_file)))
1068 return VM_FAULT_FALLBACK;
1069
1070 /* DAX can shortcut the normal fault path on write faults! */
1071 return __xfs_filemap_fault(vmf, pe_size,
1072 (vmf->flags & FAULT_FLAG_WRITE));
1073}
1074
1075static int
1076xfs_filemap_page_mkwrite(
1077 struct vm_fault *vmf)
1078{
1079 return __xfs_filemap_fault(vmf, PE_SIZE_PTE, true);
1080}
1081
Dave Chinner3af49282015-11-03 12:37:02 +11001082/*
Jan Kara7b565c92017-11-01 16:36:46 +01001083 * pfn_mkwrite was originally intended to ensure we capture time stamp updates
1084 * on write faults. In reality, it needs to serialise against truncate and
1085 * prepare memory for writing so handle is as standard write fault.
Dave Chinner3af49282015-11-03 12:37:02 +11001086 */
1087static int
1088xfs_filemap_pfn_mkwrite(
Dave Chinner3af49282015-11-03 12:37:02 +11001089 struct vm_fault *vmf)
1090{
1091
Jan Kara7b565c92017-11-01 16:36:46 +01001092 return __xfs_filemap_fault(vmf, PE_SIZE_PTE, true);
Dave Chinner3af49282015-11-03 12:37:02 +11001093}
1094
Dave Chinner6b698ed2015-06-04 09:18:53 +10001095static const struct vm_operations_struct xfs_file_vm_ops = {
1096 .fault = xfs_filemap_fault,
Dave Jianga2d58162017-02-24 14:56:59 -08001097 .huge_fault = xfs_filemap_huge_fault,
Dave Chinner6b698ed2015-06-04 09:18:53 +10001098 .map_pages = filemap_map_pages,
1099 .page_mkwrite = xfs_filemap_page_mkwrite,
Dave Chinner3af49282015-11-03 12:37:02 +11001100 .pfn_mkwrite = xfs_filemap_pfn_mkwrite,
Dave Chinner6b698ed2015-06-04 09:18:53 +10001101};
1102
1103STATIC int
1104xfs_file_mmap(
1105 struct file *filp,
1106 struct vm_area_struct *vma)
1107{
Christoph Hellwiga39e5962017-11-01 16:36:47 +01001108 /*
1109 * We don't support synchronous mappings for non-DAX files. At least
1110 * until someone comes with a sensible use case.
1111 */
1112 if (!IS_DAX(file_inode(filp)) && (vma->vm_flags & VM_SYNC))
1113 return -EOPNOTSUPP;
1114
Dave Chinner6b698ed2015-06-04 09:18:53 +10001115 file_accessed(filp);
1116 vma->vm_ops = &xfs_file_vm_ops;
1117 if (IS_DAX(file_inode(filp)))
Matthew Wilcoxacd76e72015-09-08 14:59:06 -07001118 vma->vm_flags |= VM_MIXEDMAP | VM_HUGEPAGE;
Dave Chinner6b698ed2015-06-04 09:18:53 +10001119 return 0;
Dave Chinner075a9242015-02-23 21:44:54 +11001120}
1121
Arjan van de Ven4b6f5d22006-03-28 01:56:42 -08001122const struct file_operations xfs_file_operations = {
Jeff Liu3fe3e6b2012-05-10 21:29:17 +08001123 .llseek = xfs_file_llseek,
Al Virob4f5d2c2014-04-02 14:37:59 -04001124 .read_iter = xfs_file_read_iter,
Al Virobf97f3bc2014-04-03 14:20:23 -04001125 .write_iter = xfs_file_write_iter,
Al Viro82c156f2016-09-22 23:35:42 -04001126 .splice_read = generic_file_splice_read,
Al Viro8d020762014-04-05 04:27:08 -04001127 .splice_write = iter_file_splice_write,
Nathan Scott3562fd42006-03-14 14:00:35 +11001128 .unlocked_ioctl = xfs_file_ioctl,
Linus Torvalds1da177e2005-04-16 15:20:36 -07001129#ifdef CONFIG_COMPAT
Nathan Scott3562fd42006-03-14 14:00:35 +11001130 .compat_ioctl = xfs_file_compat_ioctl,
Linus Torvalds1da177e2005-04-16 15:20:36 -07001131#endif
Nathan Scott3562fd42006-03-14 14:00:35 +11001132 .mmap = xfs_file_mmap,
Christoph Hellwiga39e5962017-11-01 16:36:47 +01001133 .mmap_supported_flags = MAP_SYNC,
Nathan Scott3562fd42006-03-14 14:00:35 +11001134 .open = xfs_file_open,
1135 .release = xfs_file_release,
1136 .fsync = xfs_file_fsync,
Toshi Kanidbe6ec82016-10-07 16:59:59 -07001137 .get_unmapped_area = thp_get_unmapped_area,
Christoph Hellwig2fe17c12011-01-14 13:07:43 +01001138 .fallocate = xfs_file_fallocate,
Darrick J. Wong9fe26042016-10-03 09:11:40 -07001139 .clone_file_range = xfs_file_clone_range,
Darrick J. Wongcc714662016-10-03 09:11:41 -07001140 .dedupe_file_range = xfs_file_dedupe_range,
Linus Torvalds1da177e2005-04-16 15:20:36 -07001141};
1142
Arjan van de Ven4b6f5d22006-03-28 01:56:42 -08001143const struct file_operations xfs_dir_file_operations = {
Christoph Hellwigf999a5b2008-11-28 14:23:32 +11001144 .open = xfs_dir_open,
Linus Torvalds1da177e2005-04-16 15:20:36 -07001145 .read = generic_read_dir,
Al Viro3b0a3c12016-04-20 23:42:46 -04001146 .iterate_shared = xfs_file_readdir,
Al Viro59af1582008-08-24 07:24:41 -04001147 .llseek = generic_file_llseek,
Nathan Scott3562fd42006-03-14 14:00:35 +11001148 .unlocked_ioctl = xfs_file_ioctl,
Nathan Scottd3870392005-05-06 06:44:46 -07001149#ifdef CONFIG_COMPAT
Nathan Scott3562fd42006-03-14 14:00:35 +11001150 .compat_ioctl = xfs_file_compat_ioctl,
Nathan Scottd3870392005-05-06 06:44:46 -07001151#endif
Christoph Hellwig1da2f2d2011-10-02 14:25:16 +00001152 .fsync = xfs_dir_fsync,
Linus Torvalds1da177e2005-04-16 15:20:36 -07001153};