blob: aadb25413e6e6a4e9dc20e46831be4a30b9f0ba1 [file] [log] [blame]
Miklos Szeredie9be9d52014-10-24 00:14:38 +02001/*
2 *
3 * Copyright (C) 2011 Novell Inc.
4 *
5 * This program is free software; you can redistribute it and/or modify it
6 * under the terms of the GNU General Public License version 2 as published by
7 * the Free Software Foundation.
8 */
9
10#include <linux/fs.h>
11#include <linux/namei.h>
12#include <linux/xattr.h>
Miklos Szeredie9be9d52014-10-24 00:14:38 +020013#include <linux/mount.h>
Miklos Szeredie9be9d52014-10-24 00:14:38 +020014#include <linux/parser.h>
15#include <linux/module.h>
Andy Whitcroftcc259632014-10-24 00:14:38 +020016#include <linux/statfs.h>
Erez Zadokf45827e82014-10-24 00:14:38 +020017#include <linux/seq_file.h>
Miklos Szeredid837a492016-07-29 12:05:24 +020018#include <linux/posix_acl_xattr.h>
Miklos Szeredie9be9d52014-10-24 00:14:38 +020019#include "overlayfs.h"
Miklos Szeredibbb1e542016-12-16 11:02:56 +010020#include "ovl_entry.h"
Miklos Szeredie9be9d52014-10-24 00:14:38 +020021
22MODULE_AUTHOR("Miklos Szeredi <miklos@szeredi.hu>");
23MODULE_DESCRIPTION("Overlay filesystem");
24MODULE_LICENSE("GPL");
25
Miklos Szeredie9be9d52014-10-24 00:14:38 +020026
27struct ovl_dir_cache;
28
Miklos Szeredia78d9f02014-12-13 00:59:52 +010029#define OVL_MAX_STACK 500
30
Miklos Szeredie9be9d52014-10-24 00:14:38 +020031
32static void ovl_dentry_release(struct dentry *dentry)
33{
34 struct ovl_entry *oe = dentry->d_fsdata;
35
36 if (oe) {
Miklos Szeredidd662662014-12-13 00:59:43 +010037 unsigned int i;
38
Miklos Szeredie9be9d52014-10-24 00:14:38 +020039 dput(oe->__upperdentry);
Miklos Szeredidd662662014-12-13 00:59:43 +010040 for (i = 0; i < oe->numlower; i++)
41 dput(oe->lowerstack[i].dentry);
Miklos Szeredie9be9d52014-10-24 00:14:38 +020042 kfree_rcu(oe, rcu);
43 }
44}
45
Miklos Szeredi2d902672016-06-30 08:53:27 +020046static struct dentry *ovl_d_real(struct dentry *dentry,
47 const struct inode *inode,
48 unsigned int open_flags)
Miklos Szeredid101a122016-03-26 16:14:37 -040049{
50 struct dentry *real;
51
Miklos Szeredica4c8a32016-12-16 11:02:55 +010052 if (!d_is_reg(dentry)) {
Miklos Szeredid101a122016-03-26 16:14:37 -040053 if (!inode || inode == d_inode(dentry))
54 return dentry;
55 goto bug;
56 }
57
Miklos Szeredi2d902672016-06-30 08:53:27 +020058 if (d_is_negative(dentry))
59 return dentry;
60
61 if (open_flags) {
62 int err = ovl_open_maybe_copy_up(dentry, open_flags);
63
64 if (err)
65 return ERR_PTR(err);
66 }
67
Miklos Szeredid101a122016-03-26 16:14:37 -040068 real = ovl_dentry_upper(dentry);
69 if (real && (!inode || inode == d_inode(real)))
70 return real;
71
72 real = ovl_dentry_lower(dentry);
73 if (!real)
74 goto bug;
75
Miklos Szeredic4fcfc12016-11-29 10:20:24 +010076 /* Handle recursion */
77 real = d_real(real, inode, open_flags);
78
Miklos Szeredid101a122016-03-26 16:14:37 -040079 if (!inode || inode == d_inode(real))
80 return real;
Miklos Szeredid101a122016-03-26 16:14:37 -040081bug:
Miklos Szeredi656189d2016-07-29 12:05:24 +020082 WARN(1, "ovl_d_real(%pd4, %s:%lu): real dentry not found\n", dentry,
Miklos Szeredid101a122016-03-26 16:14:37 -040083 inode ? inode->i_sb->s_id : "NULL", inode ? inode->i_ino : 0);
84 return dentry;
85}
86
Miklos Szeredi7c03b5d2015-06-22 13:53:48 +020087static int ovl_dentry_revalidate(struct dentry *dentry, unsigned int flags)
88{
89 struct ovl_entry *oe = dentry->d_fsdata;
90 unsigned int i;
91 int ret = 1;
92
93 for (i = 0; i < oe->numlower; i++) {
94 struct dentry *d = oe->lowerstack[i].dentry;
95
96 if (d->d_flags & DCACHE_OP_REVALIDATE) {
97 ret = d->d_op->d_revalidate(d, flags);
98 if (ret < 0)
99 return ret;
100 if (!ret) {
101 if (!(flags & LOOKUP_RCU))
102 d_invalidate(d);
103 return -ESTALE;
104 }
105 }
106 }
107 return 1;
108}
109
110static int ovl_dentry_weak_revalidate(struct dentry *dentry, unsigned int flags)
111{
112 struct ovl_entry *oe = dentry->d_fsdata;
113 unsigned int i;
114 int ret = 1;
115
116 for (i = 0; i < oe->numlower; i++) {
117 struct dentry *d = oe->lowerstack[i].dentry;
118
119 if (d->d_flags & DCACHE_OP_WEAK_REVALIDATE) {
120 ret = d->d_op->d_weak_revalidate(d, flags);
121 if (ret <= 0)
122 break;
123 }
124 }
125 return ret;
126}
127
Miklos Szeredie9be9d52014-10-24 00:14:38 +0200128static const struct dentry_operations ovl_dentry_operations = {
129 .d_release = ovl_dentry_release,
Miklos Szeredid101a122016-03-26 16:14:37 -0400130 .d_real = ovl_d_real,
Miklos Szeredie9be9d52014-10-24 00:14:38 +0200131};
132
Miklos Szeredi7c03b5d2015-06-22 13:53:48 +0200133static const struct dentry_operations ovl_reval_dentry_operations = {
134 .d_release = ovl_dentry_release,
Miklos Szeredid101a122016-03-26 16:14:37 -0400135 .d_real = ovl_d_real,
Miklos Szeredi7c03b5d2015-06-22 13:53:48 +0200136 .d_revalidate = ovl_dentry_revalidate,
137 .d_weak_revalidate = ovl_dentry_weak_revalidate,
138};
139
Miklos Szeredie9be9d52014-10-24 00:14:38 +0200140static void ovl_put_super(struct super_block *sb)
141{
142 struct ovl_fs *ufs = sb->s_fs_info;
Miklos Szeredidd662662014-12-13 00:59:43 +0100143 unsigned i;
Miklos Szeredie9be9d52014-10-24 00:14:38 +0200144
145 dput(ufs->workdir);
146 mntput(ufs->upper_mnt);
Miklos Szeredidd662662014-12-13 00:59:43 +0100147 for (i = 0; i < ufs->numlower; i++)
148 mntput(ufs->lower_mnt[i]);
Konstantin Khlebnikov5ffdbe82015-08-24 15:57:19 +0300149 kfree(ufs->lower_mnt);
Miklos Szeredie9be9d52014-10-24 00:14:38 +0200150
Erez Zadokf45827e82014-10-24 00:14:38 +0200151 kfree(ufs->config.lowerdir);
152 kfree(ufs->config.upperdir);
153 kfree(ufs->config.workdir);
Antonio Murdaca3fe6e522016-04-07 15:48:25 +0200154 put_cred(ufs->creator_cred);
Miklos Szeredie9be9d52014-10-24 00:14:38 +0200155 kfree(ufs);
156}
157
Andy Whitcroftcc259632014-10-24 00:14:38 +0200158/**
159 * ovl_statfs
160 * @sb: The overlayfs super block
161 * @buf: The struct kstatfs to fill in with stats
162 *
163 * Get the filesystem statistics. As writes always target the upper layer
Miklos Szeredi4ebc5812014-12-13 00:59:46 +0100164 * filesystem pass the statfs to the upper filesystem (if it exists)
Andy Whitcroftcc259632014-10-24 00:14:38 +0200165 */
166static int ovl_statfs(struct dentry *dentry, struct kstatfs *buf)
167{
168 struct ovl_fs *ofs = dentry->d_sb->s_fs_info;
169 struct dentry *root_dentry = dentry->d_sb->s_root;
170 struct path path;
171 int err;
172
Miklos Szeredi4ebc5812014-12-13 00:59:46 +0100173 ovl_path_real(root_dentry, &path);
Andy Whitcroftcc259632014-10-24 00:14:38 +0200174
175 err = vfs_statfs(&path, buf);
176 if (!err) {
Miklos Szeredi6b2d5fe2016-12-16 11:02:56 +0100177 buf->f_namelen = ofs->namelen;
Andy Whitcroftcc259632014-10-24 00:14:38 +0200178 buf->f_type = OVERLAYFS_SUPER_MAGIC;
179 }
180
181 return err;
182}
183
Erez Zadokf45827e82014-10-24 00:14:38 +0200184/**
185 * ovl_show_options
186 *
187 * Prints the mount options for a given superblock.
188 * Returns zero; does not fail.
189 */
190static int ovl_show_options(struct seq_file *m, struct dentry *dentry)
191{
192 struct super_block *sb = dentry->d_sb;
193 struct ovl_fs *ufs = sb->s_fs_info;
194
Kees Cooka068acf2015-09-04 15:44:57 -0700195 seq_show_option(m, "lowerdir", ufs->config.lowerdir);
Miklos Szeredi53a08cb2014-12-13 00:59:51 +0100196 if (ufs->config.upperdir) {
Kees Cooka068acf2015-09-04 15:44:57 -0700197 seq_show_option(m, "upperdir", ufs->config.upperdir);
198 seq_show_option(m, "workdir", ufs->config.workdir);
Miklos Szeredi53a08cb2014-12-13 00:59:51 +0100199 }
Miklos Szeredi8d3095f2015-10-12 17:11:44 +0200200 if (ufs->config.default_permissions)
201 seq_puts(m, ",default_permissions");
Erez Zadokf45827e82014-10-24 00:14:38 +0200202 return 0;
203}
204
Seunghun Lee3cdf6fe2015-01-03 02:26:49 +0900205static int ovl_remount(struct super_block *sb, int *flags, char *data)
206{
207 struct ovl_fs *ufs = sb->s_fs_info;
208
Miklos Szeredicc6f67b2015-05-19 14:30:12 +0200209 if (!(*flags & MS_RDONLY) && (!ufs->upper_mnt || !ufs->workdir))
Seunghun Lee3cdf6fe2015-01-03 02:26:49 +0900210 return -EROFS;
211
212 return 0;
213}
214
Miklos Szeredie9be9d52014-10-24 00:14:38 +0200215static const struct super_operations ovl_super_operations = {
216 .put_super = ovl_put_super,
Andy Whitcroftcc259632014-10-24 00:14:38 +0200217 .statfs = ovl_statfs,
Erez Zadokf45827e82014-10-24 00:14:38 +0200218 .show_options = ovl_show_options,
Seunghun Lee3cdf6fe2015-01-03 02:26:49 +0900219 .remount_fs = ovl_remount,
Miklos Szeredieead4f22016-07-29 12:05:22 +0200220 .drop_inode = generic_delete_inode,
Miklos Szeredie9be9d52014-10-24 00:14:38 +0200221};
222
223enum {
224 OPT_LOWERDIR,
225 OPT_UPPERDIR,
226 OPT_WORKDIR,
Miklos Szeredi8d3095f2015-10-12 17:11:44 +0200227 OPT_DEFAULT_PERMISSIONS,
Miklos Szeredie9be9d52014-10-24 00:14:38 +0200228 OPT_ERR,
229};
230
231static const match_table_t ovl_tokens = {
232 {OPT_LOWERDIR, "lowerdir=%s"},
233 {OPT_UPPERDIR, "upperdir=%s"},
234 {OPT_WORKDIR, "workdir=%s"},
Miklos Szeredi8d3095f2015-10-12 17:11:44 +0200235 {OPT_DEFAULT_PERMISSIONS, "default_permissions"},
Miklos Szeredie9be9d52014-10-24 00:14:38 +0200236 {OPT_ERR, NULL}
237};
238
Miklos Szeredi91c77942014-11-20 16:40:00 +0100239static char *ovl_next_opt(char **s)
240{
241 char *sbegin = *s;
242 char *p;
243
244 if (sbegin == NULL)
245 return NULL;
246
247 for (p = sbegin; *p; p++) {
248 if (*p == '\\') {
249 p++;
250 if (!*p)
251 break;
252 } else if (*p == ',') {
253 *p = '\0';
254 *s = p + 1;
255 return sbegin;
256 }
257 }
258 *s = NULL;
259 return sbegin;
260}
261
Miklos Szeredie9be9d52014-10-24 00:14:38 +0200262static int ovl_parse_opt(char *opt, struct ovl_config *config)
263{
264 char *p;
265
Miklos Szeredi91c77942014-11-20 16:40:00 +0100266 while ((p = ovl_next_opt(&opt)) != NULL) {
Miklos Szeredie9be9d52014-10-24 00:14:38 +0200267 int token;
268 substring_t args[MAX_OPT_ARGS];
269
270 if (!*p)
271 continue;
272
273 token = match_token(p, ovl_tokens, args);
274 switch (token) {
275 case OPT_UPPERDIR:
276 kfree(config->upperdir);
277 config->upperdir = match_strdup(&args[0]);
278 if (!config->upperdir)
279 return -ENOMEM;
280 break;
281
282 case OPT_LOWERDIR:
283 kfree(config->lowerdir);
284 config->lowerdir = match_strdup(&args[0]);
285 if (!config->lowerdir)
286 return -ENOMEM;
287 break;
288
289 case OPT_WORKDIR:
290 kfree(config->workdir);
291 config->workdir = match_strdup(&args[0]);
292 if (!config->workdir)
293 return -ENOMEM;
294 break;
295
Miklos Szeredi8d3095f2015-10-12 17:11:44 +0200296 case OPT_DEFAULT_PERMISSIONS:
297 config->default_permissions = true;
298 break;
299
Miklos Szeredie9be9d52014-10-24 00:14:38 +0200300 default:
hujianyangbead55e2015-01-15 13:17:36 +0800301 pr_err("overlayfs: unrecognized mount option \"%s\" or missing value\n", p);
Miklos Szeredie9be9d52014-10-24 00:14:38 +0200302 return -EINVAL;
303 }
304 }
hujianyang71cbad72015-01-15 13:20:57 +0800305
306 /* Workdir is useless in non-upper mount */
307 if (!config->upperdir && config->workdir) {
308 pr_info("overlayfs: option \"workdir=%s\" is useless in a non-upper mount, ignore\n",
309 config->workdir);
310 kfree(config->workdir);
311 config->workdir = NULL;
312 }
313
Miklos Szeredie9be9d52014-10-24 00:14:38 +0200314 return 0;
315}
316
317#define OVL_WORKDIR_NAME "work"
318
319static struct dentry *ovl_workdir_create(struct vfsmount *mnt,
320 struct dentry *dentry)
321{
322 struct inode *dir = dentry->d_inode;
323 struct dentry *work;
324 int err;
325 bool retried = false;
326
327 err = mnt_want_write(mnt);
328 if (err)
329 return ERR_PTR(err);
330
Al Viro59551022016-01-22 15:40:57 -0500331 inode_lock_nested(dir, I_MUTEX_PARENT);
Miklos Szeredie9be9d52014-10-24 00:14:38 +0200332retry:
333 work = lookup_one_len(OVL_WORKDIR_NAME, dentry,
334 strlen(OVL_WORKDIR_NAME));
335
336 if (!IS_ERR(work)) {
337 struct kstat stat = {
338 .mode = S_IFDIR | 0,
339 };
Miklos Szeredic11b9fd2016-09-01 11:11:59 +0200340 struct iattr attr = {
341 .ia_valid = ATTR_MODE,
342 .ia_mode = stat.mode,
343 };
Miklos Szeredie9be9d52014-10-24 00:14:38 +0200344
345 if (work->d_inode) {
346 err = -EEXIST;
347 if (retried)
348 goto out_dput;
349
350 retried = true;
Miklos Szeredieea2fb42016-09-01 11:11:59 +0200351 ovl_workdir_cleanup(dir, mnt, work, 0);
Miklos Szeredie9be9d52014-10-24 00:14:38 +0200352 dput(work);
353 goto retry;
354 }
355
356 err = ovl_create_real(dir, work, &stat, NULL, NULL, true);
357 if (err)
358 goto out_dput;
Miklos Szeredic11b9fd2016-09-01 11:11:59 +0200359
Miklos Szeredicb348ed2016-10-04 14:40:44 +0200360 /*
361 * Try to remove POSIX ACL xattrs from workdir. We are good if:
362 *
363 * a) success (there was a POSIX ACL xattr and was removed)
364 * b) -ENODATA (there was no POSIX ACL xattr)
365 * c) -EOPNOTSUPP (POSIX ACL xattrs are not supported)
366 *
367 * There are various other error values that could effectively
368 * mean that the xattr doesn't exist (e.g. -ERANGE is returned
369 * if the xattr name is too long), but the set of filesystems
370 * allowed as upper are limited to "normal" ones, where checking
371 * for the above two errors is sufficient.
372 */
Miklos Szeredic11b9fd2016-09-01 11:11:59 +0200373 err = vfs_removexattr(work, XATTR_NAME_POSIX_ACL_DEFAULT);
Miklos Szeredie1ff3dd2016-09-05 13:55:20 +0200374 if (err && err != -ENODATA && err != -EOPNOTSUPP)
Miklos Szeredic11b9fd2016-09-01 11:11:59 +0200375 goto out_dput;
376
377 err = vfs_removexattr(work, XATTR_NAME_POSIX_ACL_ACCESS);
Miklos Szeredie1ff3dd2016-09-05 13:55:20 +0200378 if (err && err != -ENODATA && err != -EOPNOTSUPP)
Miklos Szeredic11b9fd2016-09-01 11:11:59 +0200379 goto out_dput;
380
381 /* Clear any inherited mode bits */
382 inode_lock(work->d_inode);
383 err = notify_change(work, &attr, NULL);
384 inode_unlock(work->d_inode);
385 if (err)
386 goto out_dput;
Miklos Szeredie9be9d52014-10-24 00:14:38 +0200387 }
388out_unlock:
Al Viro59551022016-01-22 15:40:57 -0500389 inode_unlock(dir);
Miklos Szeredie9be9d52014-10-24 00:14:38 +0200390 mnt_drop_write(mnt);
391
392 return work;
393
394out_dput:
395 dput(work);
396 work = ERR_PTR(err);
397 goto out_unlock;
398}
399
Miklos Szeredi91c77942014-11-20 16:40:00 +0100400static void ovl_unescape(char *s)
401{
402 char *d = s;
403
404 for (;; s++, d++) {
405 if (*s == '\\')
406 s++;
407 *d = *s;
408 if (!*s)
409 break;
410 }
411}
412
Miklos Szerediab508822014-12-13 00:59:49 +0100413static int ovl_mount_dir_noesc(const char *name, struct path *path)
414{
Miklos Szeredia78d9f02014-12-13 00:59:52 +0100415 int err = -EINVAL;
Miklos Szerediab508822014-12-13 00:59:49 +0100416
Miklos Szeredia78d9f02014-12-13 00:59:52 +0100417 if (!*name) {
418 pr_err("overlayfs: empty lowerdir\n");
419 goto out;
420 }
Miklos Szerediab508822014-12-13 00:59:49 +0100421 err = kern_path(name, LOOKUP_FOLLOW, path);
422 if (err) {
423 pr_err("overlayfs: failed to resolve '%s': %i\n", name, err);
424 goto out;
425 }
426 err = -EINVAL;
Miklos Szeredi7c03b5d2015-06-22 13:53:48 +0200427 if (ovl_dentry_weird(path->dentry)) {
Miklos Szerediab508822014-12-13 00:59:49 +0100428 pr_err("overlayfs: filesystem on '%s' not supported\n", name);
429 goto out_put;
430 }
Miklos Szeredi2b8c30e2016-12-16 11:02:56 +0100431 if (!d_is_dir(path->dentry)) {
Miklos Szerediab508822014-12-13 00:59:49 +0100432 pr_err("overlayfs: '%s' not a directory\n", name);
433 goto out_put;
434 }
435 return 0;
436
437out_put:
438 path_put(path);
439out:
440 return err;
441}
442
443static int ovl_mount_dir(const char *name, struct path *path)
444{
445 int err = -ENOMEM;
446 char *tmp = kstrdup(name, GFP_KERNEL);
447
448 if (tmp) {
449 ovl_unescape(tmp);
450 err = ovl_mount_dir_noesc(tmp, path);
Miklos Szeredi7c03b5d2015-06-22 13:53:48 +0200451
452 if (!err)
453 if (ovl_dentry_remote(path->dentry)) {
454 pr_err("overlayfs: filesystem on '%s' not supported as upperdir\n",
455 tmp);
456 path_put(path);
457 err = -EINVAL;
458 }
Miklos Szerediab508822014-12-13 00:59:49 +0100459 kfree(tmp);
460 }
461 return err;
462}
463
Miklos Szeredi6b2d5fe2016-12-16 11:02:56 +0100464static int ovl_check_namelen(struct path *path, struct ovl_fs *ofs,
465 const char *name)
466{
467 struct kstatfs statfs;
468 int err = vfs_statfs(path, &statfs);
469
470 if (err)
471 pr_err("overlayfs: statfs failed on '%s'\n", name);
472 else
473 ofs->namelen = max(ofs->namelen, statfs.f_namelen);
474
475 return err;
476}
477
478static int ovl_lower_dir(const char *name, struct path *path,
479 struct ovl_fs *ofs, int *stack_depth, bool *remote)
Miklos Szerediab508822014-12-13 00:59:49 +0100480{
481 int err;
Miklos Szerediab508822014-12-13 00:59:49 +0100482
Miklos Szeredia78d9f02014-12-13 00:59:52 +0100483 err = ovl_mount_dir_noesc(name, path);
Miklos Szerediab508822014-12-13 00:59:49 +0100484 if (err)
485 goto out;
486
Miklos Szeredi6b2d5fe2016-12-16 11:02:56 +0100487 err = ovl_check_namelen(path, ofs, name);
488 if (err)
Miklos Szerediab508822014-12-13 00:59:49 +0100489 goto out_put;
Miklos Szeredi6b2d5fe2016-12-16 11:02:56 +0100490
Miklos Szerediab508822014-12-13 00:59:49 +0100491 *stack_depth = max(*stack_depth, path->mnt->mnt_sb->s_stack_depth);
492
Miklos Szeredi7c03b5d2015-06-22 13:53:48 +0200493 if (ovl_dentry_remote(path->dentry))
494 *remote = true;
495
Miklos Szerediab508822014-12-13 00:59:49 +0100496 return 0;
497
498out_put:
499 path_put(path);
500out:
501 return err;
502}
503
Miklos Szeredie9be9d52014-10-24 00:14:38 +0200504/* Workdir should not be subdir of upperdir and vice versa */
505static bool ovl_workdir_ok(struct dentry *workdir, struct dentry *upperdir)
506{
507 bool ok = false;
508
509 if (workdir != upperdir) {
510 ok = (lock_rename(workdir, upperdir) == NULL);
511 unlock_rename(workdir, upperdir);
512 }
513 return ok;
514}
515
Miklos Szeredia78d9f02014-12-13 00:59:52 +0100516static unsigned int ovl_split_lowerdirs(char *str)
517{
518 unsigned int ctr = 1;
519 char *s, *d;
520
521 for (s = d = str;; s++, d++) {
522 if (*s == '\\') {
523 s++;
524 } else if (*s == ':') {
525 *d = '\0';
526 ctr++;
527 continue;
528 }
529 *d = *s;
530 if (!*s)
531 break;
532 }
533 return ctr;
534}
535
Andreas Gruenbacher0c97be22016-08-22 16:36:49 +0200536static int __maybe_unused
Andreas Gruenbacher0eb45fc2016-08-22 17:52:55 +0200537ovl_posix_acl_xattr_get(const struct xattr_handler *handler,
538 struct dentry *dentry, struct inode *inode,
539 const char *name, void *buffer, size_t size)
540{
541 return ovl_xattr_get(dentry, handler->name, buffer, size);
542}
543
544static int __maybe_unused
Andreas Gruenbacher0c97be22016-08-22 16:36:49 +0200545ovl_posix_acl_xattr_set(const struct xattr_handler *handler,
546 struct dentry *dentry, struct inode *inode,
547 const char *name, const void *value,
548 size_t size, int flags)
Miklos Szeredid837a492016-07-29 12:05:24 +0200549{
550 struct dentry *workdir = ovl_workdir(dentry);
551 struct inode *realinode = ovl_inode_real(inode, NULL);
552 struct posix_acl *acl = NULL;
553 int err;
554
555 /* Check that everything is OK before copy-up */
556 if (value) {
557 acl = posix_acl_from_xattr(&init_user_ns, value, size);
558 if (IS_ERR(acl))
559 return PTR_ERR(acl);
560 }
561 err = -EOPNOTSUPP;
562 if (!IS_POSIXACL(d_inode(workdir)))
563 goto out_acl_release;
564 if (!realinode->i_op->set_acl)
565 goto out_acl_release;
566 if (handler->flags == ACL_TYPE_DEFAULT && !S_ISDIR(inode->i_mode)) {
567 err = acl ? -EACCES : 0;
568 goto out_acl_release;
569 }
570 err = -EPERM;
571 if (!inode_owner_or_capable(inode))
572 goto out_acl_release;
573
574 posix_acl_release(acl);
575
Miklos Szeredifd3220d2016-10-31 14:42:14 +0100576 /*
577 * Check if sgid bit needs to be cleared (actual setacl operation will
578 * be done with mounter's capabilities and so that won't do it for us).
579 */
580 if (unlikely(inode->i_mode & S_ISGID) &&
581 handler->flags == ACL_TYPE_ACCESS &&
582 !in_group_p(inode->i_gid) &&
583 !capable_wrt_inode_uidgid(inode, CAP_FSETID)) {
584 struct iattr iattr = { .ia_valid = ATTR_KILL_SGID };
585
586 err = ovl_setattr(dentry, &iattr);
587 if (err)
588 return err;
589 }
590
Miklos Szeredice315132016-09-01 11:12:00 +0200591 err = ovl_xattr_set(dentry, handler->name, value, size, flags);
592 if (!err)
593 ovl_copyattr(ovl_inode_real(inode, NULL), inode);
594
595 return err;
Miklos Szeredid837a492016-07-29 12:05:24 +0200596
597out_acl_release:
598 posix_acl_release(acl);
599 return err;
600}
601
Andreas Gruenbacher0eb45fc2016-08-22 17:52:55 +0200602static int ovl_own_xattr_get(const struct xattr_handler *handler,
603 struct dentry *dentry, struct inode *inode,
604 const char *name, void *buffer, size_t size)
605{
Amir Goldstein48fab5d2016-11-16 11:22:39 +0200606 return -EOPNOTSUPP;
Andreas Gruenbacher0eb45fc2016-08-22 17:52:55 +0200607}
608
Miklos Szeredid837a492016-07-29 12:05:24 +0200609static int ovl_own_xattr_set(const struct xattr_handler *handler,
610 struct dentry *dentry, struct inode *inode,
611 const char *name, const void *value,
612 size_t size, int flags)
613{
Amir Goldstein48fab5d2016-11-16 11:22:39 +0200614 return -EOPNOTSUPP;
Miklos Szeredid837a492016-07-29 12:05:24 +0200615}
616
Andreas Gruenbacher0eb45fc2016-08-22 17:52:55 +0200617static int ovl_other_xattr_get(const struct xattr_handler *handler,
618 struct dentry *dentry, struct inode *inode,
619 const char *name, void *buffer, size_t size)
620{
621 return ovl_xattr_get(dentry, name, buffer, size);
622}
623
Andreas Gruenbacher0e585cc2016-08-22 17:22:11 +0200624static int ovl_other_xattr_set(const struct xattr_handler *handler,
625 struct dentry *dentry, struct inode *inode,
626 const char *name, const void *value,
627 size_t size, int flags)
628{
629 return ovl_xattr_set(dentry, name, value, size, flags);
630}
631
Andreas Gruenbacher0c97be22016-08-22 16:36:49 +0200632static const struct xattr_handler __maybe_unused
633ovl_posix_acl_access_xattr_handler = {
Miklos Szeredid837a492016-07-29 12:05:24 +0200634 .name = XATTR_NAME_POSIX_ACL_ACCESS,
635 .flags = ACL_TYPE_ACCESS,
Andreas Gruenbacher0eb45fc2016-08-22 17:52:55 +0200636 .get = ovl_posix_acl_xattr_get,
Miklos Szeredid837a492016-07-29 12:05:24 +0200637 .set = ovl_posix_acl_xattr_set,
638};
639
Andreas Gruenbacher0c97be22016-08-22 16:36:49 +0200640static const struct xattr_handler __maybe_unused
641ovl_posix_acl_default_xattr_handler = {
Miklos Szeredid837a492016-07-29 12:05:24 +0200642 .name = XATTR_NAME_POSIX_ACL_DEFAULT,
643 .flags = ACL_TYPE_DEFAULT,
Andreas Gruenbacher0eb45fc2016-08-22 17:52:55 +0200644 .get = ovl_posix_acl_xattr_get,
Miklos Szeredid837a492016-07-29 12:05:24 +0200645 .set = ovl_posix_acl_xattr_set,
646};
647
648static const struct xattr_handler ovl_own_xattr_handler = {
649 .prefix = OVL_XATTR_PREFIX,
Andreas Gruenbacher0eb45fc2016-08-22 17:52:55 +0200650 .get = ovl_own_xattr_get,
Miklos Szeredid837a492016-07-29 12:05:24 +0200651 .set = ovl_own_xattr_set,
652};
653
654static const struct xattr_handler ovl_other_xattr_handler = {
655 .prefix = "", /* catch all */
Andreas Gruenbacher0eb45fc2016-08-22 17:52:55 +0200656 .get = ovl_other_xattr_get,
Miklos Szeredid837a492016-07-29 12:05:24 +0200657 .set = ovl_other_xattr_set,
658};
659
660static const struct xattr_handler *ovl_xattr_handlers[] = {
Andreas Gruenbacher0c97be22016-08-22 16:36:49 +0200661#ifdef CONFIG_FS_POSIX_ACL
Miklos Szeredid837a492016-07-29 12:05:24 +0200662 &ovl_posix_acl_access_xattr_handler,
663 &ovl_posix_acl_default_xattr_handler,
Andreas Gruenbacher0c97be22016-08-22 16:36:49 +0200664#endif
Miklos Szeredid837a492016-07-29 12:05:24 +0200665 &ovl_own_xattr_handler,
666 &ovl_other_xattr_handler,
667 NULL
668};
669
Miklos Szeredie9be9d52014-10-24 00:14:38 +0200670static int ovl_fill_super(struct super_block *sb, void *data, int silent)
671{
Miklos Szeredi53a08cb2014-12-13 00:59:51 +0100672 struct path upperpath = { NULL, NULL };
673 struct path workpath = { NULL, NULL };
Miklos Szeredie9be9d52014-10-24 00:14:38 +0200674 struct dentry *root_dentry;
Miklos Szeredi39b681f2016-07-29 12:05:24 +0200675 struct inode *realinode;
Miklos Szeredie9be9d52014-10-24 00:14:38 +0200676 struct ovl_entry *oe;
677 struct ovl_fs *ufs;
Miklos Szeredia78d9f02014-12-13 00:59:52 +0100678 struct path *stack = NULL;
679 char *lowertmp;
680 char *lower;
681 unsigned int numlower;
682 unsigned int stacklen = 0;
Miklos Szeredidd662662014-12-13 00:59:43 +0100683 unsigned int i;
Miklos Szeredi7c03b5d2015-06-22 13:53:48 +0200684 bool remote = false;
Miklos Szeredie9be9d52014-10-24 00:14:38 +0200685 int err;
686
Erez Zadokf45827e82014-10-24 00:14:38 +0200687 err = -ENOMEM;
688 ufs = kzalloc(sizeof(struct ovl_fs), GFP_KERNEL);
689 if (!ufs)
Miklos Szeredie9be9d52014-10-24 00:14:38 +0200690 goto out;
691
Erez Zadokf45827e82014-10-24 00:14:38 +0200692 err = ovl_parse_opt((char *) data, &ufs->config);
693 if (err)
694 goto out_free_config;
695
Miklos Szeredie9be9d52014-10-24 00:14:38 +0200696 err = -EINVAL;
Miklos Szeredi53a08cb2014-12-13 00:59:51 +0100697 if (!ufs->config.lowerdir) {
Konstantin Khlebnikov07f2af72015-06-29 20:18:56 +0300698 if (!silent)
699 pr_err("overlayfs: missing 'lowerdir'\n");
Miklos Szeredie9be9d52014-10-24 00:14:38 +0200700 goto out_free_config;
701 }
702
Miklos Szeredi53a08cb2014-12-13 00:59:51 +0100703 sb->s_stack_depth = 0;
Miklos Szeredicf9a6782015-12-11 16:30:49 +0100704 sb->s_maxbytes = MAX_LFS_FILESIZE;
Miklos Szeredi53a08cb2014-12-13 00:59:51 +0100705 if (ufs->config.upperdir) {
Miklos Szeredi53a08cb2014-12-13 00:59:51 +0100706 if (!ufs->config.workdir) {
707 pr_err("overlayfs: missing 'workdir'\n");
708 goto out_free_config;
709 }
Miklos Szeredie9be9d52014-10-24 00:14:38 +0200710
Miklos Szeredi53a08cb2014-12-13 00:59:51 +0100711 err = ovl_mount_dir(ufs->config.upperdir, &upperpath);
712 if (err)
713 goto out_free_config;
Miklos Szeredi3b7a9a22014-12-13 00:59:48 +0100714
hujianyang71cbad72015-01-15 13:20:57 +0800715 /* Upper fs should not be r/o */
716 if (upperpath.mnt->mnt_sb->s_flags & MS_RDONLY) {
717 pr_err("overlayfs: upper fs is r/o, try multi-lower layers mount\n");
718 err = -EINVAL;
719 goto out_put_upperpath;
720 }
721
Miklos Szeredi6b2d5fe2016-12-16 11:02:56 +0100722 err = ovl_check_namelen(&upperpath, ufs, ufs->config.upperdir);
723 if (err)
724 goto out_put_upperpath;
725
Miklos Szeredi53a08cb2014-12-13 00:59:51 +0100726 err = ovl_mount_dir(ufs->config.workdir, &workpath);
727 if (err)
728 goto out_put_upperpath;
729
hujianyang2f83fd82015-01-06 12:52:13 +0800730 err = -EINVAL;
Miklos Szeredi53a08cb2014-12-13 00:59:51 +0100731 if (upperpath.mnt != workpath.mnt) {
732 pr_err("overlayfs: workdir and upperdir must reside under the same mount\n");
733 goto out_put_workpath;
734 }
735 if (!ovl_workdir_ok(workpath.dentry, upperpath.dentry)) {
736 pr_err("overlayfs: workdir and upperdir must be separate subtrees\n");
737 goto out_put_workpath;
738 }
739 sb->s_stack_depth = upperpath.mnt->mnt_sb->s_stack_depth;
Miklos Szerediab508822014-12-13 00:59:49 +0100740 }
Miklos Szeredia78d9f02014-12-13 00:59:52 +0100741 err = -ENOMEM;
742 lowertmp = kstrdup(ufs->config.lowerdir, GFP_KERNEL);
743 if (!lowertmp)
Miklos Szeredi3b7a9a22014-12-13 00:59:48 +0100744 goto out_put_workpath;
Miklos Szeredie9be9d52014-10-24 00:14:38 +0200745
746 err = -EINVAL;
Miklos Szeredia78d9f02014-12-13 00:59:52 +0100747 stacklen = ovl_split_lowerdirs(lowertmp);
hujianyang6be45062015-01-15 13:19:21 +0800748 if (stacklen > OVL_MAX_STACK) {
Colin Ian Kingfd365702016-08-18 16:58:35 +0100749 pr_err("overlayfs: too many lower directories, limit is %d\n",
hujianyang6be45062015-01-15 13:19:21 +0800750 OVL_MAX_STACK);
Miklos Szeredia78d9f02014-12-13 00:59:52 +0100751 goto out_free_lowertmp;
hujianyang6be45062015-01-15 13:19:21 +0800752 } else if (!ufs->config.upperdir && stacklen == 1) {
753 pr_err("overlayfs: at least 2 lowerdir are needed while upperdir nonexistent\n");
754 goto out_free_lowertmp;
755 }
Miklos Szeredia78d9f02014-12-13 00:59:52 +0100756
757 stack = kcalloc(stacklen, sizeof(struct path), GFP_KERNEL);
758 if (!stack)
759 goto out_free_lowertmp;
760
761 lower = lowertmp;
762 for (numlower = 0; numlower < stacklen; numlower++) {
Miklos Szeredi6b2d5fe2016-12-16 11:02:56 +0100763 err = ovl_lower_dir(lower, &stack[numlower], ufs,
764 &sb->s_stack_depth, &remote);
Miklos Szeredia78d9f02014-12-13 00:59:52 +0100765 if (err)
766 goto out_put_lowerpath;
767
768 lower = strchr(lower, '\0') + 1;
769 }
770
771 err = -EINVAL;
Miklos Szerediab508822014-12-13 00:59:49 +0100772 sb->s_stack_depth++;
Miklos Szeredi69c433e2014-10-24 00:14:39 +0200773 if (sb->s_stack_depth > FILESYSTEM_MAX_STACK_DEPTH) {
774 pr_err("overlayfs: maximum fs stacking depth exceeded\n");
Miklos Szeredi3b7a9a22014-12-13 00:59:48 +0100775 goto out_put_lowerpath;
Miklos Szeredi69c433e2014-10-24 00:14:39 +0200776 }
777
Miklos Szeredi53a08cb2014-12-13 00:59:51 +0100778 if (ufs->config.upperdir) {
779 ufs->upper_mnt = clone_private_mount(&upperpath);
780 err = PTR_ERR(ufs->upper_mnt);
781 if (IS_ERR(ufs->upper_mnt)) {
782 pr_err("overlayfs: failed to clone upperpath\n");
783 goto out_put_lowerpath;
784 }
Miklos Szeredid719e8f2016-07-29 12:05:23 +0200785 /* Don't inherit atime flags */
786 ufs->upper_mnt->mnt_flags &= ~(MNT_NOATIME | MNT_NODIRATIME | MNT_RELATIME);
787
788 sb->s_time_gran = ufs->upper_mnt->mnt_sb->s_time_gran;
Miklos Szeredi3b7a9a22014-12-13 00:59:48 +0100789
Miklos Szeredi53a08cb2014-12-13 00:59:51 +0100790 ufs->workdir = ovl_workdir_create(ufs->upper_mnt, workpath.dentry);
791 err = PTR_ERR(ufs->workdir);
792 if (IS_ERR(ufs->workdir)) {
Miklos Szeredicc6f67b2015-05-19 14:30:12 +0200793 pr_warn("overlayfs: failed to create directory %s/%s (errno: %i); mounting read-only\n",
794 ufs->config.workdir, OVL_WORKDIR_NAME, -err);
795 sb->s_flags |= MS_RDONLY;
796 ufs->workdir = NULL;
Miklos Szeredi53a08cb2014-12-13 00:59:51 +0100797 }
Vivek Goyal45aebea2016-02-22 09:28:34 -0500798
799 /*
800 * Upper should support d_type, else whiteouts are visible.
801 * Given workdir and upper are on same fs, we can do
Vivek Goyal21765192016-05-20 09:04:26 -0400802 * iterate_dir() on workdir. This check requires successful
803 * creation of workdir in previous step.
Vivek Goyal45aebea2016-02-22 09:28:34 -0500804 */
Vivek Goyal21765192016-05-20 09:04:26 -0400805 if (ufs->workdir) {
806 err = ovl_check_d_type_supported(&workpath);
807 if (err < 0)
808 goto out_put_workdir;
Vivek Goyal45aebea2016-02-22 09:28:34 -0500809
Vivek Goyale7c0b592016-07-01 10:02:44 -0400810 /*
811 * We allowed this configuration and don't want to
812 * break users over kernel upgrade. So warn instead
813 * of erroring out.
814 */
815 if (!err)
816 pr_warn("overlayfs: upper fs needs to support d_type.\n");
Vivek Goyal45aebea2016-02-22 09:28:34 -0500817 }
Miklos Szeredie9be9d52014-10-24 00:14:38 +0200818 }
819
hujianyang2f83fd82015-01-06 12:52:13 +0800820 err = -ENOMEM;
Miklos Szeredia78d9f02014-12-13 00:59:52 +0100821 ufs->lower_mnt = kcalloc(numlower, sizeof(struct vfsmount *), GFP_KERNEL);
Miklos Szeredidd662662014-12-13 00:59:43 +0100822 if (ufs->lower_mnt == NULL)
Miklos Szeredi3b7a9a22014-12-13 00:59:48 +0100823 goto out_put_workdir;
Miklos Szeredia78d9f02014-12-13 00:59:52 +0100824 for (i = 0; i < numlower; i++) {
825 struct vfsmount *mnt = clone_private_mount(&stack[i]);
Miklos Szeredidd662662014-12-13 00:59:43 +0100826
hujianyang2f83fd82015-01-06 12:52:13 +0800827 err = PTR_ERR(mnt);
Miklos Szeredia78d9f02014-12-13 00:59:52 +0100828 if (IS_ERR(mnt)) {
829 pr_err("overlayfs: failed to clone lowerpath\n");
830 goto out_put_lower_mnt;
831 }
832 /*
833 * Make lower_mnt R/O. That way fchmod/fchown on lower file
834 * will fail instead of modifying lower fs.
835 */
Miklos Szeredid719e8f2016-07-29 12:05:23 +0200836 mnt->mnt_flags |= MNT_READONLY | MNT_NOATIME;
Miklos Szeredia78d9f02014-12-13 00:59:52 +0100837
838 ufs->lower_mnt[ufs->numlower] = mnt;
839 ufs->numlower++;
Miklos Szeredie9be9d52014-10-24 00:14:38 +0200840 }
841
hujianyang71cbad72015-01-15 13:20:57 +0800842 /* If the upper fs is nonexistent, we mark overlayfs r/o too */
843 if (!ufs->upper_mnt)
Miklos Szeredie9be9d52014-10-24 00:14:38 +0200844 sb->s_flags |= MS_RDONLY;
845
Miklos Szeredi7c03b5d2015-06-22 13:53:48 +0200846 if (remote)
847 sb->s_d_op = &ovl_reval_dentry_operations;
848 else
849 sb->s_d_op = &ovl_dentry_operations;
Miklos Szeredie9be9d52014-10-24 00:14:38 +0200850
Antonio Murdaca3fe6e522016-04-07 15:48:25 +0200851 ufs->creator_cred = prepare_creds();
852 if (!ufs->creator_cred)
853 goto out_put_lower_mnt;
854
Miklos Szeredie9be9d52014-10-24 00:14:38 +0200855 err = -ENOMEM;
Miklos Szeredia78d9f02014-12-13 00:59:52 +0100856 oe = ovl_alloc_entry(numlower);
Miklos Szeredi3b7a9a22014-12-13 00:59:48 +0100857 if (!oe)
Antonio Murdaca3fe6e522016-04-07 15:48:25 +0200858 goto out_put_cred;
Miklos Szeredie9be9d52014-10-24 00:14:38 +0200859
Vivek Goyal655042c2016-10-14 03:03:36 +0200860 sb->s_magic = OVERLAYFS_SUPER_MAGIC;
861 sb->s_op = &ovl_super_operations;
862 sb->s_xattr = ovl_xattr_handlers;
863 sb->s_fs_info = ufs;
864 sb->s_flags |= MS_POSIXACL | MS_NOREMOTELOCK;
865
Miklos Szeredica4c8a32016-12-16 11:02:55 +0100866 root_dentry = d_make_root(ovl_new_inode(sb, S_IFDIR, 0));
Miklos Szeredie9be9d52014-10-24 00:14:38 +0200867 if (!root_dentry)
Miklos Szeredi3b7a9a22014-12-13 00:59:48 +0100868 goto out_free_oe;
Miklos Szeredie9be9d52014-10-24 00:14:38 +0200869
870 mntput(upperpath.mnt);
Miklos Szeredia78d9f02014-12-13 00:59:52 +0100871 for (i = 0; i < numlower; i++)
872 mntput(stack[i].mnt);
Miklos Szeredie9be9d52014-10-24 00:14:38 +0200873 path_put(&workpath);
Miklos Szeredia78d9f02014-12-13 00:59:52 +0100874 kfree(lowertmp);
Miklos Szeredie9be9d52014-10-24 00:14:38 +0200875
876 oe->__upperdentry = upperpath.dentry;
Miklos Szeredia78d9f02014-12-13 00:59:52 +0100877 for (i = 0; i < numlower; i++) {
878 oe->lowerstack[i].dentry = stack[i].dentry;
879 oe->lowerstack[i].mnt = ufs->lower_mnt[i];
880 }
Konstantin Khlebnikov0f955022015-08-24 15:57:18 +0300881 kfree(stack);
Miklos Szeredie9be9d52014-10-24 00:14:38 +0200882
883 root_dentry->d_fsdata = oe;
884
Miklos Szeredi39b681f2016-07-29 12:05:24 +0200885 realinode = d_inode(ovl_dentry_real(root_dentry));
886 ovl_inode_init(d_inode(root_dentry), realinode, !!upperpath.dentry);
887 ovl_copyattr(realinode, d_inode(root_dentry));
Miklos Szeredied06e062015-12-09 16:11:59 +0100888
Miklos Szeredie9be9d52014-10-24 00:14:38 +0200889 sb->s_root = root_dentry;
Miklos Szeredie9be9d52014-10-24 00:14:38 +0200890
891 return 0;
892
Miklos Szeredi3b7a9a22014-12-13 00:59:48 +0100893out_free_oe:
894 kfree(oe);
Antonio Murdaca3fe6e522016-04-07 15:48:25 +0200895out_put_cred:
896 put_cred(ufs->creator_cred);
Miklos Szeredie9be9d52014-10-24 00:14:38 +0200897out_put_lower_mnt:
Miklos Szeredidd662662014-12-13 00:59:43 +0100898 for (i = 0; i < ufs->numlower; i++)
899 mntput(ufs->lower_mnt[i]);
900 kfree(ufs->lower_mnt);
Miklos Szeredi3b7a9a22014-12-13 00:59:48 +0100901out_put_workdir:
902 dput(ufs->workdir);
Miklos Szeredie9be9d52014-10-24 00:14:38 +0200903 mntput(ufs->upper_mnt);
Miklos Szeredie9be9d52014-10-24 00:14:38 +0200904out_put_lowerpath:
Miklos Szeredia78d9f02014-12-13 00:59:52 +0100905 for (i = 0; i < numlower; i++)
906 path_put(&stack[i]);
907 kfree(stack);
908out_free_lowertmp:
909 kfree(lowertmp);
Miklos Szeredi3b7a9a22014-12-13 00:59:48 +0100910out_put_workpath:
911 path_put(&workpath);
Miklos Szeredie9be9d52014-10-24 00:14:38 +0200912out_put_upperpath:
913 path_put(&upperpath);
Miklos Szeredie9be9d52014-10-24 00:14:38 +0200914out_free_config:
Erez Zadokf45827e82014-10-24 00:14:38 +0200915 kfree(ufs->config.lowerdir);
916 kfree(ufs->config.upperdir);
917 kfree(ufs->config.workdir);
918 kfree(ufs);
Miklos Szeredie9be9d52014-10-24 00:14:38 +0200919out:
920 return err;
921}
922
923static struct dentry *ovl_mount(struct file_system_type *fs_type, int flags,
924 const char *dev_name, void *raw_data)
925{
926 return mount_nodev(fs_type, flags, raw_data, ovl_fill_super);
927}
928
929static struct file_system_type ovl_fs_type = {
930 .owner = THIS_MODULE,
Miklos Szeredief94b182014-11-20 16:39:59 +0100931 .name = "overlay",
Miklos Szeredie9be9d52014-10-24 00:14:38 +0200932 .mount = ovl_mount,
933 .kill_sb = kill_anon_super,
934};
Miklos Szeredief94b182014-11-20 16:39:59 +0100935MODULE_ALIAS_FS("overlay");
Miklos Szeredie9be9d52014-10-24 00:14:38 +0200936
937static int __init ovl_init(void)
938{
939 return register_filesystem(&ovl_fs_type);
940}
941
942static void __exit ovl_exit(void)
943{
944 unregister_filesystem(&ovl_fs_type);
945}
946
947module_init(ovl_init);
948module_exit(ovl_exit);