blob: fa323589704f828c808127304af1615ca0f3f6df [file] [log] [blame]
Tejun Heob8441ed2013-11-24 09:54:58 -05001/*
2 * fs/kernfs/mount.c - kernfs mount implementation
3 *
4 * Copyright (c) 2001-3 Patrick Mochel
5 * Copyright (c) 2007 SUSE Linux Products GmbH
6 * Copyright (c) 2007, 2013 Tejun Heo <tj@kernel.org>
7 *
8 * This file is released under the GPLv2.
9 */
Tejun Heofa736a92013-11-28 14:54:44 -050010
11#include <linux/fs.h>
12#include <linux/mount.h>
13#include <linux/init.h>
14#include <linux/magic.h>
15#include <linux/slab.h>
16#include <linux/pagemap.h>
Aditya Kalifb3c8312016-01-29 02:54:08 -060017#include <linux/namei.h>
Serge E. Hallyn4f41fc52016-05-09 09:59:55 -050018#include <linux/seq_file.h>
Shaohua Liaa818822017-07-12 11:49:51 -070019#include <linux/exportfs.h>
Tejun Heofa736a92013-11-28 14:54:44 -050020
21#include "kernfs-internal.h"
22
Tejun Heoa797bfc2013-12-11 14:11:57 -050023struct kmem_cache *kernfs_node_cache;
Tejun Heofa736a92013-11-28 14:54:44 -050024
Tejun Heo6a7fed42014-02-03 14:09:10 -050025static int kernfs_sop_remount_fs(struct super_block *sb, int *flags, char *data)
26{
27 struct kernfs_root *root = kernfs_info(sb)->root;
28 struct kernfs_syscall_ops *scops = root->syscall_ops;
29
30 if (scops && scops->remount_fs)
31 return scops->remount_fs(root, flags, data);
32 return 0;
33}
34
35static int kernfs_sop_show_options(struct seq_file *sf, struct dentry *dentry)
36{
Shaohua Li319ba912017-07-12 11:49:49 -070037 struct kernfs_root *root = kernfs_root(kernfs_dentry_node(dentry));
Tejun Heo6a7fed42014-02-03 14:09:10 -050038 struct kernfs_syscall_ops *scops = root->syscall_ops;
39
40 if (scops && scops->show_options)
41 return scops->show_options(sf, root);
42 return 0;
43}
44
Serge E. Hallyn4f41fc52016-05-09 09:59:55 -050045static int kernfs_sop_show_path(struct seq_file *sf, struct dentry *dentry)
46{
Shaohua Li319ba912017-07-12 11:49:49 -070047 struct kernfs_node *node = kernfs_dentry_node(dentry);
Serge E. Hallyn4f41fc52016-05-09 09:59:55 -050048 struct kernfs_root *root = kernfs_root(node);
49 struct kernfs_syscall_ops *scops = root->syscall_ops;
50
51 if (scops && scops->show_path)
52 return scops->show_path(sf, node, root);
53
Serge E. Hallyn3cc9b232016-05-12 00:29:45 -050054 seq_dentry(sf, dentry, " \t\n\\");
55 return 0;
Serge E. Hallyn4f41fc52016-05-09 09:59:55 -050056}
57
Li Zefanf41c5932014-02-14 16:57:27 +080058const struct super_operations kernfs_sops = {
Tejun Heofa736a92013-11-28 14:54:44 -050059 .statfs = simple_statfs,
60 .drop_inode = generic_delete_inode,
Tejun Heoc637b8a2013-12-11 14:11:58 -050061 .evict_inode = kernfs_evict_inode,
Tejun Heo6a7fed42014-02-03 14:09:10 -050062
63 .remount_fs = kernfs_sop_remount_fs,
64 .show_options = kernfs_sop_show_options,
Serge E. Hallyn4f41fc52016-05-09 09:59:55 -050065 .show_path = kernfs_sop_show_path,
Tejun Heofa736a92013-11-28 14:54:44 -050066};
67
Shaohua Liaa818822017-07-12 11:49:51 -070068static struct inode *kernfs_fh_get_inode(struct super_block *sb,
69 u64 ino, u32 generation)
70{
71 struct kernfs_super_info *info = kernfs_info(sb);
72 struct inode *inode;
73 struct kernfs_node *kn;
74
75 if (ino == 0)
76 return ERR_PTR(-ESTALE);
77
78 kn = kernfs_find_and_get_node_by_ino(info->root, ino);
79 if (!kn)
80 return ERR_PTR(-ESTALE);
81 inode = kernfs_get_inode(sb, kn);
82 kernfs_put(kn);
83 if (IS_ERR(inode))
84 return ERR_CAST(inode);
85
86 if (generation && inode->i_generation != generation) {
87 /* we didn't find the right inode.. */
88 iput(inode);
89 return ERR_PTR(-ESTALE);
90 }
91 return inode;
92}
93
94static struct dentry *kernfs_fh_to_dentry(struct super_block *sb, struct fid *fid,
95 int fh_len, int fh_type)
96{
97 return generic_fh_to_dentry(sb, fid, fh_len, fh_type,
98 kernfs_fh_get_inode);
99}
100
101static struct dentry *kernfs_fh_to_parent(struct super_block *sb, struct fid *fid,
102 int fh_len, int fh_type)
103{
104 return generic_fh_to_parent(sb, fid, fh_len, fh_type,
105 kernfs_fh_get_inode);
106}
107
108static struct dentry *kernfs_get_parent_dentry(struct dentry *child)
109{
110 struct kernfs_node *kn = kernfs_dentry_node(child);
111
112 return d_obtain_alias(kernfs_get_inode(child->d_sb, kn->parent));
113}
114
115static const struct export_operations kernfs_export_ops = {
116 .fh_to_dentry = kernfs_fh_to_dentry,
117 .fh_to_parent = kernfs_fh_to_parent,
118 .get_parent = kernfs_get_parent_dentry,
119};
120
Tejun Heo0c23b222014-02-03 14:09:15 -0500121/**
122 * kernfs_root_from_sb - determine kernfs_root associated with a super_block
123 * @sb: the super_block in question
124 *
125 * Return the kernfs_root associated with @sb. If @sb is not a kernfs one,
126 * %NULL is returned.
127 */
128struct kernfs_root *kernfs_root_from_sb(struct super_block *sb)
129{
130 if (sb->s_op == &kernfs_sops)
131 return kernfs_info(sb)->root;
132 return NULL;
133}
134
Aditya Kalifb3c8312016-01-29 02:54:08 -0600135/*
136 * find the next ancestor in the path down to @child, where @parent was the
137 * ancestor whose descendant we want to find.
138 *
139 * Say the path is /a/b/c/d. @child is d, @parent is NULL. We return the root
140 * node. If @parent is b, then we return the node for c.
141 * Passing in d as @parent is not ok.
142 */
143static struct kernfs_node *find_next_ancestor(struct kernfs_node *child,
144 struct kernfs_node *parent)
145{
146 if (child == parent) {
147 pr_crit_once("BUG in find_next_ancestor: called with parent == child");
148 return NULL;
149 }
150
151 while (child->parent != parent) {
152 if (!child->parent)
153 return NULL;
154 child = child->parent;
155 }
156
157 return child;
158}
159
160/**
161 * kernfs_node_dentry - get a dentry for the given kernfs_node
162 * @kn: kernfs_node for which a dentry is needed
163 * @sb: the kernfs super_block
164 */
165struct dentry *kernfs_node_dentry(struct kernfs_node *kn,
166 struct super_block *sb)
167{
168 struct dentry *dentry;
169 struct kernfs_node *knparent = NULL;
170
171 BUG_ON(sb->s_op != &kernfs_sops);
172
173 dentry = dget(sb->s_root);
174
175 /* Check if this is the root kernfs_node */
176 if (!kn->parent)
177 return dentry;
178
179 knparent = find_next_ancestor(kn, NULL);
180 if (WARN_ON(!knparent))
181 return ERR_PTR(-EINVAL);
182
183 do {
184 struct dentry *dtmp;
185 struct kernfs_node *kntmp;
186
187 if (kn == knparent)
188 return dentry;
189 kntmp = find_next_ancestor(kn, knparent);
190 if (WARN_ON(!kntmp))
191 return ERR_PTR(-EINVAL);
Al Viro779b8392016-04-11 08:42:55 -0400192 dtmp = lookup_one_len_unlocked(kntmp->name, dentry,
193 strlen(kntmp->name));
Aditya Kalifb3c8312016-01-29 02:54:08 -0600194 dput(dentry);
195 if (IS_ERR(dtmp))
196 return dtmp;
197 knparent = kntmp;
198 dentry = dtmp;
199 } while (true);
200}
201
Jianyu Zhan26fc9cd2014-04-26 15:40:28 +0800202static int kernfs_fill_super(struct super_block *sb, unsigned long magic)
Tejun Heofa736a92013-11-28 14:54:44 -0500203{
Tejun Heoc525aad2013-12-11 14:11:55 -0500204 struct kernfs_super_info *info = kernfs_info(sb);
Tejun Heofa736a92013-11-28 14:54:44 -0500205 struct inode *inode;
206 struct dentry *root;
207
Tejun Heo7d568a82014-04-09 11:07:30 -0400208 info->sb = sb;
Eric W. Biedermana2982cc2016-06-09 15:34:02 -0500209 /* Userspace would break if executables or devices appear on sysfs */
210 sb->s_iflags |= SB_I_NOEXEC | SB_I_NODEV;
Kirill A. Shutemov09cbfea2016-04-01 15:29:47 +0300211 sb->s_blocksize = PAGE_SIZE;
212 sb->s_blocksize_bits = PAGE_SHIFT;
Jianyu Zhan26fc9cd2014-04-26 15:40:28 +0800213 sb->s_magic = magic;
Tejun Heoa797bfc2013-12-11 14:11:57 -0500214 sb->s_op = &kernfs_sops;
Andreas Gruenbachere72a1a82016-09-29 17:48:33 +0200215 sb->s_xattr = kernfs_xattr_handlers;
Shaohua Liaa818822017-07-12 11:49:51 -0700216 if (info->root->flags & KERNFS_ROOT_SUPPORT_EXPORTOP)
217 sb->s_export_op = &kernfs_export_ops;
Tejun Heofa736a92013-11-28 14:54:44 -0500218 sb->s_time_gran = 1;
219
220 /* get root inode, initialize and unlock it */
Tejun Heoa797bfc2013-12-11 14:11:57 -0500221 mutex_lock(&kernfs_mutex);
Tejun Heoc637b8a2013-12-11 14:11:58 -0500222 inode = kernfs_get_inode(sb, info->root->kn);
Tejun Heoa797bfc2013-12-11 14:11:57 -0500223 mutex_unlock(&kernfs_mutex);
Tejun Heofa736a92013-11-28 14:54:44 -0500224 if (!inode) {
Tejun Heoc637b8a2013-12-11 14:11:58 -0500225 pr_debug("kernfs: could not get root inode\n");
Tejun Heofa736a92013-11-28 14:54:44 -0500226 return -ENOMEM;
227 }
228
229 /* instantiate and link root dentry */
230 root = d_make_root(inode);
231 if (!root) {
232 pr_debug("%s: could not get root dentry!\n", __func__);
233 return -ENOMEM;
234 }
Tejun Heofa736a92013-11-28 14:54:44 -0500235 sb->s_root = root;
Tejun Heoa797bfc2013-12-11 14:11:57 -0500236 sb->s_d_op = &kernfs_dops;
Tejun Heofa736a92013-11-28 14:54:44 -0500237 return 0;
238}
239
Tejun Heoc637b8a2013-12-11 14:11:58 -0500240static int kernfs_test_super(struct super_block *sb, void *data)
Tejun Heofa736a92013-11-28 14:54:44 -0500241{
Tejun Heoc525aad2013-12-11 14:11:55 -0500242 struct kernfs_super_info *sb_info = kernfs_info(sb);
243 struct kernfs_super_info *info = data;
Tejun Heofa736a92013-11-28 14:54:44 -0500244
245 return sb_info->root == info->root && sb_info->ns == info->ns;
246}
247
Tejun Heoc637b8a2013-12-11 14:11:58 -0500248static int kernfs_set_super(struct super_block *sb, void *data)
Tejun Heofa736a92013-11-28 14:54:44 -0500249{
250 int error;
251 error = set_anon_super(sb, data);
252 if (!error)
253 sb->s_fs_info = data;
254 return error;
255}
256
257/**
258 * kernfs_super_ns - determine the namespace tag of a kernfs super_block
259 * @sb: super_block of interest
260 *
261 * Return the namespace tag associated with kernfs super_block @sb.
262 */
263const void *kernfs_super_ns(struct super_block *sb)
264{
Tejun Heoc525aad2013-12-11 14:11:55 -0500265 struct kernfs_super_info *info = kernfs_info(sb);
Tejun Heofa736a92013-11-28 14:54:44 -0500266
267 return info->ns;
268}
269
270/**
271 * kernfs_mount_ns - kernfs mount helper
272 * @fs_type: file_system_type of the fs being mounted
273 * @flags: mount flags specified for the mount
274 * @root: kernfs_root of the hierarchy being mounted
Jianyu Zhan26fc9cd2014-04-26 15:40:28 +0800275 * @magic: file system specific magic number
Li Zefanfed95ba2014-02-25 19:28:44 +0800276 * @new_sb_created: tell the caller if we allocated a new superblock
Tejun Heofa736a92013-11-28 14:54:44 -0500277 * @ns: optional namespace tag of the mount
278 *
279 * This is to be called from each kernfs user's file_system_type->mount()
280 * implementation, which should pass through the specified @fs_type and
281 * @flags, and specify the hierarchy and namespace tag to mount via @root
282 * and @ns, respectively.
283 *
284 * The return value can be passed to the vfs layer verbatim.
285 */
286struct dentry *kernfs_mount_ns(struct file_system_type *fs_type, int flags,
Jianyu Zhan26fc9cd2014-04-26 15:40:28 +0800287 struct kernfs_root *root, unsigned long magic,
288 bool *new_sb_created, const void *ns)
Tejun Heofa736a92013-11-28 14:54:44 -0500289{
290 struct super_block *sb;
Tejun Heoc525aad2013-12-11 14:11:55 -0500291 struct kernfs_super_info *info;
Tejun Heofa736a92013-11-28 14:54:44 -0500292 int error;
293
294 info = kzalloc(sizeof(*info), GFP_KERNEL);
295 if (!info)
296 return ERR_PTR(-ENOMEM);
297
298 info->root = root;
299 info->ns = ns;
300
Eric W. Biederman6e4eab52016-05-24 09:29:01 -0500301 sb = sget_userns(fs_type, kernfs_test_super, kernfs_set_super, flags,
302 &init_user_ns, info);
Tejun Heofa736a92013-11-28 14:54:44 -0500303 if (IS_ERR(sb) || sb->s_fs_info != info)
304 kfree(info);
305 if (IS_ERR(sb))
306 return ERR_CAST(sb);
Li Zefanfed95ba2014-02-25 19:28:44 +0800307
308 if (new_sb_created)
309 *new_sb_created = !sb->s_root;
310
Tejun Heofa736a92013-11-28 14:54:44 -0500311 if (!sb->s_root) {
Tejun Heo7d568a82014-04-09 11:07:30 -0400312 struct kernfs_super_info *info = kernfs_info(sb);
313
Jianyu Zhan26fc9cd2014-04-26 15:40:28 +0800314 error = kernfs_fill_super(sb, magic);
Tejun Heofa736a92013-11-28 14:54:44 -0500315 if (error) {
316 deactivate_locked_super(sb);
317 return ERR_PTR(error);
318 }
319 sb->s_flags |= MS_ACTIVE;
Tejun Heo7d568a82014-04-09 11:07:30 -0400320
321 mutex_lock(&kernfs_mutex);
322 list_add(&info->node, &root->supers);
323 mutex_unlock(&kernfs_mutex);
Tejun Heofa736a92013-11-28 14:54:44 -0500324 }
325
326 return dget(sb->s_root);
327}
328
329/**
330 * kernfs_kill_sb - kill_sb for kernfs
331 * @sb: super_block being killed
332 *
333 * This can be used directly for file_system_type->kill_sb(). If a kernfs
334 * user needs extra cleanup, it can implement its own kill_sb() and call
335 * this function at the end.
336 */
337void kernfs_kill_sb(struct super_block *sb)
338{
Tejun Heoc525aad2013-12-11 14:11:55 -0500339 struct kernfs_super_info *info = kernfs_info(sb);
Tejun Heofa736a92013-11-28 14:54:44 -0500340
Tejun Heo7d568a82014-04-09 11:07:30 -0400341 mutex_lock(&kernfs_mutex);
342 list_del(&info->node);
343 mutex_unlock(&kernfs_mutex);
344
Tejun Heofa736a92013-11-28 14:54:44 -0500345 /*
346 * Remove the superblock from fs_supers/s_instances
Tejun Heoc525aad2013-12-11 14:11:55 -0500347 * so we can't find it, before freeing kernfs_super_info.
Tejun Heofa736a92013-11-28 14:54:44 -0500348 */
349 kill_anon_super(sb);
350 kfree(info);
Tejun Heofa736a92013-11-28 14:54:44 -0500351}
352
Li Zefan4e264452014-06-30 11:50:28 +0800353/**
354 * kernfs_pin_sb: try to pin the superblock associated with a kernfs_root
355 * @kernfs_root: the kernfs_root in question
356 * @ns: the namespace tag
357 *
358 * Pin the superblock so the superblock won't be destroyed in subsequent
359 * operations. This can be used to block ->kill_sb() which may be useful
360 * for kernfs users which dynamically manage superblocks.
361 *
362 * Returns NULL if there's no superblock associated to this kernfs_root, or
363 * -EINVAL if the superblock is being freed.
364 */
365struct super_block *kernfs_pin_sb(struct kernfs_root *root, const void *ns)
366{
367 struct kernfs_super_info *info;
368 struct super_block *sb = NULL;
369
370 mutex_lock(&kernfs_mutex);
371 list_for_each_entry(info, &root->supers, node) {
372 if (info->ns == ns) {
373 sb = info->sb;
374 if (!atomic_inc_not_zero(&info->sb->s_active))
375 sb = ERR_PTR(-EINVAL);
376 break;
377 }
378 }
379 mutex_unlock(&kernfs_mutex);
380 return sb;
381}
382
Tejun Heofa736a92013-11-28 14:54:44 -0500383void __init kernfs_init(void)
384{
Shaohua Liba16b282017-07-12 11:49:48 -0700385
386 /*
387 * the slab is freed in RCU context, so kernfs_find_and_get_node_by_ino
388 * can access the slab lock free. This could introduce stale nodes,
389 * please see how kernfs_find_and_get_node_by_ino filters out stale
390 * nodes.
391 */
Tejun Heoa797bfc2013-12-11 14:11:57 -0500392 kernfs_node_cache = kmem_cache_create("kernfs_node_cache",
Tejun Heo324a56e2013-12-11 14:11:53 -0500393 sizeof(struct kernfs_node),
Shaohua Liba16b282017-07-12 11:49:48 -0700394 0,
395 SLAB_PANIC | SLAB_TYPESAFE_BY_RCU,
396 NULL);
Tejun Heofa736a92013-11-28 14:54:44 -0500397}