blob: 0e8622a4341c0bec29d8f5fdf8e63c71dd9836bb [file] [log] [blame]
Linus Torvalds1da177e2005-04-16 15:20:36 -07001/*
Linus Torvalds1da177e2005-04-16 15:20:36 -07002 * Central processing for nfsd.
3 *
4 * Authors: Olaf Kirch (okir@monad.swb.de)
5 *
6 * Copyright (C) 1995, 1996, 1997 Olaf Kirch <okir@monad.swb.de>
7 */
8
Alexey Dobriyane8edc6e2007-05-21 01:22:52 +04009#include <linux/sched.h>
Rafael J. Wysocki83144182007-07-17 04:03:35 -070010#include <linux/freezer.h>
Paul Gortmaker143cb492011-07-01 14:23:34 -040011#include <linux/module.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070012#include <linux/fs_struct.h>
Andy Adamsonc3d06f92009-04-03 08:28:18 +030013#include <linux/swap.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070014
Linus Torvalds1da177e2005-04-16 15:20:36 -070015#include <linux/sunrpc/stats.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070016#include <linux/sunrpc/svcsock.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070017#include <linux/lockd/bind.h>
Andreas Gruenbachera257cdd2005-06-22 17:16:26 +000018#include <linux/nfsacl.h>
Ryusei Yamaguchied2d8ae2009-08-16 00:54:41 +090019#include <linux/seq_file.h>
Pavel Emelyanovfc5d00b2010-09-29 16:03:50 +040020#include <net/net_namespace.h>
Boaz Harrosh9a74af22009-12-03 20:30:56 +020021#include "nfsd.h"
22#include "cache.h"
J. Bruce Fields0a3adad2009-11-04 18:12:35 -050023#include "vfs.h"
Stanislav Kinsbursky2c2fe292012-12-06 14:23:14 +030024#include "netns.h"
Linus Torvalds1da177e2005-04-16 15:20:36 -070025
26#define NFSDDBG_FACILITY NFSDDBG_SVC
27
Linus Torvalds1da177e2005-04-16 15:20:36 -070028extern struct svc_program nfsd_program;
Jeff Layton9867d762008-06-10 08:40:38 -040029static int nfsd(void *vrqstp);
Linus Torvalds1da177e2005-04-16 15:20:36 -070030
Neil Brownbedbdd82008-06-10 08:40:35 -040031/*
Stanislav Kinsbursky9dd98452012-12-06 14:23:24 +030032 * nfsd_mutex protects nn->nfsd_serv -- both the pointer itself and the members
Neil Brownbedbdd82008-06-10 08:40:35 -040033 * of the svc_serv struct. In particular, ->sv_nrthreads but also to some
34 * extent ->sv_temp_socks and ->sv_permsocks. It also protects nfsdstats.th_cnt
35 *
Stanislav Kinsbursky9dd98452012-12-06 14:23:24 +030036 * If (out side the lock) nn->nfsd_serv is non-NULL, then it must point to a
Neil Brownbedbdd82008-06-10 08:40:35 -040037 * properly initialised 'struct svc_serv' with ->sv_nrthreads > 0. That number
38 * of nfsd threads must exist and each must listed in ->sp_all_threads in each
39 * entry of ->sv_pools[].
40 *
41 * Transitions of the thread count between zero and non-zero are of particular
42 * interest since the svc_serv needs to be created and initialized at that
43 * point, or freed.
Jeff Layton3dd98a32008-06-10 08:40:36 -040044 *
45 * Finally, the nfsd_mutex also protects some of the global variables that are
46 * accessed when nfsd starts and that are settable via the write_* routines in
47 * nfsctl.c. In particular:
48 *
49 * user_recovery_dirname
50 * user_lease_time
51 * nfsd_versions
Neil Brownbedbdd82008-06-10 08:40:35 -040052 */
53DEFINE_MUTEX(nfsd_mutex);
Neil Brownbedbdd82008-06-10 08:40:35 -040054
Andy Adamson4bd9b0f42009-06-24 15:37:45 -040055/*
56 * nfsd_drc_lock protects nfsd_drc_max_pages and nfsd_drc_pages_used.
57 * nfsd_drc_max_pages limits the total amount of memory available for
58 * version 4.1 DRC caches.
59 * nfsd_drc_pages_used tracks the current version 4.1 DRC memory usage.
60 */
61spinlock_t nfsd_drc_lock;
Andy Adamson0c193052009-07-27 19:09:19 -040062unsigned int nfsd_drc_max_mem;
63unsigned int nfsd_drc_mem_used;
Andy Adamson4bd9b0f42009-06-24 15:37:45 -040064
Andreas Gruenbacher3fb803a2006-02-01 03:04:34 -080065#if defined(CONFIG_NFSD_V2_ACL) || defined(CONFIG_NFSD_V3_ACL)
66static struct svc_stat nfsd_acl_svcstats;
67static struct svc_version * nfsd_acl_version[] = {
68 [2] = &nfsd_acl_version2,
69 [3] = &nfsd_acl_version3,
70};
71
72#define NFSD_ACL_MINVERS 2
Tobias Klausere8c96f82006-03-24 03:15:34 -080073#define NFSD_ACL_NRVERS ARRAY_SIZE(nfsd_acl_version)
Andreas Gruenbacher3fb803a2006-02-01 03:04:34 -080074static struct svc_version *nfsd_acl_versions[NFSD_ACL_NRVERS];
75
76static struct svc_program nfsd_acl_program = {
77 .pg_prog = NFS_ACL_PROGRAM,
78 .pg_nvers = NFSD_ACL_NRVERS,
79 .pg_vers = nfsd_acl_versions,
NeilBrown1a8eff62007-01-26 00:56:58 -080080 .pg_name = "nfsacl",
Andreas Gruenbacher3fb803a2006-02-01 03:04:34 -080081 .pg_class = "nfsd",
82 .pg_stats = &nfsd_acl_svcstats,
83 .pg_authenticate = &svc_set_client,
84};
85
86static struct svc_stat nfsd_acl_svcstats = {
87 .program = &nfsd_acl_program,
88};
89#endif /* defined(CONFIG_NFSD_V2_ACL) || defined(CONFIG_NFSD_V3_ACL) */
90
NeilBrown70c3b762005-11-07 01:00:25 -080091static struct svc_version * nfsd_version[] = {
92 [2] = &nfsd_version2,
93#if defined(CONFIG_NFSD_V3)
94 [3] = &nfsd_version3,
95#endif
96#if defined(CONFIG_NFSD_V4)
97 [4] = &nfsd_version4,
98#endif
99};
100
101#define NFSD_MINVERS 2
Tobias Klausere8c96f82006-03-24 03:15:34 -0800102#define NFSD_NRVERS ARRAY_SIZE(nfsd_version)
NeilBrown70c3b762005-11-07 01:00:25 -0800103static struct svc_version *nfsd_versions[NFSD_NRVERS];
104
105struct svc_program nfsd_program = {
Andreas Gruenbacher3fb803a2006-02-01 03:04:34 -0800106#if defined(CONFIG_NFSD_V2_ACL) || defined(CONFIG_NFSD_V3_ACL)
107 .pg_next = &nfsd_acl_program,
108#endif
NeilBrown70c3b762005-11-07 01:00:25 -0800109 .pg_prog = NFS_PROGRAM, /* program number */
110 .pg_nvers = NFSD_NRVERS, /* nr of entries in nfsd_version */
111 .pg_vers = nfsd_versions, /* version table */
112 .pg_name = "nfsd", /* program name */
113 .pg_class = "nfsd", /* authentication class */
114 .pg_stats = &nfsd_svcstats, /* version table */
115 .pg_authenticate = &svc_set_client, /* export authentication */
116
117};
118
Benny Halevy8daf2202009-04-03 08:28:59 +0300119u32 nfsd_supported_minorversion;
120
NeilBrown6658d3a2006-10-02 02:17:46 -0700121int nfsd_vers(int vers, enum vers_op change)
122{
123 if (vers < NFSD_MINVERS || vers >= NFSD_NRVERS)
Pavel Emelyanov15ddb4a2010-05-14 15:33:36 +0400124 return 0;
NeilBrown6658d3a2006-10-02 02:17:46 -0700125 switch(change) {
126 case NFSD_SET:
127 nfsd_versions[vers] = nfsd_version[vers];
NeilBrown6658d3a2006-10-02 02:17:46 -0700128#if defined(CONFIG_NFSD_V2_ACL) || defined(CONFIG_NFSD_V3_ACL)
129 if (vers < NFSD_ACL_NRVERS)
NeilBrown1a8eff62007-01-26 00:56:58 -0800130 nfsd_acl_versions[vers] = nfsd_acl_version[vers];
NeilBrown6658d3a2006-10-02 02:17:46 -0700131#endif
NeilBrown1a8eff62007-01-26 00:56:58 -0800132 break;
NeilBrown6658d3a2006-10-02 02:17:46 -0700133 case NFSD_CLEAR:
134 nfsd_versions[vers] = NULL;
135#if defined(CONFIG_NFSD_V2_ACL) || defined(CONFIG_NFSD_V3_ACL)
136 if (vers < NFSD_ACL_NRVERS)
NeilBrown1a8eff62007-01-26 00:56:58 -0800137 nfsd_acl_versions[vers] = NULL;
NeilBrown6658d3a2006-10-02 02:17:46 -0700138#endif
139 break;
140 case NFSD_TEST:
141 return nfsd_versions[vers] != NULL;
142 case NFSD_AVAIL:
143 return nfsd_version[vers] != NULL;
144 }
145 return 0;
146}
Benny Halevy8daf2202009-04-03 08:28:59 +0300147
148int nfsd_minorversion(u32 minorversion, enum vers_op change)
149{
150 if (minorversion > NFSD_SUPPORTED_MINOR_VERSION)
151 return -1;
152 switch(change) {
153 case NFSD_SET:
154 nfsd_supported_minorversion = minorversion;
155 break;
156 case NFSD_CLEAR:
157 if (minorversion == 0)
158 return -1;
159 nfsd_supported_minorversion = minorversion - 1;
160 break;
161 case NFSD_TEST:
162 return minorversion <= nfsd_supported_minorversion;
163 case NFSD_AVAIL:
164 return minorversion <= NFSD_SUPPORTED_MINOR_VERSION;
165 }
166 return 0;
167}
168
Linus Torvalds1da177e2005-04-16 15:20:36 -0700169/*
170 * Maximum number of nfsd processes
171 */
172#define NFSD_MAXSERVS 8192
173
Stanislav Kinsbursky9dd98452012-12-06 14:23:24 +0300174int nfsd_nrthreads(struct net *net)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700175{
Neil Brownc7d106c2008-06-12 13:38:42 +1000176 int rv = 0;
Stanislav Kinsbursky9dd98452012-12-06 14:23:24 +0300177 struct nfsd_net *nn = net_generic(net, nfsd_net_id);
178
Neil Brownc7d106c2008-06-12 13:38:42 +1000179 mutex_lock(&nfsd_mutex);
Stanislav Kinsbursky9dd98452012-12-06 14:23:24 +0300180 if (nn->nfsd_serv)
181 rv = nn->nfsd_serv->sv_nrthreads;
Neil Brownc7d106c2008-06-12 13:38:42 +1000182 mutex_unlock(&nfsd_mutex);
183 return rv;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700184}
185
Stanislav Kinsburskydb6e1822012-12-10 12:19:09 +0300186static int nfsd_init_socks(struct net *net)
J. Bruce Fields59db4a02010-07-21 18:29:25 -0400187{
188 int error;
Stanislav Kinsbursky9dd98452012-12-06 14:23:24 +0300189 struct nfsd_net *nn = net_generic(net, nfsd_net_id);
190
191 if (!list_empty(&nn->nfsd_serv->sv_permsocks))
J. Bruce Fields59db4a02010-07-21 18:29:25 -0400192 return 0;
193
Stanislav Kinsbursky9dd98452012-12-06 14:23:24 +0300194 error = svc_create_xprt(nn->nfsd_serv, "udp", net, PF_INET, NFS_PORT,
J. Bruce Fields59db4a02010-07-21 18:29:25 -0400195 SVC_SOCK_DEFAULTS);
196 if (error < 0)
197 return error;
198
Stanislav Kinsbursky9dd98452012-12-06 14:23:24 +0300199 error = svc_create_xprt(nn->nfsd_serv, "tcp", net, PF_INET, NFS_PORT,
J. Bruce Fields59db4a02010-07-21 18:29:25 -0400200 SVC_SOCK_DEFAULTS);
201 if (error < 0)
202 return error;
203
204 return 0;
205}
206
Jeff Layton4ad9a342010-07-19 16:50:04 -0400207static bool nfsd_up = false;
208
Stanislav Kinsbursky6ff50b32012-12-06 14:23:09 +0300209static int nfsd_startup_net(struct net *net)
210{
Stanislav Kinsbursky2c2fe292012-12-06 14:23:14 +0300211 struct nfsd_net *nn = net_generic(net, nfsd_net_id);
Stanislav Kinsbursky6ff50b32012-12-06 14:23:09 +0300212 int ret;
213
Stanislav Kinsbursky2c2fe292012-12-06 14:23:14 +0300214 if (nn->nfsd_net_up)
215 return 0;
216
Stanislav Kinsbursky6ff50b32012-12-06 14:23:09 +0300217 ret = nfsd_init_socks(net);
218 if (ret)
219 return ret;
220 ret = lockd_up(net);
221 if (ret)
222 return ret;
223 ret = nfs4_state_start_net(net);
224 if (ret)
225 goto out_lockd;
226
Stanislav Kinsbursky2c2fe292012-12-06 14:23:14 +0300227 nn->nfsd_net_up = true;
Stanislav Kinsbursky6ff50b32012-12-06 14:23:09 +0300228 return 0;
229
230out_lockd:
231 lockd_down(net);
232 return ret;
233}
234
Stanislav Kinsburskydb42d1a2012-12-10 12:19:14 +0300235static int nfsd_startup(int nrservs, struct net *net)
Jeff Layton4ad9a342010-07-19 16:50:04 -0400236{
237 int ret;
J. Bruce Fields774f8bb2010-08-02 14:12:44 -0400238
239 if (nfsd_up)
240 return 0;
J. Bruce Fields59db4a02010-07-21 18:29:25 -0400241 /*
242 * Readahead param cache - will no-op if it already exists.
243 * (Note therefore results will be suboptimal if number of
244 * threads is modified after nfsd start.)
245 */
246 ret = nfsd_racache_init(2*nrservs);
247 if (ret)
248 return ret;
Jeff Layton4ad9a342010-07-19 16:50:04 -0400249 ret = nfs4_state_start();
Jeff Laytonac77efb2010-07-20 14:10:22 -0400250 if (ret)
Stanislav Kinsbursky6ff50b32012-12-06 14:23:09 +0300251 goto out_racache;
252 ret = nfsd_startup_net(net);
Stanislav Kinsburskyf252bc62012-11-26 15:22:18 +0300253 if (ret)
Stanislav Kinsbursky6ff50b32012-12-06 14:23:09 +0300254 goto out_net;
Stanislav Kinsburskyf252bc62012-11-26 15:22:18 +0300255
Jeff Layton4ad9a342010-07-19 16:50:04 -0400256 nfsd_up = true;
Jeff Laytonac77efb2010-07-20 14:10:22 -0400257 return 0;
Stanislav Kinsbursky6ff50b32012-12-06 14:23:09 +0300258
259out_net:
Stanislav Kinsburskyf252bc62012-11-26 15:22:18 +0300260 nfs4_state_shutdown();
J. Bruce Fields59db4a02010-07-21 18:29:25 -0400261out_racache:
262 nfsd_racache_shutdown();
Jeff Layton4ad9a342010-07-19 16:50:04 -0400263 return ret;
264}
265
Stanislav Kinsbursky6ff50b32012-12-06 14:23:09 +0300266static void nfsd_shutdown_net(struct net *net)
267{
Stanislav Kinsbursky2c2fe292012-12-06 14:23:14 +0300268 struct nfsd_net *nn = net_generic(net, nfsd_net_id);
269
270 if (!nn->nfsd_net_up)
271 return;
272
Stanislav Kinsbursky6ff50b32012-12-06 14:23:09 +0300273 nfs4_state_shutdown_net(net);
274 lockd_down(net);
Stanislav Kinsbursky2c2fe292012-12-06 14:23:14 +0300275 nn->nfsd_net_up = false;
Stanislav Kinsbursky6ff50b32012-12-06 14:23:09 +0300276}
277
Stanislav Kinsburskydb42d1a2012-12-10 12:19:14 +0300278static void nfsd_shutdown(struct net *net)
Jeff Layton4ad9a342010-07-19 16:50:04 -0400279{
280 /*
281 * write_ports can create the server without actually starting
282 * any threads--if we get shut down before any threads are
283 * started, then nfsd_last_thread will be run before any of this
284 * other initialization has been done.
285 */
286 if (!nfsd_up)
287 return;
Stanislav Kinsbursky6ff50b32012-12-06 14:23:09 +0300288 nfsd_shutdown_net(net);
Jeff Layton4ad9a342010-07-19 16:50:04 -0400289 nfs4_state_shutdown();
J. Bruce Fields59db4a02010-07-21 18:29:25 -0400290 nfsd_racache_shutdown();
Jeff Layton4ad9a342010-07-19 16:50:04 -0400291 nfsd_up = false;
292}
293
Stanislav Kinsbursky5ecebb72012-01-13 14:03:04 +0400294static void nfsd_last_thread(struct svc_serv *serv, struct net *net)
NeilBrownbc591cc2006-10-02 02:17:44 -0700295{
Stanislav Kinsburskydb42d1a2012-12-10 12:19:14 +0300296 nfsd_shutdown(net);
NeilBrownbc591cc2006-10-02 02:17:44 -0700297
Stanislav Kinsbursky5ecebb72012-01-13 14:03:04 +0400298 svc_rpcb_cleanup(serv, net);
Stanislav Kinsbursky16d05872011-10-25 14:17:28 +0300299
Jeff Laytone096bbc2008-06-10 08:40:37 -0400300 printk(KERN_WARNING "nfsd: last server has exited, flushing export "
301 "cache\n");
Stanislav Kinsburskyb3853e02012-04-11 15:13:21 +0400302 nfsd_export_flush(net);
NeilBrownbc591cc2006-10-02 02:17:44 -0700303}
NeilBrown6658d3a2006-10-02 02:17:46 -0700304
305void nfsd_reset_versions(void)
306{
307 int found_one = 0;
308 int i;
309
310 for (i = NFSD_MINVERS; i < NFSD_NRVERS; i++) {
311 if (nfsd_program.pg_vers[i])
312 found_one = 1;
313 }
314
315 if (!found_one) {
316 for (i = NFSD_MINVERS; i < NFSD_NRVERS; i++)
317 nfsd_program.pg_vers[i] = nfsd_version[i];
318#if defined(CONFIG_NFSD_V2_ACL) || defined(CONFIG_NFSD_V3_ACL)
319 for (i = NFSD_ACL_MINVERS; i < NFSD_ACL_NRVERS; i++)
320 nfsd_acl_program.pg_vers[i] =
321 nfsd_acl_version[i];
322#endif
323 }
324}
325
Andy Adamsonc3d06f92009-04-03 08:28:18 +0300326/*
327 * Each session guarantees a negotiated per slot memory cache for replies
328 * which in turn consumes memory beyond the v2/v3/v4.0 server. A dedicated
329 * NFSv4.1 server might want to use more memory for a DRC than a machine
330 * with mutiple services.
331 *
332 * Impose a hard limit on the number of pages for the DRC which varies
333 * according to the machines free pages. This is of course only a default.
334 *
335 * For now this is a #defined shift which could be under admin control
336 * in the future.
337 */
338static void set_max_drc(void)
339{
Andy Adamson6a14dd12009-07-27 19:06:45 -0400340 #define NFSD_DRC_SIZE_SHIFT 10
Andy Adamson0c193052009-07-27 19:09:19 -0400341 nfsd_drc_max_mem = (nr_free_buffer_pages()
342 >> NFSD_DRC_SIZE_SHIFT) * PAGE_SIZE;
343 nfsd_drc_mem_used = 0;
Andy Adamson4bd9b0f42009-06-24 15:37:45 -0400344 spin_lock_init(&nfsd_drc_lock);
Andy Adamson0c193052009-07-27 19:09:19 -0400345 dprintk("%s nfsd_drc_max_mem %u \n", __func__, nfsd_drc_max_mem);
Andy Adamsonc3d06f92009-04-03 08:28:18 +0300346}
Neil Brownbedbdd82008-06-10 08:40:35 -0400347
J. Bruce Fields87b0fc72012-01-30 16:18:35 -0500348static int nfsd_get_default_max_blksize(void)
349{
350 struct sysinfo i;
351 unsigned long long target;
352 unsigned long ret;
353
354 si_meminfo(&i);
J. Bruce Fields508f9222012-01-30 16:21:11 -0500355 target = (i.totalram - i.totalhigh) << PAGE_SHIFT;
J. Bruce Fields87b0fc72012-01-30 16:18:35 -0500356 /*
357 * Aim for 1/4096 of memory per thread This gives 1MB on 4Gig
358 * machines, but only uses 32K on 128M machines. Bottom out at
359 * 8K on 32M and smaller. Of course, this is only a default.
360 */
361 target >>= 12;
362
363 ret = NFSSVC_MAXBLKSIZE;
364 while (ret > target && ret >= 8*1024*2)
365 ret /= 2;
366 return ret;
367}
368
Stanislav Kinsbursky67774362012-12-10 12:19:20 +0300369int nfsd_create_serv(struct net *net)
NeilBrown02a375f2006-10-02 02:17:46 -0700370{
Stanislav Kinsbursky9793f7c2012-05-02 16:08:38 +0400371 int error;
Stanislav Kinsburskyb9c0ef82012-12-06 14:23:19 +0300372 struct nfsd_net *nn = net_generic(net, nfsd_net_id);
Stanislav Kinsbursky9793f7c2012-05-02 16:08:38 +0400373
Neil Brownbedbdd82008-06-10 08:40:35 -0400374 WARN_ON(!mutex_is_locked(&nfsd_mutex));
Stanislav Kinsbursky9dd98452012-12-06 14:23:24 +0300375 if (nn->nfsd_serv) {
376 svc_get(nn->nfsd_serv);
NeilBrown02a375f2006-10-02 02:17:46 -0700377 return 0;
378 }
J. Bruce Fields87b0fc72012-01-30 16:18:35 -0500379 if (nfsd_max_blksize == 0)
380 nfsd_max_blksize = nfsd_get_default_max_blksize();
J. Bruce Fieldse844a7b2010-08-06 15:48:03 -0400381 nfsd_reset_versions();
Stanislav Kinsbursky9dd98452012-12-06 14:23:24 +0300382 nn->nfsd_serv = svc_create_pooled(&nfsd_program, nfsd_max_blksize,
Jeff Laytona75c5d02008-06-10 08:40:39 -0400383 nfsd_last_thread, nfsd, THIS_MODULE);
Stanislav Kinsbursky9dd98452012-12-06 14:23:24 +0300384 if (nn->nfsd_serv == NULL)
Jeff Layton628b3682010-07-21 16:40:08 -0400385 return -ENOMEM;
Neil Brownbedbdd82008-06-10 08:40:35 -0400386
Stanislav Kinsbursky9dd98452012-12-06 14:23:24 +0300387 error = svc_bind(nn->nfsd_serv, net);
Stanislav Kinsbursky9793f7c2012-05-02 16:08:38 +0400388 if (error < 0) {
Stanislav Kinsbursky9dd98452012-12-06 14:23:24 +0300389 svc_destroy(nn->nfsd_serv);
Stanislav Kinsbursky9793f7c2012-05-02 16:08:38 +0400390 return error;
391 }
392
Jeff Layton628b3682010-07-21 16:40:08 -0400393 set_max_drc();
Stanislav Kinsburskyb9c0ef82012-12-06 14:23:19 +0300394 do_gettimeofday(&nn->nfssvc_boot); /* record boot time */
J. Bruce Fields87b0fc72012-01-30 16:18:35 -0500395 return 0;
NeilBrown02a375f2006-10-02 02:17:46 -0700396}
397
Stanislav Kinsbursky9dd98452012-12-06 14:23:24 +0300398int nfsd_nrpools(struct net *net)
Greg Bankseed29652006-10-02 02:18:02 -0700399{
Stanislav Kinsbursky9dd98452012-12-06 14:23:24 +0300400 struct nfsd_net *nn = net_generic(net, nfsd_net_id);
401
402 if (nn->nfsd_serv == NULL)
Greg Bankseed29652006-10-02 02:18:02 -0700403 return 0;
404 else
Stanislav Kinsbursky9dd98452012-12-06 14:23:24 +0300405 return nn->nfsd_serv->sv_nrpools;
Greg Bankseed29652006-10-02 02:18:02 -0700406}
407
Stanislav Kinsbursky9dd98452012-12-06 14:23:24 +0300408int nfsd_get_nrthreads(int n, int *nthreads, struct net *net)
Greg Bankseed29652006-10-02 02:18:02 -0700409{
410 int i = 0;
Stanislav Kinsbursky9dd98452012-12-06 14:23:24 +0300411 struct nfsd_net *nn = net_generic(net, nfsd_net_id);
Greg Bankseed29652006-10-02 02:18:02 -0700412
Stanislav Kinsbursky9dd98452012-12-06 14:23:24 +0300413 if (nn->nfsd_serv != NULL) {
414 for (i = 0; i < nn->nfsd_serv->sv_nrpools && i < n; i++)
415 nthreads[i] = nn->nfsd_serv->sv_pools[i].sp_nrthreads;
Greg Bankseed29652006-10-02 02:18:02 -0700416 }
417
418 return 0;
419}
420
Stanislav Kinsbursky9dd98452012-12-06 14:23:24 +0300421void nfsd_destroy(struct net *net)
422{
423 struct nfsd_net *nn = net_generic(net, nfsd_net_id);
424 int destroy = (nn->nfsd_serv->sv_nrthreads == 1);
425
426 if (destroy)
427 svc_shutdown_net(nn->nfsd_serv, net);
428 svc_destroy(nn->nfsd_serv);
429 if (destroy)
430 nn->nfsd_serv = NULL;
431}
432
Stanislav Kinsbursky3938a0d2012-12-10 12:19:30 +0300433int nfsd_set_nrthreads(int n, int *nthreads, struct net *net)
Greg Bankseed29652006-10-02 02:18:02 -0700434{
435 int i = 0;
436 int tot = 0;
437 int err = 0;
Stanislav Kinsbursky9dd98452012-12-06 14:23:24 +0300438 struct nfsd_net *nn = net_generic(net, nfsd_net_id);
Greg Bankseed29652006-10-02 02:18:02 -0700439
Neil Brownbedbdd82008-06-10 08:40:35 -0400440 WARN_ON(!mutex_is_locked(&nfsd_mutex));
441
Stanislav Kinsbursky9dd98452012-12-06 14:23:24 +0300442 if (nn->nfsd_serv == NULL || n <= 0)
Greg Bankseed29652006-10-02 02:18:02 -0700443 return 0;
444
Stanislav Kinsbursky9dd98452012-12-06 14:23:24 +0300445 if (n > nn->nfsd_serv->sv_nrpools)
446 n = nn->nfsd_serv->sv_nrpools;
Greg Bankseed29652006-10-02 02:18:02 -0700447
448 /* enforce a global maximum number of threads */
449 tot = 0;
450 for (i = 0; i < n; i++) {
451 if (nthreads[i] > NFSD_MAXSERVS)
452 nthreads[i] = NFSD_MAXSERVS;
453 tot += nthreads[i];
454 }
455 if (tot > NFSD_MAXSERVS) {
456 /* total too large: scale down requested numbers */
457 for (i = 0; i < n && tot > 0; i++) {
458 int new = nthreads[i] * NFSD_MAXSERVS / tot;
459 tot -= (nthreads[i] - new);
460 nthreads[i] = new;
461 }
462 for (i = 0; i < n && tot > 0; i++) {
463 nthreads[i]--;
464 tot--;
465 }
466 }
467
468 /*
469 * There must always be a thread in pool 0; the admin
470 * can't shut down NFS completely using pool_threads.
471 */
472 if (nthreads[0] == 0)
473 nthreads[0] = 1;
474
475 /* apply the new numbers */
Stanislav Kinsbursky9dd98452012-12-06 14:23:24 +0300476 svc_get(nn->nfsd_serv);
Greg Bankseed29652006-10-02 02:18:02 -0700477 for (i = 0; i < n; i++) {
Stanislav Kinsbursky9dd98452012-12-06 14:23:24 +0300478 err = svc_set_num_threads(nn->nfsd_serv, &nn->nfsd_serv->sv_pools[i],
Greg Bankseed29652006-10-02 02:18:02 -0700479 nthreads[i]);
480 if (err)
481 break;
482 }
Stanislav Kinsbursky19f7e2c2012-07-03 16:46:41 +0400483 nfsd_destroy(net);
Greg Bankseed29652006-10-02 02:18:02 -0700484 return err;
485}
486
Jeff Laytonac77efb2010-07-20 14:10:22 -0400487/*
488 * Adjust the number of threads and return the new number of threads.
489 * This is also the function that starts the server if necessary, if
490 * this is the first time nrservs is nonzero.
491 */
Linus Torvalds1da177e2005-04-16 15:20:36 -0700492int
Stanislav Kinsburskyd41a9412012-12-10 12:19:25 +0300493nfsd_svc(int nrservs, struct net *net)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700494{
495 int error;
J. Bruce Fields774f8bb2010-08-02 14:12:44 -0400496 bool nfsd_up_before;
Stanislav Kinsbursky9dd98452012-12-06 14:23:24 +0300497 struct nfsd_net *nn = net_generic(net, nfsd_net_id);
Neil Brownbedbdd82008-06-10 08:40:35 -0400498
499 mutex_lock(&nfsd_mutex);
NeilBrown6658d3a2006-10-02 02:17:46 -0700500 dprintk("nfsd: creating service\n");
Linus Torvalds1da177e2005-04-16 15:20:36 -0700501 if (nrservs <= 0)
502 nrservs = 0;
503 if (nrservs > NFSD_MAXSERVS)
504 nrservs = NFSD_MAXSERVS;
NeilBrown671e1fc2009-06-16 11:03:20 +1000505 error = 0;
Stanislav Kinsbursky9dd98452012-12-06 14:23:24 +0300506 if (nrservs == 0 && nn->nfsd_serv == NULL)
NeilBrown671e1fc2009-06-16 11:03:20 +1000507 goto out;
508
Stanislav Kinsbursky67774362012-12-10 12:19:20 +0300509 error = nfsd_create_serv(net);
NeilBrown02a375f2006-10-02 02:17:46 -0700510 if (error)
J. Bruce Fields774f8bb2010-08-02 14:12:44 -0400511 goto out;
512
513 nfsd_up_before = nfsd_up;
514
Stanislav Kinsburskydb42d1a2012-12-10 12:19:14 +0300515 error = nfsd_startup(nrservs, net);
J. Bruce Fieldsaf4718f2010-07-21 18:31:42 -0400516 if (error)
517 goto out_destroy;
Stanislav Kinsbursky9dd98452012-12-06 14:23:24 +0300518 error = svc_set_num_threads(nn->nfsd_serv, NULL, nrservs);
J. Bruce Fields774f8bb2010-08-02 14:12:44 -0400519 if (error)
520 goto out_shutdown;
Stanislav Kinsbursky9dd98452012-12-06 14:23:24 +0300521 /* We are holding a reference to nn->nfsd_serv which
J. Bruce Fieldsaf4718f2010-07-21 18:31:42 -0400522 * we don't want to count in the return value,
523 * so subtract 1
524 */
Stanislav Kinsbursky9dd98452012-12-06 14:23:24 +0300525 error = nn->nfsd_serv->sv_nrthreads - 1;
J. Bruce Fields774f8bb2010-08-02 14:12:44 -0400526out_shutdown:
527 if (error < 0 && !nfsd_up_before)
Stanislav Kinsburskydb42d1a2012-12-10 12:19:14 +0300528 nfsd_shutdown(net);
Jeff Layton4ad9a342010-07-19 16:50:04 -0400529out_destroy:
Stanislav Kinsbursky19f7e2c2012-07-03 16:46:41 +0400530 nfsd_destroy(net); /* Release server */
Jeff Layton4ad9a342010-07-19 16:50:04 -0400531out:
Neil Brownbedbdd82008-06-10 08:40:35 -0400532 mutex_unlock(&nfsd_mutex);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700533 return error;
534}
535
Linus Torvalds1da177e2005-04-16 15:20:36 -0700536
537/*
538 * This is the NFS server kernel thread
539 */
Jeff Layton9867d762008-06-10 08:40:38 -0400540static int
541nfsd(void *vrqstp)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700542{
Jeff Layton9867d762008-06-10 08:40:38 -0400543 struct svc_rqst *rqstp = (struct svc_rqst *) vrqstp;
J. Bruce Fields5b444cc2012-08-17 21:47:53 -0400544 int err;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700545
546 /* Lock module and set up kernel thread */
Neil Brownbedbdd82008-06-10 08:40:35 -0400547 mutex_lock(&nfsd_mutex);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700548
Jeff Layton9867d762008-06-10 08:40:38 -0400549 /* At this point, the thread shares current->fs
Linus Torvalds1da177e2005-04-16 15:20:36 -0700550 * with the init process. We need to create files with a
551 * umask of 0 instead of init's umask. */
Al Viro3e93cd62009-03-29 19:00:13 -0400552 if (unshare_fs_struct() < 0) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700553 printk("Unable to start nfsd thread: out of memory\n");
554 goto out;
555 }
Al Viro3e93cd62009-03-29 19:00:13 -0400556
Linus Torvalds1da177e2005-04-16 15:20:36 -0700557 current->fs->umask = 0;
558
Jeff Layton9867d762008-06-10 08:40:38 -0400559 /*
560 * thread is spawned with all signals set to SIG_IGN, re-enable
Jeff Layton100766f2008-06-30 14:09:46 -0400561 * the ones that will bring down the thread
Jeff Layton9867d762008-06-10 08:40:38 -0400562 */
Jeff Layton100766f2008-06-30 14:09:46 -0400563 allow_signal(SIGKILL);
564 allow_signal(SIGHUP);
565 allow_signal(SIGINT);
566 allow_signal(SIGQUIT);
Neil Brownbedbdd82008-06-10 08:40:35 -0400567
Linus Torvalds1da177e2005-04-16 15:20:36 -0700568 nfsdstats.th_cnt++;
Neil Brownbedbdd82008-06-10 08:40:35 -0400569 mutex_unlock(&nfsd_mutex);
570
Linus Torvalds1da177e2005-04-16 15:20:36 -0700571 /*
572 * We want less throttling in balance_dirty_pages() so that nfs to
573 * localhost doesn't cause nfsd to lock up due to all the client's
574 * dirty pages.
575 */
576 current->flags |= PF_LESS_THROTTLE;
Rafael J. Wysocki83144182007-07-17 04:03:35 -0700577 set_freezable();
Linus Torvalds1da177e2005-04-16 15:20:36 -0700578
579 /*
580 * The main request loop
581 */
582 for (;;) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700583 /*
584 * Find a socket with data available and call its
585 * recvfrom routine.
586 */
NeilBrown6fb2b472006-10-02 02:17:50 -0700587 while ((err = svc_recv(rqstp, 60*60*HZ)) == -EAGAIN)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700588 ;
Jeff Layton9867d762008-06-10 08:40:38 -0400589 if (err == -EINTR)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700590 break;
David Howellse0e81732009-09-02 09:13:40 +0100591 validate_process_creds();
NeilBrown6fb2b472006-10-02 02:17:50 -0700592 svc_process(rqstp);
David Howellse0e81732009-09-02 09:13:40 +0100593 validate_process_creds();
Linus Torvalds1da177e2005-04-16 15:20:36 -0700594 }
595
NeilBrown24e36662006-10-02 02:17:45 -0700596 /* Clear signals before calling svc_exit_thread() */
NeilBrown9e4160522005-04-16 15:26:37 -0700597 flush_signals(current);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700598
Neil Brownbedbdd82008-06-10 08:40:35 -0400599 mutex_lock(&nfsd_mutex);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700600 nfsdstats.th_cnt --;
601
602out:
Stanislav Kinsbursky57c8b13e2012-07-03 16:46:41 +0400603 rqstp->rq_server = NULL;
Stanislav Kinsbursky786185b2012-05-04 12:49:41 +0400604
Linus Torvalds1da177e2005-04-16 15:20:36 -0700605 /* Release the thread */
606 svc_exit_thread(rqstp);
607
Stanislav Kinsbursky57c8b13e2012-07-03 16:46:41 +0400608 nfsd_destroy(&init_net);
609
Linus Torvalds1da177e2005-04-16 15:20:36 -0700610 /* Release module */
Neil Brownbedbdd82008-06-10 08:40:35 -0400611 mutex_unlock(&nfsd_mutex);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700612 module_put_and_exit(0);
Jeff Layton9867d762008-06-10 08:40:38 -0400613 return 0;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700614}
615
Andy Adamson32c1eb02007-07-17 04:04:48 -0700616static __be32 map_new_errors(u32 vers, __be32 nfserr)
617{
618 if (nfserr == nfserr_jukebox && vers == 2)
619 return nfserr_dropit;
620 if (nfserr == nfserr_wrongsec && vers < 4)
621 return nfserr_acces;
622 return nfserr;
623}
624
Linus Torvalds1da177e2005-04-16 15:20:36 -0700625int
Al Viroc7afef12006-10-19 23:29:02 -0700626nfsd_dispatch(struct svc_rqst *rqstp, __be32 *statp)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700627{
628 struct svc_procedure *proc;
629 kxdrproc_t xdr;
Al Viroad451d32006-10-19 23:28:55 -0700630 __be32 nfserr;
631 __be32 *nfserrp;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700632
633 dprintk("nfsd_dispatch: vers %d proc %d\n",
634 rqstp->rq_vers, rqstp->rq_proc);
635 proc = rqstp->rq_procinfo;
636
J. Bruce Fields10910062011-01-24 12:11:02 -0500637 /*
638 * Give the xdr decoder a chance to change this if it wants
639 * (necessary in the NFSv4.0 compound case)
640 */
641 rqstp->rq_cachetype = proc->pc_cachetype;
642 /* Decode arguments */
643 xdr = proc->pc_decode;
644 if (xdr && !xdr(rqstp, (__be32*)rqstp->rq_arg.head[0].iov_base,
645 rqstp->rq_argp)) {
646 dprintk("nfsd: failed to decode arguments!\n");
647 *statp = rpc_garbage_args;
648 return 1;
649 }
650
Linus Torvalds1da177e2005-04-16 15:20:36 -0700651 /* Check whether we have this call in the cache. */
J. Bruce Fields10910062011-01-24 12:11:02 -0500652 switch (nfsd_cache_lookup(rqstp)) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700653 case RC_INTR:
654 case RC_DROPIT:
655 return 0;
656 case RC_REPLY:
657 return 1;
658 case RC_DOIT:;
659 /* do it */
660 }
661
Linus Torvalds1da177e2005-04-16 15:20:36 -0700662 /* need to grab the location to store the status, as
663 * nfsv4 does some encoding while processing
664 */
665 nfserrp = rqstp->rq_res.head[0].iov_base
666 + rqstp->rq_res.head[0].iov_len;
Al Viroad451d32006-10-19 23:28:55 -0700667 rqstp->rq_res.head[0].iov_len += sizeof(__be32);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700668
669 /* Now call the procedure handler, and encode NFS status. */
670 nfserr = proc->pc_func(rqstp, rqstp->rq_argp, rqstp->rq_resp);
Andy Adamson32c1eb02007-07-17 04:04:48 -0700671 nfserr = map_new_errors(rqstp->rq_vers, nfserr);
J. Bruce Fields9e701c62011-01-02 21:56:36 -0500672 if (nfserr == nfserr_dropit || rqstp->rq_dropme) {
J. Bruce Fields45457e02007-06-22 17:26:32 -0400673 dprintk("nfsd: Dropping request; may be revisited later\n");
Linus Torvalds1da177e2005-04-16 15:20:36 -0700674 nfsd_cache_update(rqstp, RC_NOCACHE, NULL);
675 return 0;
676 }
677
678 if (rqstp->rq_proc != 0)
679 *nfserrp++ = nfserr;
680
681 /* Encode result.
682 * For NFSv2, additional info is never returned in case of an error.
683 */
684 if (!(nfserr && rqstp->rq_vers == 2)) {
685 xdr = proc->pc_encode;
686 if (xdr && !xdr(rqstp, nfserrp,
687 rqstp->rq_resp)) {
688 /* Failed to encode result. Release cache entry */
689 dprintk("nfsd: failed to encode result!\n");
690 nfsd_cache_update(rqstp, RC_NOCACHE, NULL);
691 *statp = rpc_system_err;
692 return 1;
693 }
694 }
695
696 /* Store reply in cache. */
J. Bruce Fields57d276d2012-11-16 15:22:43 -0500697 nfsd_cache_update(rqstp, rqstp->rq_cachetype, statp + 1);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700698 return 1;
699}
Greg Banks03cf6c92009-01-13 21:26:36 +1100700
701int nfsd_pool_stats_open(struct inode *inode, struct file *file)
702{
Ryusei Yamaguchied2d8ae2009-08-16 00:54:41 +0900703 int ret;
Stanislav Kinsbursky9dd98452012-12-06 14:23:24 +0300704 struct net *net = &init_net;
705 struct nfsd_net *nn = net_generic(net, nfsd_net_id);
706
Ryusei Yamaguchied2d8ae2009-08-16 00:54:41 +0900707 mutex_lock(&nfsd_mutex);
Stanislav Kinsbursky9dd98452012-12-06 14:23:24 +0300708 if (nn->nfsd_serv == NULL) {
Ryusei Yamaguchied2d8ae2009-08-16 00:54:41 +0900709 mutex_unlock(&nfsd_mutex);
Greg Banks03cf6c92009-01-13 21:26:36 +1100710 return -ENODEV;
Ryusei Yamaguchied2d8ae2009-08-16 00:54:41 +0900711 }
712 /* bump up the psudo refcount while traversing */
Stanislav Kinsbursky9dd98452012-12-06 14:23:24 +0300713 svc_get(nn->nfsd_serv);
714 ret = svc_pool_stats_open(nn->nfsd_serv, file);
Ryusei Yamaguchied2d8ae2009-08-16 00:54:41 +0900715 mutex_unlock(&nfsd_mutex);
716 return ret;
717}
718
719int nfsd_pool_stats_release(struct inode *inode, struct file *file)
720{
721 int ret = seq_release(inode, file);
Stanislav Kinsbursky786185b2012-05-04 12:49:41 +0400722 struct net *net = &init_net;
723
Ryusei Yamaguchied2d8ae2009-08-16 00:54:41 +0900724 mutex_lock(&nfsd_mutex);
725 /* this function really, really should have been called svc_put() */
Stanislav Kinsbursky19f7e2c2012-07-03 16:46:41 +0400726 nfsd_destroy(net);
Ryusei Yamaguchied2d8ae2009-08-16 00:54:41 +0900727 mutex_unlock(&nfsd_mutex);
728 return ret;
Greg Banks03cf6c92009-01-13 21:26:36 +1100729}