Merge tag 'libnvdimm-fixes-4.20-rc3' of git://git.kernel.org/pub/scm/linux/kernel...
[linux-2.6-block.git] / fs / nfsd / nfssvc.c
CommitLineData
b2441318 1// SPDX-License-Identifier: GPL-2.0
1da177e4 2/*
1da177e4
LT
3 * Central processing for nfsd.
4 *
5 * Authors: Olaf Kirch (okir@monad.swb.de)
6 *
7 * Copyright (C) 1995, 1996, 1997 Olaf Kirch <okir@monad.swb.de>
8 */
9
3f07c014 10#include <linux/sched/signal.h>
83144186 11#include <linux/freezer.h>
143cb494 12#include <linux/module.h>
1da177e4 13#include <linux/fs_struct.h>
c3d06f9c 14#include <linux/swap.h>
1da177e4 15
1da177e4 16#include <linux/sunrpc/stats.h>
1da177e4 17#include <linux/sunrpc/svcsock.h>
36684996 18#include <linux/sunrpc/svc_xprt.h>
1da177e4 19#include <linux/lockd/bind.h>
a257cdd0 20#include <linux/nfsacl.h>
ed2d8aed 21#include <linux/seq_file.h>
36684996
SM
22#include <linux/inetdevice.h>
23#include <net/addrconf.h>
24#include <net/ipv6.h>
fc5d00b0 25#include <net/net_namespace.h>
9a74af21
BH
26#include "nfsd.h"
27#include "cache.h"
0a3adade 28#include "vfs.h"
2c2fe290 29#include "netns.h"
1da177e4
LT
30
31#define NFSDDBG_FACILITY NFSDDBG_SVC
32
1da177e4 33extern struct svc_program nfsd_program;
9867d76c 34static int nfsd(void *vrqstp);
1da177e4 35
bedbdd8b 36/*
9dd9845f 37 * nfsd_mutex protects nn->nfsd_serv -- both the pointer itself and the members
bedbdd8b
NB
38 * of the svc_serv struct. In particular, ->sv_nrthreads but also to some
39 * extent ->sv_temp_socks and ->sv_permsocks. It also protects nfsdstats.th_cnt
40 *
9dd9845f 41 * If (out side the lock) nn->nfsd_serv is non-NULL, then it must point to a
bedbdd8b
NB
42 * properly initialised 'struct svc_serv' with ->sv_nrthreads > 0. That number
43 * of nfsd threads must exist and each must listed in ->sp_all_threads in each
44 * entry of ->sv_pools[].
45 *
46 * Transitions of the thread count between zero and non-zero are of particular
47 * interest since the svc_serv needs to be created and initialized at that
48 * point, or freed.
3dd98a3b
JL
49 *
50 * Finally, the nfsd_mutex also protects some of the global variables that are
51 * accessed when nfsd starts and that are settable via the write_* routines in
52 * nfsctl.c. In particular:
53 *
54 * user_recovery_dirname
55 * user_lease_time
56 * nfsd_versions
bedbdd8b
NB
57 */
58DEFINE_MUTEX(nfsd_mutex);
bedbdd8b 59
4bd9b0f4
AA
60/*
61 * nfsd_drc_lock protects nfsd_drc_max_pages and nfsd_drc_pages_used.
62 * nfsd_drc_max_pages limits the total amount of memory available for
63 * version 4.1 DRC caches.
64 * nfsd_drc_pages_used tracks the current version 4.1 DRC memory usage.
65 */
66spinlock_t nfsd_drc_lock;
697ce9be
ZY
67unsigned long nfsd_drc_max_mem;
68unsigned long nfsd_drc_mem_used;
4bd9b0f4 69
3fb803a9
AG
70#if defined(CONFIG_NFSD_V2_ACL) || defined(CONFIG_NFSD_V3_ACL)
71static struct svc_stat nfsd_acl_svcstats;
e9679189 72static const struct svc_version *nfsd_acl_version[] = {
3fb803a9
AG
73 [2] = &nfsd_acl_version2,
74 [3] = &nfsd_acl_version3,
75};
76
77#define NFSD_ACL_MINVERS 2
e8c96f8c 78#define NFSD_ACL_NRVERS ARRAY_SIZE(nfsd_acl_version)
e9679189 79static const struct svc_version *nfsd_acl_versions[NFSD_ACL_NRVERS];
3fb803a9
AG
80
81static struct svc_program nfsd_acl_program = {
82 .pg_prog = NFS_ACL_PROGRAM,
83 .pg_nvers = NFSD_ACL_NRVERS,
84 .pg_vers = nfsd_acl_versions,
1a8eff6d 85 .pg_name = "nfsacl",
3fb803a9
AG
86 .pg_class = "nfsd",
87 .pg_stats = &nfsd_acl_svcstats,
88 .pg_authenticate = &svc_set_client,
89};
90
91static struct svc_stat nfsd_acl_svcstats = {
92 .program = &nfsd_acl_program,
93};
94#endif /* defined(CONFIG_NFSD_V2_ACL) || defined(CONFIG_NFSD_V3_ACL) */
95
e9679189 96static const struct svc_version *nfsd_version[] = {
70c3b76c
N
97 [2] = &nfsd_version2,
98#if defined(CONFIG_NFSD_V3)
99 [3] = &nfsd_version3,
100#endif
101#if defined(CONFIG_NFSD_V4)
102 [4] = &nfsd_version4,
103#endif
104};
105
106#define NFSD_MINVERS 2
e8c96f8c 107#define NFSD_NRVERS ARRAY_SIZE(nfsd_version)
e9679189 108static const struct svc_version *nfsd_versions[NFSD_NRVERS];
70c3b76c
N
109
110struct svc_program nfsd_program = {
3fb803a9
AG
111#if defined(CONFIG_NFSD_V2_ACL) || defined(CONFIG_NFSD_V3_ACL)
112 .pg_next = &nfsd_acl_program,
113#endif
70c3b76c
N
114 .pg_prog = NFS_PROGRAM, /* program number */
115 .pg_nvers = NFSD_NRVERS, /* nr of entries in nfsd_version */
116 .pg_vers = nfsd_versions, /* version table */
117 .pg_name = "nfsd", /* program name */
118 .pg_class = "nfsd", /* authentication class */
119 .pg_stats = &nfsd_svcstats, /* version table */
120 .pg_authenticate = &svc_set_client, /* export authentication */
121
122};
123
35f7a14f
BF
124static bool nfsd_supported_minorversions[NFSD_SUPPORTED_MINOR_VERSION + 1] = {
125 [0] = 1,
126 [1] = 1,
c23ae601 127 [2] = 1,
35f7a14f 128};
8daf220a 129
6658d3a7
N
130int nfsd_vers(int vers, enum vers_op change)
131{
132 if (vers < NFSD_MINVERS || vers >= NFSD_NRVERS)
15ddb4ae 133 return 0;
6658d3a7
N
134 switch(change) {
135 case NFSD_SET:
136 nfsd_versions[vers] = nfsd_version[vers];
6658d3a7
N
137#if defined(CONFIG_NFSD_V2_ACL) || defined(CONFIG_NFSD_V3_ACL)
138 if (vers < NFSD_ACL_NRVERS)
1a8eff6d 139 nfsd_acl_versions[vers] = nfsd_acl_version[vers];
6658d3a7 140#endif
1a8eff6d 141 break;
6658d3a7
N
142 case NFSD_CLEAR:
143 nfsd_versions[vers] = NULL;
144#if defined(CONFIG_NFSD_V2_ACL) || defined(CONFIG_NFSD_V3_ACL)
145 if (vers < NFSD_ACL_NRVERS)
1a8eff6d 146 nfsd_acl_versions[vers] = NULL;
6658d3a7
N
147#endif
148 break;
149 case NFSD_TEST:
150 return nfsd_versions[vers] != NULL;
151 case NFSD_AVAIL:
152 return nfsd_version[vers] != NULL;
153 }
154 return 0;
155}
8daf220a 156
d3635ff0
TM
157static void
158nfsd_adjust_nfsd_versions4(void)
159{
160 unsigned i;
161
162 for (i = 0; i <= NFSD_SUPPORTED_MINOR_VERSION; i++) {
163 if (nfsd_supported_minorversions[i])
164 return;
165 }
166 nfsd_vers(4, NFSD_CLEAR);
167}
168
8daf220a
BH
169int nfsd_minorversion(u32 minorversion, enum vers_op change)
170{
928c6fb3
N
171 if (minorversion > NFSD_SUPPORTED_MINOR_VERSION &&
172 change != NFSD_AVAIL)
8daf220a
BH
173 return -1;
174 switch(change) {
175 case NFSD_SET:
35f7a14f 176 nfsd_supported_minorversions[minorversion] = true;
d3635ff0 177 nfsd_vers(4, NFSD_SET);
8daf220a
BH
178 break;
179 case NFSD_CLEAR:
35f7a14f 180 nfsd_supported_minorversions[minorversion] = false;
d3635ff0 181 nfsd_adjust_nfsd_versions4();
8daf220a
BH
182 break;
183 case NFSD_TEST:
35f7a14f 184 return nfsd_supported_minorversions[minorversion];
8daf220a
BH
185 case NFSD_AVAIL:
186 return minorversion <= NFSD_SUPPORTED_MINOR_VERSION;
187 }
188 return 0;
189}
190
1da177e4
LT
191/*
192 * Maximum number of nfsd processes
193 */
194#define NFSD_MAXSERVS 8192
195
9dd9845f 196int nfsd_nrthreads(struct net *net)
1da177e4 197{
c7d106c9 198 int rv = 0;
9dd9845f
SK
199 struct nfsd_net *nn = net_generic(net, nfsd_net_id);
200
c7d106c9 201 mutex_lock(&nfsd_mutex);
9dd9845f
SK
202 if (nn->nfsd_serv)
203 rv = nn->nfsd_serv->sv_nrthreads;
c7d106c9
NB
204 mutex_unlock(&nfsd_mutex);
205 return rv;
1da177e4
LT
206}
207
db6e182c 208static int nfsd_init_socks(struct net *net)
59db4a0c
BF
209{
210 int error;
9dd9845f
SK
211 struct nfsd_net *nn = net_generic(net, nfsd_net_id);
212
213 if (!list_empty(&nn->nfsd_serv->sv_permsocks))
59db4a0c
BF
214 return 0;
215
9dd9845f 216 error = svc_create_xprt(nn->nfsd_serv, "udp", net, PF_INET, NFS_PORT,
59db4a0c
BF
217 SVC_SOCK_DEFAULTS);
218 if (error < 0)
219 return error;
220
9dd9845f 221 error = svc_create_xprt(nn->nfsd_serv, "tcp", net, PF_INET, NFS_PORT,
59db4a0c
BF
222 SVC_SOCK_DEFAULTS);
223 if (error < 0)
224 return error;
225
226 return 0;
227}
228
4539f149 229static int nfsd_users = 0;
4ad9a344 230
bda9cac1
SK
231static int nfsd_startup_generic(int nrservs)
232{
233 int ret;
234
4539f149 235 if (nfsd_users++)
bda9cac1
SK
236 return 0;
237
238 /*
239 * Readahead param cache - will no-op if it already exists.
240 * (Note therefore results will be suboptimal if number of
241 * threads is modified after nfsd start.)
242 */
243 ret = nfsd_racache_init(2*nrservs);
244 if (ret)
d9499a95
KM
245 goto dec_users;
246
bda9cac1
SK
247 ret = nfs4_state_start();
248 if (ret)
249 goto out_racache;
250 return 0;
251
252out_racache:
253 nfsd_racache_shutdown();
d9499a95
KM
254dec_users:
255 nfsd_users--;
bda9cac1
SK
256 return ret;
257}
258
259static void nfsd_shutdown_generic(void)
260{
4539f149
SK
261 if (--nfsd_users)
262 return;
263
bda9cac1
SK
264 nfs4_state_shutdown();
265 nfsd_racache_shutdown();
266}
267
8ef66714
KM
268static bool nfsd_needs_lockd(void)
269{
ff88825f 270#if defined(CONFIG_NFSD_V3)
8ef66714 271 return (nfsd_versions[2] != NULL) || (nfsd_versions[3] != NULL);
ff88825f
KM
272#else
273 return (nfsd_versions[2] != NULL);
274#endif
8ef66714
KM
275}
276
903d9bf0 277static int nfsd_startup_net(int nrservs, struct net *net)
6ff50b3d 278{
2c2fe290 279 struct nfsd_net *nn = net_generic(net, nfsd_net_id);
6ff50b3d
SK
280 int ret;
281
2c2fe290
SK
282 if (nn->nfsd_net_up)
283 return 0;
284
903d9bf0 285 ret = nfsd_startup_generic(nrservs);
6ff50b3d
SK
286 if (ret)
287 return ret;
903d9bf0
SK
288 ret = nfsd_init_socks(net);
289 if (ret)
290 goto out_socks;
8ef66714
KM
291
292 if (nfsd_needs_lockd() && !nn->lockd_up) {
293 ret = lockd_up(net);
294 if (ret)
295 goto out_socks;
296 nn->lockd_up = 1;
297 }
298
6ff50b3d
SK
299 ret = nfs4_state_start_net(net);
300 if (ret)
301 goto out_lockd;
302
2c2fe290 303 nn->nfsd_net_up = true;
6ff50b3d
SK
304 return 0;
305
306out_lockd:
8ef66714
KM
307 if (nn->lockd_up) {
308 lockd_down(net);
309 nn->lockd_up = 0;
310 }
903d9bf0 311out_socks:
bda9cac1 312 nfsd_shutdown_generic();
4ad9a344
JL
313 return ret;
314}
315
6ff50b3d
SK
316static void nfsd_shutdown_net(struct net *net)
317{
2c2fe290
SK
318 struct nfsd_net *nn = net_generic(net, nfsd_net_id);
319
6ff50b3d 320 nfs4_state_shutdown_net(net);
8ef66714
KM
321 if (nn->lockd_up) {
322 lockd_down(net);
323 nn->lockd_up = 0;
324 }
2c2fe290 325 nn->nfsd_net_up = false;
903d9bf0 326 nfsd_shutdown_generic();
6ff50b3d
SK
327}
328
36684996
SM
329static int nfsd_inetaddr_event(struct notifier_block *this, unsigned long event,
330 void *ptr)
331{
332 struct in_ifaddr *ifa = (struct in_ifaddr *)ptr;
333 struct net_device *dev = ifa->ifa_dev->dev;
334 struct net *net = dev_net(dev);
335 struct nfsd_net *nn = net_generic(net, nfsd_net_id);
336 struct sockaddr_in sin;
337
2317dc55
VA
338 if ((event != NETDEV_DOWN) ||
339 !atomic_inc_not_zero(&nn->ntf_refcnt))
36684996
SM
340 goto out;
341
342 if (nn->nfsd_serv) {
343 dprintk("nfsd_inetaddr_event: removed %pI4\n", &ifa->ifa_local);
344 sin.sin_family = AF_INET;
345 sin.sin_addr.s_addr = ifa->ifa_local;
346 svc_age_temp_xprts_now(nn->nfsd_serv, (struct sockaddr *)&sin);
347 }
2317dc55
VA
348 atomic_dec(&nn->ntf_refcnt);
349 wake_up(&nn->ntf_wq);
36684996
SM
350
351out:
352 return NOTIFY_DONE;
353}
354
355static struct notifier_block nfsd_inetaddr_notifier = {
356 .notifier_call = nfsd_inetaddr_event,
357};
358
359#if IS_ENABLED(CONFIG_IPV6)
360static int nfsd_inet6addr_event(struct notifier_block *this,
361 unsigned long event, void *ptr)
362{
363 struct inet6_ifaddr *ifa = (struct inet6_ifaddr *)ptr;
364 struct net_device *dev = ifa->idev->dev;
365 struct net *net = dev_net(dev);
366 struct nfsd_net *nn = net_generic(net, nfsd_net_id);
367 struct sockaddr_in6 sin6;
368
2317dc55
VA
369 if ((event != NETDEV_DOWN) ||
370 !atomic_inc_not_zero(&nn->ntf_refcnt))
36684996
SM
371 goto out;
372
373 if (nn->nfsd_serv) {
374 dprintk("nfsd_inet6addr_event: removed %pI6\n", &ifa->addr);
375 sin6.sin6_family = AF_INET6;
376 sin6.sin6_addr = ifa->addr;
7b19824d
SM
377 if (ipv6_addr_type(&sin6.sin6_addr) & IPV6_ADDR_LINKLOCAL)
378 sin6.sin6_scope_id = ifa->idev->dev->ifindex;
36684996
SM
379 svc_age_temp_xprts_now(nn->nfsd_serv, (struct sockaddr *)&sin6);
380 }
2317dc55
VA
381 atomic_dec(&nn->ntf_refcnt);
382 wake_up(&nn->ntf_wq);
36684996
SM
383out:
384 return NOTIFY_DONE;
385}
386
387static struct notifier_block nfsd_inet6addr_notifier = {
388 .notifier_call = nfsd_inet6addr_event,
389};
390#endif
391
1eca45f8
VA
392/* Only used under nfsd_mutex, so this atomic may be overkill: */
393static atomic_t nfsd_notifier_refcount = ATOMIC_INIT(0);
394
541e864f 395static void nfsd_last_thread(struct svc_serv *serv, struct net *net)
4ad9a344 396{
903d9bf0
SK
397 struct nfsd_net *nn = net_generic(net, nfsd_net_id);
398
2317dc55 399 atomic_dec(&nn->ntf_refcnt);
1eca45f8
VA
400 /* check if the notifier still has clients */
401 if (atomic_dec_return(&nfsd_notifier_refcount) == 0) {
402 unregister_inetaddr_notifier(&nfsd_inetaddr_notifier);
36684996 403#if IS_ENABLED(CONFIG_IPV6)
1eca45f8 404 unregister_inet6addr_notifier(&nfsd_inet6addr_notifier);
36684996 405#endif
1eca45f8 406 }
2317dc55 407 wait_event(nn->ntf_wq, atomic_read(&nn->ntf_refcnt) == 0);
1eca45f8 408
4ad9a344
JL
409 /*
410 * write_ports can create the server without actually starting
411 * any threads--if we get shut down before any threads are
412 * started, then nfsd_last_thread will be run before any of this
691412b4 413 * other initialization has been done except the rpcb information.
4ad9a344 414 */
691412b4 415 svc_rpcb_cleanup(serv, net);
903d9bf0 416 if (!nn->nfsd_net_up)
4ad9a344 417 return;
16d05870 418
691412b4 419 nfsd_shutdown_net(net);
e096bbc6
JL
420 printk(KERN_WARNING "nfsd: last server has exited, flushing export "
421 "cache\n");
b3853e0e 422 nfsd_export_flush(net);
bc591ccf 423}
6658d3a7
N
424
425void nfsd_reset_versions(void)
426{
6658d3a7
N
427 int i;
428
800a938f
N
429 for (i = 0; i < NFSD_NRVERS; i++)
430 if (nfsd_vers(i, NFSD_TEST))
431 return;
6658d3a7 432
800a938f
N
433 for (i = 0; i < NFSD_NRVERS; i++)
434 if (i != 4)
435 nfsd_vers(i, NFSD_SET);
436 else {
437 int minor = 0;
438 while (nfsd_minorversion(minor, NFSD_SET) >= 0)
439 minor++;
440 }
6658d3a7
N
441}
442
c3d06f9c
AA
443/*
444 * Each session guarantees a negotiated per slot memory cache for replies
445 * which in turn consumes memory beyond the v2/v3/v4.0 server. A dedicated
446 * NFSv4.1 server might want to use more memory for a DRC than a machine
447 * with mutiple services.
448 *
449 * Impose a hard limit on the number of pages for the DRC which varies
450 * according to the machines free pages. This is of course only a default.
451 *
452 * For now this is a #defined shift which could be under admin control
453 * in the future.
454 */
455static void set_max_drc(void)
456{
44d8660d 457 #define NFSD_DRC_SIZE_SHIFT 7
0c193054
AA
458 nfsd_drc_max_mem = (nr_free_buffer_pages()
459 >> NFSD_DRC_SIZE_SHIFT) * PAGE_SIZE;
460 nfsd_drc_mem_used = 0;
4bd9b0f4 461 spin_lock_init(&nfsd_drc_lock);
697ce9be 462 dprintk("%s nfsd_drc_max_mem %lu \n", __func__, nfsd_drc_max_mem);
c3d06f9c 463}
bedbdd8b 464
87b0fc7d 465static int nfsd_get_default_max_blksize(void)
02a375f0 466{
87b0fc7d
BF
467 struct sysinfo i;
468 unsigned long long target;
469 unsigned long ret;
bedbdd8b 470
87b0fc7d 471 si_meminfo(&i);
508f9227 472 target = (i.totalram - i.totalhigh) << PAGE_SHIFT;
87b0fc7d
BF
473 /*
474 * Aim for 1/4096 of memory per thread This gives 1MB on 4Gig
475 * machines, but only uses 32K on 128M machines. Bottom out at
476 * 8K on 32M and smaller. Of course, this is only a default.
477 */
478 target >>= 12;
479
480 ret = NFSSVC_MAXBLKSIZE;
481 while (ret > target && ret >= 8*1024*2)
482 ret /= 2;
483 return ret;
484}
485
afea5657 486static const struct svc_serv_ops nfsd_thread_sv_ops = {
b9e13cdf
JL
487 .svo_shutdown = nfsd_last_thread,
488 .svo_function = nfsd,
489 .svo_enqueue_xprt = svc_xprt_do_enqueue,
598e2359 490 .svo_setup = svc_set_num_threads,
b9e13cdf 491 .svo_module = THIS_MODULE,
ea126e74
JL
492};
493
6777436b 494int nfsd_create_serv(struct net *net)
87b0fc7d 495{
9793f7c8 496 int error;
b9c0ef85 497 struct nfsd_net *nn = net_generic(net, nfsd_net_id);
9793f7c8 498
bedbdd8b 499 WARN_ON(!mutex_is_locked(&nfsd_mutex));
9dd9845f
SK
500 if (nn->nfsd_serv) {
501 svc_get(nn->nfsd_serv);
02a375f0
N
502 return 0;
503 }
87b0fc7d
BF
504 if (nfsd_max_blksize == 0)
505 nfsd_max_blksize = nfsd_get_default_max_blksize();
e844a7b9 506 nfsd_reset_versions();
9dd9845f 507 nn->nfsd_serv = svc_create_pooled(&nfsd_program, nfsd_max_blksize,
b9e13cdf 508 &nfsd_thread_sv_ops);
9dd9845f 509 if (nn->nfsd_serv == NULL)
628b3687 510 return -ENOMEM;
bedbdd8b 511
5b8db00b 512 nn->nfsd_serv->sv_maxconn = nn->max_connections;
9dd9845f 513 error = svc_bind(nn->nfsd_serv, net);
9793f7c8 514 if (error < 0) {
9dd9845f 515 svc_destroy(nn->nfsd_serv);
9793f7c8
SK
516 return error;
517 }
518
628b3687 519 set_max_drc();
1eca45f8
VA
520 /* check if the notifier is already set */
521 if (atomic_inc_return(&nfsd_notifier_refcount) == 1) {
522 register_inetaddr_notifier(&nfsd_inetaddr_notifier);
36684996 523#if IS_ENABLED(CONFIG_IPV6)
1eca45f8 524 register_inet6addr_notifier(&nfsd_inet6addr_notifier);
36684996 525#endif
1eca45f8 526 }
2317dc55 527 atomic_inc(&nn->ntf_refcnt);
256a89fa 528 ktime_get_real_ts64(&nn->nfssvc_boot); /* record boot time */
87b0fc7d 529 return 0;
02a375f0
N
530}
531
9dd9845f 532int nfsd_nrpools(struct net *net)
eed2965a 533{
9dd9845f
SK
534 struct nfsd_net *nn = net_generic(net, nfsd_net_id);
535
536 if (nn->nfsd_serv == NULL)
eed2965a
GB
537 return 0;
538 else
9dd9845f 539 return nn->nfsd_serv->sv_nrpools;
eed2965a
GB
540}
541
9dd9845f 542int nfsd_get_nrthreads(int n, int *nthreads, struct net *net)
eed2965a
GB
543{
544 int i = 0;
9dd9845f 545 struct nfsd_net *nn = net_generic(net, nfsd_net_id);
eed2965a 546
9dd9845f
SK
547 if (nn->nfsd_serv != NULL) {
548 for (i = 0; i < nn->nfsd_serv->sv_nrpools && i < n; i++)
549 nthreads[i] = nn->nfsd_serv->sv_pools[i].sp_nrthreads;
eed2965a
GB
550 }
551
552 return 0;
553}
554
9dd9845f
SK
555void nfsd_destroy(struct net *net)
556{
557 struct nfsd_net *nn = net_generic(net, nfsd_net_id);
558 int destroy = (nn->nfsd_serv->sv_nrthreads == 1);
559
560 if (destroy)
561 svc_shutdown_net(nn->nfsd_serv, net);
562 svc_destroy(nn->nfsd_serv);
563 if (destroy)
564 nn->nfsd_serv = NULL;
565}
566
3938a0d5 567int nfsd_set_nrthreads(int n, int *nthreads, struct net *net)
eed2965a
GB
568{
569 int i = 0;
570 int tot = 0;
571 int err = 0;
9dd9845f 572 struct nfsd_net *nn = net_generic(net, nfsd_net_id);
eed2965a 573
bedbdd8b
NB
574 WARN_ON(!mutex_is_locked(&nfsd_mutex));
575
9dd9845f 576 if (nn->nfsd_serv == NULL || n <= 0)
eed2965a
GB
577 return 0;
578
9dd9845f
SK
579 if (n > nn->nfsd_serv->sv_nrpools)
580 n = nn->nfsd_serv->sv_nrpools;
eed2965a
GB
581
582 /* enforce a global maximum number of threads */
583 tot = 0;
584 for (i = 0; i < n; i++) {
3c7aa15d 585 nthreads[i] = min(nthreads[i], NFSD_MAXSERVS);
eed2965a
GB
586 tot += nthreads[i];
587 }
588 if (tot > NFSD_MAXSERVS) {
589 /* total too large: scale down requested numbers */
590 for (i = 0; i < n && tot > 0; i++) {
591 int new = nthreads[i] * NFSD_MAXSERVS / tot;
592 tot -= (nthreads[i] - new);
593 nthreads[i] = new;
594 }
595 for (i = 0; i < n && tot > 0; i++) {
596 nthreads[i]--;
597 tot--;
598 }
599 }
600
601 /*
602 * There must always be a thread in pool 0; the admin
603 * can't shut down NFS completely using pool_threads.
604 */
605 if (nthreads[0] == 0)
606 nthreads[0] = 1;
607
608 /* apply the new numbers */
9dd9845f 609 svc_get(nn->nfsd_serv);
eed2965a 610 for (i = 0; i < n; i++) {
598e2359
JL
611 err = nn->nfsd_serv->sv_ops->svo_setup(nn->nfsd_serv,
612 &nn->nfsd_serv->sv_pools[i], nthreads[i]);
eed2965a
GB
613 if (err)
614 break;
615 }
19f7e2ca 616 nfsd_destroy(net);
eed2965a
GB
617 return err;
618}
619
ac77efbe
JL
620/*
621 * Adjust the number of threads and return the new number of threads.
622 * This is also the function that starts the server if necessary, if
623 * this is the first time nrservs is nonzero.
624 */
1da177e4 625int
d41a9417 626nfsd_svc(int nrservs, struct net *net)
1da177e4
LT
627{
628 int error;
774f8bbd 629 bool nfsd_up_before;
9dd9845f 630 struct nfsd_net *nn = net_generic(net, nfsd_net_id);
bedbdd8b
NB
631
632 mutex_lock(&nfsd_mutex);
6658d3a7 633 dprintk("nfsd: creating service\n");
3c7aa15d
KM
634
635 nrservs = max(nrservs, 0);
636 nrservs = min(nrservs, NFSD_MAXSERVS);
671e1fcf 637 error = 0;
3c7aa15d 638
9dd9845f 639 if (nrservs == 0 && nn->nfsd_serv == NULL)
671e1fcf
N
640 goto out;
641
6777436b 642 error = nfsd_create_serv(net);
02a375f0 643 if (error)
774f8bbd
BF
644 goto out;
645
903d9bf0 646 nfsd_up_before = nn->nfsd_net_up;
774f8bbd 647
903d9bf0 648 error = nfsd_startup_net(nrservs, net);
af4718f3
BF
649 if (error)
650 goto out_destroy;
598e2359
JL
651 error = nn->nfsd_serv->sv_ops->svo_setup(nn->nfsd_serv,
652 NULL, nrservs);
774f8bbd
BF
653 if (error)
654 goto out_shutdown;
9dd9845f 655 /* We are holding a reference to nn->nfsd_serv which
af4718f3
BF
656 * we don't want to count in the return value,
657 * so subtract 1
658 */
9dd9845f 659 error = nn->nfsd_serv->sv_nrthreads - 1;
4ad9a344 660out_shutdown:
774f8bbd 661 if (error < 0 && !nfsd_up_before)
541e864f 662 nfsd_shutdown_net(net);
774f8bbd 663out_destroy:
19f7e2ca 664 nfsd_destroy(net); /* Release server */
4ad9a344 665out:
bedbdd8b 666 mutex_unlock(&nfsd_mutex);
1da177e4
LT
667 return error;
668}
669
1da177e4
LT
670
671/*
672 * This is the NFS server kernel thread
673 */
9867d76c
JL
674static int
675nfsd(void *vrqstp)
1da177e4 676{
9867d76c 677 struct svc_rqst *rqstp = (struct svc_rqst *) vrqstp;
88c47666
SK
678 struct svc_xprt *perm_sock = list_entry(rqstp->rq_server->sv_permsocks.next, typeof(struct svc_xprt), xpt_list);
679 struct net *net = perm_sock->xpt_net;
5b8db00b 680 struct nfsd_net *nn = net_generic(net, nfsd_net_id);
5b444cc9 681 int err;
1da177e4
LT
682
683 /* Lock module and set up kernel thread */
bedbdd8b 684 mutex_lock(&nfsd_mutex);
1da177e4 685
9867d76c 686 /* At this point, the thread shares current->fs
47057abd
AG
687 * with the init process. We need to create files with the
688 * umask as defined by the client instead of init's umask. */
3e93cd67 689 if (unshare_fs_struct() < 0) {
1da177e4
LT
690 printk("Unable to start nfsd thread: out of memory\n");
691 goto out;
692 }
3e93cd67 693
1da177e4
LT
694 current->fs->umask = 0;
695
9867d76c
JL
696 /*
697 * thread is spawned with all signals set to SIG_IGN, re-enable
100766f8 698 * the ones that will bring down the thread
9867d76c 699 */
100766f8
JL
700 allow_signal(SIGKILL);
701 allow_signal(SIGHUP);
702 allow_signal(SIGINT);
703 allow_signal(SIGQUIT);
bedbdd8b 704
1da177e4 705 nfsdstats.th_cnt++;
bedbdd8b
NB
706 mutex_unlock(&nfsd_mutex);
707
83144186 708 set_freezable();
1da177e4
LT
709
710 /*
711 * The main request loop
712 */
713 for (;;) {
5b8db00b
JL
714 /* Update sv_maxconn if it has changed */
715 rqstp->rq_server->sv_maxconn = nn->max_connections;
716
1da177e4
LT
717 /*
718 * Find a socket with data available and call its
719 * recvfrom routine.
720 */
6fb2b47f 721 while ((err = svc_recv(rqstp, 60*60*HZ)) == -EAGAIN)
1da177e4 722 ;
9867d76c 723 if (err == -EINTR)
1da177e4 724 break;
e0e81739 725 validate_process_creds();
6fb2b47f 726 svc_process(rqstp);
e0e81739 727 validate_process_creds();
1da177e4
LT
728 }
729
24e36663 730 /* Clear signals before calling svc_exit_thread() */
9e416052 731 flush_signals(current);
1da177e4 732
bedbdd8b 733 mutex_lock(&nfsd_mutex);
1da177e4
LT
734 nfsdstats.th_cnt --;
735
736out:
57c8b13e 737 rqstp->rq_server = NULL;
786185b5 738
1da177e4
LT
739 /* Release the thread */
740 svc_exit_thread(rqstp);
741
88c47666 742 nfsd_destroy(net);
57c8b13e 743
1da177e4 744 /* Release module */
bedbdd8b 745 mutex_unlock(&nfsd_mutex);
1da177e4 746 module_put_and_exit(0);
9867d76c 747 return 0;
1da177e4
LT
748}
749
32c1eb0c
AA
750static __be32 map_new_errors(u32 vers, __be32 nfserr)
751{
752 if (nfserr == nfserr_jukebox && vers == 2)
753 return nfserr_dropit;
754 if (nfserr == nfserr_wrongsec && vers < 4)
755 return nfserr_acces;
756 return nfserr;
757}
758
e6838a29
BF
759/*
760 * A write procedure can have a large argument, and a read procedure can
761 * have a large reply, but no NFSv2 or NFSv3 procedure has argument and
762 * reply that can both be larger than a page. The xdr code has taken
763 * advantage of this assumption to be a sloppy about bounds checking in
764 * some cases. Pending a rewrite of the NFSv2/v3 xdr code to fix that
765 * problem, we enforce these assumptions here:
766 */
767static bool nfs_request_too_big(struct svc_rqst *rqstp,
860bda29 768 const struct svc_procedure *proc)
e6838a29
BF
769{
770 /*
771 * The ACL code has more careful bounds-checking and is not
772 * susceptible to this problem:
773 */
774 if (rqstp->rq_prog != NFS_PROGRAM)
775 return false;
776 /*
777 * Ditto NFSv4 (which can in theory have argument and reply both
778 * more than a page):
779 */
780 if (rqstp->rq_vers >= 4)
781 return false;
782 /* The reply will be small, we're OK: */
783 if (proc->pc_xdrressize > 0 &&
784 proc->pc_xdrressize < XDR_QUADLEN(PAGE_SIZE))
785 return false;
786
787 return rqstp->rq_arg.len > PAGE_SIZE;
788}
789
1da177e4 790int
c7afef1f 791nfsd_dispatch(struct svc_rqst *rqstp, __be32 *statp)
1da177e4 792{
860bda29 793 const struct svc_procedure *proc;
ad451d38
AV
794 __be32 nfserr;
795 __be32 *nfserrp;
1da177e4
LT
796
797 dprintk("nfsd_dispatch: vers %d proc %d\n",
798 rqstp->rq_vers, rqstp->rq_proc);
799 proc = rqstp->rq_procinfo;
800
e6838a29
BF
801 if (nfs_request_too_big(rqstp, proc)) {
802 dprintk("nfsd: NFSv%d argument too large\n", rqstp->rq_vers);
803 *statp = rpc_garbage_args;
804 return 1;
805 }
1091006c
BF
806 /*
807 * Give the xdr decoder a chance to change this if it wants
808 * (necessary in the NFSv4.0 compound case)
809 */
810 rqstp->rq_cachetype = proc->pc_cachetype;
811 /* Decode arguments */
026fec7e
CH
812 if (proc->pc_decode &&
813 !proc->pc_decode(rqstp, (__be32*)rqstp->rq_arg.head[0].iov_base)) {
1091006c
BF
814 dprintk("nfsd: failed to decode arguments!\n");
815 *statp = rpc_garbage_args;
816 return 1;
817 }
818
1da177e4 819 /* Check whether we have this call in the cache. */
1091006c 820 switch (nfsd_cache_lookup(rqstp)) {
1da177e4
LT
821 case RC_DROPIT:
822 return 0;
823 case RC_REPLY:
824 return 1;
825 case RC_DOIT:;
826 /* do it */
827 }
828
1da177e4
LT
829 /* need to grab the location to store the status, as
830 * nfsv4 does some encoding while processing
831 */
832 nfserrp = rqstp->rq_res.head[0].iov_base
833 + rqstp->rq_res.head[0].iov_len;
ad451d38 834 rqstp->rq_res.head[0].iov_len += sizeof(__be32);
1da177e4
LT
835
836 /* Now call the procedure handler, and encode NFS status. */
a6beb732 837 nfserr = proc->pc_func(rqstp);
32c1eb0c 838 nfserr = map_new_errors(rqstp->rq_vers, nfserr);
78b65eb3 839 if (nfserr == nfserr_dropit || test_bit(RQ_DROPME, &rqstp->rq_flags)) {
45457e09 840 dprintk("nfsd: Dropping request; may be revisited later\n");
1da177e4
LT
841 nfsd_cache_update(rqstp, RC_NOCACHE, NULL);
842 return 0;
843 }
844
845 if (rqstp->rq_proc != 0)
846 *nfserrp++ = nfserr;
847
848 /* Encode result.
849 * For NFSv2, additional info is never returned in case of an error.
850 */
851 if (!(nfserr && rqstp->rq_vers == 2)) {
63f8de37 852 if (proc->pc_encode && !proc->pc_encode(rqstp, nfserrp)) {
1da177e4
LT
853 /* Failed to encode result. Release cache entry */
854 dprintk("nfsd: failed to encode result!\n");
855 nfsd_cache_update(rqstp, RC_NOCACHE, NULL);
856 *statp = rpc_system_err;
857 return 1;
858 }
859 }
860
861 /* Store reply in cache. */
57d276d7 862 nfsd_cache_update(rqstp, rqstp->rq_cachetype, statp + 1);
1da177e4
LT
863 return 1;
864}
03cf6c9f
GB
865
866int nfsd_pool_stats_open(struct inode *inode, struct file *file)
867{
ed2d8aed 868 int ret;
11f77942 869 struct nfsd_net *nn = net_generic(inode->i_sb->s_fs_info, nfsd_net_id);
9dd9845f 870
ed2d8aed 871 mutex_lock(&nfsd_mutex);
9dd9845f 872 if (nn->nfsd_serv == NULL) {
ed2d8aed 873 mutex_unlock(&nfsd_mutex);
03cf6c9f 874 return -ENODEV;
ed2d8aed
RY
875 }
876 /* bump up the psudo refcount while traversing */
9dd9845f
SK
877 svc_get(nn->nfsd_serv);
878 ret = svc_pool_stats_open(nn->nfsd_serv, file);
ed2d8aed
RY
879 mutex_unlock(&nfsd_mutex);
880 return ret;
881}
882
883int nfsd_pool_stats_release(struct inode *inode, struct file *file)
884{
885 int ret = seq_release(inode, file);
11f77942 886 struct net *net = inode->i_sb->s_fs_info;
786185b5 887
ed2d8aed
RY
888 mutex_lock(&nfsd_mutex);
889 /* this function really, really should have been called svc_put() */
19f7e2ca 890 nfsd_destroy(net);
ed2d8aed
RY
891 mutex_unlock(&nfsd_mutex);
892 return ret;
03cf6c9f 893}