SUNRPC: De-duplicate .pc_release() call sites
[linux-block.git] / fs / nfsd / nfssvc.c
CommitLineData
b2441318 1// SPDX-License-Identifier: GPL-2.0
1da177e4 2/*
1da177e4
LT
3 * Central processing for nfsd.
4 *
5 * Authors: Olaf Kirch (okir@monad.swb.de)
6 *
7 * Copyright (C) 1995, 1996, 1997 Olaf Kirch <okir@monad.swb.de>
8 */
9
3f07c014 10#include <linux/sched/signal.h>
83144186 11#include <linux/freezer.h>
143cb494 12#include <linux/module.h>
1da177e4 13#include <linux/fs_struct.h>
c3d06f9c 14#include <linux/swap.h>
1da177e4 15
1da177e4 16#include <linux/sunrpc/stats.h>
1da177e4 17#include <linux/sunrpc/svcsock.h>
36684996 18#include <linux/sunrpc/svc_xprt.h>
1da177e4 19#include <linux/lockd/bind.h>
a257cdd0 20#include <linux/nfsacl.h>
ed2d8aed 21#include <linux/seq_file.h>
36684996
SM
22#include <linux/inetdevice.h>
23#include <net/addrconf.h>
24#include <net/ipv6.h>
fc5d00b0 25#include <net/net_namespace.h>
9a74af21
BH
26#include "nfsd.h"
27#include "cache.h"
0a3adade 28#include "vfs.h"
2c2fe290 29#include "netns.h"
65294c1f 30#include "filecache.h"
1da177e4 31
0dfdad1c
CL
32#include "trace.h"
33
1da177e4
LT
34#define NFSDDBG_FACILITY NFSDDBG_SVC
35
1da177e4 36extern struct svc_program nfsd_program;
9867d76c 37static int nfsd(void *vrqstp);
029be5d0
TM
38#if defined(CONFIG_NFSD_V2_ACL) || defined(CONFIG_NFSD_V3_ACL)
39static int nfsd_acl_rpcbind_set(struct net *,
40 const struct svc_program *,
41 u32, int,
42 unsigned short,
43 unsigned short);
e333f3bb
TM
44static __be32 nfsd_acl_init_request(struct svc_rqst *,
45 const struct svc_program *,
46 struct svc_process_info *);
029be5d0
TM
47#endif
48static int nfsd_rpcbind_set(struct net *,
49 const struct svc_program *,
50 u32, int,
51 unsigned short,
52 unsigned short);
e333f3bb
TM
53static __be32 nfsd_init_request(struct svc_rqst *,
54 const struct svc_program *,
55 struct svc_process_info *);
1da177e4 56
bedbdd8b 57/*
9dd9845f 58 * nfsd_mutex protects nn->nfsd_serv -- both the pointer itself and the members
bedbdd8b
NB
59 * of the svc_serv struct. In particular, ->sv_nrthreads but also to some
60 * extent ->sv_temp_socks and ->sv_permsocks. It also protects nfsdstats.th_cnt
61 *
9dd9845f 62 * If (out side the lock) nn->nfsd_serv is non-NULL, then it must point to a
bedbdd8b
NB
63 * properly initialised 'struct svc_serv' with ->sv_nrthreads > 0. That number
64 * of nfsd threads must exist and each must listed in ->sp_all_threads in each
65 * entry of ->sv_pools[].
66 *
67 * Transitions of the thread count between zero and non-zero are of particular
68 * interest since the svc_serv needs to be created and initialized at that
69 * point, or freed.
3dd98a3b
JL
70 *
71 * Finally, the nfsd_mutex also protects some of the global variables that are
72 * accessed when nfsd starts and that are settable via the write_* routines in
73 * nfsctl.c. In particular:
74 *
75 * user_recovery_dirname
76 * user_lease_time
77 * nfsd_versions
bedbdd8b
NB
78 */
79DEFINE_MUTEX(nfsd_mutex);
bedbdd8b 80
4bd9b0f4
AA
81/*
82 * nfsd_drc_lock protects nfsd_drc_max_pages and nfsd_drc_pages_used.
83 * nfsd_drc_max_pages limits the total amount of memory available for
84 * version 4.1 DRC caches.
85 * nfsd_drc_pages_used tracks the current version 4.1 DRC memory usage.
86 */
b73ac680 87DEFINE_SPINLOCK(nfsd_drc_lock);
697ce9be
ZY
88unsigned long nfsd_drc_max_mem;
89unsigned long nfsd_drc_mem_used;
4bd9b0f4 90
3fb803a9
AG
91#if defined(CONFIG_NFSD_V2_ACL) || defined(CONFIG_NFSD_V3_ACL)
92static struct svc_stat nfsd_acl_svcstats;
e9679189 93static const struct svc_version *nfsd_acl_version[] = {
3fb803a9
AG
94 [2] = &nfsd_acl_version2,
95 [3] = &nfsd_acl_version3,
96};
97
98#define NFSD_ACL_MINVERS 2
e8c96f8c 99#define NFSD_ACL_NRVERS ARRAY_SIZE(nfsd_acl_version)
3fb803a9
AG
100
101static struct svc_program nfsd_acl_program = {
102 .pg_prog = NFS_ACL_PROGRAM,
103 .pg_nvers = NFSD_ACL_NRVERS,
7c149057 104 .pg_vers = nfsd_acl_version,
1a8eff6d 105 .pg_name = "nfsacl",
3fb803a9
AG
106 .pg_class = "nfsd",
107 .pg_stats = &nfsd_acl_svcstats,
108 .pg_authenticate = &svc_set_client,
e333f3bb 109 .pg_init_request = nfsd_acl_init_request,
029be5d0 110 .pg_rpcbind_set = nfsd_acl_rpcbind_set,
3fb803a9
AG
111};
112
113static struct svc_stat nfsd_acl_svcstats = {
114 .program = &nfsd_acl_program,
115};
116#endif /* defined(CONFIG_NFSD_V2_ACL) || defined(CONFIG_NFSD_V3_ACL) */
117
e9679189 118static const struct svc_version *nfsd_version[] = {
70c3b76c
N
119 [2] = &nfsd_version2,
120#if defined(CONFIG_NFSD_V3)
121 [3] = &nfsd_version3,
122#endif
123#if defined(CONFIG_NFSD_V4)
124 [4] = &nfsd_version4,
125#endif
126};
127
128#define NFSD_MINVERS 2
e8c96f8c 129#define NFSD_NRVERS ARRAY_SIZE(nfsd_version)
70c3b76c
N
130
131struct svc_program nfsd_program = {
3fb803a9
AG
132#if defined(CONFIG_NFSD_V2_ACL) || defined(CONFIG_NFSD_V3_ACL)
133 .pg_next = &nfsd_acl_program,
134#endif
70c3b76c
N
135 .pg_prog = NFS_PROGRAM, /* program number */
136 .pg_nvers = NFSD_NRVERS, /* nr of entries in nfsd_version */
e333f3bb 137 .pg_vers = nfsd_version, /* version table */
70c3b76c
N
138 .pg_name = "nfsd", /* program name */
139 .pg_class = "nfsd", /* authentication class */
140 .pg_stats = &nfsd_svcstats, /* version table */
141 .pg_authenticate = &svc_set_client, /* export authentication */
e333f3bb 142 .pg_init_request = nfsd_init_request,
029be5d0 143 .pg_rpcbind_set = nfsd_rpcbind_set,
70c3b76c
N
144};
145
e333f3bb
TM
146static bool
147nfsd_support_version(int vers)
148{
149 if (vers >= NFSD_MINVERS && vers < NFSD_NRVERS)
150 return nfsd_version[vers] != NULL;
151 return false;
152}
153
154static bool *
155nfsd_alloc_versions(void)
156{
157 bool *vers = kmalloc_array(NFSD_NRVERS, sizeof(bool), GFP_KERNEL);
158 unsigned i;
159
160 if (vers) {
161 /* All compiled versions are enabled by default */
162 for (i = 0; i < NFSD_NRVERS; i++)
163 vers[i] = nfsd_support_version(i);
164 }
165 return vers;
166}
167
168static bool *
169nfsd_alloc_minorversions(void)
170{
171 bool *vers = kmalloc_array(NFSD_SUPPORTED_MINOR_VERSION + 1,
172 sizeof(bool), GFP_KERNEL);
173 unsigned i;
8daf220a 174
e333f3bb
TM
175 if (vers) {
176 /* All minor versions are enabled by default */
177 for (i = 0; i <= NFSD_SUPPORTED_MINOR_VERSION; i++)
178 vers[i] = nfsd_support_version(4);
179 }
180 return vers;
181}
182
183void
184nfsd_netns_free_versions(struct nfsd_net *nn)
185{
186 kfree(nn->nfsd_versions);
187 kfree(nn->nfsd4_minorversions);
188 nn->nfsd_versions = NULL;
189 nn->nfsd4_minorversions = NULL;
190}
191
192static void
193nfsd_netns_init_versions(struct nfsd_net *nn)
194{
195 if (!nn->nfsd_versions) {
196 nn->nfsd_versions = nfsd_alloc_versions();
197 nn->nfsd4_minorversions = nfsd_alloc_minorversions();
198 if (!nn->nfsd_versions || !nn->nfsd4_minorversions)
199 nfsd_netns_free_versions(nn);
200 }
201}
202
203int nfsd_vers(struct nfsd_net *nn, int vers, enum vers_op change)
6658d3a7
N
204{
205 if (vers < NFSD_MINVERS || vers >= NFSD_NRVERS)
15ddb4ae 206 return 0;
6658d3a7
N
207 switch(change) {
208 case NFSD_SET:
e333f3bb
TM
209 if (nn->nfsd_versions)
210 nn->nfsd_versions[vers] = nfsd_support_version(vers);
1a8eff6d 211 break;
6658d3a7 212 case NFSD_CLEAR:
e333f3bb
TM
213 nfsd_netns_init_versions(nn);
214 if (nn->nfsd_versions)
215 nn->nfsd_versions[vers] = false;
6658d3a7
N
216 break;
217 case NFSD_TEST:
e333f3bb
TM
218 if (nn->nfsd_versions)
219 return nn->nfsd_versions[vers];
df561f66 220 fallthrough;
6658d3a7 221 case NFSD_AVAIL:
e333f3bb 222 return nfsd_support_version(vers);
6658d3a7
N
223 }
224 return 0;
225}
8daf220a 226
d3635ff0 227static void
e333f3bb 228nfsd_adjust_nfsd_versions4(struct nfsd_net *nn)
d3635ff0
TM
229{
230 unsigned i;
231
232 for (i = 0; i <= NFSD_SUPPORTED_MINOR_VERSION; i++) {
e333f3bb 233 if (nn->nfsd4_minorversions[i])
d3635ff0
TM
234 return;
235 }
e333f3bb 236 nfsd_vers(nn, 4, NFSD_CLEAR);
d3635ff0
TM
237}
238
e333f3bb 239int nfsd_minorversion(struct nfsd_net *nn, u32 minorversion, enum vers_op change)
8daf220a 240{
928c6fb3
N
241 if (minorversion > NFSD_SUPPORTED_MINOR_VERSION &&
242 change != NFSD_AVAIL)
8daf220a 243 return -1;
e333f3bb 244
8daf220a
BH
245 switch(change) {
246 case NFSD_SET:
e333f3bb
TM
247 if (nn->nfsd4_minorversions) {
248 nfsd_vers(nn, 4, NFSD_SET);
249 nn->nfsd4_minorversions[minorversion] =
250 nfsd_vers(nn, 4, NFSD_TEST);
251 }
8daf220a
BH
252 break;
253 case NFSD_CLEAR:
e333f3bb
TM
254 nfsd_netns_init_versions(nn);
255 if (nn->nfsd4_minorversions) {
256 nn->nfsd4_minorversions[minorversion] = false;
257 nfsd_adjust_nfsd_versions4(nn);
258 }
8daf220a
BH
259 break;
260 case NFSD_TEST:
e333f3bb
TM
261 if (nn->nfsd4_minorversions)
262 return nn->nfsd4_minorversions[minorversion];
263 return nfsd_vers(nn, 4, NFSD_TEST);
8daf220a 264 case NFSD_AVAIL:
e333f3bb
TM
265 return minorversion <= NFSD_SUPPORTED_MINOR_VERSION &&
266 nfsd_vers(nn, 4, NFSD_AVAIL);
8daf220a
BH
267 }
268 return 0;
269}
270
1da177e4
LT
271/*
272 * Maximum number of nfsd processes
273 */
274#define NFSD_MAXSERVS 8192
275
9dd9845f 276int nfsd_nrthreads(struct net *net)
1da177e4 277{
c7d106c9 278 int rv = 0;
9dd9845f
SK
279 struct nfsd_net *nn = net_generic(net, nfsd_net_id);
280
c7d106c9 281 mutex_lock(&nfsd_mutex);
9dd9845f
SK
282 if (nn->nfsd_serv)
283 rv = nn->nfsd_serv->sv_nrthreads;
c7d106c9
NB
284 mutex_unlock(&nfsd_mutex);
285 return rv;
1da177e4
LT
286}
287
4df493a2 288static int nfsd_init_socks(struct net *net, const struct cred *cred)
59db4a0c
BF
289{
290 int error;
9dd9845f
SK
291 struct nfsd_net *nn = net_generic(net, nfsd_net_id);
292
293 if (!list_empty(&nn->nfsd_serv->sv_permsocks))
59db4a0c
BF
294 return 0;
295
9dd9845f 296 error = svc_create_xprt(nn->nfsd_serv, "udp", net, PF_INET, NFS_PORT,
4df493a2 297 SVC_SOCK_DEFAULTS, cred);
59db4a0c
BF
298 if (error < 0)
299 return error;
300
9dd9845f 301 error = svc_create_xprt(nn->nfsd_serv, "tcp", net, PF_INET, NFS_PORT,
4df493a2 302 SVC_SOCK_DEFAULTS, cred);
59db4a0c
BF
303 if (error < 0)
304 return error;
305
306 return 0;
307}
308
4539f149 309static int nfsd_users = 0;
4ad9a344 310
70c53075 311static int nfsd_startup_generic(void)
bda9cac1
SK
312{
313 int ret;
314
4539f149 315 if (nfsd_users++)
bda9cac1
SK
316 return 0;
317
65294c1f
JL
318 ret = nfsd_file_cache_init();
319 if (ret)
320 goto dec_users;
d9499a95 321
bda9cac1
SK
322 ret = nfs4_state_start();
323 if (ret)
501cb184 324 goto out_file_cache;
bda9cac1
SK
325 return 0;
326
65294c1f
JL
327out_file_cache:
328 nfsd_file_cache_shutdown();
d9499a95
KM
329dec_users:
330 nfsd_users--;
bda9cac1
SK
331 return ret;
332}
333
334static void nfsd_shutdown_generic(void)
335{
4539f149
SK
336 if (--nfsd_users)
337 return;
338
bda9cac1 339 nfs4_state_shutdown();
65294c1f 340 nfsd_file_cache_shutdown();
bda9cac1
SK
341}
342
e333f3bb 343static bool nfsd_needs_lockd(struct nfsd_net *nn)
8ef66714 344{
e333f3bb 345 return nfsd_vers(nn, 2, NFSD_TEST) || nfsd_vers(nn, 3, NFSD_TEST);
8ef66714
KM
346}
347
27c438f5
TM
348void nfsd_copy_boot_verifier(__be32 verf[2], struct nfsd_net *nn)
349{
350 int seq = 0;
351
352 do {
353 read_seqbegin_or_lock(&nn->boot_lock, &seq);
354 /*
355 * This is opaque to client, so no need to byte-swap. Use
356 * __force to keep sparse happy. y2038 time_t overflow is
357 * irrelevant in this usage
358 */
359 verf[0] = (__force __be32)nn->nfssvc_boot.tv_sec;
360 verf[1] = (__force __be32)nn->nfssvc_boot.tv_nsec;
361 } while (need_seqretry(&nn->boot_lock, seq));
362 done_seqretry(&nn->boot_lock, seq);
363}
364
65643f4c 365static void nfsd_reset_boot_verifier_locked(struct nfsd_net *nn)
27c438f5
TM
366{
367 ktime_get_real_ts64(&nn->nfssvc_boot);
368}
369
370void nfsd_reset_boot_verifier(struct nfsd_net *nn)
371{
372 write_seqlock(&nn->boot_lock);
373 nfsd_reset_boot_verifier_locked(nn);
374 write_sequnlock(&nn->boot_lock);
375}
376
70c53075 377static int nfsd_startup_net(struct net *net, const struct cred *cred)
6ff50b3d 378{
2c2fe290 379 struct nfsd_net *nn = net_generic(net, nfsd_net_id);
6ff50b3d
SK
380 int ret;
381
2c2fe290
SK
382 if (nn->nfsd_net_up)
383 return 0;
384
70c53075 385 ret = nfsd_startup_generic();
6ff50b3d
SK
386 if (ret)
387 return ret;
4df493a2 388 ret = nfsd_init_socks(net, cred);
903d9bf0
SK
389 if (ret)
390 goto out_socks;
8ef66714 391
e333f3bb 392 if (nfsd_needs_lockd(nn) && !nn->lockd_up) {
40373b12 393 ret = lockd_up(net, cred);
8ef66714
KM
394 if (ret)
395 goto out_socks;
e44b4bf2 396 nn->lockd_up = true;
8ef66714
KM
397 }
398
9542e6a6 399 ret = nfsd_file_cache_start_net(net);
6ff50b3d
SK
400 if (ret)
401 goto out_lockd;
9542e6a6
TM
402 ret = nfs4_state_start_net(net);
403 if (ret)
404 goto out_filecache;
6ff50b3d 405
f4e44b39
DN
406#ifdef CONFIG_NFSD_V4_2_INTER_SSC
407 nfsd4_ssc_init_umount_work(nn);
408#endif
2c2fe290 409 nn->nfsd_net_up = true;
6ff50b3d
SK
410 return 0;
411
9542e6a6
TM
412out_filecache:
413 nfsd_file_cache_shutdown_net(net);
6ff50b3d 414out_lockd:
8ef66714
KM
415 if (nn->lockd_up) {
416 lockd_down(net);
e44b4bf2 417 nn->lockd_up = false;
8ef66714 418 }
903d9bf0 419out_socks:
bda9cac1 420 nfsd_shutdown_generic();
4ad9a344
JL
421 return ret;
422}
423
6ff50b3d
SK
424static void nfsd_shutdown_net(struct net *net)
425{
2c2fe290
SK
426 struct nfsd_net *nn = net_generic(net, nfsd_net_id);
427
9542e6a6 428 nfsd_file_cache_shutdown_net(net);
6ff50b3d 429 nfs4_state_shutdown_net(net);
8ef66714
KM
430 if (nn->lockd_up) {
431 lockd_down(net);
e44b4bf2 432 nn->lockd_up = false;
8ef66714 433 }
2c2fe290 434 nn->nfsd_net_up = false;
903d9bf0 435 nfsd_shutdown_generic();
6ff50b3d
SK
436}
437
36684996
SM
438static int nfsd_inetaddr_event(struct notifier_block *this, unsigned long event,
439 void *ptr)
440{
441 struct in_ifaddr *ifa = (struct in_ifaddr *)ptr;
442 struct net_device *dev = ifa->ifa_dev->dev;
443 struct net *net = dev_net(dev);
444 struct nfsd_net *nn = net_generic(net, nfsd_net_id);
445 struct sockaddr_in sin;
446
2317dc55
VA
447 if ((event != NETDEV_DOWN) ||
448 !atomic_inc_not_zero(&nn->ntf_refcnt))
36684996
SM
449 goto out;
450
451 if (nn->nfsd_serv) {
452 dprintk("nfsd_inetaddr_event: removed %pI4\n", &ifa->ifa_local);
453 sin.sin_family = AF_INET;
454 sin.sin_addr.s_addr = ifa->ifa_local;
455 svc_age_temp_xprts_now(nn->nfsd_serv, (struct sockaddr *)&sin);
456 }
2317dc55
VA
457 atomic_dec(&nn->ntf_refcnt);
458 wake_up(&nn->ntf_wq);
36684996
SM
459
460out:
461 return NOTIFY_DONE;
462}
463
464static struct notifier_block nfsd_inetaddr_notifier = {
465 .notifier_call = nfsd_inetaddr_event,
466};
467
468#if IS_ENABLED(CONFIG_IPV6)
469static int nfsd_inet6addr_event(struct notifier_block *this,
470 unsigned long event, void *ptr)
471{
472 struct inet6_ifaddr *ifa = (struct inet6_ifaddr *)ptr;
473 struct net_device *dev = ifa->idev->dev;
474 struct net *net = dev_net(dev);
475 struct nfsd_net *nn = net_generic(net, nfsd_net_id);
476 struct sockaddr_in6 sin6;
477
2317dc55
VA
478 if ((event != NETDEV_DOWN) ||
479 !atomic_inc_not_zero(&nn->ntf_refcnt))
36684996
SM
480 goto out;
481
482 if (nn->nfsd_serv) {
483 dprintk("nfsd_inet6addr_event: removed %pI6\n", &ifa->addr);
484 sin6.sin6_family = AF_INET6;
485 sin6.sin6_addr = ifa->addr;
7b19824d
SM
486 if (ipv6_addr_type(&sin6.sin6_addr) & IPV6_ADDR_LINKLOCAL)
487 sin6.sin6_scope_id = ifa->idev->dev->ifindex;
36684996
SM
488 svc_age_temp_xprts_now(nn->nfsd_serv, (struct sockaddr *)&sin6);
489 }
2317dc55
VA
490 atomic_dec(&nn->ntf_refcnt);
491 wake_up(&nn->ntf_wq);
36684996
SM
492out:
493 return NOTIFY_DONE;
494}
495
496static struct notifier_block nfsd_inet6addr_notifier = {
497 .notifier_call = nfsd_inet6addr_event,
498};
499#endif
500
1eca45f8
VA
501/* Only used under nfsd_mutex, so this atomic may be overkill: */
502static atomic_t nfsd_notifier_refcount = ATOMIC_INIT(0);
503
541e864f 504static void nfsd_last_thread(struct svc_serv *serv, struct net *net)
4ad9a344 505{
903d9bf0
SK
506 struct nfsd_net *nn = net_generic(net, nfsd_net_id);
507
2317dc55 508 atomic_dec(&nn->ntf_refcnt);
1eca45f8
VA
509 /* check if the notifier still has clients */
510 if (atomic_dec_return(&nfsd_notifier_refcount) == 0) {
511 unregister_inetaddr_notifier(&nfsd_inetaddr_notifier);
36684996 512#if IS_ENABLED(CONFIG_IPV6)
1eca45f8 513 unregister_inet6addr_notifier(&nfsd_inet6addr_notifier);
36684996 514#endif
1eca45f8 515 }
2317dc55 516 wait_event(nn->ntf_wq, atomic_read(&nn->ntf_refcnt) == 0);
1eca45f8 517
4ad9a344
JL
518 /*
519 * write_ports can create the server without actually starting
520 * any threads--if we get shut down before any threads are
521 * started, then nfsd_last_thread will be run before any of this
691412b4 522 * other initialization has been done except the rpcb information.
4ad9a344 523 */
691412b4 524 svc_rpcb_cleanup(serv, net);
903d9bf0 525 if (!nn->nfsd_net_up)
4ad9a344 526 return;
16d05870 527
691412b4 528 nfsd_shutdown_net(net);
4420440c 529 pr_info("nfsd: last server has exited, flushing export cache\n");
b3853e0e 530 nfsd_export_flush(net);
bc591ccf 531}
6658d3a7 532
e333f3bb 533void nfsd_reset_versions(struct nfsd_net *nn)
6658d3a7 534{
6658d3a7
N
535 int i;
536
800a938f 537 for (i = 0; i < NFSD_NRVERS; i++)
e333f3bb 538 if (nfsd_vers(nn, i, NFSD_TEST))
800a938f 539 return;
6658d3a7 540
800a938f
N
541 for (i = 0; i < NFSD_NRVERS; i++)
542 if (i != 4)
e333f3bb 543 nfsd_vers(nn, i, NFSD_SET);
800a938f
N
544 else {
545 int minor = 0;
e333f3bb 546 while (nfsd_minorversion(nn, minor, NFSD_SET) >= 0)
800a938f
N
547 minor++;
548 }
6658d3a7
N
549}
550
c3d06f9c
AA
551/*
552 * Each session guarantees a negotiated per slot memory cache for replies
553 * which in turn consumes memory beyond the v2/v3/v4.0 server. A dedicated
554 * NFSv4.1 server might want to use more memory for a DRC than a machine
555 * with mutiple services.
556 *
557 * Impose a hard limit on the number of pages for the DRC which varies
558 * according to the machines free pages. This is of course only a default.
559 *
560 * For now this is a #defined shift which could be under admin control
561 * in the future.
562 */
563static void set_max_drc(void)
564{
44d8660d 565 #define NFSD_DRC_SIZE_SHIFT 7
0c193054
AA
566 nfsd_drc_max_mem = (nr_free_buffer_pages()
567 >> NFSD_DRC_SIZE_SHIFT) * PAGE_SIZE;
568 nfsd_drc_mem_used = 0;
697ce9be 569 dprintk("%s nfsd_drc_max_mem %lu \n", __func__, nfsd_drc_max_mem);
c3d06f9c 570}
bedbdd8b 571
87b0fc7d 572static int nfsd_get_default_max_blksize(void)
02a375f0 573{
87b0fc7d
BF
574 struct sysinfo i;
575 unsigned long long target;
576 unsigned long ret;
bedbdd8b 577
87b0fc7d 578 si_meminfo(&i);
508f9227 579 target = (i.totalram - i.totalhigh) << PAGE_SHIFT;
87b0fc7d
BF
580 /*
581 * Aim for 1/4096 of memory per thread This gives 1MB on 4Gig
582 * machines, but only uses 32K on 128M machines. Bottom out at
583 * 8K on 32M and smaller. Of course, this is only a default.
584 */
585 target >>= 12;
586
587 ret = NFSSVC_MAXBLKSIZE;
588 while (ret > target && ret >= 8*1024*2)
589 ret /= 2;
590 return ret;
591}
592
afea5657 593static const struct svc_serv_ops nfsd_thread_sv_ops = {
b9e13cdf
JL
594 .svo_shutdown = nfsd_last_thread,
595 .svo_function = nfsd,
596 .svo_enqueue_xprt = svc_xprt_do_enqueue,
598e2359 597 .svo_setup = svc_set_num_threads,
b9e13cdf 598 .svo_module = THIS_MODULE,
ea126e74
JL
599};
600
c6c7f2a8
TM
601static void nfsd_complete_shutdown(struct net *net)
602{
603 struct nfsd_net *nn = net_generic(net, nfsd_net_id);
604
605 WARN_ON(!mutex_is_locked(&nfsd_mutex));
606
607 nn->nfsd_serv = NULL;
608 complete(&nn->nfsd_shutdown_complete);
609}
610
611void nfsd_shutdown_threads(struct net *net)
612{
613 struct nfsd_net *nn = net_generic(net, nfsd_net_id);
614 struct svc_serv *serv;
615
616 mutex_lock(&nfsd_mutex);
617 serv = nn->nfsd_serv;
618 if (serv == NULL) {
619 mutex_unlock(&nfsd_mutex);
620 return;
621 }
622
623 svc_get(serv);
624 /* Kill outstanding nfsd threads */
625 serv->sv_ops->svo_setup(serv, NULL, 0);
626 nfsd_destroy(net);
627 mutex_unlock(&nfsd_mutex);
628 /* Wait for shutdown of nfsd_serv to complete */
629 wait_for_completion(&nn->nfsd_shutdown_complete);
630}
631
44fb26c6 632bool i_am_nfsd(void)
28df3d15
BF
633{
634 return kthread_func(current) == nfsd;
635}
636
6777436b 637int nfsd_create_serv(struct net *net)
87b0fc7d 638{
9793f7c8 639 int error;
b9c0ef85 640 struct nfsd_net *nn = net_generic(net, nfsd_net_id);
9793f7c8 641
bedbdd8b 642 WARN_ON(!mutex_is_locked(&nfsd_mutex));
9dd9845f
SK
643 if (nn->nfsd_serv) {
644 svc_get(nn->nfsd_serv);
02a375f0
N
645 return 0;
646 }
87b0fc7d
BF
647 if (nfsd_max_blksize == 0)
648 nfsd_max_blksize = nfsd_get_default_max_blksize();
e333f3bb 649 nfsd_reset_versions(nn);
9dd9845f 650 nn->nfsd_serv = svc_create_pooled(&nfsd_program, nfsd_max_blksize,
b9e13cdf 651 &nfsd_thread_sv_ops);
9dd9845f 652 if (nn->nfsd_serv == NULL)
628b3687 653 return -ENOMEM;
c6c7f2a8 654 init_completion(&nn->nfsd_shutdown_complete);
bedbdd8b 655
5b8db00b 656 nn->nfsd_serv->sv_maxconn = nn->max_connections;
9dd9845f 657 error = svc_bind(nn->nfsd_serv, net);
9793f7c8 658 if (error < 0) {
9dd9845f 659 svc_destroy(nn->nfsd_serv);
c6c7f2a8 660 nfsd_complete_shutdown(net);
9793f7c8
SK
661 return error;
662 }
663
628b3687 664 set_max_drc();
1eca45f8
VA
665 /* check if the notifier is already set */
666 if (atomic_inc_return(&nfsd_notifier_refcount) == 1) {
667 register_inetaddr_notifier(&nfsd_inetaddr_notifier);
36684996 668#if IS_ENABLED(CONFIG_IPV6)
1eca45f8 669 register_inet6addr_notifier(&nfsd_inet6addr_notifier);
36684996 670#endif
1eca45f8 671 }
2317dc55 672 atomic_inc(&nn->ntf_refcnt);
27c438f5 673 nfsd_reset_boot_verifier(nn);
87b0fc7d 674 return 0;
02a375f0
N
675}
676
9dd9845f 677int nfsd_nrpools(struct net *net)
eed2965a 678{
9dd9845f
SK
679 struct nfsd_net *nn = net_generic(net, nfsd_net_id);
680
681 if (nn->nfsd_serv == NULL)
eed2965a
GB
682 return 0;
683 else
9dd9845f 684 return nn->nfsd_serv->sv_nrpools;
eed2965a
GB
685}
686
9dd9845f 687int nfsd_get_nrthreads(int n, int *nthreads, struct net *net)
eed2965a
GB
688{
689 int i = 0;
9dd9845f 690 struct nfsd_net *nn = net_generic(net, nfsd_net_id);
eed2965a 691
9dd9845f
SK
692 if (nn->nfsd_serv != NULL) {
693 for (i = 0; i < nn->nfsd_serv->sv_nrpools && i < n; i++)
694 nthreads[i] = nn->nfsd_serv->sv_pools[i].sp_nrthreads;
eed2965a
GB
695 }
696
697 return 0;
698}
699
9dd9845f
SK
700void nfsd_destroy(struct net *net)
701{
702 struct nfsd_net *nn = net_generic(net, nfsd_net_id);
703 int destroy = (nn->nfsd_serv->sv_nrthreads == 1);
704
705 if (destroy)
706 svc_shutdown_net(nn->nfsd_serv, net);
707 svc_destroy(nn->nfsd_serv);
708 if (destroy)
c6c7f2a8 709 nfsd_complete_shutdown(net);
9dd9845f
SK
710}
711
3938a0d5 712int nfsd_set_nrthreads(int n, int *nthreads, struct net *net)
eed2965a
GB
713{
714 int i = 0;
715 int tot = 0;
716 int err = 0;
9dd9845f 717 struct nfsd_net *nn = net_generic(net, nfsd_net_id);
eed2965a 718
bedbdd8b
NB
719 WARN_ON(!mutex_is_locked(&nfsd_mutex));
720
9dd9845f 721 if (nn->nfsd_serv == NULL || n <= 0)
eed2965a
GB
722 return 0;
723
9dd9845f
SK
724 if (n > nn->nfsd_serv->sv_nrpools)
725 n = nn->nfsd_serv->sv_nrpools;
eed2965a
GB
726
727 /* enforce a global maximum number of threads */
728 tot = 0;
729 for (i = 0; i < n; i++) {
3c7aa15d 730 nthreads[i] = min(nthreads[i], NFSD_MAXSERVS);
eed2965a
GB
731 tot += nthreads[i];
732 }
733 if (tot > NFSD_MAXSERVS) {
734 /* total too large: scale down requested numbers */
735 for (i = 0; i < n && tot > 0; i++) {
736 int new = nthreads[i] * NFSD_MAXSERVS / tot;
737 tot -= (nthreads[i] - new);
738 nthreads[i] = new;
739 }
740 for (i = 0; i < n && tot > 0; i++) {
741 nthreads[i]--;
742 tot--;
743 }
744 }
745
746 /*
747 * There must always be a thread in pool 0; the admin
748 * can't shut down NFS completely using pool_threads.
749 */
750 if (nthreads[0] == 0)
751 nthreads[0] = 1;
752
753 /* apply the new numbers */
9dd9845f 754 svc_get(nn->nfsd_serv);
eed2965a 755 for (i = 0; i < n; i++) {
598e2359
JL
756 err = nn->nfsd_serv->sv_ops->svo_setup(nn->nfsd_serv,
757 &nn->nfsd_serv->sv_pools[i], nthreads[i]);
eed2965a
GB
758 if (err)
759 break;
760 }
19f7e2ca 761 nfsd_destroy(net);
eed2965a
GB
762 return err;
763}
764
ac77efbe
JL
765/*
766 * Adjust the number of threads and return the new number of threads.
767 * This is also the function that starts the server if necessary, if
768 * this is the first time nrservs is nonzero.
769 */
1da177e4 770int
4df493a2 771nfsd_svc(int nrservs, struct net *net, const struct cred *cred)
1da177e4
LT
772{
773 int error;
774f8bbd 774 bool nfsd_up_before;
9dd9845f 775 struct nfsd_net *nn = net_generic(net, nfsd_net_id);
bedbdd8b
NB
776
777 mutex_lock(&nfsd_mutex);
6658d3a7 778 dprintk("nfsd: creating service\n");
3c7aa15d
KM
779
780 nrservs = max(nrservs, 0);
781 nrservs = min(nrservs, NFSD_MAXSERVS);
671e1fcf 782 error = 0;
3c7aa15d 783
9dd9845f 784 if (nrservs == 0 && nn->nfsd_serv == NULL)
671e1fcf
N
785 goto out;
786
7627d7dc
SM
787 strlcpy(nn->nfsd_name, utsname()->nodename,
788 sizeof(nn->nfsd_name));
789
6777436b 790 error = nfsd_create_serv(net);
02a375f0 791 if (error)
774f8bbd
BF
792 goto out;
793
903d9bf0 794 nfsd_up_before = nn->nfsd_net_up;
774f8bbd 795
70c53075 796 error = nfsd_startup_net(net, cred);
af4718f3
BF
797 if (error)
798 goto out_destroy;
598e2359
JL
799 error = nn->nfsd_serv->sv_ops->svo_setup(nn->nfsd_serv,
800 NULL, nrservs);
774f8bbd
BF
801 if (error)
802 goto out_shutdown;
9dd9845f 803 /* We are holding a reference to nn->nfsd_serv which
af4718f3
BF
804 * we don't want to count in the return value,
805 * so subtract 1
806 */
9dd9845f 807 error = nn->nfsd_serv->sv_nrthreads - 1;
4ad9a344 808out_shutdown:
774f8bbd 809 if (error < 0 && !nfsd_up_before)
541e864f 810 nfsd_shutdown_net(net);
774f8bbd 811out_destroy:
19f7e2ca 812 nfsd_destroy(net); /* Release server */
4ad9a344 813out:
bedbdd8b 814 mutex_unlock(&nfsd_mutex);
1da177e4
LT
815 return error;
816}
817
029be5d0
TM
818#if defined(CONFIG_NFSD_V2_ACL) || defined(CONFIG_NFSD_V3_ACL)
819static bool
820nfsd_support_acl_version(int vers)
821{
822 if (vers >= NFSD_ACL_MINVERS && vers < NFSD_ACL_NRVERS)
823 return nfsd_acl_version[vers] != NULL;
824 return false;
825}
826
827static int
828nfsd_acl_rpcbind_set(struct net *net, const struct svc_program *progp,
829 u32 version, int family, unsigned short proto,
830 unsigned short port)
831{
832 if (!nfsd_support_acl_version(version) ||
e333f3bb 833 !nfsd_vers(net_generic(net, nfsd_net_id), version, NFSD_TEST))
029be5d0
TM
834 return 0;
835 return svc_generic_rpcbind_set(net, progp, version, family,
836 proto, port);
837}
e333f3bb
TM
838
839static __be32
840nfsd_acl_init_request(struct svc_rqst *rqstp,
841 const struct svc_program *progp,
842 struct svc_process_info *ret)
843{
844 struct nfsd_net *nn = net_generic(SVC_NET(rqstp), nfsd_net_id);
845 int i;
846
847 if (likely(nfsd_support_acl_version(rqstp->rq_vers) &&
848 nfsd_vers(nn, rqstp->rq_vers, NFSD_TEST)))
849 return svc_generic_init_request(rqstp, progp, ret);
850
851 ret->mismatch.lovers = NFSD_ACL_NRVERS;
852 for (i = NFSD_ACL_MINVERS; i < NFSD_ACL_NRVERS; i++) {
853 if (nfsd_support_acl_version(rqstp->rq_vers) &&
854 nfsd_vers(nn, i, NFSD_TEST)) {
855 ret->mismatch.lovers = i;
856 break;
857 }
858 }
859 if (ret->mismatch.lovers == NFSD_ACL_NRVERS)
860 return rpc_prog_unavail;
861 ret->mismatch.hivers = NFSD_ACL_MINVERS;
862 for (i = NFSD_ACL_NRVERS - 1; i >= NFSD_ACL_MINVERS; i--) {
863 if (nfsd_support_acl_version(rqstp->rq_vers) &&
864 nfsd_vers(nn, i, NFSD_TEST)) {
865 ret->mismatch.hivers = i;
866 break;
867 }
868 }
869 return rpc_prog_mismatch;
870}
029be5d0
TM
871#endif
872
873static int
874nfsd_rpcbind_set(struct net *net, const struct svc_program *progp,
875 u32 version, int family, unsigned short proto,
876 unsigned short port)
877{
e333f3bb 878 if (!nfsd_vers(net_generic(net, nfsd_net_id), version, NFSD_TEST))
029be5d0
TM
879 return 0;
880 return svc_generic_rpcbind_set(net, progp, version, family,
881 proto, port);
882}
1da177e4 883
e333f3bb
TM
884static __be32
885nfsd_init_request(struct svc_rqst *rqstp,
886 const struct svc_program *progp,
887 struct svc_process_info *ret)
888{
889 struct nfsd_net *nn = net_generic(SVC_NET(rqstp), nfsd_net_id);
890 int i;
891
892 if (likely(nfsd_vers(nn, rqstp->rq_vers, NFSD_TEST)))
893 return svc_generic_init_request(rqstp, progp, ret);
894
895 ret->mismatch.lovers = NFSD_NRVERS;
896 for (i = NFSD_MINVERS; i < NFSD_NRVERS; i++) {
897 if (nfsd_vers(nn, i, NFSD_TEST)) {
898 ret->mismatch.lovers = i;
899 break;
900 }
901 }
902 if (ret->mismatch.lovers == NFSD_NRVERS)
903 return rpc_prog_unavail;
904 ret->mismatch.hivers = NFSD_MINVERS;
905 for (i = NFSD_NRVERS - 1; i >= NFSD_MINVERS; i--) {
906 if (nfsd_vers(nn, i, NFSD_TEST)) {
907 ret->mismatch.hivers = i;
908 break;
909 }
910 }
911 return rpc_prog_mismatch;
912}
913
1da177e4
LT
914/*
915 * This is the NFS server kernel thread
916 */
9867d76c
JL
917static int
918nfsd(void *vrqstp)
1da177e4 919{
9867d76c 920 struct svc_rqst *rqstp = (struct svc_rqst *) vrqstp;
88c47666
SK
921 struct svc_xprt *perm_sock = list_entry(rqstp->rq_server->sv_permsocks.next, typeof(struct svc_xprt), xpt_list);
922 struct net *net = perm_sock->xpt_net;
5b8db00b 923 struct nfsd_net *nn = net_generic(net, nfsd_net_id);
5b444cc9 924 int err;
1da177e4
LT
925
926 /* Lock module and set up kernel thread */
bedbdd8b 927 mutex_lock(&nfsd_mutex);
1da177e4 928
9867d76c 929 /* At this point, the thread shares current->fs
47057abd
AG
930 * with the init process. We need to create files with the
931 * umask as defined by the client instead of init's umask. */
3e93cd67 932 if (unshare_fs_struct() < 0) {
1da177e4
LT
933 printk("Unable to start nfsd thread: out of memory\n");
934 goto out;
935 }
3e93cd67 936
1da177e4
LT
937 current->fs->umask = 0;
938
9867d76c
JL
939 /*
940 * thread is spawned with all signals set to SIG_IGN, re-enable
100766f8 941 * the ones that will bring down the thread
9867d76c 942 */
100766f8
JL
943 allow_signal(SIGKILL);
944 allow_signal(SIGHUP);
945 allow_signal(SIGINT);
946 allow_signal(SIGQUIT);
bedbdd8b 947
1da177e4 948 nfsdstats.th_cnt++;
bedbdd8b
NB
949 mutex_unlock(&nfsd_mutex);
950
83144186 951 set_freezable();
1da177e4
LT
952
953 /*
954 * The main request loop
955 */
956 for (;;) {
5b8db00b
JL
957 /* Update sv_maxconn if it has changed */
958 rqstp->rq_server->sv_maxconn = nn->max_connections;
959
1da177e4
LT
960 /*
961 * Find a socket with data available and call its
962 * recvfrom routine.
963 */
6fb2b47f 964 while ((err = svc_recv(rqstp, 60*60*HZ)) == -EAGAIN)
1da177e4 965 ;
9867d76c 966 if (err == -EINTR)
1da177e4 967 break;
e0e81739 968 validate_process_creds();
6fb2b47f 969 svc_process(rqstp);
e0e81739 970 validate_process_creds();
1da177e4
LT
971 }
972
24e36663 973 /* Clear signals before calling svc_exit_thread() */
9e416052 974 flush_signals(current);
1da177e4 975
bedbdd8b 976 mutex_lock(&nfsd_mutex);
1da177e4
LT
977 nfsdstats.th_cnt --;
978
979out:
57c8b13e 980 rqstp->rq_server = NULL;
786185b5 981
1da177e4
LT
982 /* Release the thread */
983 svc_exit_thread(rqstp);
984
88c47666 985 nfsd_destroy(net);
57c8b13e 986
1da177e4 987 /* Release module */
bedbdd8b 988 mutex_unlock(&nfsd_mutex);
1da177e4 989 module_put_and_exit(0);
9867d76c 990 return 0;
1da177e4
LT
991}
992
383c440d
CL
993/**
994 * nfsd_dispatch - Process an NFS or NFSACL Request
995 * @rqstp: incoming request
996 * @statp: pointer to location of accept_stat field in RPC Reply buffer
997 *
998 * This RPC dispatcher integrates the NFS server's duplicate reply cache.
999 *
1000 * Return values:
1001 * %0: Processing complete; do not send a Reply
1002 * %1: Processing complete; send Reply in rqstp->rq_res
1003 */
1004int nfsd_dispatch(struct svc_rqst *rqstp, __be32 *statp)
1da177e4 1005{
4c96cb56
CL
1006 const struct svc_procedure *proc = rqstp->rq_procinfo;
1007 struct kvec *argv = &rqstp->rq_arg.head[0];
1008 struct kvec *resv = &rqstp->rq_res.head[0];
cc028a10 1009 __be32 *p;
1da177e4 1010
1091006c
BF
1011 /*
1012 * Give the xdr decoder a chance to change this if it wants
1013 * (necessary in the NFSv4.0 compound case)
1014 */
1015 rqstp->rq_cachetype = proc->pc_cachetype;
5191955d
CL
1016
1017 svcxdr_init_decode(rqstp);
85085aac
CL
1018 if (!proc->pc_decode(rqstp, argv->iov_base))
1019 goto out_decode_err;
1091006c 1020
1091006c 1021 switch (nfsd_cache_lookup(rqstp)) {
84c138e7
CL
1022 case RC_DOIT:
1023 break;
1da177e4 1024 case RC_REPLY:
85085aac 1025 goto out_cached_reply;
84c138e7 1026 case RC_DROPIT:
85085aac 1027 goto out_dropit;
1da177e4
LT
1028 }
1029
383c440d
CL
1030 /*
1031 * Need to grab the location to store the status, as
1032 * NFSv4 does some encoding while processing
1da177e4 1033 */
cc028a10 1034 p = resv->iov_base + resv->iov_len;
bddfdbcd 1035 svcxdr_init_encode(rqstp);
1da177e4 1036
cc028a10
CL
1037 *statp = proc->pc_func(rqstp);
1038 if (*statp == rpc_drop_reply || test_bit(RQ_DROPME, &rqstp->rq_flags))
85085aac 1039 goto out_update_drop;
1da177e4 1040
cc028a10 1041 if (!proc->pc_encode(rqstp, p))
f0af2210 1042 goto out_encode_err;
1da177e4 1043
57d276d7 1044 nfsd_cache_update(rqstp, rqstp->rq_cachetype, statp + 1);
85085aac
CL
1045out_cached_reply:
1046 return 1;
1047
85085aac 1048out_decode_err:
0dfdad1c 1049 trace_nfsd_garbage_args_err(rqstp);
85085aac
CL
1050 *statp = rpc_garbage_args;
1051 return 1;
1052
1053out_update_drop:
85085aac
CL
1054 nfsd_cache_update(rqstp, RC_NOCACHE, NULL);
1055out_dropit:
1056 return 0;
1057
1058out_encode_err:
0dfdad1c 1059 trace_nfsd_cant_encode_err(rqstp);
85085aac
CL
1060 nfsd_cache_update(rqstp, RC_NOCACHE, NULL);
1061 *statp = rpc_system_err;
1da177e4
LT
1062 return 1;
1063}
03cf6c9f 1064
788f7183
CL
1065/**
1066 * nfssvc_decode_voidarg - Decode void arguments
1067 * @rqstp: Server RPC transaction context
1068 * @p: buffer containing arguments to decode
1069 *
1070 * Return values:
1071 * %0: Arguments were not valid
1072 * %1: Decoding was successful
1073 */
1074int nfssvc_decode_voidarg(struct svc_rqst *rqstp, __be32 *p)
1075{
1076 return 1;
1077}
1078
1079/**
1080 * nfssvc_encode_voidres - Encode void results
1081 * @rqstp: Server RPC transaction context
1082 * @p: buffer in which to encode results
1083 *
1084 * Return values:
1085 * %0: Local error while encoding
1086 * %1: Encoding was successful
1087 */
1088int nfssvc_encode_voidres(struct svc_rqst *rqstp, __be32 *p)
1089{
bddfdbcd 1090 return 1;
788f7183
CL
1091}
1092
03cf6c9f
GB
1093int nfsd_pool_stats_open(struct inode *inode, struct file *file)
1094{
ed2d8aed 1095 int ret;
11f77942 1096 struct nfsd_net *nn = net_generic(inode->i_sb->s_fs_info, nfsd_net_id);
9dd9845f 1097
ed2d8aed 1098 mutex_lock(&nfsd_mutex);
9dd9845f 1099 if (nn->nfsd_serv == NULL) {
ed2d8aed 1100 mutex_unlock(&nfsd_mutex);
03cf6c9f 1101 return -ENODEV;
ed2d8aed
RY
1102 }
1103 /* bump up the psudo refcount while traversing */
9dd9845f
SK
1104 svc_get(nn->nfsd_serv);
1105 ret = svc_pool_stats_open(nn->nfsd_serv, file);
ed2d8aed
RY
1106 mutex_unlock(&nfsd_mutex);
1107 return ret;
1108}
1109
1110int nfsd_pool_stats_release(struct inode *inode, struct file *file)
1111{
1112 int ret = seq_release(inode, file);
11f77942 1113 struct net *net = inode->i_sb->s_fs_info;
786185b5 1114
ed2d8aed
RY
1115 mutex_lock(&nfsd_mutex);
1116 /* this function really, really should have been called svc_put() */
19f7e2ca 1117 nfsd_destroy(net);
ed2d8aed
RY
1118 mutex_unlock(&nfsd_mutex);
1119 return ret;
03cf6c9f 1120}