]>
Commit | Line | Data |
---|---|---|
b2441318 | 1 | // SPDX-License-Identifier: GPL-2.0 |
1da177e4 | 2 | /* |
1da177e4 LT |
3 | * Central processing for nfsd. |
4 | * | |
5 | * Authors: Olaf Kirch ([email protected]) | |
6 | * | |
7 | * Copyright (C) 1995, 1996, 1997 Olaf Kirch <[email protected]> | |
8 | */ | |
9 | ||
3f07c014 | 10 | #include <linux/sched/signal.h> |
83144186 | 11 | #include <linux/freezer.h> |
143cb494 | 12 | #include <linux/module.h> |
1da177e4 | 13 | #include <linux/fs_struct.h> |
c3d06f9c | 14 | #include <linux/swap.h> |
1da177e4 | 15 | |
1da177e4 | 16 | #include <linux/sunrpc/stats.h> |
1da177e4 | 17 | #include <linux/sunrpc/svcsock.h> |
36684996 | 18 | #include <linux/sunrpc/svc_xprt.h> |
1da177e4 | 19 | #include <linux/lockd/bind.h> |
a257cdd0 | 20 | #include <linux/nfsacl.h> |
ed2d8aed | 21 | #include <linux/seq_file.h> |
36684996 SM |
22 | #include <linux/inetdevice.h> |
23 | #include <net/addrconf.h> | |
24 | #include <net/ipv6.h> | |
fc5d00b0 | 25 | #include <net/net_namespace.h> |
9a74af21 BH |
26 | #include "nfsd.h" |
27 | #include "cache.h" | |
0a3adade | 28 | #include "vfs.h" |
2c2fe290 | 29 | #include "netns.h" |
1da177e4 LT |
30 | |
31 | #define NFSDDBG_FACILITY NFSDDBG_SVC | |
32 | ||
1da177e4 | 33 | extern struct svc_program nfsd_program; |
9867d76c | 34 | static int nfsd(void *vrqstp); |
1da177e4 | 35 | |
bedbdd8b | 36 | /* |
9dd9845f | 37 | * nfsd_mutex protects nn->nfsd_serv -- both the pointer itself and the members |
bedbdd8b NB |
38 | * of the svc_serv struct. In particular, ->sv_nrthreads but also to some |
39 | * extent ->sv_temp_socks and ->sv_permsocks. It also protects nfsdstats.th_cnt | |
40 | * | |
9dd9845f | 41 | * If (out side the lock) nn->nfsd_serv is non-NULL, then it must point to a |
bedbdd8b NB |
42 | * properly initialised 'struct svc_serv' with ->sv_nrthreads > 0. That number |
43 | * of nfsd threads must exist and each must listed in ->sp_all_threads in each | |
44 | * entry of ->sv_pools[]. | |
45 | * | |
46 | * Transitions of the thread count between zero and non-zero are of particular | |
47 | * interest since the svc_serv needs to be created and initialized at that | |
48 | * point, or freed. | |
3dd98a3b JL |
49 | * |
50 | * Finally, the nfsd_mutex also protects some of the global variables that are | |
51 | * accessed when nfsd starts and that are settable via the write_* routines in | |
52 | * nfsctl.c. In particular: | |
53 | * | |
54 | * user_recovery_dirname | |
55 | * user_lease_time | |
56 | * nfsd_versions | |
bedbdd8b NB |
57 | */ |
58 | DEFINE_MUTEX(nfsd_mutex); | |
bedbdd8b | 59 | |
4bd9b0f4 AA |
60 | /* |
61 | * nfsd_drc_lock protects nfsd_drc_max_pages and nfsd_drc_pages_used. | |
62 | * nfsd_drc_max_pages limits the total amount of memory available for | |
63 | * version 4.1 DRC caches. | |
64 | * nfsd_drc_pages_used tracks the current version 4.1 DRC memory usage. | |
65 | */ | |
66 | spinlock_t nfsd_drc_lock; | |
697ce9be ZY |
67 | unsigned long nfsd_drc_max_mem; |
68 | unsigned long nfsd_drc_mem_used; | |
4bd9b0f4 | 69 | |
3fb803a9 AG |
70 | #if defined(CONFIG_NFSD_V2_ACL) || defined(CONFIG_NFSD_V3_ACL) |
71 | static struct svc_stat nfsd_acl_svcstats; | |
e9679189 | 72 | static const struct svc_version *nfsd_acl_version[] = { |
3fb803a9 AG |
73 | [2] = &nfsd_acl_version2, |
74 | [3] = &nfsd_acl_version3, | |
75 | }; | |
76 | ||
77 | #define NFSD_ACL_MINVERS 2 | |
e8c96f8c | 78 | #define NFSD_ACL_NRVERS ARRAY_SIZE(nfsd_acl_version) |
e9679189 | 79 | static const struct svc_version *nfsd_acl_versions[NFSD_ACL_NRVERS]; |
3fb803a9 AG |
80 | |
81 | static struct svc_program nfsd_acl_program = { | |
82 | .pg_prog = NFS_ACL_PROGRAM, | |
83 | .pg_nvers = NFSD_ACL_NRVERS, | |
84 | .pg_vers = nfsd_acl_versions, | |
1a8eff6d | 85 | .pg_name = "nfsacl", |
3fb803a9 AG |
86 | .pg_class = "nfsd", |
87 | .pg_stats = &nfsd_acl_svcstats, | |
88 | .pg_authenticate = &svc_set_client, | |
89 | }; | |
90 | ||
91 | static struct svc_stat nfsd_acl_svcstats = { | |
92 | .program = &nfsd_acl_program, | |
93 | }; | |
94 | #endif /* defined(CONFIG_NFSD_V2_ACL) || defined(CONFIG_NFSD_V3_ACL) */ | |
95 | ||
e9679189 | 96 | static const struct svc_version *nfsd_version[] = { |
70c3b76c N |
97 | [2] = &nfsd_version2, |
98 | #if defined(CONFIG_NFSD_V3) | |
99 | [3] = &nfsd_version3, | |
100 | #endif | |
101 | #if defined(CONFIG_NFSD_V4) | |
102 | [4] = &nfsd_version4, | |
103 | #endif | |
104 | }; | |
105 | ||
106 | #define NFSD_MINVERS 2 | |
e8c96f8c | 107 | #define NFSD_NRVERS ARRAY_SIZE(nfsd_version) |
e9679189 | 108 | static const struct svc_version *nfsd_versions[NFSD_NRVERS]; |
70c3b76c N |
109 | |
110 | struct svc_program nfsd_program = { | |
3fb803a9 AG |
111 | #if defined(CONFIG_NFSD_V2_ACL) || defined(CONFIG_NFSD_V3_ACL) |
112 | .pg_next = &nfsd_acl_program, | |
113 | #endif | |
70c3b76c N |
114 | .pg_prog = NFS_PROGRAM, /* program number */ |
115 | .pg_nvers = NFSD_NRVERS, /* nr of entries in nfsd_version */ | |
116 | .pg_vers = nfsd_versions, /* version table */ | |
117 | .pg_name = "nfsd", /* program name */ | |
118 | .pg_class = "nfsd", /* authentication class */ | |
119 | .pg_stats = &nfsd_svcstats, /* version table */ | |
120 | .pg_authenticate = &svc_set_client, /* export authentication */ | |
121 | ||
122 | }; | |
123 | ||
35f7a14f BF |
124 | static bool nfsd_supported_minorversions[NFSD_SUPPORTED_MINOR_VERSION + 1] = { |
125 | [0] = 1, | |
126 | [1] = 1, | |
c23ae601 | 127 | [2] = 1, |
35f7a14f | 128 | }; |
8daf220a | 129 | |
6658d3a7 N |
130 | int nfsd_vers(int vers, enum vers_op change) |
131 | { | |
132 | if (vers < NFSD_MINVERS || vers >= NFSD_NRVERS) | |
15ddb4ae | 133 | return 0; |
6658d3a7 N |
134 | switch(change) { |
135 | case NFSD_SET: | |
136 | nfsd_versions[vers] = nfsd_version[vers]; | |
6658d3a7 N |
137 | #if defined(CONFIG_NFSD_V2_ACL) || defined(CONFIG_NFSD_V3_ACL) |
138 | if (vers < NFSD_ACL_NRVERS) | |
1a8eff6d | 139 | nfsd_acl_versions[vers] = nfsd_acl_version[vers]; |
6658d3a7 | 140 | #endif |
1a8eff6d | 141 | break; |
6658d3a7 N |
142 | case NFSD_CLEAR: |
143 | nfsd_versions[vers] = NULL; | |
144 | #if defined(CONFIG_NFSD_V2_ACL) || defined(CONFIG_NFSD_V3_ACL) | |
145 | if (vers < NFSD_ACL_NRVERS) | |
1a8eff6d | 146 | nfsd_acl_versions[vers] = NULL; |
6658d3a7 N |
147 | #endif |
148 | break; | |
149 | case NFSD_TEST: | |
150 | return nfsd_versions[vers] != NULL; | |
151 | case NFSD_AVAIL: | |
152 | return nfsd_version[vers] != NULL; | |
153 | } | |
154 | return 0; | |
155 | } | |
8daf220a | 156 | |
d3635ff0 TM |
157 | static void |
158 | nfsd_adjust_nfsd_versions4(void) | |
159 | { | |
160 | unsigned i; | |
161 | ||
162 | for (i = 0; i <= NFSD_SUPPORTED_MINOR_VERSION; i++) { | |
163 | if (nfsd_supported_minorversions[i]) | |
164 | return; | |
165 | } | |
166 | nfsd_vers(4, NFSD_CLEAR); | |
167 | } | |
168 | ||
8daf220a BH |
169 | int nfsd_minorversion(u32 minorversion, enum vers_op change) |
170 | { | |
928c6fb3 N |
171 | if (minorversion > NFSD_SUPPORTED_MINOR_VERSION && |
172 | change != NFSD_AVAIL) | |
8daf220a BH |
173 | return -1; |
174 | switch(change) { | |
175 | case NFSD_SET: | |
35f7a14f | 176 | nfsd_supported_minorversions[minorversion] = true; |
d3635ff0 | 177 | nfsd_vers(4, NFSD_SET); |
8daf220a BH |
178 | break; |
179 | case NFSD_CLEAR: | |
35f7a14f | 180 | nfsd_supported_minorversions[minorversion] = false; |
d3635ff0 | 181 | nfsd_adjust_nfsd_versions4(); |
8daf220a BH |
182 | break; |
183 | case NFSD_TEST: | |
35f7a14f | 184 | return nfsd_supported_minorversions[minorversion]; |
8daf220a BH |
185 | case NFSD_AVAIL: |
186 | return minorversion <= NFSD_SUPPORTED_MINOR_VERSION; | |
187 | } | |
188 | return 0; | |
189 | } | |
190 | ||
1da177e4 LT |
191 | /* |
192 | * Maximum number of nfsd processes | |
193 | */ | |
194 | #define NFSD_MAXSERVS 8192 | |
195 | ||
9dd9845f | 196 | int nfsd_nrthreads(struct net *net) |
1da177e4 | 197 | { |
c7d106c9 | 198 | int rv = 0; |
9dd9845f SK |
199 | struct nfsd_net *nn = net_generic(net, nfsd_net_id); |
200 | ||
c7d106c9 | 201 | mutex_lock(&nfsd_mutex); |
9dd9845f SK |
202 | if (nn->nfsd_serv) |
203 | rv = nn->nfsd_serv->sv_nrthreads; | |
c7d106c9 NB |
204 | mutex_unlock(&nfsd_mutex); |
205 | return rv; | |
1da177e4 LT |
206 | } |
207 | ||
db6e182c | 208 | static int nfsd_init_socks(struct net *net) |
59db4a0c BF |
209 | { |
210 | int error; | |
9dd9845f SK |
211 | struct nfsd_net *nn = net_generic(net, nfsd_net_id); |
212 | ||
213 | if (!list_empty(&nn->nfsd_serv->sv_permsocks)) | |
59db4a0c BF |
214 | return 0; |
215 | ||
9dd9845f | 216 | error = svc_create_xprt(nn->nfsd_serv, "udp", net, PF_INET, NFS_PORT, |
59db4a0c BF |
217 | SVC_SOCK_DEFAULTS); |
218 | if (error < 0) | |
219 | return error; | |
220 | ||
9dd9845f | 221 | error = svc_create_xprt(nn->nfsd_serv, "tcp", net, PF_INET, NFS_PORT, |
59db4a0c BF |
222 | SVC_SOCK_DEFAULTS); |
223 | if (error < 0) | |
224 | return error; | |
225 | ||
226 | return 0; | |
227 | } | |
228 | ||
4539f149 | 229 | static int nfsd_users = 0; |
4ad9a344 | 230 | |
bda9cac1 SK |
231 | static int nfsd_startup_generic(int nrservs) |
232 | { | |
233 | int ret; | |
234 | ||
4539f149 | 235 | if (nfsd_users++) |
bda9cac1 SK |
236 | return 0; |
237 | ||
238 | /* | |
239 | * Readahead param cache - will no-op if it already exists. | |
240 | * (Note therefore results will be suboptimal if number of | |
241 | * threads is modified after nfsd start.) | |
242 | */ | |
243 | ret = nfsd_racache_init(2*nrservs); | |
244 | if (ret) | |
d9499a95 KM |
245 | goto dec_users; |
246 | ||
bda9cac1 SK |
247 | ret = nfs4_state_start(); |
248 | if (ret) | |
249 | goto out_racache; | |
250 | return 0; | |
251 | ||
252 | out_racache: | |
253 | nfsd_racache_shutdown(); | |
d9499a95 KM |
254 | dec_users: |
255 | nfsd_users--; | |
bda9cac1 SK |
256 | return ret; |
257 | } | |
258 | ||
259 | static void nfsd_shutdown_generic(void) | |
260 | { | |
4539f149 SK |
261 | if (--nfsd_users) |
262 | return; | |
263 | ||
bda9cac1 SK |
264 | nfs4_state_shutdown(); |
265 | nfsd_racache_shutdown(); | |
266 | } | |
267 | ||
8ef66714 KM |
268 | static bool nfsd_needs_lockd(void) |
269 | { | |
ff88825f | 270 | #if defined(CONFIG_NFSD_V3) |
8ef66714 | 271 | return (nfsd_versions[2] != NULL) || (nfsd_versions[3] != NULL); |
ff88825f KM |
272 | #else |
273 | return (nfsd_versions[2] != NULL); | |
274 | #endif | |
8ef66714 KM |
275 | } |
276 | ||
903d9bf0 | 277 | static int nfsd_startup_net(int nrservs, struct net *net) |
6ff50b3d | 278 | { |
2c2fe290 | 279 | struct nfsd_net *nn = net_generic(net, nfsd_net_id); |
6ff50b3d SK |
280 | int ret; |
281 | ||
2c2fe290 SK |
282 | if (nn->nfsd_net_up) |
283 | return 0; | |
284 | ||
903d9bf0 | 285 | ret = nfsd_startup_generic(nrservs); |
6ff50b3d SK |
286 | if (ret) |
287 | return ret; | |
903d9bf0 SK |
288 | ret = nfsd_init_socks(net); |
289 | if (ret) | |
290 | goto out_socks; | |
8ef66714 KM |
291 | |
292 | if (nfsd_needs_lockd() && !nn->lockd_up) { | |
293 | ret = lockd_up(net); | |
294 | if (ret) | |
295 | goto out_socks; | |
296 | nn->lockd_up = 1; | |
297 | } | |
298 | ||
6ff50b3d SK |
299 | ret = nfs4_state_start_net(net); |
300 | if (ret) | |
301 | goto out_lockd; | |
302 | ||
2c2fe290 | 303 | nn->nfsd_net_up = true; |
6ff50b3d SK |
304 | return 0; |
305 | ||
306 | out_lockd: | |
8ef66714 KM |
307 | if (nn->lockd_up) { |
308 | lockd_down(net); | |
309 | nn->lockd_up = 0; | |
310 | } | |
903d9bf0 | 311 | out_socks: |
bda9cac1 | 312 | nfsd_shutdown_generic(); |
4ad9a344 JL |
313 | return ret; |
314 | } | |
315 | ||
6ff50b3d SK |
316 | static void nfsd_shutdown_net(struct net *net) |
317 | { | |
2c2fe290 SK |
318 | struct nfsd_net *nn = net_generic(net, nfsd_net_id); |
319 | ||
6ff50b3d | 320 | nfs4_state_shutdown_net(net); |
8ef66714 KM |
321 | if (nn->lockd_up) { |
322 | lockd_down(net); | |
323 | nn->lockd_up = 0; | |
324 | } | |
2c2fe290 | 325 | nn->nfsd_net_up = false; |
903d9bf0 | 326 | nfsd_shutdown_generic(); |
6ff50b3d SK |
327 | } |
328 | ||
36684996 SM |
329 | static int nfsd_inetaddr_event(struct notifier_block *this, unsigned long event, |
330 | void *ptr) | |
331 | { | |
332 | struct in_ifaddr *ifa = (struct in_ifaddr *)ptr; | |
333 | struct net_device *dev = ifa->ifa_dev->dev; | |
334 | struct net *net = dev_net(dev); | |
335 | struct nfsd_net *nn = net_generic(net, nfsd_net_id); | |
336 | struct sockaddr_in sin; | |
337 | ||
2317dc55 VA |
338 | if ((event != NETDEV_DOWN) || |
339 | !atomic_inc_not_zero(&nn->ntf_refcnt)) | |
36684996 SM |
340 | goto out; |
341 | ||
342 | if (nn->nfsd_serv) { | |
343 | dprintk("nfsd_inetaddr_event: removed %pI4\n", &ifa->ifa_local); | |
344 | sin.sin_family = AF_INET; | |
345 | sin.sin_addr.s_addr = ifa->ifa_local; | |
346 | svc_age_temp_xprts_now(nn->nfsd_serv, (struct sockaddr *)&sin); | |
347 | } | |
2317dc55 VA |
348 | atomic_dec(&nn->ntf_refcnt); |
349 | wake_up(&nn->ntf_wq); | |
36684996 SM |
350 | |
351 | out: | |
352 | return NOTIFY_DONE; | |
353 | } | |
354 | ||
355 | static struct notifier_block nfsd_inetaddr_notifier = { | |
356 | .notifier_call = nfsd_inetaddr_event, | |
357 | }; | |
358 | ||
359 | #if IS_ENABLED(CONFIG_IPV6) | |
360 | static int nfsd_inet6addr_event(struct notifier_block *this, | |
361 | unsigned long event, void *ptr) | |
362 | { | |
363 | struct inet6_ifaddr *ifa = (struct inet6_ifaddr *)ptr; | |
364 | struct net_device *dev = ifa->idev->dev; | |
365 | struct net *net = dev_net(dev); | |
366 | struct nfsd_net *nn = net_generic(net, nfsd_net_id); | |
367 | struct sockaddr_in6 sin6; | |
368 | ||
2317dc55 VA |
369 | if ((event != NETDEV_DOWN) || |
370 | !atomic_inc_not_zero(&nn->ntf_refcnt)) | |
36684996 SM |
371 | goto out; |
372 | ||
373 | if (nn->nfsd_serv) { | |
374 | dprintk("nfsd_inet6addr_event: removed %pI6\n", &ifa->addr); | |
375 | sin6.sin6_family = AF_INET6; | |
376 | sin6.sin6_addr = ifa->addr; | |
7b19824d SM |
377 | if (ipv6_addr_type(&sin6.sin6_addr) & IPV6_ADDR_LINKLOCAL) |
378 | sin6.sin6_scope_id = ifa->idev->dev->ifindex; | |
36684996 SM |
379 | svc_age_temp_xprts_now(nn->nfsd_serv, (struct sockaddr *)&sin6); |
380 | } | |
2317dc55 VA |
381 | atomic_dec(&nn->ntf_refcnt); |
382 | wake_up(&nn->ntf_wq); | |
36684996 SM |
383 | out: |
384 | return NOTIFY_DONE; | |
385 | } | |
386 | ||
387 | static struct notifier_block nfsd_inet6addr_notifier = { | |
388 | .notifier_call = nfsd_inet6addr_event, | |
389 | }; | |
390 | #endif | |
391 | ||
1eca45f8 VA |
392 | /* Only used under nfsd_mutex, so this atomic may be overkill: */ |
393 | static atomic_t nfsd_notifier_refcount = ATOMIC_INIT(0); | |
394 | ||
541e864f | 395 | static void nfsd_last_thread(struct svc_serv *serv, struct net *net) |
4ad9a344 | 396 | { |
903d9bf0 SK |
397 | struct nfsd_net *nn = net_generic(net, nfsd_net_id); |
398 | ||
2317dc55 | 399 | atomic_dec(&nn->ntf_refcnt); |
1eca45f8 VA |
400 | /* check if the notifier still has clients */ |
401 | if (atomic_dec_return(&nfsd_notifier_refcount) == 0) { | |
402 | unregister_inetaddr_notifier(&nfsd_inetaddr_notifier); | |
36684996 | 403 | #if IS_ENABLED(CONFIG_IPV6) |
1eca45f8 | 404 | unregister_inet6addr_notifier(&nfsd_inet6addr_notifier); |
36684996 | 405 | #endif |
1eca45f8 | 406 | } |
2317dc55 | 407 | wait_event(nn->ntf_wq, atomic_read(&nn->ntf_refcnt) == 0); |
1eca45f8 | 408 | |
4ad9a344 JL |
409 | /* |
410 | * write_ports can create the server without actually starting | |
411 | * any threads--if we get shut down before any threads are | |
412 | * started, then nfsd_last_thread will be run before any of this | |
691412b4 | 413 | * other initialization has been done except the rpcb information. |
4ad9a344 | 414 | */ |
691412b4 | 415 | svc_rpcb_cleanup(serv, net); |
903d9bf0 | 416 | if (!nn->nfsd_net_up) |
4ad9a344 | 417 | return; |
16d05870 | 418 | |
691412b4 | 419 | nfsd_shutdown_net(net); |
e096bbc6 JL |
420 | printk(KERN_WARNING "nfsd: last server has exited, flushing export " |
421 | "cache\n"); | |
b3853e0e | 422 | nfsd_export_flush(net); |
bc591ccf | 423 | } |
6658d3a7 N |
424 | |
425 | void nfsd_reset_versions(void) | |
426 | { | |
6658d3a7 N |
427 | int i; |
428 | ||
800a938f N |
429 | for (i = 0; i < NFSD_NRVERS; i++) |
430 | if (nfsd_vers(i, NFSD_TEST)) | |
431 | return; | |
6658d3a7 | 432 | |
800a938f N |
433 | for (i = 0; i < NFSD_NRVERS; i++) |
434 | if (i != 4) | |
435 | nfsd_vers(i, NFSD_SET); | |
436 | else { | |
437 | int minor = 0; | |
438 | while (nfsd_minorversion(minor, NFSD_SET) >= 0) | |
439 | minor++; | |
440 | } | |
6658d3a7 N |
441 | } |
442 | ||
c3d06f9c AA |
443 | /* |
444 | * Each session guarantees a negotiated per slot memory cache for replies | |
445 | * which in turn consumes memory beyond the v2/v3/v4.0 server. A dedicated | |
446 | * NFSv4.1 server might want to use more memory for a DRC than a machine | |
447 | * with mutiple services. | |
448 | * | |
449 | * Impose a hard limit on the number of pages for the DRC which varies | |
450 | * according to the machines free pages. This is of course only a default. | |
451 | * | |
452 | * For now this is a #defined shift which could be under admin control | |
453 | * in the future. | |
454 | */ | |
455 | static void set_max_drc(void) | |
456 | { | |
44d8660d | 457 | #define NFSD_DRC_SIZE_SHIFT 7 |
0c193054 AA |
458 | nfsd_drc_max_mem = (nr_free_buffer_pages() |
459 | >> NFSD_DRC_SIZE_SHIFT) * PAGE_SIZE; | |
460 | nfsd_drc_mem_used = 0; | |
4bd9b0f4 | 461 | spin_lock_init(&nfsd_drc_lock); |
697ce9be | 462 | dprintk("%s nfsd_drc_max_mem %lu \n", __func__, nfsd_drc_max_mem); |
c3d06f9c | 463 | } |
bedbdd8b | 464 | |
87b0fc7d | 465 | static int nfsd_get_default_max_blksize(void) |
02a375f0 | 466 | { |
87b0fc7d BF |
467 | struct sysinfo i; |
468 | unsigned long long target; | |
469 | unsigned long ret; | |
bedbdd8b | 470 | |
87b0fc7d | 471 | si_meminfo(&i); |
508f9227 | 472 | target = (i.totalram - i.totalhigh) << PAGE_SHIFT; |
87b0fc7d BF |
473 | /* |
474 | * Aim for 1/4096 of memory per thread This gives 1MB on 4Gig | |
475 | * machines, but only uses 32K on 128M machines. Bottom out at | |
476 | * 8K on 32M and smaller. Of course, this is only a default. | |
477 | */ | |
478 | target >>= 12; | |
479 | ||
480 | ret = NFSSVC_MAXBLKSIZE; | |
481 | while (ret > target && ret >= 8*1024*2) | |
482 | ret /= 2; | |
483 | return ret; | |
484 | } | |
485 | ||
afea5657 | 486 | static const struct svc_serv_ops nfsd_thread_sv_ops = { |
b9e13cdf JL |
487 | .svo_shutdown = nfsd_last_thread, |
488 | .svo_function = nfsd, | |
489 | .svo_enqueue_xprt = svc_xprt_do_enqueue, | |
598e2359 | 490 | .svo_setup = svc_set_num_threads, |
b9e13cdf | 491 | .svo_module = THIS_MODULE, |
ea126e74 JL |
492 | }; |
493 | ||
6777436b | 494 | int nfsd_create_serv(struct net *net) |
87b0fc7d | 495 | { |
9793f7c8 | 496 | int error; |
b9c0ef85 | 497 | struct nfsd_net *nn = net_generic(net, nfsd_net_id); |
9793f7c8 | 498 | |
bedbdd8b | 499 | WARN_ON(!mutex_is_locked(&nfsd_mutex)); |
9dd9845f SK |
500 | if (nn->nfsd_serv) { |
501 | svc_get(nn->nfsd_serv); | |
02a375f0 N |
502 | return 0; |
503 | } | |
87b0fc7d BF |
504 | if (nfsd_max_blksize == 0) |
505 | nfsd_max_blksize = nfsd_get_default_max_blksize(); | |
e844a7b9 | 506 | nfsd_reset_versions(); |
9dd9845f | 507 | nn->nfsd_serv = svc_create_pooled(&nfsd_program, nfsd_max_blksize, |
b9e13cdf | 508 | &nfsd_thread_sv_ops); |
9dd9845f | 509 | if (nn->nfsd_serv == NULL) |
628b3687 | 510 | return -ENOMEM; |
bedbdd8b | 511 | |
5b8db00b | 512 | nn->nfsd_serv->sv_maxconn = nn->max_connections; |
9dd9845f | 513 | error = svc_bind(nn->nfsd_serv, net); |
9793f7c8 | 514 | if (error < 0) { |
9dd9845f | 515 | svc_destroy(nn->nfsd_serv); |
9793f7c8 SK |
516 | return error; |
517 | } | |
518 | ||
628b3687 | 519 | set_max_drc(); |
1eca45f8 VA |
520 | /* check if the notifier is already set */ |
521 | if (atomic_inc_return(&nfsd_notifier_refcount) == 1) { | |
522 | register_inetaddr_notifier(&nfsd_inetaddr_notifier); | |
36684996 | 523 | #if IS_ENABLED(CONFIG_IPV6) |
1eca45f8 | 524 | register_inet6addr_notifier(&nfsd_inet6addr_notifier); |
36684996 | 525 | #endif |
1eca45f8 | 526 | } |
2317dc55 | 527 | atomic_inc(&nn->ntf_refcnt); |
256a89fa | 528 | ktime_get_real_ts64(&nn->nfssvc_boot); /* record boot time */ |
87b0fc7d | 529 | return 0; |
02a375f0 N |
530 | } |
531 | ||
9dd9845f | 532 | int nfsd_nrpools(struct net *net) |
eed2965a | 533 | { |
9dd9845f SK |
534 | struct nfsd_net *nn = net_generic(net, nfsd_net_id); |
535 | ||
536 | if (nn->nfsd_serv == NULL) | |
eed2965a GB |
537 | return 0; |
538 | else | |
9dd9845f | 539 | return nn->nfsd_serv->sv_nrpools; |
eed2965a GB |
540 | } |
541 | ||
9dd9845f | 542 | int nfsd_get_nrthreads(int n, int *nthreads, struct net *net) |
eed2965a GB |
543 | { |
544 | int i = 0; | |
9dd9845f | 545 | struct nfsd_net *nn = net_generic(net, nfsd_net_id); |
eed2965a | 546 | |
9dd9845f SK |
547 | if (nn->nfsd_serv != NULL) { |
548 | for (i = 0; i < nn->nfsd_serv->sv_nrpools && i < n; i++) | |
549 | nthreads[i] = nn->nfsd_serv->sv_pools[i].sp_nrthreads; | |
eed2965a GB |
550 | } |
551 | ||
552 | return 0; | |
553 | } | |
554 | ||
9dd9845f SK |
555 | void nfsd_destroy(struct net *net) |
556 | { | |
557 | struct nfsd_net *nn = net_generic(net, nfsd_net_id); | |
558 | int destroy = (nn->nfsd_serv->sv_nrthreads == 1); | |
559 | ||
560 | if (destroy) | |
561 | svc_shutdown_net(nn->nfsd_serv, net); | |
562 | svc_destroy(nn->nfsd_serv); | |
563 | if (destroy) | |
564 | nn->nfsd_serv = NULL; | |
565 | } | |
566 | ||
3938a0d5 | 567 | int nfsd_set_nrthreads(int n, int *nthreads, struct net *net) |
eed2965a GB |
568 | { |
569 | int i = 0; | |
570 | int tot = 0; | |
571 | int err = 0; | |
9dd9845f | 572 | struct nfsd_net *nn = net_generic(net, nfsd_net_id); |
eed2965a | 573 | |
bedbdd8b NB |
574 | WARN_ON(!mutex_is_locked(&nfsd_mutex)); |
575 | ||
9dd9845f | 576 | if (nn->nfsd_serv == NULL || n <= 0) |
eed2965a GB |
577 | return 0; |
578 | ||
9dd9845f SK |
579 | if (n > nn->nfsd_serv->sv_nrpools) |
580 | n = nn->nfsd_serv->sv_nrpools; | |
eed2965a GB |
581 | |
582 | /* enforce a global maximum number of threads */ | |
583 | tot = 0; | |
584 | for (i = 0; i < n; i++) { | |
3c7aa15d | 585 | nthreads[i] = min(nthreads[i], NFSD_MAXSERVS); |
eed2965a GB |
586 | tot += nthreads[i]; |
587 | } | |
588 | if (tot > NFSD_MAXSERVS) { | |
589 | /* total too large: scale down requested numbers */ | |
590 | for (i = 0; i < n && tot > 0; i++) { | |
591 | int new = nthreads[i] * NFSD_MAXSERVS / tot; | |
592 | tot -= (nthreads[i] - new); | |
593 | nthreads[i] = new; | |
594 | } | |
595 | for (i = 0; i < n && tot > 0; i++) { | |
596 | nthreads[i]--; | |
597 | tot--; | |
598 | } | |
599 | } | |
600 | ||
601 | /* | |
602 | * There must always be a thread in pool 0; the admin | |
603 | * can't shut down NFS completely using pool_threads. | |
604 | */ | |
605 | if (nthreads[0] == 0) | |
606 | nthreads[0] = 1; | |
607 | ||
608 | /* apply the new numbers */ | |
9dd9845f | 609 | svc_get(nn->nfsd_serv); |
eed2965a | 610 | for (i = 0; i < n; i++) { |
598e2359 JL |
611 | err = nn->nfsd_serv->sv_ops->svo_setup(nn->nfsd_serv, |
612 | &nn->nfsd_serv->sv_pools[i], nthreads[i]); | |
eed2965a GB |
613 | if (err) |
614 | break; | |
615 | } | |
19f7e2ca | 616 | nfsd_destroy(net); |
eed2965a GB |
617 | return err; |
618 | } | |
619 | ||
ac77efbe JL |
620 | /* |
621 | * Adjust the number of threads and return the new number of threads. | |
622 | * This is also the function that starts the server if necessary, if | |
623 | * this is the first time nrservs is nonzero. | |
624 | */ | |
1da177e4 | 625 | int |
d41a9417 | 626 | nfsd_svc(int nrservs, struct net *net) |
1da177e4 LT |
627 | { |
628 | int error; | |
774f8bbd | 629 | bool nfsd_up_before; |
9dd9845f | 630 | struct nfsd_net *nn = net_generic(net, nfsd_net_id); |
bedbdd8b NB |
631 | |
632 | mutex_lock(&nfsd_mutex); | |
6658d3a7 | 633 | dprintk("nfsd: creating service\n"); |
3c7aa15d KM |
634 | |
635 | nrservs = max(nrservs, 0); | |
636 | nrservs = min(nrservs, NFSD_MAXSERVS); | |
671e1fcf | 637 | error = 0; |
3c7aa15d | 638 | |
9dd9845f | 639 | if (nrservs == 0 && nn->nfsd_serv == NULL) |
671e1fcf N |
640 | goto out; |
641 | ||
6777436b | 642 | error = nfsd_create_serv(net); |
02a375f0 | 643 | if (error) |
774f8bbd BF |
644 | goto out; |
645 | ||
903d9bf0 | 646 | nfsd_up_before = nn->nfsd_net_up; |
774f8bbd | 647 | |
903d9bf0 | 648 | error = nfsd_startup_net(nrservs, net); |
af4718f3 BF |
649 | if (error) |
650 | goto out_destroy; | |
598e2359 JL |
651 | error = nn->nfsd_serv->sv_ops->svo_setup(nn->nfsd_serv, |
652 | NULL, nrservs); | |
774f8bbd BF |
653 | if (error) |
654 | goto out_shutdown; | |
9dd9845f | 655 | /* We are holding a reference to nn->nfsd_serv which |
af4718f3 BF |
656 | * we don't want to count in the return value, |
657 | * so subtract 1 | |
658 | */ | |
9dd9845f | 659 | error = nn->nfsd_serv->sv_nrthreads - 1; |
4ad9a344 | 660 | out_shutdown: |
774f8bbd | 661 | if (error < 0 && !nfsd_up_before) |
541e864f | 662 | nfsd_shutdown_net(net); |
774f8bbd | 663 | out_destroy: |
19f7e2ca | 664 | nfsd_destroy(net); /* Release server */ |
4ad9a344 | 665 | out: |
bedbdd8b | 666 | mutex_unlock(&nfsd_mutex); |
1da177e4 LT |
667 | return error; |
668 | } | |
669 | ||
1da177e4 LT |
670 | |
671 | /* | |
672 | * This is the NFS server kernel thread | |
673 | */ | |
9867d76c JL |
674 | static int |
675 | nfsd(void *vrqstp) | |
1da177e4 | 676 | { |
9867d76c | 677 | struct svc_rqst *rqstp = (struct svc_rqst *) vrqstp; |
88c47666 SK |
678 | struct svc_xprt *perm_sock = list_entry(rqstp->rq_server->sv_permsocks.next, typeof(struct svc_xprt), xpt_list); |
679 | struct net *net = perm_sock->xpt_net; | |
5b8db00b | 680 | struct nfsd_net *nn = net_generic(net, nfsd_net_id); |
5b444cc9 | 681 | int err; |
1da177e4 LT |
682 | |
683 | /* Lock module and set up kernel thread */ | |
bedbdd8b | 684 | mutex_lock(&nfsd_mutex); |
1da177e4 | 685 | |
9867d76c | 686 | /* At this point, the thread shares current->fs |
47057abd AG |
687 | * with the init process. We need to create files with the |
688 | * umask as defined by the client instead of init's umask. */ | |
3e93cd67 | 689 | if (unshare_fs_struct() < 0) { |
1da177e4 LT |
690 | printk("Unable to start nfsd thread: out of memory\n"); |
691 | goto out; | |
692 | } | |
3e93cd67 | 693 | |
1da177e4 LT |
694 | current->fs->umask = 0; |
695 | ||
9867d76c JL |
696 | /* |
697 | * thread is spawned with all signals set to SIG_IGN, re-enable | |
100766f8 | 698 | * the ones that will bring down the thread |
9867d76c | 699 | */ |
100766f8 JL |
700 | allow_signal(SIGKILL); |
701 | allow_signal(SIGHUP); | |
702 | allow_signal(SIGINT); | |
703 | allow_signal(SIGQUIT); | |
bedbdd8b | 704 | |
1da177e4 | 705 | nfsdstats.th_cnt++; |
bedbdd8b NB |
706 | mutex_unlock(&nfsd_mutex); |
707 | ||
83144186 | 708 | set_freezable(); |
1da177e4 LT |
709 | |
710 | /* | |
711 | * The main request loop | |
712 | */ | |
713 | for (;;) { | |
5b8db00b JL |
714 | /* Update sv_maxconn if it has changed */ |
715 | rqstp->rq_server->sv_maxconn = nn->max_connections; | |
716 | ||
1da177e4 LT |
717 | /* |
718 | * Find a socket with data available and call its | |
719 | * recvfrom routine. | |
720 | */ | |
6fb2b47f | 721 | while ((err = svc_recv(rqstp, 60*60*HZ)) == -EAGAIN) |
1da177e4 | 722 | ; |
9867d76c | 723 | if (err == -EINTR) |
1da177e4 | 724 | break; |
e0e81739 | 725 | validate_process_creds(); |
6fb2b47f | 726 | svc_process(rqstp); |
e0e81739 | 727 | validate_process_creds(); |
1da177e4 LT |
728 | } |
729 | ||
24e36663 | 730 | /* Clear signals before calling svc_exit_thread() */ |
9e416052 | 731 | flush_signals(current); |
1da177e4 | 732 | |
bedbdd8b | 733 | mutex_lock(&nfsd_mutex); |
1da177e4 LT |
734 | nfsdstats.th_cnt --; |
735 | ||
736 | out: | |
57c8b13e | 737 | rqstp->rq_server = NULL; |
786185b5 | 738 | |
1da177e4 LT |
739 | /* Release the thread */ |
740 | svc_exit_thread(rqstp); | |
741 | ||
88c47666 | 742 | nfsd_destroy(net); |
57c8b13e | 743 | |
1da177e4 | 744 | /* Release module */ |
bedbdd8b | 745 | mutex_unlock(&nfsd_mutex); |
1da177e4 | 746 | module_put_and_exit(0); |
9867d76c | 747 | return 0; |
1da177e4 LT |
748 | } |
749 | ||
32c1eb0c AA |
750 | static __be32 map_new_errors(u32 vers, __be32 nfserr) |
751 | { | |
752 | if (nfserr == nfserr_jukebox && vers == 2) | |
753 | return nfserr_dropit; | |
754 | if (nfserr == nfserr_wrongsec && vers < 4) | |
755 | return nfserr_acces; | |
756 | return nfserr; | |
757 | } | |
758 | ||
e6838a29 BF |
759 | /* |
760 | * A write procedure can have a large argument, and a read procedure can | |
761 | * have a large reply, but no NFSv2 or NFSv3 procedure has argument and | |
762 | * reply that can both be larger than a page. The xdr code has taken | |
763 | * advantage of this assumption to be a sloppy about bounds checking in | |
764 | * some cases. Pending a rewrite of the NFSv2/v3 xdr code to fix that | |
765 | * problem, we enforce these assumptions here: | |
766 | */ | |
767 | static bool nfs_request_too_big(struct svc_rqst *rqstp, | |
860bda29 | 768 | const struct svc_procedure *proc) |
e6838a29 BF |
769 | { |
770 | /* | |
771 | * The ACL code has more careful bounds-checking and is not | |
772 | * susceptible to this problem: | |
773 | */ | |
774 | if (rqstp->rq_prog != NFS_PROGRAM) | |
775 | return false; | |
776 | /* | |
777 | * Ditto NFSv4 (which can in theory have argument and reply both | |
778 | * more than a page): | |
779 | */ | |
780 | if (rqstp->rq_vers >= 4) | |
781 | return false; | |
782 | /* The reply will be small, we're OK: */ | |
783 | if (proc->pc_xdrressize > 0 && | |
784 | proc->pc_xdrressize < XDR_QUADLEN(PAGE_SIZE)) | |
785 | return false; | |
786 | ||
787 | return rqstp->rq_arg.len > PAGE_SIZE; | |
788 | } | |
789 | ||
1da177e4 | 790 | int |
c7afef1f | 791 | nfsd_dispatch(struct svc_rqst *rqstp, __be32 *statp) |
1da177e4 | 792 | { |
860bda29 | 793 | const struct svc_procedure *proc; |
ad451d38 AV |
794 | __be32 nfserr; |
795 | __be32 *nfserrp; | |
1da177e4 LT |
796 | |
797 | dprintk("nfsd_dispatch: vers %d proc %d\n", | |
798 | rqstp->rq_vers, rqstp->rq_proc); | |
799 | proc = rqstp->rq_procinfo; | |
800 | ||
e6838a29 BF |
801 | if (nfs_request_too_big(rqstp, proc)) { |
802 | dprintk("nfsd: NFSv%d argument too large\n", rqstp->rq_vers); | |
803 | *statp = rpc_garbage_args; | |
804 | return 1; | |
805 | } | |
1091006c BF |
806 | /* |
807 | * Give the xdr decoder a chance to change this if it wants | |
808 | * (necessary in the NFSv4.0 compound case) | |
809 | */ | |
810 | rqstp->rq_cachetype = proc->pc_cachetype; | |
811 | /* Decode arguments */ | |
026fec7e CH |
812 | if (proc->pc_decode && |
813 | !proc->pc_decode(rqstp, (__be32*)rqstp->rq_arg.head[0].iov_base)) { | |
1091006c BF |
814 | dprintk("nfsd: failed to decode arguments!\n"); |
815 | *statp = rpc_garbage_args; | |
816 | return 1; | |
817 | } | |
818 | ||
1da177e4 | 819 | /* Check whether we have this call in the cache. */ |
1091006c | 820 | switch (nfsd_cache_lookup(rqstp)) { |
1da177e4 LT |
821 | case RC_DROPIT: |
822 | return 0; | |
823 | case RC_REPLY: | |
824 | return 1; | |
825 | case RC_DOIT:; | |
826 | /* do it */ | |
827 | } | |
828 | ||
1da177e4 LT |
829 | /* need to grab the location to store the status, as |
830 | * nfsv4 does some encoding while processing | |
831 | */ | |
832 | nfserrp = rqstp->rq_res.head[0].iov_base | |
833 | + rqstp->rq_res.head[0].iov_len; | |
ad451d38 | 834 | rqstp->rq_res.head[0].iov_len += sizeof(__be32); |
1da177e4 LT |
835 | |
836 | /* Now call the procedure handler, and encode NFS status. */ | |
a6beb732 | 837 | nfserr = proc->pc_func(rqstp); |
32c1eb0c | 838 | nfserr = map_new_errors(rqstp->rq_vers, nfserr); |
78b65eb3 | 839 | if (nfserr == nfserr_dropit || test_bit(RQ_DROPME, &rqstp->rq_flags)) { |
45457e09 | 840 | dprintk("nfsd: Dropping request; may be revisited later\n"); |
1da177e4 LT |
841 | nfsd_cache_update(rqstp, RC_NOCACHE, NULL); |
842 | return 0; | |
843 | } | |
844 | ||
845 | if (rqstp->rq_proc != 0) | |
846 | *nfserrp++ = nfserr; | |
847 | ||
848 | /* Encode result. | |
849 | * For NFSv2, additional info is never returned in case of an error. | |
850 | */ | |
851 | if (!(nfserr && rqstp->rq_vers == 2)) { | |
63f8de37 | 852 | if (proc->pc_encode && !proc->pc_encode(rqstp, nfserrp)) { |
1da177e4 LT |
853 | /* Failed to encode result. Release cache entry */ |
854 | dprintk("nfsd: failed to encode result!\n"); | |
855 | nfsd_cache_update(rqstp, RC_NOCACHE, NULL); | |
856 | *statp = rpc_system_err; | |
857 | return 1; | |
858 | } | |
859 | } | |
860 | ||
861 | /* Store reply in cache. */ | |
57d276d7 | 862 | nfsd_cache_update(rqstp, rqstp->rq_cachetype, statp + 1); |
1da177e4 LT |
863 | return 1; |
864 | } | |
03cf6c9f GB |
865 | |
866 | int nfsd_pool_stats_open(struct inode *inode, struct file *file) | |
867 | { | |
ed2d8aed | 868 | int ret; |
11f77942 | 869 | struct nfsd_net *nn = net_generic(inode->i_sb->s_fs_info, nfsd_net_id); |
9dd9845f | 870 | |
ed2d8aed | 871 | mutex_lock(&nfsd_mutex); |
9dd9845f | 872 | if (nn->nfsd_serv == NULL) { |
ed2d8aed | 873 | mutex_unlock(&nfsd_mutex); |
03cf6c9f | 874 | return -ENODEV; |
ed2d8aed RY |
875 | } |
876 | /* bump up the psudo refcount while traversing */ | |
9dd9845f SK |
877 | svc_get(nn->nfsd_serv); |
878 | ret = svc_pool_stats_open(nn->nfsd_serv, file); | |
ed2d8aed RY |
879 | mutex_unlock(&nfsd_mutex); |
880 | return ret; | |
881 | } | |
882 | ||
883 | int nfsd_pool_stats_release(struct inode *inode, struct file *file) | |
884 | { | |
885 | int ret = seq_release(inode, file); | |
11f77942 | 886 | struct net *net = inode->i_sb->s_fs_info; |
786185b5 | 887 | |
ed2d8aed RY |
888 | mutex_lock(&nfsd_mutex); |
889 | /* this function really, really should have been called svc_put() */ | |
19f7e2ca | 890 | nfsd_destroy(net); |
ed2d8aed RY |
891 | mutex_unlock(&nfsd_mutex); |
892 | return ret; | |
03cf6c9f | 893 | } |