Loading...
1/*
2 * Syscall interface to knfsd.
3 *
4 * Copyright (C) 1995, 1996 Olaf Kirch <okir@monad.swb.de>
5 */
6
7#include <linux/slab.h>
8#include <linux/namei.h>
9#include <linux/ctype.h>
10
11#include <linux/sunrpc/svcsock.h>
12#include <linux/lockd/lockd.h>
13#include <linux/sunrpc/clnt.h>
14#include <linux/sunrpc/gss_api.h>
15#include <linux/sunrpc/gss_krb5_enctypes.h>
16#include <linux/sunrpc/rpc_pipe_fs.h>
17#include <linux/module.h>
18
19#include "idmap.h"
20#include "nfsd.h"
21#include "cache.h"
22#include "fault_inject.h"
23#include "netns.h"
24
25/*
26 * We have a single directory with several nodes in it.
27 */
28enum {
29 NFSD_Root = 1,
30 NFSD_List,
31 NFSD_Export_features,
32 NFSD_Fh,
33 NFSD_FO_UnlockIP,
34 NFSD_FO_UnlockFS,
35 NFSD_Threads,
36 NFSD_Pool_Threads,
37 NFSD_Pool_Stats,
38 NFSD_Versions,
39 NFSD_Ports,
40 NFSD_MaxBlkSize,
41 NFSD_SupportedEnctypes,
42 /*
43 * The below MUST come last. Otherwise we leave a hole in nfsd_files[]
44 * with !CONFIG_NFSD_V4 and simple_fill_super() goes oops
45 */
46#ifdef CONFIG_NFSD_V4
47 NFSD_Leasetime,
48 NFSD_Gracetime,
49 NFSD_RecoveryDir,
50#endif
51};
52
53/*
54 * write() for these nodes.
55 */
56static ssize_t write_filehandle(struct file *file, char *buf, size_t size);
57static ssize_t write_unlock_ip(struct file *file, char *buf, size_t size);
58static ssize_t write_unlock_fs(struct file *file, char *buf, size_t size);
59static ssize_t write_threads(struct file *file, char *buf, size_t size);
60static ssize_t write_pool_threads(struct file *file, char *buf, size_t size);
61static ssize_t write_versions(struct file *file, char *buf, size_t size);
62static ssize_t write_ports(struct file *file, char *buf, size_t size);
63static ssize_t write_maxblksize(struct file *file, char *buf, size_t size);
64#ifdef CONFIG_NFSD_V4
65static ssize_t write_leasetime(struct file *file, char *buf, size_t size);
66static ssize_t write_gracetime(struct file *file, char *buf, size_t size);
67static ssize_t write_recoverydir(struct file *file, char *buf, size_t size);
68#endif
69
70static ssize_t (*write_op[])(struct file *, char *, size_t) = {
71 [NFSD_Fh] = write_filehandle,
72 [NFSD_FO_UnlockIP] = write_unlock_ip,
73 [NFSD_FO_UnlockFS] = write_unlock_fs,
74 [NFSD_Threads] = write_threads,
75 [NFSD_Pool_Threads] = write_pool_threads,
76 [NFSD_Versions] = write_versions,
77 [NFSD_Ports] = write_ports,
78 [NFSD_MaxBlkSize] = write_maxblksize,
79#ifdef CONFIG_NFSD_V4
80 [NFSD_Leasetime] = write_leasetime,
81 [NFSD_Gracetime] = write_gracetime,
82 [NFSD_RecoveryDir] = write_recoverydir,
83#endif
84};
85
86static ssize_t nfsctl_transaction_write(struct file *file, const char __user *buf, size_t size, loff_t *pos)
87{
88 ino_t ino = file->f_path.dentry->d_inode->i_ino;
89 char *data;
90 ssize_t rv;
91
92 if (ino >= ARRAY_SIZE(write_op) || !write_op[ino])
93 return -EINVAL;
94
95 data = simple_transaction_get(file, buf, size);
96 if (IS_ERR(data))
97 return PTR_ERR(data);
98
99 rv = write_op[ino](file, data, size);
100 if (rv >= 0) {
101 simple_transaction_set(file, rv);
102 rv = size;
103 }
104 return rv;
105}
106
107static ssize_t nfsctl_transaction_read(struct file *file, char __user *buf, size_t size, loff_t *pos)
108{
109 if (! file->private_data) {
110 /* An attempt to read a transaction file without writing
111 * causes a 0-byte write so that the file can return
112 * state information
113 */
114 ssize_t rv = nfsctl_transaction_write(file, buf, 0, pos);
115 if (rv < 0)
116 return rv;
117 }
118 return simple_transaction_read(file, buf, size, pos);
119}
120
121static const struct file_operations transaction_ops = {
122 .write = nfsctl_transaction_write,
123 .read = nfsctl_transaction_read,
124 .release = simple_transaction_release,
125 .llseek = default_llseek,
126};
127
128static int exports_open(struct inode *inode, struct file *file)
129{
130 int err;
131 struct seq_file *seq;
132 struct nfsd_net *nn = net_generic(&init_net, nfsd_net_id);
133
134 err = seq_open(file, &nfs_exports_op);
135 if (err)
136 return err;
137
138 seq = file->private_data;
139 seq->private = nn->svc_export_cache;
140 return 0;
141}
142
143static const struct file_operations exports_operations = {
144 .open = exports_open,
145 .read = seq_read,
146 .llseek = seq_lseek,
147 .release = seq_release,
148 .owner = THIS_MODULE,
149};
150
151static int export_features_show(struct seq_file *m, void *v)
152{
153 seq_printf(m, "0x%x 0x%x\n", NFSEXP_ALLFLAGS, NFSEXP_SECINFO_FLAGS);
154 return 0;
155}
156
157static int export_features_open(struct inode *inode, struct file *file)
158{
159 return single_open(file, export_features_show, NULL);
160}
161
162static struct file_operations export_features_operations = {
163 .open = export_features_open,
164 .read = seq_read,
165 .llseek = seq_lseek,
166 .release = single_release,
167};
168
169#if defined(CONFIG_SUNRPC_GSS) || defined(CONFIG_SUNRPC_GSS_MODULE)
170static int supported_enctypes_show(struct seq_file *m, void *v)
171{
172 seq_printf(m, KRB5_SUPPORTED_ENCTYPES);
173 return 0;
174}
175
176static int supported_enctypes_open(struct inode *inode, struct file *file)
177{
178 return single_open(file, supported_enctypes_show, NULL);
179}
180
181static struct file_operations supported_enctypes_ops = {
182 .open = supported_enctypes_open,
183 .read = seq_read,
184 .llseek = seq_lseek,
185 .release = single_release,
186};
187#endif /* CONFIG_SUNRPC_GSS or CONFIG_SUNRPC_GSS_MODULE */
188
189extern int nfsd_pool_stats_open(struct inode *inode, struct file *file);
190extern int nfsd_pool_stats_release(struct inode *inode, struct file *file);
191
192static const struct file_operations pool_stats_operations = {
193 .open = nfsd_pool_stats_open,
194 .read = seq_read,
195 .llseek = seq_lseek,
196 .release = nfsd_pool_stats_release,
197 .owner = THIS_MODULE,
198};
199
200/*----------------------------------------------------------------------------*/
201/*
202 * payload - write methods
203 */
204
205
206/**
207 * write_unlock_ip - Release all locks used by a client
208 *
209 * Experimental.
210 *
211 * Input:
212 * buf: '\n'-terminated C string containing a
213 * presentation format IP address
214 * size: length of C string in @buf
215 * Output:
216 * On success: returns zero if all specified locks were released;
217 * returns one if one or more locks were not released
218 * On error: return code is negative errno value
219 */
220static ssize_t write_unlock_ip(struct file *file, char *buf, size_t size)
221{
222 struct sockaddr_storage address;
223 struct sockaddr *sap = (struct sockaddr *)&address;
224 size_t salen = sizeof(address);
225 char *fo_path;
226
227 /* sanity check */
228 if (size == 0)
229 return -EINVAL;
230
231 if (buf[size-1] != '\n')
232 return -EINVAL;
233
234 fo_path = buf;
235 if (qword_get(&buf, fo_path, size) < 0)
236 return -EINVAL;
237
238 if (rpc_pton(&init_net, fo_path, size, sap, salen) == 0)
239 return -EINVAL;
240
241 return nlmsvc_unlock_all_by_ip(sap);
242}
243
244/**
245 * write_unlock_fs - Release all locks on a local file system
246 *
247 * Experimental.
248 *
249 * Input:
250 * buf: '\n'-terminated C string containing the
251 * absolute pathname of a local file system
252 * size: length of C string in @buf
253 * Output:
254 * On success: returns zero if all specified locks were released;
255 * returns one if one or more locks were not released
256 * On error: return code is negative errno value
257 */
258static ssize_t write_unlock_fs(struct file *file, char *buf, size_t size)
259{
260 struct path path;
261 char *fo_path;
262 int error;
263
264 /* sanity check */
265 if (size == 0)
266 return -EINVAL;
267
268 if (buf[size-1] != '\n')
269 return -EINVAL;
270
271 fo_path = buf;
272 if (qword_get(&buf, fo_path, size) < 0)
273 return -EINVAL;
274
275 error = kern_path(fo_path, 0, &path);
276 if (error)
277 return error;
278
279 /*
280 * XXX: Needs better sanity checking. Otherwise we could end up
281 * releasing locks on the wrong file system.
282 *
283 * For example:
284 * 1. Does the path refer to a directory?
285 * 2. Is that directory a mount point, or
286 * 3. Is that directory the root of an exported file system?
287 */
288 error = nlmsvc_unlock_all_by_sb(path.dentry->d_sb);
289
290 path_put(&path);
291 return error;
292}
293
294/**
295 * write_filehandle - Get a variable-length NFS file handle by path
296 *
297 * On input, the buffer contains a '\n'-terminated C string comprised of
298 * three alphanumeric words separated by whitespace. The string may
299 * contain escape sequences.
300 *
301 * Input:
302 * buf:
303 * domain: client domain name
304 * path: export pathname
305 * maxsize: numeric maximum size of
306 * @buf
307 * size: length of C string in @buf
308 * Output:
309 * On success: passed-in buffer filled with '\n'-terminated C
310 * string containing a ASCII hex text version
311 * of the NFS file handle;
312 * return code is the size in bytes of the string
313 * On error: return code is negative errno value
314 */
315static ssize_t write_filehandle(struct file *file, char *buf, size_t size)
316{
317 char *dname, *path;
318 int uninitialized_var(maxsize);
319 char *mesg = buf;
320 int len;
321 struct auth_domain *dom;
322 struct knfsd_fh fh;
323
324 if (size == 0)
325 return -EINVAL;
326
327 if (buf[size-1] != '\n')
328 return -EINVAL;
329 buf[size-1] = 0;
330
331 dname = mesg;
332 len = qword_get(&mesg, dname, size);
333 if (len <= 0)
334 return -EINVAL;
335
336 path = dname+len+1;
337 len = qword_get(&mesg, path, size);
338 if (len <= 0)
339 return -EINVAL;
340
341 len = get_int(&mesg, &maxsize);
342 if (len)
343 return len;
344
345 if (maxsize < NFS_FHSIZE)
346 return -EINVAL;
347 if (maxsize > NFS3_FHSIZE)
348 maxsize = NFS3_FHSIZE;
349
350 if (qword_get(&mesg, mesg, size)>0)
351 return -EINVAL;
352
353 /* we have all the words, they are in buf.. */
354 dom = unix_domain_find(dname);
355 if (!dom)
356 return -ENOMEM;
357
358 len = exp_rootfh(&init_net, dom, path, &fh, maxsize);
359 auth_domain_put(dom);
360 if (len)
361 return len;
362
363 mesg = buf;
364 len = SIMPLE_TRANSACTION_LIMIT;
365 qword_addhex(&mesg, &len, (char*)&fh.fh_base, fh.fh_size);
366 mesg[-1] = '\n';
367 return mesg - buf;
368}
369
370/**
371 * write_threads - Start NFSD, or report the current number of running threads
372 *
373 * Input:
374 * buf: ignored
375 * size: zero
376 * Output:
377 * On success: passed-in buffer filled with '\n'-terminated C
378 * string numeric value representing the number of
379 * running NFSD threads;
380 * return code is the size in bytes of the string
381 * On error: return code is zero
382 *
383 * OR
384 *
385 * Input:
386 * buf: C string containing an unsigned
387 * integer value representing the
388 * number of NFSD threads to start
389 * size: non-zero length of C string in @buf
390 * Output:
391 * On success: NFS service is started;
392 * passed-in buffer filled with '\n'-terminated C
393 * string numeric value representing the number of
394 * running NFSD threads;
395 * return code is the size in bytes of the string
396 * On error: return code is zero or a negative errno value
397 */
398static ssize_t write_threads(struct file *file, char *buf, size_t size)
399{
400 char *mesg = buf;
401 int rv;
402 if (size > 0) {
403 int newthreads;
404 rv = get_int(&mesg, &newthreads);
405 if (rv)
406 return rv;
407 if (newthreads < 0)
408 return -EINVAL;
409 rv = nfsd_svc(NFS_PORT, newthreads);
410 if (rv < 0)
411 return rv;
412 } else
413 rv = nfsd_nrthreads();
414
415 return scnprintf(buf, SIMPLE_TRANSACTION_LIMIT, "%d\n", rv);
416}
417
418/**
419 * write_pool_threads - Set or report the current number of threads per pool
420 *
421 * Input:
422 * buf: ignored
423 * size: zero
424 *
425 * OR
426 *
427 * Input:
428 * buf: C string containing whitespace-
429 * separated unsigned integer values
430 * representing the number of NFSD
431 * threads to start in each pool
432 * size: non-zero length of C string in @buf
433 * Output:
434 * On success: passed-in buffer filled with '\n'-terminated C
435 * string containing integer values representing the
436 * number of NFSD threads in each pool;
437 * return code is the size in bytes of the string
438 * On error: return code is zero or a negative errno value
439 */
440static ssize_t write_pool_threads(struct file *file, char *buf, size_t size)
441{
442 /* if size > 0, look for an array of number of threads per node
443 * and apply them then write out number of threads per node as reply
444 */
445 char *mesg = buf;
446 int i;
447 int rv;
448 int len;
449 int npools;
450 int *nthreads;
451
452 mutex_lock(&nfsd_mutex);
453 npools = nfsd_nrpools();
454 if (npools == 0) {
455 /*
456 * NFS is shut down. The admin can start it by
457 * writing to the threads file but NOT the pool_threads
458 * file, sorry. Report zero threads.
459 */
460 mutex_unlock(&nfsd_mutex);
461 strcpy(buf, "0\n");
462 return strlen(buf);
463 }
464
465 nthreads = kcalloc(npools, sizeof(int), GFP_KERNEL);
466 rv = -ENOMEM;
467 if (nthreads == NULL)
468 goto out_free;
469
470 if (size > 0) {
471 for (i = 0; i < npools; i++) {
472 rv = get_int(&mesg, &nthreads[i]);
473 if (rv == -ENOENT)
474 break; /* fewer numbers than pools */
475 if (rv)
476 goto out_free; /* syntax error */
477 rv = -EINVAL;
478 if (nthreads[i] < 0)
479 goto out_free;
480 }
481 rv = nfsd_set_nrthreads(i, nthreads);
482 if (rv)
483 goto out_free;
484 }
485
486 rv = nfsd_get_nrthreads(npools, nthreads);
487 if (rv)
488 goto out_free;
489
490 mesg = buf;
491 size = SIMPLE_TRANSACTION_LIMIT;
492 for (i = 0; i < npools && size > 0; i++) {
493 snprintf(mesg, size, "%d%c", nthreads[i], (i == npools-1 ? '\n' : ' '));
494 len = strlen(mesg);
495 size -= len;
496 mesg += len;
497 }
498 rv = mesg - buf;
499out_free:
500 kfree(nthreads);
501 mutex_unlock(&nfsd_mutex);
502 return rv;
503}
504
505static ssize_t __write_versions(struct file *file, char *buf, size_t size)
506{
507 char *mesg = buf;
508 char *vers, *minorp, sign;
509 int len, num, remaining;
510 unsigned minor;
511 ssize_t tlen = 0;
512 char *sep;
513
514 if (size>0) {
515 if (nfsd_serv)
516 /* Cannot change versions without updating
517 * nfsd_serv->sv_xdrsize, and reallocing
518 * rq_argp and rq_resp
519 */
520 return -EBUSY;
521 if (buf[size-1] != '\n')
522 return -EINVAL;
523 buf[size-1] = 0;
524
525 vers = mesg;
526 len = qword_get(&mesg, vers, size);
527 if (len <= 0) return -EINVAL;
528 do {
529 sign = *vers;
530 if (sign == '+' || sign == '-')
531 num = simple_strtol((vers+1), &minorp, 0);
532 else
533 num = simple_strtol(vers, &minorp, 0);
534 if (*minorp == '.') {
535 if (num < 4)
536 return -EINVAL;
537 minor = simple_strtoul(minorp+1, NULL, 0);
538 if (minor == 0)
539 return -EINVAL;
540 if (nfsd_minorversion(minor, sign == '-' ?
541 NFSD_CLEAR : NFSD_SET) < 0)
542 return -EINVAL;
543 goto next;
544 }
545 switch(num) {
546 case 2:
547 case 3:
548 case 4:
549 nfsd_vers(num, sign == '-' ? NFSD_CLEAR : NFSD_SET);
550 break;
551 default:
552 return -EINVAL;
553 }
554 next:
555 vers += len + 1;
556 } while ((len = qword_get(&mesg, vers, size)) > 0);
557 /* If all get turned off, turn them back on, as
558 * having no versions is BAD
559 */
560 nfsd_reset_versions();
561 }
562
563 /* Now write current state into reply buffer */
564 len = 0;
565 sep = "";
566 remaining = SIMPLE_TRANSACTION_LIMIT;
567 for (num=2 ; num <= 4 ; num++)
568 if (nfsd_vers(num, NFSD_AVAIL)) {
569 len = snprintf(buf, remaining, "%s%c%d", sep,
570 nfsd_vers(num, NFSD_TEST)?'+':'-',
571 num);
572 sep = " ";
573
574 if (len > remaining)
575 break;
576 remaining -= len;
577 buf += len;
578 tlen += len;
579 }
580 if (nfsd_vers(4, NFSD_AVAIL))
581 for (minor = 1; minor <= NFSD_SUPPORTED_MINOR_VERSION;
582 minor++) {
583 len = snprintf(buf, remaining, " %c4.%u",
584 (nfsd_vers(4, NFSD_TEST) &&
585 nfsd_minorversion(minor, NFSD_TEST)) ?
586 '+' : '-',
587 minor);
588
589 if (len > remaining)
590 break;
591 remaining -= len;
592 buf += len;
593 tlen += len;
594 }
595
596 len = snprintf(buf, remaining, "\n");
597 if (len > remaining)
598 return -EINVAL;
599 return tlen + len;
600}
601
602/**
603 * write_versions - Set or report the available NFS protocol versions
604 *
605 * Input:
606 * buf: ignored
607 * size: zero
608 * Output:
609 * On success: passed-in buffer filled with '\n'-terminated C
610 * string containing positive or negative integer
611 * values representing the current status of each
612 * protocol version;
613 * return code is the size in bytes of the string
614 * On error: return code is zero or a negative errno value
615 *
616 * OR
617 *
618 * Input:
619 * buf: C string containing whitespace-
620 * separated positive or negative
621 * integer values representing NFS
622 * protocol versions to enable ("+n")
623 * or disable ("-n")
624 * size: non-zero length of C string in @buf
625 * Output:
626 * On success: status of zero or more protocol versions has
627 * been updated; passed-in buffer filled with
628 * '\n'-terminated C string containing positive
629 * or negative integer values representing the
630 * current status of each protocol version;
631 * return code is the size in bytes of the string
632 * On error: return code is zero or a negative errno value
633 */
634static ssize_t write_versions(struct file *file, char *buf, size_t size)
635{
636 ssize_t rv;
637
638 mutex_lock(&nfsd_mutex);
639 rv = __write_versions(file, buf, size);
640 mutex_unlock(&nfsd_mutex);
641 return rv;
642}
643
644/*
645 * Zero-length write. Return a list of NFSD's current listener
646 * transports.
647 */
648static ssize_t __write_ports_names(char *buf)
649{
650 if (nfsd_serv == NULL)
651 return 0;
652 return svc_xprt_names(nfsd_serv, buf, SIMPLE_TRANSACTION_LIMIT);
653}
654
655/*
656 * A single 'fd' number was written, in which case it must be for
657 * a socket of a supported family/protocol, and we use it as an
658 * nfsd listener.
659 */
660static ssize_t __write_ports_addfd(char *buf)
661{
662 char *mesg = buf;
663 int fd, err;
664 struct net *net = &init_net;
665
666 err = get_int(&mesg, &fd);
667 if (err != 0 || fd < 0)
668 return -EINVAL;
669
670 err = nfsd_create_serv();
671 if (err != 0)
672 return err;
673
674 err = svc_addsock(nfsd_serv, fd, buf, SIMPLE_TRANSACTION_LIMIT);
675 if (err < 0) {
676 nfsd_destroy(net);
677 return err;
678 }
679
680 /* Decrease the count, but don't shut down the service */
681 nfsd_serv->sv_nrthreads--;
682 return err;
683}
684
685/*
686 * A '-' followed by the 'name' of a socket means we close the socket.
687 */
688static ssize_t __write_ports_delfd(char *buf)
689{
690 char *toclose;
691 int len = 0;
692
693 toclose = kstrdup(buf + 1, GFP_KERNEL);
694 if (toclose == NULL)
695 return -ENOMEM;
696
697 if (nfsd_serv != NULL)
698 len = svc_sock_names(nfsd_serv, buf,
699 SIMPLE_TRANSACTION_LIMIT, toclose);
700 kfree(toclose);
701 return len;
702}
703
704/*
705 * A transport listener is added by writing it's transport name and
706 * a port number.
707 */
708static ssize_t __write_ports_addxprt(char *buf)
709{
710 char transport[16];
711 struct svc_xprt *xprt;
712 int port, err;
713 struct net *net = &init_net;
714
715 if (sscanf(buf, "%15s %4u", transport, &port) != 2)
716 return -EINVAL;
717
718 if (port < 1 || port > USHRT_MAX)
719 return -EINVAL;
720
721 err = nfsd_create_serv();
722 if (err != 0)
723 return err;
724
725 err = svc_create_xprt(nfsd_serv, transport, net,
726 PF_INET, port, SVC_SOCK_ANONYMOUS);
727 if (err < 0)
728 goto out_err;
729
730 err = svc_create_xprt(nfsd_serv, transport, net,
731 PF_INET6, port, SVC_SOCK_ANONYMOUS);
732 if (err < 0 && err != -EAFNOSUPPORT)
733 goto out_close;
734
735 /* Decrease the count, but don't shut down the service */
736 nfsd_serv->sv_nrthreads--;
737 return 0;
738out_close:
739 xprt = svc_find_xprt(nfsd_serv, transport, net, PF_INET, port);
740 if (xprt != NULL) {
741 svc_close_xprt(xprt);
742 svc_xprt_put(xprt);
743 }
744out_err:
745 nfsd_destroy(net);
746 return err;
747}
748
749/*
750 * A transport listener is removed by writing a "-", it's transport
751 * name, and it's port number.
752 */
753static ssize_t __write_ports_delxprt(char *buf)
754{
755 struct svc_xprt *xprt;
756 char transport[16];
757 int port;
758
759 if (sscanf(&buf[1], "%15s %4u", transport, &port) != 2)
760 return -EINVAL;
761
762 if (port < 1 || port > USHRT_MAX || nfsd_serv == NULL)
763 return -EINVAL;
764
765 xprt = svc_find_xprt(nfsd_serv, transport, &init_net, AF_UNSPEC, port);
766 if (xprt == NULL)
767 return -ENOTCONN;
768
769 svc_close_xprt(xprt);
770 svc_xprt_put(xprt);
771 return 0;
772}
773
774static ssize_t __write_ports(struct file *file, char *buf, size_t size)
775{
776 if (size == 0)
777 return __write_ports_names(buf);
778
779 if (isdigit(buf[0]))
780 return __write_ports_addfd(buf);
781
782 if (buf[0] == '-' && isdigit(buf[1]))
783 return __write_ports_delfd(buf);
784
785 if (isalpha(buf[0]))
786 return __write_ports_addxprt(buf);
787
788 if (buf[0] == '-' && isalpha(buf[1]))
789 return __write_ports_delxprt(buf);
790
791 return -EINVAL;
792}
793
794/**
795 * write_ports - Pass a socket file descriptor or transport name to listen on
796 *
797 * Input:
798 * buf: ignored
799 * size: zero
800 * Output:
801 * On success: passed-in buffer filled with a '\n'-terminated C
802 * string containing a whitespace-separated list of
803 * named NFSD listeners;
804 * return code is the size in bytes of the string
805 * On error: return code is zero or a negative errno value
806 *
807 * OR
808 *
809 * Input:
810 * buf: C string containing an unsigned
811 * integer value representing a bound
812 * but unconnected socket that is to be
813 * used as an NFSD listener; listen(3)
814 * must be called for a SOCK_STREAM
815 * socket, otherwise it is ignored
816 * size: non-zero length of C string in @buf
817 * Output:
818 * On success: NFS service is started;
819 * passed-in buffer filled with a '\n'-terminated C
820 * string containing a unique alphanumeric name of
821 * the listener;
822 * return code is the size in bytes of the string
823 * On error: return code is a negative errno value
824 *
825 * OR
826 *
827 * Input:
828 * buf: C string containing a "-" followed
829 * by an integer value representing a
830 * previously passed in socket file
831 * descriptor
832 * size: non-zero length of C string in @buf
833 * Output:
834 * On success: NFS service no longer listens on that socket;
835 * passed-in buffer filled with a '\n'-terminated C
836 * string containing a unique name of the listener;
837 * return code is the size in bytes of the string
838 * On error: return code is a negative errno value
839 *
840 * OR
841 *
842 * Input:
843 * buf: C string containing a transport
844 * name and an unsigned integer value
845 * representing the port to listen on,
846 * separated by whitespace
847 * size: non-zero length of C string in @buf
848 * Output:
849 * On success: returns zero; NFS service is started
850 * On error: return code is a negative errno value
851 *
852 * OR
853 *
854 * Input:
855 * buf: C string containing a "-" followed
856 * by a transport name and an unsigned
857 * integer value representing the port
858 * to listen on, separated by whitespace
859 * size: non-zero length of C string in @buf
860 * Output:
861 * On success: returns zero; NFS service no longer listens
862 * on that transport
863 * On error: return code is a negative errno value
864 */
865static ssize_t write_ports(struct file *file, char *buf, size_t size)
866{
867 ssize_t rv;
868
869 mutex_lock(&nfsd_mutex);
870 rv = __write_ports(file, buf, size);
871 mutex_unlock(&nfsd_mutex);
872 return rv;
873}
874
875
876int nfsd_max_blksize;
877
878/**
879 * write_maxblksize - Set or report the current NFS blksize
880 *
881 * Input:
882 * buf: ignored
883 * size: zero
884 *
885 * OR
886 *
887 * Input:
888 * buf: C string containing an unsigned
889 * integer value representing the new
890 * NFS blksize
891 * size: non-zero length of C string in @buf
892 * Output:
893 * On success: passed-in buffer filled with '\n'-terminated C string
894 * containing numeric value of the current NFS blksize
895 * setting;
896 * return code is the size in bytes of the string
897 * On error: return code is zero or a negative errno value
898 */
899static ssize_t write_maxblksize(struct file *file, char *buf, size_t size)
900{
901 char *mesg = buf;
902 if (size > 0) {
903 int bsize;
904 int rv = get_int(&mesg, &bsize);
905 if (rv)
906 return rv;
907 /* force bsize into allowed range and
908 * required alignment.
909 */
910 if (bsize < 1024)
911 bsize = 1024;
912 if (bsize > NFSSVC_MAXBLKSIZE)
913 bsize = NFSSVC_MAXBLKSIZE;
914 bsize &= ~(1024-1);
915 mutex_lock(&nfsd_mutex);
916 if (nfsd_serv) {
917 mutex_unlock(&nfsd_mutex);
918 return -EBUSY;
919 }
920 nfsd_max_blksize = bsize;
921 mutex_unlock(&nfsd_mutex);
922 }
923
924 return scnprintf(buf, SIMPLE_TRANSACTION_LIMIT, "%d\n",
925 nfsd_max_blksize);
926}
927
928#ifdef CONFIG_NFSD_V4
929static ssize_t __nfsd4_write_time(struct file *file, char *buf, size_t size, time_t *time)
930{
931 char *mesg = buf;
932 int rv, i;
933
934 if (size > 0) {
935 if (nfsd_serv)
936 return -EBUSY;
937 rv = get_int(&mesg, &i);
938 if (rv)
939 return rv;
940 /*
941 * Some sanity checking. We don't have a reason for
942 * these particular numbers, but problems with the
943 * extremes are:
944 * - Too short: the briefest network outage may
945 * cause clients to lose all their locks. Also,
946 * the frequent polling may be wasteful.
947 * - Too long: do you really want reboot recovery
948 * to take more than an hour? Or to make other
949 * clients wait an hour before being able to
950 * revoke a dead client's locks?
951 */
952 if (i < 10 || i > 3600)
953 return -EINVAL;
954 *time = i;
955 }
956
957 return scnprintf(buf, SIMPLE_TRANSACTION_LIMIT, "%ld\n", *time);
958}
959
960static ssize_t nfsd4_write_time(struct file *file, char *buf, size_t size, time_t *time)
961{
962 ssize_t rv;
963
964 mutex_lock(&nfsd_mutex);
965 rv = __nfsd4_write_time(file, buf, size, time);
966 mutex_unlock(&nfsd_mutex);
967 return rv;
968}
969
970/**
971 * write_leasetime - Set or report the current NFSv4 lease time
972 *
973 * Input:
974 * buf: ignored
975 * size: zero
976 *
977 * OR
978 *
979 * Input:
980 * buf: C string containing an unsigned
981 * integer value representing the new
982 * NFSv4 lease expiry time
983 * size: non-zero length of C string in @buf
984 * Output:
985 * On success: passed-in buffer filled with '\n'-terminated C
986 * string containing unsigned integer value of the
987 * current lease expiry time;
988 * return code is the size in bytes of the string
989 * On error: return code is zero or a negative errno value
990 */
991static ssize_t write_leasetime(struct file *file, char *buf, size_t size)
992{
993 return nfsd4_write_time(file, buf, size, &nfsd4_lease);
994}
995
996/**
997 * write_gracetime - Set or report current NFSv4 grace period time
998 *
999 * As above, but sets the time of the NFSv4 grace period.
1000 *
1001 * Note this should never be set to less than the *previous*
1002 * lease-period time, but we don't try to enforce this. (In the common
1003 * case (a new boot), we don't know what the previous lease time was
1004 * anyway.)
1005 */
1006static ssize_t write_gracetime(struct file *file, char *buf, size_t size)
1007{
1008 return nfsd4_write_time(file, buf, size, &nfsd4_grace);
1009}
1010
1011extern char *nfs4_recoverydir(void);
1012
1013static ssize_t __write_recoverydir(struct file *file, char *buf, size_t size)
1014{
1015 char *mesg = buf;
1016 char *recdir;
1017 int len, status;
1018
1019 if (size > 0) {
1020 if (nfsd_serv)
1021 return -EBUSY;
1022 if (size > PATH_MAX || buf[size-1] != '\n')
1023 return -EINVAL;
1024 buf[size-1] = 0;
1025
1026 recdir = mesg;
1027 len = qword_get(&mesg, recdir, size);
1028 if (len <= 0)
1029 return -EINVAL;
1030
1031 status = nfs4_reset_recoverydir(recdir);
1032 if (status)
1033 return status;
1034 }
1035
1036 return scnprintf(buf, SIMPLE_TRANSACTION_LIMIT, "%s\n",
1037 nfs4_recoverydir());
1038}
1039
1040/**
1041 * write_recoverydir - Set or report the pathname of the recovery directory
1042 *
1043 * Input:
1044 * buf: ignored
1045 * size: zero
1046 *
1047 * OR
1048 *
1049 * Input:
1050 * buf: C string containing the pathname
1051 * of the directory on a local file
1052 * system containing permanent NFSv4
1053 * recovery data
1054 * size: non-zero length of C string in @buf
1055 * Output:
1056 * On success: passed-in buffer filled with '\n'-terminated C string
1057 * containing the current recovery pathname setting;
1058 * return code is the size in bytes of the string
1059 * On error: return code is zero or a negative errno value
1060 */
1061static ssize_t write_recoverydir(struct file *file, char *buf, size_t size)
1062{
1063 ssize_t rv;
1064
1065 mutex_lock(&nfsd_mutex);
1066 rv = __write_recoverydir(file, buf, size);
1067 mutex_unlock(&nfsd_mutex);
1068 return rv;
1069}
1070
1071#endif
1072
1073/*----------------------------------------------------------------------------*/
1074/*
1075 * populating the filesystem.
1076 */
1077
1078static int nfsd_fill_super(struct super_block * sb, void * data, int silent)
1079{
1080 static struct tree_descr nfsd_files[] = {
1081 [NFSD_List] = {"exports", &exports_operations, S_IRUGO},
1082 [NFSD_Export_features] = {"export_features",
1083 &export_features_operations, S_IRUGO},
1084 [NFSD_FO_UnlockIP] = {"unlock_ip",
1085 &transaction_ops, S_IWUSR|S_IRUSR},
1086 [NFSD_FO_UnlockFS] = {"unlock_filesystem",
1087 &transaction_ops, S_IWUSR|S_IRUSR},
1088 [NFSD_Fh] = {"filehandle", &transaction_ops, S_IWUSR|S_IRUSR},
1089 [NFSD_Threads] = {"threads", &transaction_ops, S_IWUSR|S_IRUSR},
1090 [NFSD_Pool_Threads] = {"pool_threads", &transaction_ops, S_IWUSR|S_IRUSR},
1091 [NFSD_Pool_Stats] = {"pool_stats", &pool_stats_operations, S_IRUGO},
1092 [NFSD_Versions] = {"versions", &transaction_ops, S_IWUSR|S_IRUSR},
1093 [NFSD_Ports] = {"portlist", &transaction_ops, S_IWUSR|S_IRUGO},
1094 [NFSD_MaxBlkSize] = {"max_block_size", &transaction_ops, S_IWUSR|S_IRUGO},
1095#if defined(CONFIG_SUNRPC_GSS) || defined(CONFIG_SUNRPC_GSS_MODULE)
1096 [NFSD_SupportedEnctypes] = {"supported_krb5_enctypes", &supported_enctypes_ops, S_IRUGO},
1097#endif /* CONFIG_SUNRPC_GSS or CONFIG_SUNRPC_GSS_MODULE */
1098#ifdef CONFIG_NFSD_V4
1099 [NFSD_Leasetime] = {"nfsv4leasetime", &transaction_ops, S_IWUSR|S_IRUSR},
1100 [NFSD_Gracetime] = {"nfsv4gracetime", &transaction_ops, S_IWUSR|S_IRUSR},
1101 [NFSD_RecoveryDir] = {"nfsv4recoverydir", &transaction_ops, S_IWUSR|S_IRUSR},
1102#endif
1103 /* last one */ {""}
1104 };
1105 return simple_fill_super(sb, 0x6e667364, nfsd_files);
1106}
1107
1108static struct dentry *nfsd_mount(struct file_system_type *fs_type,
1109 int flags, const char *dev_name, void *data)
1110{
1111 return mount_single(fs_type, flags, data, nfsd_fill_super);
1112}
1113
1114static struct file_system_type nfsd_fs_type = {
1115 .owner = THIS_MODULE,
1116 .name = "nfsd",
1117 .mount = nfsd_mount,
1118 .kill_sb = kill_litter_super,
1119};
1120
1121#ifdef CONFIG_PROC_FS
1122static int create_proc_exports_entry(void)
1123{
1124 struct proc_dir_entry *entry;
1125
1126 entry = proc_mkdir("fs/nfs", NULL);
1127 if (!entry)
1128 return -ENOMEM;
1129 entry = proc_create("exports", 0, entry, &exports_operations);
1130 if (!entry)
1131 return -ENOMEM;
1132 return 0;
1133}
1134#else /* CONFIG_PROC_FS */
1135static int create_proc_exports_entry(void)
1136{
1137 return 0;
1138}
1139#endif
1140
1141int nfsd_net_id;
1142
1143static __net_init int nfsd_init_net(struct net *net)
1144{
1145 int retval;
1146
1147 retval = nfsd_export_init(net);
1148 if (retval)
1149 goto out_export_error;
1150 retval = nfsd_idmap_init(net);
1151 if (retval)
1152 goto out_idmap_error;
1153 return 0;
1154
1155out_idmap_error:
1156 nfsd_export_shutdown(net);
1157out_export_error:
1158 return retval;
1159}
1160
1161static __net_exit void nfsd_exit_net(struct net *net)
1162{
1163 nfsd_idmap_shutdown(net);
1164 nfsd_export_shutdown(net);
1165}
1166
1167static struct pernet_operations nfsd_net_ops = {
1168 .init = nfsd_init_net,
1169 .exit = nfsd_exit_net,
1170 .id = &nfsd_net_id,
1171 .size = sizeof(struct nfsd_net),
1172};
1173
1174static int __init init_nfsd(void)
1175{
1176 int retval;
1177 printk(KERN_INFO "Installing knfsd (copyright (C) 1996 okir@monad.swb.de).\n");
1178
1179 retval = register_cld_notifier();
1180 if (retval)
1181 return retval;
1182 retval = register_pernet_subsys(&nfsd_net_ops);
1183 if (retval < 0)
1184 goto out_unregister_notifier;
1185 retval = nfsd4_init_slabs();
1186 if (retval)
1187 goto out_unregister_pernet;
1188 nfs4_state_init();
1189 retval = nfsd_fault_inject_init(); /* nfsd fault injection controls */
1190 if (retval)
1191 goto out_free_slabs;
1192 nfsd_stat_init(); /* Statistics */
1193 retval = nfsd_reply_cache_init();
1194 if (retval)
1195 goto out_free_stat;
1196 nfsd_lockd_init(); /* lockd->nfsd callbacks */
1197 retval = create_proc_exports_entry();
1198 if (retval)
1199 goto out_free_lockd;
1200 retval = register_filesystem(&nfsd_fs_type);
1201 if (retval)
1202 goto out_free_all;
1203 return 0;
1204out_free_all:
1205 remove_proc_entry("fs/nfs/exports", NULL);
1206 remove_proc_entry("fs/nfs", NULL);
1207out_free_lockd:
1208 nfsd_lockd_shutdown();
1209 nfsd_reply_cache_shutdown();
1210out_free_stat:
1211 nfsd_stat_shutdown();
1212 nfsd_fault_inject_cleanup();
1213out_free_slabs:
1214 nfsd4_free_slabs();
1215out_unregister_pernet:
1216 unregister_pernet_subsys(&nfsd_net_ops);
1217out_unregister_notifier:
1218 unregister_cld_notifier();
1219 return retval;
1220}
1221
1222static void __exit exit_nfsd(void)
1223{
1224 nfsd_reply_cache_shutdown();
1225 remove_proc_entry("fs/nfs/exports", NULL);
1226 remove_proc_entry("fs/nfs", NULL);
1227 nfsd_stat_shutdown();
1228 nfsd_lockd_shutdown();
1229 nfsd4_free_slabs();
1230 nfsd_fault_inject_cleanup();
1231 unregister_filesystem(&nfsd_fs_type);
1232 unregister_pernet_subsys(&nfsd_net_ops);
1233 unregister_cld_notifier();
1234}
1235
1236MODULE_AUTHOR("Olaf Kirch <okir@monad.swb.de>");
1237MODULE_LICENSE("GPL");
1238module_init(init_nfsd)
1239module_exit(exit_nfsd)
1// SPDX-License-Identifier: GPL-2.0-only
2/*
3 * Syscall interface to knfsd.
4 *
5 * Copyright (C) 1995, 1996 Olaf Kirch <okir@monad.swb.de>
6 */
7
8#include <linux/slab.h>
9#include <linux/namei.h>
10#include <linux/ctype.h>
11#include <linux/fs_context.h>
12
13#include <linux/sunrpc/svcsock.h>
14#include <linux/lockd/lockd.h>
15#include <linux/sunrpc/addr.h>
16#include <linux/sunrpc/gss_api.h>
17#include <linux/sunrpc/gss_krb5_enctypes.h>
18#include <linux/sunrpc/rpc_pipe_fs.h>
19#include <linux/module.h>
20#include <linux/fsnotify.h>
21
22#include "idmap.h"
23#include "nfsd.h"
24#include "cache.h"
25#include "state.h"
26#include "netns.h"
27#include "pnfs.h"
28
29/*
30 * We have a single directory with several nodes in it.
31 */
32enum {
33 NFSD_Root = 1,
34 NFSD_List,
35 NFSD_Export_Stats,
36 NFSD_Export_features,
37 NFSD_Fh,
38 NFSD_FO_UnlockIP,
39 NFSD_FO_UnlockFS,
40 NFSD_Threads,
41 NFSD_Pool_Threads,
42 NFSD_Pool_Stats,
43 NFSD_Reply_Cache_Stats,
44 NFSD_Versions,
45 NFSD_Ports,
46 NFSD_MaxBlkSize,
47 NFSD_MaxConnections,
48 NFSD_SupportedEnctypes,
49 /*
50 * The below MUST come last. Otherwise we leave a hole in nfsd_files[]
51 * with !CONFIG_NFSD_V4 and simple_fill_super() goes oops
52 */
53#ifdef CONFIG_NFSD_V4
54 NFSD_Leasetime,
55 NFSD_Gracetime,
56 NFSD_RecoveryDir,
57 NFSD_V4EndGrace,
58#endif
59 NFSD_MaxReserved
60};
61
62/*
63 * write() for these nodes.
64 */
65static ssize_t write_filehandle(struct file *file, char *buf, size_t size);
66static ssize_t write_unlock_ip(struct file *file, char *buf, size_t size);
67static ssize_t write_unlock_fs(struct file *file, char *buf, size_t size);
68static ssize_t write_threads(struct file *file, char *buf, size_t size);
69static ssize_t write_pool_threads(struct file *file, char *buf, size_t size);
70static ssize_t write_versions(struct file *file, char *buf, size_t size);
71static ssize_t write_ports(struct file *file, char *buf, size_t size);
72static ssize_t write_maxblksize(struct file *file, char *buf, size_t size);
73static ssize_t write_maxconn(struct file *file, char *buf, size_t size);
74#ifdef CONFIG_NFSD_V4
75static ssize_t write_leasetime(struct file *file, char *buf, size_t size);
76static ssize_t write_gracetime(struct file *file, char *buf, size_t size);
77static ssize_t write_recoverydir(struct file *file, char *buf, size_t size);
78static ssize_t write_v4_end_grace(struct file *file, char *buf, size_t size);
79#endif
80
81static ssize_t (*const write_op[])(struct file *, char *, size_t) = {
82 [NFSD_Fh] = write_filehandle,
83 [NFSD_FO_UnlockIP] = write_unlock_ip,
84 [NFSD_FO_UnlockFS] = write_unlock_fs,
85 [NFSD_Threads] = write_threads,
86 [NFSD_Pool_Threads] = write_pool_threads,
87 [NFSD_Versions] = write_versions,
88 [NFSD_Ports] = write_ports,
89 [NFSD_MaxBlkSize] = write_maxblksize,
90 [NFSD_MaxConnections] = write_maxconn,
91#ifdef CONFIG_NFSD_V4
92 [NFSD_Leasetime] = write_leasetime,
93 [NFSD_Gracetime] = write_gracetime,
94 [NFSD_RecoveryDir] = write_recoverydir,
95 [NFSD_V4EndGrace] = write_v4_end_grace,
96#endif
97};
98
99static ssize_t nfsctl_transaction_write(struct file *file, const char __user *buf, size_t size, loff_t *pos)
100{
101 ino_t ino = file_inode(file)->i_ino;
102 char *data;
103 ssize_t rv;
104
105 if (ino >= ARRAY_SIZE(write_op) || !write_op[ino])
106 return -EINVAL;
107
108 data = simple_transaction_get(file, buf, size);
109 if (IS_ERR(data))
110 return PTR_ERR(data);
111
112 rv = write_op[ino](file, data, size);
113 if (rv >= 0) {
114 simple_transaction_set(file, rv);
115 rv = size;
116 }
117 return rv;
118}
119
120static ssize_t nfsctl_transaction_read(struct file *file, char __user *buf, size_t size, loff_t *pos)
121{
122 if (! file->private_data) {
123 /* An attempt to read a transaction file without writing
124 * causes a 0-byte write so that the file can return
125 * state information
126 */
127 ssize_t rv = nfsctl_transaction_write(file, buf, 0, pos);
128 if (rv < 0)
129 return rv;
130 }
131 return simple_transaction_read(file, buf, size, pos);
132}
133
134static const struct file_operations transaction_ops = {
135 .write = nfsctl_transaction_write,
136 .read = nfsctl_transaction_read,
137 .release = simple_transaction_release,
138 .llseek = default_llseek,
139};
140
141static int exports_net_open(struct net *net, struct file *file)
142{
143 int err;
144 struct seq_file *seq;
145 struct nfsd_net *nn = net_generic(net, nfsd_net_id);
146
147 err = seq_open(file, &nfs_exports_op);
148 if (err)
149 return err;
150
151 seq = file->private_data;
152 seq->private = nn->svc_export_cache;
153 return 0;
154}
155
156static int exports_proc_open(struct inode *inode, struct file *file)
157{
158 return exports_net_open(current->nsproxy->net_ns, file);
159}
160
161static const struct proc_ops exports_proc_ops = {
162 .proc_open = exports_proc_open,
163 .proc_read = seq_read,
164 .proc_lseek = seq_lseek,
165 .proc_release = seq_release,
166};
167
168static int exports_nfsd_open(struct inode *inode, struct file *file)
169{
170 return exports_net_open(inode->i_sb->s_fs_info, file);
171}
172
173static const struct file_operations exports_nfsd_operations = {
174 .open = exports_nfsd_open,
175 .read = seq_read,
176 .llseek = seq_lseek,
177 .release = seq_release,
178};
179
180static int export_features_show(struct seq_file *m, void *v)
181{
182 seq_printf(m, "0x%x 0x%x\n", NFSEXP_ALLFLAGS, NFSEXP_SECINFO_FLAGS);
183 return 0;
184}
185
186static int export_features_open(struct inode *inode, struct file *file)
187{
188 return single_open(file, export_features_show, NULL);
189}
190
191static const struct file_operations export_features_operations = {
192 .open = export_features_open,
193 .read = seq_read,
194 .llseek = seq_lseek,
195 .release = single_release,
196};
197
198#if defined(CONFIG_SUNRPC_GSS) || defined(CONFIG_SUNRPC_GSS_MODULE)
199static int supported_enctypes_show(struct seq_file *m, void *v)
200{
201 seq_printf(m, KRB5_SUPPORTED_ENCTYPES);
202 return 0;
203}
204
205static int supported_enctypes_open(struct inode *inode, struct file *file)
206{
207 return single_open(file, supported_enctypes_show, NULL);
208}
209
210static const struct file_operations supported_enctypes_ops = {
211 .open = supported_enctypes_open,
212 .read = seq_read,
213 .llseek = seq_lseek,
214 .release = single_release,
215};
216#endif /* CONFIG_SUNRPC_GSS or CONFIG_SUNRPC_GSS_MODULE */
217
218static const struct file_operations pool_stats_operations = {
219 .open = nfsd_pool_stats_open,
220 .read = seq_read,
221 .llseek = seq_lseek,
222 .release = nfsd_pool_stats_release,
223};
224
225static const struct file_operations reply_cache_stats_operations = {
226 .open = nfsd_reply_cache_stats_open,
227 .read = seq_read,
228 .llseek = seq_lseek,
229 .release = single_release,
230};
231
232/*----------------------------------------------------------------------------*/
233/*
234 * payload - write methods
235 */
236
237static inline struct net *netns(struct file *file)
238{
239 return file_inode(file)->i_sb->s_fs_info;
240}
241
242/*
243 * write_unlock_ip - Release all locks used by a client
244 *
245 * Experimental.
246 *
247 * Input:
248 * buf: '\n'-terminated C string containing a
249 * presentation format IP address
250 * size: length of C string in @buf
251 * Output:
252 * On success: returns zero if all specified locks were released;
253 * returns one if one or more locks were not released
254 * On error: return code is negative errno value
255 */
256static ssize_t write_unlock_ip(struct file *file, char *buf, size_t size)
257{
258 struct sockaddr_storage address;
259 struct sockaddr *sap = (struct sockaddr *)&address;
260 size_t salen = sizeof(address);
261 char *fo_path;
262 struct net *net = netns(file);
263
264 /* sanity check */
265 if (size == 0)
266 return -EINVAL;
267
268 if (buf[size-1] != '\n')
269 return -EINVAL;
270
271 fo_path = buf;
272 if (qword_get(&buf, fo_path, size) < 0)
273 return -EINVAL;
274
275 if (rpc_pton(net, fo_path, size, sap, salen) == 0)
276 return -EINVAL;
277
278 return nlmsvc_unlock_all_by_ip(sap);
279}
280
281/*
282 * write_unlock_fs - Release all locks on a local file system
283 *
284 * Experimental.
285 *
286 * Input:
287 * buf: '\n'-terminated C string containing the
288 * absolute pathname of a local file system
289 * size: length of C string in @buf
290 * Output:
291 * On success: returns zero if all specified locks were released;
292 * returns one if one or more locks were not released
293 * On error: return code is negative errno value
294 */
295static ssize_t write_unlock_fs(struct file *file, char *buf, size_t size)
296{
297 struct path path;
298 char *fo_path;
299 int error;
300
301 /* sanity check */
302 if (size == 0)
303 return -EINVAL;
304
305 if (buf[size-1] != '\n')
306 return -EINVAL;
307
308 fo_path = buf;
309 if (qword_get(&buf, fo_path, size) < 0)
310 return -EINVAL;
311
312 error = kern_path(fo_path, 0, &path);
313 if (error)
314 return error;
315
316 /*
317 * XXX: Needs better sanity checking. Otherwise we could end up
318 * releasing locks on the wrong file system.
319 *
320 * For example:
321 * 1. Does the path refer to a directory?
322 * 2. Is that directory a mount point, or
323 * 3. Is that directory the root of an exported file system?
324 */
325 error = nlmsvc_unlock_all_by_sb(path.dentry->d_sb);
326
327 path_put(&path);
328 return error;
329}
330
331/*
332 * write_filehandle - Get a variable-length NFS file handle by path
333 *
334 * On input, the buffer contains a '\n'-terminated C string comprised of
335 * three alphanumeric words separated by whitespace. The string may
336 * contain escape sequences.
337 *
338 * Input:
339 * buf:
340 * domain: client domain name
341 * path: export pathname
342 * maxsize: numeric maximum size of
343 * @buf
344 * size: length of C string in @buf
345 * Output:
346 * On success: passed-in buffer filled with '\n'-terminated C
347 * string containing a ASCII hex text version
348 * of the NFS file handle;
349 * return code is the size in bytes of the string
350 * On error: return code is negative errno value
351 */
352static ssize_t write_filehandle(struct file *file, char *buf, size_t size)
353{
354 char *dname, *path;
355 int maxsize;
356 char *mesg = buf;
357 int len;
358 struct auth_domain *dom;
359 struct knfsd_fh fh;
360
361 if (size == 0)
362 return -EINVAL;
363
364 if (buf[size-1] != '\n')
365 return -EINVAL;
366 buf[size-1] = 0;
367
368 dname = mesg;
369 len = qword_get(&mesg, dname, size);
370 if (len <= 0)
371 return -EINVAL;
372
373 path = dname+len+1;
374 len = qword_get(&mesg, path, size);
375 if (len <= 0)
376 return -EINVAL;
377
378 len = get_int(&mesg, &maxsize);
379 if (len)
380 return len;
381
382 if (maxsize < NFS_FHSIZE)
383 return -EINVAL;
384 maxsize = min(maxsize, NFS3_FHSIZE);
385
386 if (qword_get(&mesg, mesg, size)>0)
387 return -EINVAL;
388
389 /* we have all the words, they are in buf.. */
390 dom = unix_domain_find(dname);
391 if (!dom)
392 return -ENOMEM;
393
394 len = exp_rootfh(netns(file), dom, path, &fh, maxsize);
395 auth_domain_put(dom);
396 if (len)
397 return len;
398
399 mesg = buf;
400 len = SIMPLE_TRANSACTION_LIMIT;
401 qword_addhex(&mesg, &len, (char*)&fh.fh_base, fh.fh_size);
402 mesg[-1] = '\n';
403 return mesg - buf;
404}
405
406/*
407 * write_threads - Start NFSD, or report the current number of running threads
408 *
409 * Input:
410 * buf: ignored
411 * size: zero
412 * Output:
413 * On success: passed-in buffer filled with '\n'-terminated C
414 * string numeric value representing the number of
415 * running NFSD threads;
416 * return code is the size in bytes of the string
417 * On error: return code is zero
418 *
419 * OR
420 *
421 * Input:
422 * buf: C string containing an unsigned
423 * integer value representing the
424 * number of NFSD threads to start
425 * size: non-zero length of C string in @buf
426 * Output:
427 * On success: NFS service is started;
428 * passed-in buffer filled with '\n'-terminated C
429 * string numeric value representing the number of
430 * running NFSD threads;
431 * return code is the size in bytes of the string
432 * On error: return code is zero or a negative errno value
433 */
434static ssize_t write_threads(struct file *file, char *buf, size_t size)
435{
436 char *mesg = buf;
437 int rv;
438 struct net *net = netns(file);
439
440 if (size > 0) {
441 int newthreads;
442 rv = get_int(&mesg, &newthreads);
443 if (rv)
444 return rv;
445 if (newthreads < 0)
446 return -EINVAL;
447 rv = nfsd_svc(newthreads, net, file->f_cred);
448 if (rv < 0)
449 return rv;
450 } else
451 rv = nfsd_nrthreads(net);
452
453 return scnprintf(buf, SIMPLE_TRANSACTION_LIMIT, "%d\n", rv);
454}
455
456/*
457 * write_pool_threads - Set or report the current number of threads per pool
458 *
459 * Input:
460 * buf: ignored
461 * size: zero
462 *
463 * OR
464 *
465 * Input:
466 * buf: C string containing whitespace-
467 * separated unsigned integer values
468 * representing the number of NFSD
469 * threads to start in each pool
470 * size: non-zero length of C string in @buf
471 * Output:
472 * On success: passed-in buffer filled with '\n'-terminated C
473 * string containing integer values representing the
474 * number of NFSD threads in each pool;
475 * return code is the size in bytes of the string
476 * On error: return code is zero or a negative errno value
477 */
478static ssize_t write_pool_threads(struct file *file, char *buf, size_t size)
479{
480 /* if size > 0, look for an array of number of threads per node
481 * and apply them then write out number of threads per node as reply
482 */
483 char *mesg = buf;
484 int i;
485 int rv;
486 int len;
487 int npools;
488 int *nthreads;
489 struct net *net = netns(file);
490
491 mutex_lock(&nfsd_mutex);
492 npools = nfsd_nrpools(net);
493 if (npools == 0) {
494 /*
495 * NFS is shut down. The admin can start it by
496 * writing to the threads file but NOT the pool_threads
497 * file, sorry. Report zero threads.
498 */
499 mutex_unlock(&nfsd_mutex);
500 strcpy(buf, "0\n");
501 return strlen(buf);
502 }
503
504 nthreads = kcalloc(npools, sizeof(int), GFP_KERNEL);
505 rv = -ENOMEM;
506 if (nthreads == NULL)
507 goto out_free;
508
509 if (size > 0) {
510 for (i = 0; i < npools; i++) {
511 rv = get_int(&mesg, &nthreads[i]);
512 if (rv == -ENOENT)
513 break; /* fewer numbers than pools */
514 if (rv)
515 goto out_free; /* syntax error */
516 rv = -EINVAL;
517 if (nthreads[i] < 0)
518 goto out_free;
519 }
520 rv = nfsd_set_nrthreads(i, nthreads, net);
521 if (rv)
522 goto out_free;
523 }
524
525 rv = nfsd_get_nrthreads(npools, nthreads, net);
526 if (rv)
527 goto out_free;
528
529 mesg = buf;
530 size = SIMPLE_TRANSACTION_LIMIT;
531 for (i = 0; i < npools && size > 0; i++) {
532 snprintf(mesg, size, "%d%c", nthreads[i], (i == npools-1 ? '\n' : ' '));
533 len = strlen(mesg);
534 size -= len;
535 mesg += len;
536 }
537 rv = mesg - buf;
538out_free:
539 kfree(nthreads);
540 mutex_unlock(&nfsd_mutex);
541 return rv;
542}
543
544static ssize_t
545nfsd_print_version_support(struct nfsd_net *nn, char *buf, int remaining,
546 const char *sep, unsigned vers, int minor)
547{
548 const char *format = minor < 0 ? "%s%c%u" : "%s%c%u.%u";
549 bool supported = !!nfsd_vers(nn, vers, NFSD_TEST);
550
551 if (vers == 4 && minor >= 0 &&
552 !nfsd_minorversion(nn, minor, NFSD_TEST))
553 supported = false;
554 if (minor == 0 && supported)
555 /*
556 * special case for backward compatability.
557 * +4.0 is never reported, it is implied by
558 * +4, unless -4.0 is present.
559 */
560 return 0;
561 return snprintf(buf, remaining, format, sep,
562 supported ? '+' : '-', vers, minor);
563}
564
565static ssize_t __write_versions(struct file *file, char *buf, size_t size)
566{
567 char *mesg = buf;
568 char *vers, *minorp, sign;
569 int len, num, remaining;
570 ssize_t tlen = 0;
571 char *sep;
572 struct nfsd_net *nn = net_generic(netns(file), nfsd_net_id);
573
574 if (size>0) {
575 if (nn->nfsd_serv)
576 /* Cannot change versions without updating
577 * nn->nfsd_serv->sv_xdrsize, and reallocing
578 * rq_argp and rq_resp
579 */
580 return -EBUSY;
581 if (buf[size-1] != '\n')
582 return -EINVAL;
583 buf[size-1] = 0;
584
585 vers = mesg;
586 len = qword_get(&mesg, vers, size);
587 if (len <= 0) return -EINVAL;
588 do {
589 enum vers_op cmd;
590 unsigned minor;
591 sign = *vers;
592 if (sign == '+' || sign == '-')
593 num = simple_strtol((vers+1), &minorp, 0);
594 else
595 num = simple_strtol(vers, &minorp, 0);
596 if (*minorp == '.') {
597 if (num != 4)
598 return -EINVAL;
599 if (kstrtouint(minorp+1, 0, &minor) < 0)
600 return -EINVAL;
601 }
602
603 cmd = sign == '-' ? NFSD_CLEAR : NFSD_SET;
604 switch(num) {
605 case 2:
606 case 3:
607 nfsd_vers(nn, num, cmd);
608 break;
609 case 4:
610 if (*minorp == '.') {
611 if (nfsd_minorversion(nn, minor, cmd) < 0)
612 return -EINVAL;
613 } else if ((cmd == NFSD_SET) != nfsd_vers(nn, num, NFSD_TEST)) {
614 /*
615 * Either we have +4 and no minors are enabled,
616 * or we have -4 and at least one minor is enabled.
617 * In either case, propagate 'cmd' to all minors.
618 */
619 minor = 0;
620 while (nfsd_minorversion(nn, minor, cmd) >= 0)
621 minor++;
622 }
623 break;
624 default:
625 return -EINVAL;
626 }
627 vers += len + 1;
628 } while ((len = qword_get(&mesg, vers, size)) > 0);
629 /* If all get turned off, turn them back on, as
630 * having no versions is BAD
631 */
632 nfsd_reset_versions(nn);
633 }
634
635 /* Now write current state into reply buffer */
636 len = 0;
637 sep = "";
638 remaining = SIMPLE_TRANSACTION_LIMIT;
639 for (num=2 ; num <= 4 ; num++) {
640 int minor;
641 if (!nfsd_vers(nn, num, NFSD_AVAIL))
642 continue;
643
644 minor = -1;
645 do {
646 len = nfsd_print_version_support(nn, buf, remaining,
647 sep, num, minor);
648 if (len >= remaining)
649 goto out;
650 remaining -= len;
651 buf += len;
652 tlen += len;
653 minor++;
654 if (len)
655 sep = " ";
656 } while (num == 4 && minor <= NFSD_SUPPORTED_MINOR_VERSION);
657 }
658out:
659 len = snprintf(buf, remaining, "\n");
660 if (len >= remaining)
661 return -EINVAL;
662 return tlen + len;
663}
664
665/*
666 * write_versions - Set or report the available NFS protocol versions
667 *
668 * Input:
669 * buf: ignored
670 * size: zero
671 * Output:
672 * On success: passed-in buffer filled with '\n'-terminated C
673 * string containing positive or negative integer
674 * values representing the current status of each
675 * protocol version;
676 * return code is the size in bytes of the string
677 * On error: return code is zero or a negative errno value
678 *
679 * OR
680 *
681 * Input:
682 * buf: C string containing whitespace-
683 * separated positive or negative
684 * integer values representing NFS
685 * protocol versions to enable ("+n")
686 * or disable ("-n")
687 * size: non-zero length of C string in @buf
688 * Output:
689 * On success: status of zero or more protocol versions has
690 * been updated; passed-in buffer filled with
691 * '\n'-terminated C string containing positive
692 * or negative integer values representing the
693 * current status of each protocol version;
694 * return code is the size in bytes of the string
695 * On error: return code is zero or a negative errno value
696 */
697static ssize_t write_versions(struct file *file, char *buf, size_t size)
698{
699 ssize_t rv;
700
701 mutex_lock(&nfsd_mutex);
702 rv = __write_versions(file, buf, size);
703 mutex_unlock(&nfsd_mutex);
704 return rv;
705}
706
707/*
708 * Zero-length write. Return a list of NFSD's current listener
709 * transports.
710 */
711static ssize_t __write_ports_names(char *buf, struct net *net)
712{
713 struct nfsd_net *nn = net_generic(net, nfsd_net_id);
714
715 if (nn->nfsd_serv == NULL)
716 return 0;
717 return svc_xprt_names(nn->nfsd_serv, buf, SIMPLE_TRANSACTION_LIMIT);
718}
719
720/*
721 * A single 'fd' number was written, in which case it must be for
722 * a socket of a supported family/protocol, and we use it as an
723 * nfsd listener.
724 */
725static ssize_t __write_ports_addfd(char *buf, struct net *net, const struct cred *cred)
726{
727 char *mesg = buf;
728 int fd, err;
729 struct nfsd_net *nn = net_generic(net, nfsd_net_id);
730
731 err = get_int(&mesg, &fd);
732 if (err != 0 || fd < 0)
733 return -EINVAL;
734
735 if (svc_alien_sock(net, fd)) {
736 printk(KERN_ERR "%s: socket net is different to NFSd's one\n", __func__);
737 return -EINVAL;
738 }
739
740 err = nfsd_create_serv(net);
741 if (err != 0)
742 return err;
743
744 err = svc_addsock(nn->nfsd_serv, fd, buf, SIMPLE_TRANSACTION_LIMIT, cred);
745 if (err < 0) {
746 nfsd_destroy(net);
747 return err;
748 }
749
750 /* Decrease the count, but don't shut down the service */
751 nn->nfsd_serv->sv_nrthreads--;
752 return err;
753}
754
755/*
756 * A transport listener is added by writing it's transport name and
757 * a port number.
758 */
759static ssize_t __write_ports_addxprt(char *buf, struct net *net, const struct cred *cred)
760{
761 char transport[16];
762 struct svc_xprt *xprt;
763 int port, err;
764 struct nfsd_net *nn = net_generic(net, nfsd_net_id);
765
766 if (sscanf(buf, "%15s %5u", transport, &port) != 2)
767 return -EINVAL;
768
769 if (port < 1 || port > USHRT_MAX)
770 return -EINVAL;
771
772 err = nfsd_create_serv(net);
773 if (err != 0)
774 return err;
775
776 err = svc_create_xprt(nn->nfsd_serv, transport, net,
777 PF_INET, port, SVC_SOCK_ANONYMOUS, cred);
778 if (err < 0)
779 goto out_err;
780
781 err = svc_create_xprt(nn->nfsd_serv, transport, net,
782 PF_INET6, port, SVC_SOCK_ANONYMOUS, cred);
783 if (err < 0 && err != -EAFNOSUPPORT)
784 goto out_close;
785
786 /* Decrease the count, but don't shut down the service */
787 nn->nfsd_serv->sv_nrthreads--;
788 return 0;
789out_close:
790 xprt = svc_find_xprt(nn->nfsd_serv, transport, net, PF_INET, port);
791 if (xprt != NULL) {
792 svc_close_xprt(xprt);
793 svc_xprt_put(xprt);
794 }
795out_err:
796 if (!list_empty(&nn->nfsd_serv->sv_permsocks))
797 nn->nfsd_serv->sv_nrthreads--;
798 else
799 nfsd_destroy(net);
800 return err;
801}
802
803static ssize_t __write_ports(struct file *file, char *buf, size_t size,
804 struct net *net)
805{
806 if (size == 0)
807 return __write_ports_names(buf, net);
808
809 if (isdigit(buf[0]))
810 return __write_ports_addfd(buf, net, file->f_cred);
811
812 if (isalpha(buf[0]))
813 return __write_ports_addxprt(buf, net, file->f_cred);
814
815 return -EINVAL;
816}
817
818/*
819 * write_ports - Pass a socket file descriptor or transport name to listen on
820 *
821 * Input:
822 * buf: ignored
823 * size: zero
824 * Output:
825 * On success: passed-in buffer filled with a '\n'-terminated C
826 * string containing a whitespace-separated list of
827 * named NFSD listeners;
828 * return code is the size in bytes of the string
829 * On error: return code is zero or a negative errno value
830 *
831 * OR
832 *
833 * Input:
834 * buf: C string containing an unsigned
835 * integer value representing a bound
836 * but unconnected socket that is to be
837 * used as an NFSD listener; listen(3)
838 * must be called for a SOCK_STREAM
839 * socket, otherwise it is ignored
840 * size: non-zero length of C string in @buf
841 * Output:
842 * On success: NFS service is started;
843 * passed-in buffer filled with a '\n'-terminated C
844 * string containing a unique alphanumeric name of
845 * the listener;
846 * return code is the size in bytes of the string
847 * On error: return code is a negative errno value
848 *
849 * OR
850 *
851 * Input:
852 * buf: C string containing a transport
853 * name and an unsigned integer value
854 * representing the port to listen on,
855 * separated by whitespace
856 * size: non-zero length of C string in @buf
857 * Output:
858 * On success: returns zero; NFS service is started
859 * On error: return code is a negative errno value
860 */
861static ssize_t write_ports(struct file *file, char *buf, size_t size)
862{
863 ssize_t rv;
864
865 mutex_lock(&nfsd_mutex);
866 rv = __write_ports(file, buf, size, netns(file));
867 mutex_unlock(&nfsd_mutex);
868 return rv;
869}
870
871
872int nfsd_max_blksize;
873
874/*
875 * write_maxblksize - Set or report the current NFS blksize
876 *
877 * Input:
878 * buf: ignored
879 * size: zero
880 *
881 * OR
882 *
883 * Input:
884 * buf: C string containing an unsigned
885 * integer value representing the new
886 * NFS blksize
887 * size: non-zero length of C string in @buf
888 * Output:
889 * On success: passed-in buffer filled with '\n'-terminated C string
890 * containing numeric value of the current NFS blksize
891 * setting;
892 * return code is the size in bytes of the string
893 * On error: return code is zero or a negative errno value
894 */
895static ssize_t write_maxblksize(struct file *file, char *buf, size_t size)
896{
897 char *mesg = buf;
898 struct nfsd_net *nn = net_generic(netns(file), nfsd_net_id);
899
900 if (size > 0) {
901 int bsize;
902 int rv = get_int(&mesg, &bsize);
903 if (rv)
904 return rv;
905 /* force bsize into allowed range and
906 * required alignment.
907 */
908 bsize = max_t(int, bsize, 1024);
909 bsize = min_t(int, bsize, NFSSVC_MAXBLKSIZE);
910 bsize &= ~(1024-1);
911 mutex_lock(&nfsd_mutex);
912 if (nn->nfsd_serv) {
913 mutex_unlock(&nfsd_mutex);
914 return -EBUSY;
915 }
916 nfsd_max_blksize = bsize;
917 mutex_unlock(&nfsd_mutex);
918 }
919
920 return scnprintf(buf, SIMPLE_TRANSACTION_LIMIT, "%d\n",
921 nfsd_max_blksize);
922}
923
924/*
925 * write_maxconn - Set or report the current max number of connections
926 *
927 * Input:
928 * buf: ignored
929 * size: zero
930 * OR
931 *
932 * Input:
933 * buf: C string containing an unsigned
934 * integer value representing the new
935 * number of max connections
936 * size: non-zero length of C string in @buf
937 * Output:
938 * On success: passed-in buffer filled with '\n'-terminated C string
939 * containing numeric value of max_connections setting
940 * for this net namespace;
941 * return code is the size in bytes of the string
942 * On error: return code is zero or a negative errno value
943 */
944static ssize_t write_maxconn(struct file *file, char *buf, size_t size)
945{
946 char *mesg = buf;
947 struct nfsd_net *nn = net_generic(netns(file), nfsd_net_id);
948 unsigned int maxconn = nn->max_connections;
949
950 if (size > 0) {
951 int rv = get_uint(&mesg, &maxconn);
952
953 if (rv)
954 return rv;
955 nn->max_connections = maxconn;
956 }
957
958 return scnprintf(buf, SIMPLE_TRANSACTION_LIMIT, "%u\n", maxconn);
959}
960
961#ifdef CONFIG_NFSD_V4
962static ssize_t __nfsd4_write_time(struct file *file, char *buf, size_t size,
963 time64_t *time, struct nfsd_net *nn)
964{
965 char *mesg = buf;
966 int rv, i;
967
968 if (size > 0) {
969 if (nn->nfsd_serv)
970 return -EBUSY;
971 rv = get_int(&mesg, &i);
972 if (rv)
973 return rv;
974 /*
975 * Some sanity checking. We don't have a reason for
976 * these particular numbers, but problems with the
977 * extremes are:
978 * - Too short: the briefest network outage may
979 * cause clients to lose all their locks. Also,
980 * the frequent polling may be wasteful.
981 * - Too long: do you really want reboot recovery
982 * to take more than an hour? Or to make other
983 * clients wait an hour before being able to
984 * revoke a dead client's locks?
985 */
986 if (i < 10 || i > 3600)
987 return -EINVAL;
988 *time = i;
989 }
990
991 return scnprintf(buf, SIMPLE_TRANSACTION_LIMIT, "%lld\n", *time);
992}
993
994static ssize_t nfsd4_write_time(struct file *file, char *buf, size_t size,
995 time64_t *time, struct nfsd_net *nn)
996{
997 ssize_t rv;
998
999 mutex_lock(&nfsd_mutex);
1000 rv = __nfsd4_write_time(file, buf, size, time, nn);
1001 mutex_unlock(&nfsd_mutex);
1002 return rv;
1003}
1004
1005/*
1006 * write_leasetime - Set or report the current NFSv4 lease time
1007 *
1008 * Input:
1009 * buf: ignored
1010 * size: zero
1011 *
1012 * OR
1013 *
1014 * Input:
1015 * buf: C string containing an unsigned
1016 * integer value representing the new
1017 * NFSv4 lease expiry time
1018 * size: non-zero length of C string in @buf
1019 * Output:
1020 * On success: passed-in buffer filled with '\n'-terminated C
1021 * string containing unsigned integer value of the
1022 * current lease expiry time;
1023 * return code is the size in bytes of the string
1024 * On error: return code is zero or a negative errno value
1025 */
1026static ssize_t write_leasetime(struct file *file, char *buf, size_t size)
1027{
1028 struct nfsd_net *nn = net_generic(netns(file), nfsd_net_id);
1029 return nfsd4_write_time(file, buf, size, &nn->nfsd4_lease, nn);
1030}
1031
1032/*
1033 * write_gracetime - Set or report current NFSv4 grace period time
1034 *
1035 * As above, but sets the time of the NFSv4 grace period.
1036 *
1037 * Note this should never be set to less than the *previous*
1038 * lease-period time, but we don't try to enforce this. (In the common
1039 * case (a new boot), we don't know what the previous lease time was
1040 * anyway.)
1041 */
1042static ssize_t write_gracetime(struct file *file, char *buf, size_t size)
1043{
1044 struct nfsd_net *nn = net_generic(netns(file), nfsd_net_id);
1045 return nfsd4_write_time(file, buf, size, &nn->nfsd4_grace, nn);
1046}
1047
1048static ssize_t __write_recoverydir(struct file *file, char *buf, size_t size,
1049 struct nfsd_net *nn)
1050{
1051 char *mesg = buf;
1052 char *recdir;
1053 int len, status;
1054
1055 if (size > 0) {
1056 if (nn->nfsd_serv)
1057 return -EBUSY;
1058 if (size > PATH_MAX || buf[size-1] != '\n')
1059 return -EINVAL;
1060 buf[size-1] = 0;
1061
1062 recdir = mesg;
1063 len = qword_get(&mesg, recdir, size);
1064 if (len <= 0)
1065 return -EINVAL;
1066
1067 status = nfs4_reset_recoverydir(recdir);
1068 if (status)
1069 return status;
1070 }
1071
1072 return scnprintf(buf, SIMPLE_TRANSACTION_LIMIT, "%s\n",
1073 nfs4_recoverydir());
1074}
1075
1076/*
1077 * write_recoverydir - Set or report the pathname of the recovery directory
1078 *
1079 * Input:
1080 * buf: ignored
1081 * size: zero
1082 *
1083 * OR
1084 *
1085 * Input:
1086 * buf: C string containing the pathname
1087 * of the directory on a local file
1088 * system containing permanent NFSv4
1089 * recovery data
1090 * size: non-zero length of C string in @buf
1091 * Output:
1092 * On success: passed-in buffer filled with '\n'-terminated C string
1093 * containing the current recovery pathname setting;
1094 * return code is the size in bytes of the string
1095 * On error: return code is zero or a negative errno value
1096 */
1097static ssize_t write_recoverydir(struct file *file, char *buf, size_t size)
1098{
1099 ssize_t rv;
1100 struct nfsd_net *nn = net_generic(netns(file), nfsd_net_id);
1101
1102 mutex_lock(&nfsd_mutex);
1103 rv = __write_recoverydir(file, buf, size, nn);
1104 mutex_unlock(&nfsd_mutex);
1105 return rv;
1106}
1107
1108/*
1109 * write_v4_end_grace - release grace period for nfsd's v4.x lock manager
1110 *
1111 * Input:
1112 * buf: ignored
1113 * size: zero
1114 * OR
1115 *
1116 * Input:
1117 * buf: any value
1118 * size: non-zero length of C string in @buf
1119 * Output:
1120 * passed-in buffer filled with "Y" or "N" with a newline
1121 * and NULL-terminated C string. This indicates whether
1122 * the grace period has ended in the current net
1123 * namespace. Return code is the size in bytes of the
1124 * string. Writing a string that starts with 'Y', 'y', or
1125 * '1' to the file will end the grace period for nfsd's v4
1126 * lock manager.
1127 */
1128static ssize_t write_v4_end_grace(struct file *file, char *buf, size_t size)
1129{
1130 struct nfsd_net *nn = net_generic(netns(file), nfsd_net_id);
1131
1132 if (size > 0) {
1133 switch(buf[0]) {
1134 case 'Y':
1135 case 'y':
1136 case '1':
1137 if (!nn->nfsd_serv)
1138 return -EBUSY;
1139 nfsd4_end_grace(nn);
1140 break;
1141 default:
1142 return -EINVAL;
1143 }
1144 }
1145
1146 return scnprintf(buf, SIMPLE_TRANSACTION_LIMIT, "%c\n",
1147 nn->grace_ended ? 'Y' : 'N');
1148}
1149
1150#endif
1151
1152/*----------------------------------------------------------------------------*/
1153/*
1154 * populating the filesystem.
1155 */
1156
1157/* Basically copying rpc_get_inode. */
1158static struct inode *nfsd_get_inode(struct super_block *sb, umode_t mode)
1159{
1160 struct inode *inode = new_inode(sb);
1161 if (!inode)
1162 return NULL;
1163 /* Following advice from simple_fill_super documentation: */
1164 inode->i_ino = iunique(sb, NFSD_MaxReserved);
1165 inode->i_mode = mode;
1166 inode->i_atime = inode->i_mtime = inode->i_ctime = current_time(inode);
1167 switch (mode & S_IFMT) {
1168 case S_IFDIR:
1169 inode->i_fop = &simple_dir_operations;
1170 inode->i_op = &simple_dir_inode_operations;
1171 inc_nlink(inode);
1172 break;
1173 default:
1174 break;
1175 }
1176 return inode;
1177}
1178
1179static int __nfsd_mkdir(struct inode *dir, struct dentry *dentry, umode_t mode, struct nfsdfs_client *ncl)
1180{
1181 struct inode *inode;
1182
1183 inode = nfsd_get_inode(dir->i_sb, mode);
1184 if (!inode)
1185 return -ENOMEM;
1186 if (ncl) {
1187 inode->i_private = ncl;
1188 kref_get(&ncl->cl_ref);
1189 }
1190 d_add(dentry, inode);
1191 inc_nlink(dir);
1192 fsnotify_mkdir(dir, dentry);
1193 return 0;
1194}
1195
1196static struct dentry *nfsd_mkdir(struct dentry *parent, struct nfsdfs_client *ncl, char *name)
1197{
1198 struct inode *dir = parent->d_inode;
1199 struct dentry *dentry;
1200 int ret = -ENOMEM;
1201
1202 inode_lock(dir);
1203 dentry = d_alloc_name(parent, name);
1204 if (!dentry)
1205 goto out_err;
1206 ret = __nfsd_mkdir(d_inode(parent), dentry, S_IFDIR | 0600, ncl);
1207 if (ret)
1208 goto out_err;
1209out:
1210 inode_unlock(dir);
1211 return dentry;
1212out_err:
1213 dput(dentry);
1214 dentry = ERR_PTR(ret);
1215 goto out;
1216}
1217
1218static void clear_ncl(struct inode *inode)
1219{
1220 struct nfsdfs_client *ncl = inode->i_private;
1221
1222 inode->i_private = NULL;
1223 kref_put(&ncl->cl_ref, ncl->cl_release);
1224}
1225
1226static struct nfsdfs_client *__get_nfsdfs_client(struct inode *inode)
1227{
1228 struct nfsdfs_client *nc = inode->i_private;
1229
1230 if (nc)
1231 kref_get(&nc->cl_ref);
1232 return nc;
1233}
1234
1235struct nfsdfs_client *get_nfsdfs_client(struct inode *inode)
1236{
1237 struct nfsdfs_client *nc;
1238
1239 inode_lock_shared(inode);
1240 nc = __get_nfsdfs_client(inode);
1241 inode_unlock_shared(inode);
1242 return nc;
1243}
1244/* from __rpc_unlink */
1245static void nfsdfs_remove_file(struct inode *dir, struct dentry *dentry)
1246{
1247 int ret;
1248
1249 clear_ncl(d_inode(dentry));
1250 dget(dentry);
1251 ret = simple_unlink(dir, dentry);
1252 d_delete(dentry);
1253 dput(dentry);
1254 WARN_ON_ONCE(ret);
1255}
1256
1257static void nfsdfs_remove_files(struct dentry *root)
1258{
1259 struct dentry *dentry, *tmp;
1260
1261 list_for_each_entry_safe(dentry, tmp, &root->d_subdirs, d_child) {
1262 if (!simple_positive(dentry)) {
1263 WARN_ON_ONCE(1); /* I think this can't happen? */
1264 continue;
1265 }
1266 nfsdfs_remove_file(d_inode(root), dentry);
1267 }
1268}
1269
1270/* XXX: cut'n'paste from simple_fill_super; figure out if we could share
1271 * code instead. */
1272static int nfsdfs_create_files(struct dentry *root,
1273 const struct tree_descr *files,
1274 struct dentry **fdentries)
1275{
1276 struct inode *dir = d_inode(root);
1277 struct inode *inode;
1278 struct dentry *dentry;
1279 int i;
1280
1281 inode_lock(dir);
1282 for (i = 0; files->name && files->name[0]; i++, files++) {
1283 dentry = d_alloc_name(root, files->name);
1284 if (!dentry)
1285 goto out;
1286 inode = nfsd_get_inode(d_inode(root)->i_sb,
1287 S_IFREG | files->mode);
1288 if (!inode) {
1289 dput(dentry);
1290 goto out;
1291 }
1292 inode->i_fop = files->ops;
1293 inode->i_private = __get_nfsdfs_client(dir);
1294 d_add(dentry, inode);
1295 fsnotify_create(dir, dentry);
1296 if (fdentries)
1297 fdentries[i] = dentry;
1298 }
1299 inode_unlock(dir);
1300 return 0;
1301out:
1302 nfsdfs_remove_files(root);
1303 inode_unlock(dir);
1304 return -ENOMEM;
1305}
1306
1307/* on success, returns positive number unique to that client. */
1308struct dentry *nfsd_client_mkdir(struct nfsd_net *nn,
1309 struct nfsdfs_client *ncl, u32 id,
1310 const struct tree_descr *files,
1311 struct dentry **fdentries)
1312{
1313 struct dentry *dentry;
1314 char name[11];
1315 int ret;
1316
1317 sprintf(name, "%u", id);
1318
1319 dentry = nfsd_mkdir(nn->nfsd_client_dir, ncl, name);
1320 if (IS_ERR(dentry)) /* XXX: tossing errors? */
1321 return NULL;
1322 ret = nfsdfs_create_files(dentry, files, fdentries);
1323 if (ret) {
1324 nfsd_client_rmdir(dentry);
1325 return NULL;
1326 }
1327 return dentry;
1328}
1329
1330/* Taken from __rpc_rmdir: */
1331void nfsd_client_rmdir(struct dentry *dentry)
1332{
1333 struct inode *dir = d_inode(dentry->d_parent);
1334 struct inode *inode = d_inode(dentry);
1335 int ret;
1336
1337 inode_lock(dir);
1338 nfsdfs_remove_files(dentry);
1339 clear_ncl(inode);
1340 dget(dentry);
1341 ret = simple_rmdir(dir, dentry);
1342 WARN_ON_ONCE(ret);
1343 fsnotify_rmdir(dir, dentry);
1344 d_delete(dentry);
1345 dput(dentry);
1346 inode_unlock(dir);
1347}
1348
1349static int nfsd_fill_super(struct super_block *sb, struct fs_context *fc)
1350{
1351 struct nfsd_net *nn = net_generic(current->nsproxy->net_ns,
1352 nfsd_net_id);
1353 struct dentry *dentry;
1354 int ret;
1355
1356 static const struct tree_descr nfsd_files[] = {
1357 [NFSD_List] = {"exports", &exports_nfsd_operations, S_IRUGO},
1358 /* Per-export io stats use same ops as exports file */
1359 [NFSD_Export_Stats] = {"export_stats", &exports_nfsd_operations, S_IRUGO},
1360 [NFSD_Export_features] = {"export_features",
1361 &export_features_operations, S_IRUGO},
1362 [NFSD_FO_UnlockIP] = {"unlock_ip",
1363 &transaction_ops, S_IWUSR|S_IRUSR},
1364 [NFSD_FO_UnlockFS] = {"unlock_filesystem",
1365 &transaction_ops, S_IWUSR|S_IRUSR},
1366 [NFSD_Fh] = {"filehandle", &transaction_ops, S_IWUSR|S_IRUSR},
1367 [NFSD_Threads] = {"threads", &transaction_ops, S_IWUSR|S_IRUSR},
1368 [NFSD_Pool_Threads] = {"pool_threads", &transaction_ops, S_IWUSR|S_IRUSR},
1369 [NFSD_Pool_Stats] = {"pool_stats", &pool_stats_operations, S_IRUGO},
1370 [NFSD_Reply_Cache_Stats] = {"reply_cache_stats", &reply_cache_stats_operations, S_IRUGO},
1371 [NFSD_Versions] = {"versions", &transaction_ops, S_IWUSR|S_IRUSR},
1372 [NFSD_Ports] = {"portlist", &transaction_ops, S_IWUSR|S_IRUGO},
1373 [NFSD_MaxBlkSize] = {"max_block_size", &transaction_ops, S_IWUSR|S_IRUGO},
1374 [NFSD_MaxConnections] = {"max_connections", &transaction_ops, S_IWUSR|S_IRUGO},
1375#if defined(CONFIG_SUNRPC_GSS) || defined(CONFIG_SUNRPC_GSS_MODULE)
1376 [NFSD_SupportedEnctypes] = {"supported_krb5_enctypes", &supported_enctypes_ops, S_IRUGO},
1377#endif /* CONFIG_SUNRPC_GSS or CONFIG_SUNRPC_GSS_MODULE */
1378#ifdef CONFIG_NFSD_V4
1379 [NFSD_Leasetime] = {"nfsv4leasetime", &transaction_ops, S_IWUSR|S_IRUSR},
1380 [NFSD_Gracetime] = {"nfsv4gracetime", &transaction_ops, S_IWUSR|S_IRUSR},
1381 [NFSD_RecoveryDir] = {"nfsv4recoverydir", &transaction_ops, S_IWUSR|S_IRUSR},
1382 [NFSD_V4EndGrace] = {"v4_end_grace", &transaction_ops, S_IWUSR|S_IRUGO},
1383#endif
1384 /* last one */ {""}
1385 };
1386
1387 ret = simple_fill_super(sb, 0x6e667364, nfsd_files);
1388 if (ret)
1389 return ret;
1390 dentry = nfsd_mkdir(sb->s_root, NULL, "clients");
1391 if (IS_ERR(dentry))
1392 return PTR_ERR(dentry);
1393 nn->nfsd_client_dir = dentry;
1394 return 0;
1395}
1396
1397static int nfsd_fs_get_tree(struct fs_context *fc)
1398{
1399 return get_tree_keyed(fc, nfsd_fill_super, get_net(fc->net_ns));
1400}
1401
1402static void nfsd_fs_free_fc(struct fs_context *fc)
1403{
1404 if (fc->s_fs_info)
1405 put_net(fc->s_fs_info);
1406}
1407
1408static const struct fs_context_operations nfsd_fs_context_ops = {
1409 .free = nfsd_fs_free_fc,
1410 .get_tree = nfsd_fs_get_tree,
1411};
1412
1413static int nfsd_init_fs_context(struct fs_context *fc)
1414{
1415 put_user_ns(fc->user_ns);
1416 fc->user_ns = get_user_ns(fc->net_ns->user_ns);
1417 fc->ops = &nfsd_fs_context_ops;
1418 return 0;
1419}
1420
1421static void nfsd_umount(struct super_block *sb)
1422{
1423 struct net *net = sb->s_fs_info;
1424
1425 nfsd_shutdown_threads(net);
1426
1427 kill_litter_super(sb);
1428 put_net(net);
1429}
1430
1431static struct file_system_type nfsd_fs_type = {
1432 .owner = THIS_MODULE,
1433 .name = "nfsd",
1434 .init_fs_context = nfsd_init_fs_context,
1435 .kill_sb = nfsd_umount,
1436};
1437MODULE_ALIAS_FS("nfsd");
1438
1439#ifdef CONFIG_PROC_FS
1440static int create_proc_exports_entry(void)
1441{
1442 struct proc_dir_entry *entry;
1443
1444 entry = proc_mkdir("fs/nfs", NULL);
1445 if (!entry)
1446 return -ENOMEM;
1447 entry = proc_create("exports", 0, entry, &exports_proc_ops);
1448 if (!entry) {
1449 remove_proc_entry("fs/nfs", NULL);
1450 return -ENOMEM;
1451 }
1452 return 0;
1453}
1454#else /* CONFIG_PROC_FS */
1455static int create_proc_exports_entry(void)
1456{
1457 return 0;
1458}
1459#endif
1460
1461unsigned int nfsd_net_id;
1462
1463static __net_init int nfsd_init_net(struct net *net)
1464{
1465 int retval;
1466 struct nfsd_net *nn = net_generic(net, nfsd_net_id);
1467
1468 retval = nfsd_export_init(net);
1469 if (retval)
1470 goto out_export_error;
1471 retval = nfsd_idmap_init(net);
1472 if (retval)
1473 goto out_idmap_error;
1474 nn->nfsd_versions = NULL;
1475 nn->nfsd4_minorversions = NULL;
1476 retval = nfsd_reply_cache_init(nn);
1477 if (retval)
1478 goto out_drc_error;
1479 nn->nfsd4_lease = 90; /* default lease time */
1480 nn->nfsd4_grace = 90;
1481 nn->somebody_reclaimed = false;
1482 nn->track_reclaim_completes = false;
1483 nn->clverifier_counter = prandom_u32();
1484 nn->clientid_base = prandom_u32();
1485 nn->clientid_counter = nn->clientid_base + 1;
1486 nn->s2s_cp_cl_id = nn->clientid_counter++;
1487
1488 atomic_set(&nn->ntf_refcnt, 0);
1489 init_waitqueue_head(&nn->ntf_wq);
1490 seqlock_init(&nn->boot_lock);
1491
1492 return 0;
1493
1494out_drc_error:
1495 nfsd_idmap_shutdown(net);
1496out_idmap_error:
1497 nfsd_export_shutdown(net);
1498out_export_error:
1499 return retval;
1500}
1501
1502static __net_exit void nfsd_exit_net(struct net *net)
1503{
1504 struct nfsd_net *nn = net_generic(net, nfsd_net_id);
1505
1506 nfsd_reply_cache_shutdown(nn);
1507 nfsd_idmap_shutdown(net);
1508 nfsd_export_shutdown(net);
1509 nfsd_netns_free_versions(net_generic(net, nfsd_net_id));
1510}
1511
1512static struct pernet_operations nfsd_net_ops = {
1513 .init = nfsd_init_net,
1514 .exit = nfsd_exit_net,
1515 .id = &nfsd_net_id,
1516 .size = sizeof(struct nfsd_net),
1517};
1518
1519static int __init init_nfsd(void)
1520{
1521 int retval;
1522 printk(KERN_INFO "Installing knfsd (copyright (C) 1996 okir@monad.swb.de).\n");
1523
1524 retval = register_cld_notifier();
1525 if (retval)
1526 return retval;
1527 retval = nfsd4_init_slabs();
1528 if (retval)
1529 goto out_unregister_notifier;
1530 retval = nfsd4_init_pnfs();
1531 if (retval)
1532 goto out_free_slabs;
1533 retval = nfsd_stat_init(); /* Statistics */
1534 if (retval)
1535 goto out_free_pnfs;
1536 retval = nfsd_drc_slab_create();
1537 if (retval)
1538 goto out_free_stat;
1539 nfsd_lockd_init(); /* lockd->nfsd callbacks */
1540 retval = create_proc_exports_entry();
1541 if (retval)
1542 goto out_free_lockd;
1543 retval = register_filesystem(&nfsd_fs_type);
1544 if (retval)
1545 goto out_free_exports;
1546 retval = register_pernet_subsys(&nfsd_net_ops);
1547 if (retval < 0)
1548 goto out_free_all;
1549 return 0;
1550out_free_all:
1551 unregister_filesystem(&nfsd_fs_type);
1552out_free_exports:
1553 remove_proc_entry("fs/nfs/exports", NULL);
1554 remove_proc_entry("fs/nfs", NULL);
1555out_free_lockd:
1556 nfsd_lockd_shutdown();
1557 nfsd_drc_slab_free();
1558out_free_stat:
1559 nfsd_stat_shutdown();
1560out_free_pnfs:
1561 nfsd4_exit_pnfs();
1562out_free_slabs:
1563 nfsd4_free_slabs();
1564out_unregister_notifier:
1565 unregister_cld_notifier();
1566 return retval;
1567}
1568
1569static void __exit exit_nfsd(void)
1570{
1571 unregister_pernet_subsys(&nfsd_net_ops);
1572 nfsd_drc_slab_free();
1573 remove_proc_entry("fs/nfs/exports", NULL);
1574 remove_proc_entry("fs/nfs", NULL);
1575 nfsd_stat_shutdown();
1576 nfsd_lockd_shutdown();
1577 nfsd4_free_slabs();
1578 nfsd4_exit_pnfs();
1579 unregister_filesystem(&nfsd_fs_type);
1580 unregister_cld_notifier();
1581}
1582
1583MODULE_AUTHOR("Olaf Kirch <okir@monad.swb.de>");
1584MODULE_LICENSE("GPL");
1585module_init(init_nfsd)
1586module_exit(exit_nfsd)