Loading...
1/*
2 * Syscall interface to knfsd.
3 *
4 * Copyright (C) 1995, 1996 Olaf Kirch <okir@monad.swb.de>
5 */
6
7#include <linux/slab.h>
8#include <linux/namei.h>
9#include <linux/ctype.h>
10
11#include <linux/sunrpc/svcsock.h>
12#include <linux/nfsd/syscall.h>
13#include <linux/lockd/lockd.h>
14#include <linux/sunrpc/clnt.h>
15#include <linux/sunrpc/gss_api.h>
16#include <linux/sunrpc/gss_krb5_enctypes.h>
17
18#include "idmap.h"
19#include "nfsd.h"
20#include "cache.h"
21
22/*
23 * We have a single directory with several nodes in it.
24 */
25enum {
26 NFSD_Root = 1,
27 NFSD_List,
28 NFSD_Export_features,
29 NFSD_Fh,
30 NFSD_FO_UnlockIP,
31 NFSD_FO_UnlockFS,
32 NFSD_Threads,
33 NFSD_Pool_Threads,
34 NFSD_Pool_Stats,
35 NFSD_Versions,
36 NFSD_Ports,
37 NFSD_MaxBlkSize,
38 NFSD_SupportedEnctypes,
39 /*
40 * The below MUST come last. Otherwise we leave a hole in nfsd_files[]
41 * with !CONFIG_NFSD_V4 and simple_fill_super() goes oops
42 */
43#ifdef CONFIG_NFSD_V4
44 NFSD_Leasetime,
45 NFSD_Gracetime,
46 NFSD_RecoveryDir,
47#endif
48};
49
50/*
51 * write() for these nodes.
52 */
53static ssize_t write_filehandle(struct file *file, char *buf, size_t size);
54static ssize_t write_unlock_ip(struct file *file, char *buf, size_t size);
55static ssize_t write_unlock_fs(struct file *file, char *buf, size_t size);
56static ssize_t write_threads(struct file *file, char *buf, size_t size);
57static ssize_t write_pool_threads(struct file *file, char *buf, size_t size);
58static ssize_t write_versions(struct file *file, char *buf, size_t size);
59static ssize_t write_ports(struct file *file, char *buf, size_t size);
60static ssize_t write_maxblksize(struct file *file, char *buf, size_t size);
61#ifdef CONFIG_NFSD_V4
62static ssize_t write_leasetime(struct file *file, char *buf, size_t size);
63static ssize_t write_gracetime(struct file *file, char *buf, size_t size);
64static ssize_t write_recoverydir(struct file *file, char *buf, size_t size);
65#endif
66
67static ssize_t (*write_op[])(struct file *, char *, size_t) = {
68 [NFSD_Fh] = write_filehandle,
69 [NFSD_FO_UnlockIP] = write_unlock_ip,
70 [NFSD_FO_UnlockFS] = write_unlock_fs,
71 [NFSD_Threads] = write_threads,
72 [NFSD_Pool_Threads] = write_pool_threads,
73 [NFSD_Versions] = write_versions,
74 [NFSD_Ports] = write_ports,
75 [NFSD_MaxBlkSize] = write_maxblksize,
76#ifdef CONFIG_NFSD_V4
77 [NFSD_Leasetime] = write_leasetime,
78 [NFSD_Gracetime] = write_gracetime,
79 [NFSD_RecoveryDir] = write_recoverydir,
80#endif
81};
82
83static ssize_t nfsctl_transaction_write(struct file *file, const char __user *buf, size_t size, loff_t *pos)
84{
85 ino_t ino = file->f_path.dentry->d_inode->i_ino;
86 char *data;
87 ssize_t rv;
88
89 if (ino >= ARRAY_SIZE(write_op) || !write_op[ino])
90 return -EINVAL;
91
92 data = simple_transaction_get(file, buf, size);
93 if (IS_ERR(data))
94 return PTR_ERR(data);
95
96 rv = write_op[ino](file, data, size);
97 if (rv >= 0) {
98 simple_transaction_set(file, rv);
99 rv = size;
100 }
101 return rv;
102}
103
104static ssize_t nfsctl_transaction_read(struct file *file, char __user *buf, size_t size, loff_t *pos)
105{
106 if (! file->private_data) {
107 /* An attempt to read a transaction file without writing
108 * causes a 0-byte write so that the file can return
109 * state information
110 */
111 ssize_t rv = nfsctl_transaction_write(file, buf, 0, pos);
112 if (rv < 0)
113 return rv;
114 }
115 return simple_transaction_read(file, buf, size, pos);
116}
117
118static const struct file_operations transaction_ops = {
119 .write = nfsctl_transaction_write,
120 .read = nfsctl_transaction_read,
121 .release = simple_transaction_release,
122 .llseek = default_llseek,
123};
124
125static int exports_open(struct inode *inode, struct file *file)
126{
127 return seq_open(file, &nfs_exports_op);
128}
129
130static const struct file_operations exports_operations = {
131 .open = exports_open,
132 .read = seq_read,
133 .llseek = seq_lseek,
134 .release = seq_release,
135 .owner = THIS_MODULE,
136};
137
138static int export_features_show(struct seq_file *m, void *v)
139{
140 seq_printf(m, "0x%x 0x%x\n", NFSEXP_ALLFLAGS, NFSEXP_SECINFO_FLAGS);
141 return 0;
142}
143
144static int export_features_open(struct inode *inode, struct file *file)
145{
146 return single_open(file, export_features_show, NULL);
147}
148
149static struct file_operations export_features_operations = {
150 .open = export_features_open,
151 .read = seq_read,
152 .llseek = seq_lseek,
153 .release = single_release,
154};
155
156#if defined(CONFIG_SUNRPC_GSS) || defined(CONFIG_SUNRPC_GSS_MODULE)
157static int supported_enctypes_show(struct seq_file *m, void *v)
158{
159 seq_printf(m, KRB5_SUPPORTED_ENCTYPES);
160 return 0;
161}
162
163static int supported_enctypes_open(struct inode *inode, struct file *file)
164{
165 return single_open(file, supported_enctypes_show, NULL);
166}
167
168static struct file_operations supported_enctypes_ops = {
169 .open = supported_enctypes_open,
170 .read = seq_read,
171 .llseek = seq_lseek,
172 .release = single_release,
173};
174#endif /* CONFIG_SUNRPC_GSS or CONFIG_SUNRPC_GSS_MODULE */
175
176extern int nfsd_pool_stats_open(struct inode *inode, struct file *file);
177extern int nfsd_pool_stats_release(struct inode *inode, struct file *file);
178
179static const struct file_operations pool_stats_operations = {
180 .open = nfsd_pool_stats_open,
181 .read = seq_read,
182 .llseek = seq_lseek,
183 .release = nfsd_pool_stats_release,
184 .owner = THIS_MODULE,
185};
186
187/*----------------------------------------------------------------------------*/
188/*
189 * payload - write methods
190 */
191
192
193/**
194 * write_unlock_ip - Release all locks used by a client
195 *
196 * Experimental.
197 *
198 * Input:
199 * buf: '\n'-terminated C string containing a
200 * presentation format IP address
201 * size: length of C string in @buf
202 * Output:
203 * On success: returns zero if all specified locks were released;
204 * returns one if one or more locks were not released
205 * On error: return code is negative errno value
206 */
207static ssize_t write_unlock_ip(struct file *file, char *buf, size_t size)
208{
209 struct sockaddr_storage address;
210 struct sockaddr *sap = (struct sockaddr *)&address;
211 size_t salen = sizeof(address);
212 char *fo_path;
213
214 /* sanity check */
215 if (size == 0)
216 return -EINVAL;
217
218 if (buf[size-1] != '\n')
219 return -EINVAL;
220
221 fo_path = buf;
222 if (qword_get(&buf, fo_path, size) < 0)
223 return -EINVAL;
224
225 if (rpc_pton(fo_path, size, sap, salen) == 0)
226 return -EINVAL;
227
228 return nlmsvc_unlock_all_by_ip(sap);
229}
230
231/**
232 * write_unlock_fs - Release all locks on a local file system
233 *
234 * Experimental.
235 *
236 * Input:
237 * buf: '\n'-terminated C string containing the
238 * absolute pathname of a local file system
239 * size: length of C string in @buf
240 * Output:
241 * On success: returns zero if all specified locks were released;
242 * returns one if one or more locks were not released
243 * On error: return code is negative errno value
244 */
245static ssize_t write_unlock_fs(struct file *file, char *buf, size_t size)
246{
247 struct path path;
248 char *fo_path;
249 int error;
250
251 /* sanity check */
252 if (size == 0)
253 return -EINVAL;
254
255 if (buf[size-1] != '\n')
256 return -EINVAL;
257
258 fo_path = buf;
259 if (qword_get(&buf, fo_path, size) < 0)
260 return -EINVAL;
261
262 error = kern_path(fo_path, 0, &path);
263 if (error)
264 return error;
265
266 /*
267 * XXX: Needs better sanity checking. Otherwise we could end up
268 * releasing locks on the wrong file system.
269 *
270 * For example:
271 * 1. Does the path refer to a directory?
272 * 2. Is that directory a mount point, or
273 * 3. Is that directory the root of an exported file system?
274 */
275 error = nlmsvc_unlock_all_by_sb(path.mnt->mnt_sb);
276
277 path_put(&path);
278 return error;
279}
280
281/**
282 * write_filehandle - Get a variable-length NFS file handle by path
283 *
284 * On input, the buffer contains a '\n'-terminated C string comprised of
285 * three alphanumeric words separated by whitespace. The string may
286 * contain escape sequences.
287 *
288 * Input:
289 * buf:
290 * domain: client domain name
291 * path: export pathname
292 * maxsize: numeric maximum size of
293 * @buf
294 * size: length of C string in @buf
295 * Output:
296 * On success: passed-in buffer filled with '\n'-terminated C
297 * string containing a ASCII hex text version
298 * of the NFS file handle;
299 * return code is the size in bytes of the string
300 * On error: return code is negative errno value
301 */
302static ssize_t write_filehandle(struct file *file, char *buf, size_t size)
303{
304 char *dname, *path;
305 int uninitialized_var(maxsize);
306 char *mesg = buf;
307 int len;
308 struct auth_domain *dom;
309 struct knfsd_fh fh;
310
311 if (size == 0)
312 return -EINVAL;
313
314 if (buf[size-1] != '\n')
315 return -EINVAL;
316 buf[size-1] = 0;
317
318 dname = mesg;
319 len = qword_get(&mesg, dname, size);
320 if (len <= 0)
321 return -EINVAL;
322
323 path = dname+len+1;
324 len = qword_get(&mesg, path, size);
325 if (len <= 0)
326 return -EINVAL;
327
328 len = get_int(&mesg, &maxsize);
329 if (len)
330 return len;
331
332 if (maxsize < NFS_FHSIZE)
333 return -EINVAL;
334 if (maxsize > NFS3_FHSIZE)
335 maxsize = NFS3_FHSIZE;
336
337 if (qword_get(&mesg, mesg, size)>0)
338 return -EINVAL;
339
340 /* we have all the words, they are in buf.. */
341 dom = unix_domain_find(dname);
342 if (!dom)
343 return -ENOMEM;
344
345 len = exp_rootfh(dom, path, &fh, maxsize);
346 auth_domain_put(dom);
347 if (len)
348 return len;
349
350 mesg = buf;
351 len = SIMPLE_TRANSACTION_LIMIT;
352 qword_addhex(&mesg, &len, (char*)&fh.fh_base, fh.fh_size);
353 mesg[-1] = '\n';
354 return mesg - buf;
355}
356
357/**
358 * write_threads - Start NFSD, or report the current number of running threads
359 *
360 * Input:
361 * buf: ignored
362 * size: zero
363 * Output:
364 * On success: passed-in buffer filled with '\n'-terminated C
365 * string numeric value representing the number of
366 * running NFSD threads;
367 * return code is the size in bytes of the string
368 * On error: return code is zero
369 *
370 * OR
371 *
372 * Input:
373 * buf: C string containing an unsigned
374 * integer value representing the
375 * number of NFSD threads to start
376 * size: non-zero length of C string in @buf
377 * Output:
378 * On success: NFS service is started;
379 * passed-in buffer filled with '\n'-terminated C
380 * string numeric value representing the number of
381 * running NFSD threads;
382 * return code is the size in bytes of the string
383 * On error: return code is zero or a negative errno value
384 */
385static ssize_t write_threads(struct file *file, char *buf, size_t size)
386{
387 char *mesg = buf;
388 int rv;
389 if (size > 0) {
390 int newthreads;
391 rv = get_int(&mesg, &newthreads);
392 if (rv)
393 return rv;
394 if (newthreads < 0)
395 return -EINVAL;
396 rv = nfsd_svc(NFS_PORT, newthreads);
397 if (rv < 0)
398 return rv;
399 } else
400 rv = nfsd_nrthreads();
401
402 return scnprintf(buf, SIMPLE_TRANSACTION_LIMIT, "%d\n", rv);
403}
404
405/**
406 * write_pool_threads - Set or report the current number of threads per pool
407 *
408 * Input:
409 * buf: ignored
410 * size: zero
411 *
412 * OR
413 *
414 * Input:
415 * buf: C string containing whitespace-
416 * separated unsigned integer values
417 * representing the number of NFSD
418 * threads to start in each pool
419 * size: non-zero length of C string in @buf
420 * Output:
421 * On success: passed-in buffer filled with '\n'-terminated C
422 * string containing integer values representing the
423 * number of NFSD threads in each pool;
424 * return code is the size in bytes of the string
425 * On error: return code is zero or a negative errno value
426 */
427static ssize_t write_pool_threads(struct file *file, char *buf, size_t size)
428{
429 /* if size > 0, look for an array of number of threads per node
430 * and apply them then write out number of threads per node as reply
431 */
432 char *mesg = buf;
433 int i;
434 int rv;
435 int len;
436 int npools;
437 int *nthreads;
438
439 mutex_lock(&nfsd_mutex);
440 npools = nfsd_nrpools();
441 if (npools == 0) {
442 /*
443 * NFS is shut down. The admin can start it by
444 * writing to the threads file but NOT the pool_threads
445 * file, sorry. Report zero threads.
446 */
447 mutex_unlock(&nfsd_mutex);
448 strcpy(buf, "0\n");
449 return strlen(buf);
450 }
451
452 nthreads = kcalloc(npools, sizeof(int), GFP_KERNEL);
453 rv = -ENOMEM;
454 if (nthreads == NULL)
455 goto out_free;
456
457 if (size > 0) {
458 for (i = 0; i < npools; i++) {
459 rv = get_int(&mesg, &nthreads[i]);
460 if (rv == -ENOENT)
461 break; /* fewer numbers than pools */
462 if (rv)
463 goto out_free; /* syntax error */
464 rv = -EINVAL;
465 if (nthreads[i] < 0)
466 goto out_free;
467 }
468 rv = nfsd_set_nrthreads(i, nthreads);
469 if (rv)
470 goto out_free;
471 }
472
473 rv = nfsd_get_nrthreads(npools, nthreads);
474 if (rv)
475 goto out_free;
476
477 mesg = buf;
478 size = SIMPLE_TRANSACTION_LIMIT;
479 for (i = 0; i < npools && size > 0; i++) {
480 snprintf(mesg, size, "%d%c", nthreads[i], (i == npools-1 ? '\n' : ' '));
481 len = strlen(mesg);
482 size -= len;
483 mesg += len;
484 }
485 rv = mesg - buf;
486out_free:
487 kfree(nthreads);
488 mutex_unlock(&nfsd_mutex);
489 return rv;
490}
491
492static ssize_t __write_versions(struct file *file, char *buf, size_t size)
493{
494 char *mesg = buf;
495 char *vers, *minorp, sign;
496 int len, num, remaining;
497 unsigned minor;
498 ssize_t tlen = 0;
499 char *sep;
500
501 if (size>0) {
502 if (nfsd_serv)
503 /* Cannot change versions without updating
504 * nfsd_serv->sv_xdrsize, and reallocing
505 * rq_argp and rq_resp
506 */
507 return -EBUSY;
508 if (buf[size-1] != '\n')
509 return -EINVAL;
510 buf[size-1] = 0;
511
512 vers = mesg;
513 len = qword_get(&mesg, vers, size);
514 if (len <= 0) return -EINVAL;
515 do {
516 sign = *vers;
517 if (sign == '+' || sign == '-')
518 num = simple_strtol((vers+1), &minorp, 0);
519 else
520 num = simple_strtol(vers, &minorp, 0);
521 if (*minorp == '.') {
522 if (num < 4)
523 return -EINVAL;
524 minor = simple_strtoul(minorp+1, NULL, 0);
525 if (minor == 0)
526 return -EINVAL;
527 if (nfsd_minorversion(minor, sign == '-' ?
528 NFSD_CLEAR : NFSD_SET) < 0)
529 return -EINVAL;
530 goto next;
531 }
532 switch(num) {
533 case 2:
534 case 3:
535 case 4:
536 nfsd_vers(num, sign == '-' ? NFSD_CLEAR : NFSD_SET);
537 break;
538 default:
539 return -EINVAL;
540 }
541 next:
542 vers += len + 1;
543 } while ((len = qword_get(&mesg, vers, size)) > 0);
544 /* If all get turned off, turn them back on, as
545 * having no versions is BAD
546 */
547 nfsd_reset_versions();
548 }
549
550 /* Now write current state into reply buffer */
551 len = 0;
552 sep = "";
553 remaining = SIMPLE_TRANSACTION_LIMIT;
554 for (num=2 ; num <= 4 ; num++)
555 if (nfsd_vers(num, NFSD_AVAIL)) {
556 len = snprintf(buf, remaining, "%s%c%d", sep,
557 nfsd_vers(num, NFSD_TEST)?'+':'-',
558 num);
559 sep = " ";
560
561 if (len > remaining)
562 break;
563 remaining -= len;
564 buf += len;
565 tlen += len;
566 }
567 if (nfsd_vers(4, NFSD_AVAIL))
568 for (minor = 1; minor <= NFSD_SUPPORTED_MINOR_VERSION;
569 minor++) {
570 len = snprintf(buf, remaining, " %c4.%u",
571 (nfsd_vers(4, NFSD_TEST) &&
572 nfsd_minorversion(minor, NFSD_TEST)) ?
573 '+' : '-',
574 minor);
575
576 if (len > remaining)
577 break;
578 remaining -= len;
579 buf += len;
580 tlen += len;
581 }
582
583 len = snprintf(buf, remaining, "\n");
584 if (len > remaining)
585 return -EINVAL;
586 return tlen + len;
587}
588
589/**
590 * write_versions - Set or report the available NFS protocol versions
591 *
592 * Input:
593 * buf: ignored
594 * size: zero
595 * Output:
596 * On success: passed-in buffer filled with '\n'-terminated C
597 * string containing positive or negative integer
598 * values representing the current status of each
599 * protocol version;
600 * return code is the size in bytes of the string
601 * On error: return code is zero or a negative errno value
602 *
603 * OR
604 *
605 * Input:
606 * buf: C string containing whitespace-
607 * separated positive or negative
608 * integer values representing NFS
609 * protocol versions to enable ("+n")
610 * or disable ("-n")
611 * size: non-zero length of C string in @buf
612 * Output:
613 * On success: status of zero or more protocol versions has
614 * been updated; passed-in buffer filled with
615 * '\n'-terminated C string containing positive
616 * or negative integer values representing the
617 * current status of each protocol version;
618 * return code is the size in bytes of the string
619 * On error: return code is zero or a negative errno value
620 */
621static ssize_t write_versions(struct file *file, char *buf, size_t size)
622{
623 ssize_t rv;
624
625 mutex_lock(&nfsd_mutex);
626 rv = __write_versions(file, buf, size);
627 mutex_unlock(&nfsd_mutex);
628 return rv;
629}
630
631/*
632 * Zero-length write. Return a list of NFSD's current listener
633 * transports.
634 */
635static ssize_t __write_ports_names(char *buf)
636{
637 if (nfsd_serv == NULL)
638 return 0;
639 return svc_xprt_names(nfsd_serv, buf, SIMPLE_TRANSACTION_LIMIT);
640}
641
642/*
643 * A single 'fd' number was written, in which case it must be for
644 * a socket of a supported family/protocol, and we use it as an
645 * nfsd listener.
646 */
647static ssize_t __write_ports_addfd(char *buf)
648{
649 char *mesg = buf;
650 int fd, err;
651
652 err = get_int(&mesg, &fd);
653 if (err != 0 || fd < 0)
654 return -EINVAL;
655
656 err = nfsd_create_serv();
657 if (err != 0)
658 return err;
659
660 err = svc_addsock(nfsd_serv, fd, buf, SIMPLE_TRANSACTION_LIMIT);
661 if (err < 0) {
662 svc_destroy(nfsd_serv);
663 return err;
664 }
665
666 /* Decrease the count, but don't shut down the service */
667 nfsd_serv->sv_nrthreads--;
668 return err;
669}
670
671/*
672 * A '-' followed by the 'name' of a socket means we close the socket.
673 */
674static ssize_t __write_ports_delfd(char *buf)
675{
676 char *toclose;
677 int len = 0;
678
679 toclose = kstrdup(buf + 1, GFP_KERNEL);
680 if (toclose == NULL)
681 return -ENOMEM;
682
683 if (nfsd_serv != NULL)
684 len = svc_sock_names(nfsd_serv, buf,
685 SIMPLE_TRANSACTION_LIMIT, toclose);
686 kfree(toclose);
687 return len;
688}
689
690/*
691 * A transport listener is added by writing it's transport name and
692 * a port number.
693 */
694static ssize_t __write_ports_addxprt(char *buf)
695{
696 char transport[16];
697 struct svc_xprt *xprt;
698 int port, err;
699
700 if (sscanf(buf, "%15s %4u", transport, &port) != 2)
701 return -EINVAL;
702
703 if (port < 1 || port > USHRT_MAX)
704 return -EINVAL;
705
706 err = nfsd_create_serv();
707 if (err != 0)
708 return err;
709
710 err = svc_create_xprt(nfsd_serv, transport, &init_net,
711 PF_INET, port, SVC_SOCK_ANONYMOUS);
712 if (err < 0)
713 goto out_err;
714
715 err = svc_create_xprt(nfsd_serv, transport, &init_net,
716 PF_INET6, port, SVC_SOCK_ANONYMOUS);
717 if (err < 0 && err != -EAFNOSUPPORT)
718 goto out_close;
719
720 /* Decrease the count, but don't shut down the service */
721 nfsd_serv->sv_nrthreads--;
722 return 0;
723out_close:
724 xprt = svc_find_xprt(nfsd_serv, transport, PF_INET, port);
725 if (xprt != NULL) {
726 svc_close_xprt(xprt);
727 svc_xprt_put(xprt);
728 }
729out_err:
730 svc_destroy(nfsd_serv);
731 return err;
732}
733
734/*
735 * A transport listener is removed by writing a "-", it's transport
736 * name, and it's port number.
737 */
738static ssize_t __write_ports_delxprt(char *buf)
739{
740 struct svc_xprt *xprt;
741 char transport[16];
742 int port;
743
744 if (sscanf(&buf[1], "%15s %4u", transport, &port) != 2)
745 return -EINVAL;
746
747 if (port < 1 || port > USHRT_MAX || nfsd_serv == NULL)
748 return -EINVAL;
749
750 xprt = svc_find_xprt(nfsd_serv, transport, AF_UNSPEC, port);
751 if (xprt == NULL)
752 return -ENOTCONN;
753
754 svc_close_xprt(xprt);
755 svc_xprt_put(xprt);
756 return 0;
757}
758
759static ssize_t __write_ports(struct file *file, char *buf, size_t size)
760{
761 if (size == 0)
762 return __write_ports_names(buf);
763
764 if (isdigit(buf[0]))
765 return __write_ports_addfd(buf);
766
767 if (buf[0] == '-' && isdigit(buf[1]))
768 return __write_ports_delfd(buf);
769
770 if (isalpha(buf[0]))
771 return __write_ports_addxprt(buf);
772
773 if (buf[0] == '-' && isalpha(buf[1]))
774 return __write_ports_delxprt(buf);
775
776 return -EINVAL;
777}
778
779/**
780 * write_ports - Pass a socket file descriptor or transport name to listen on
781 *
782 * Input:
783 * buf: ignored
784 * size: zero
785 * Output:
786 * On success: passed-in buffer filled with a '\n'-terminated C
787 * string containing a whitespace-separated list of
788 * named NFSD listeners;
789 * return code is the size in bytes of the string
790 * On error: return code is zero or a negative errno value
791 *
792 * OR
793 *
794 * Input:
795 * buf: C string containing an unsigned
796 * integer value representing a bound
797 * but unconnected socket that is to be
798 * used as an NFSD listener; listen(3)
799 * must be called for a SOCK_STREAM
800 * socket, otherwise it is ignored
801 * size: non-zero length of C string in @buf
802 * Output:
803 * On success: NFS service is started;
804 * passed-in buffer filled with a '\n'-terminated C
805 * string containing a unique alphanumeric name of
806 * the listener;
807 * return code is the size in bytes of the string
808 * On error: return code is a negative errno value
809 *
810 * OR
811 *
812 * Input:
813 * buf: C string containing a "-" followed
814 * by an integer value representing a
815 * previously passed in socket file
816 * descriptor
817 * size: non-zero length of C string in @buf
818 * Output:
819 * On success: NFS service no longer listens on that socket;
820 * passed-in buffer filled with a '\n'-terminated C
821 * string containing a unique name of the listener;
822 * return code is the size in bytes of the string
823 * On error: return code is a negative errno value
824 *
825 * OR
826 *
827 * Input:
828 * buf: C string containing a transport
829 * name and an unsigned integer value
830 * representing the port to listen on,
831 * separated by whitespace
832 * size: non-zero length of C string in @buf
833 * Output:
834 * On success: returns zero; NFS service is started
835 * On error: return code is a negative errno value
836 *
837 * OR
838 *
839 * Input:
840 * buf: C string containing a "-" followed
841 * by a transport name and an unsigned
842 * integer value representing the port
843 * to listen on, separated by whitespace
844 * size: non-zero length of C string in @buf
845 * Output:
846 * On success: returns zero; NFS service no longer listens
847 * on that transport
848 * On error: return code is a negative errno value
849 */
850static ssize_t write_ports(struct file *file, char *buf, size_t size)
851{
852 ssize_t rv;
853
854 mutex_lock(&nfsd_mutex);
855 rv = __write_ports(file, buf, size);
856 mutex_unlock(&nfsd_mutex);
857 return rv;
858}
859
860
861int nfsd_max_blksize;
862
863/**
864 * write_maxblksize - Set or report the current NFS blksize
865 *
866 * Input:
867 * buf: ignored
868 * size: zero
869 *
870 * OR
871 *
872 * Input:
873 * buf: C string containing an unsigned
874 * integer value representing the new
875 * NFS blksize
876 * size: non-zero length of C string in @buf
877 * Output:
878 * On success: passed-in buffer filled with '\n'-terminated C string
879 * containing numeric value of the current NFS blksize
880 * setting;
881 * return code is the size in bytes of the string
882 * On error: return code is zero or a negative errno value
883 */
884static ssize_t write_maxblksize(struct file *file, char *buf, size_t size)
885{
886 char *mesg = buf;
887 if (size > 0) {
888 int bsize;
889 int rv = get_int(&mesg, &bsize);
890 if (rv)
891 return rv;
892 /* force bsize into allowed range and
893 * required alignment.
894 */
895 if (bsize < 1024)
896 bsize = 1024;
897 if (bsize > NFSSVC_MAXBLKSIZE)
898 bsize = NFSSVC_MAXBLKSIZE;
899 bsize &= ~(1024-1);
900 mutex_lock(&nfsd_mutex);
901 if (nfsd_serv) {
902 mutex_unlock(&nfsd_mutex);
903 return -EBUSY;
904 }
905 nfsd_max_blksize = bsize;
906 mutex_unlock(&nfsd_mutex);
907 }
908
909 return scnprintf(buf, SIMPLE_TRANSACTION_LIMIT, "%d\n",
910 nfsd_max_blksize);
911}
912
913#ifdef CONFIG_NFSD_V4
914static ssize_t __nfsd4_write_time(struct file *file, char *buf, size_t size, time_t *time)
915{
916 char *mesg = buf;
917 int rv, i;
918
919 if (size > 0) {
920 if (nfsd_serv)
921 return -EBUSY;
922 rv = get_int(&mesg, &i);
923 if (rv)
924 return rv;
925 /*
926 * Some sanity checking. We don't have a reason for
927 * these particular numbers, but problems with the
928 * extremes are:
929 * - Too short: the briefest network outage may
930 * cause clients to lose all their locks. Also,
931 * the frequent polling may be wasteful.
932 * - Too long: do you really want reboot recovery
933 * to take more than an hour? Or to make other
934 * clients wait an hour before being able to
935 * revoke a dead client's locks?
936 */
937 if (i < 10 || i > 3600)
938 return -EINVAL;
939 *time = i;
940 }
941
942 return scnprintf(buf, SIMPLE_TRANSACTION_LIMIT, "%ld\n", *time);
943}
944
945static ssize_t nfsd4_write_time(struct file *file, char *buf, size_t size, time_t *time)
946{
947 ssize_t rv;
948
949 mutex_lock(&nfsd_mutex);
950 rv = __nfsd4_write_time(file, buf, size, time);
951 mutex_unlock(&nfsd_mutex);
952 return rv;
953}
954
955/**
956 * write_leasetime - Set or report the current NFSv4 lease time
957 *
958 * Input:
959 * buf: ignored
960 * size: zero
961 *
962 * OR
963 *
964 * Input:
965 * buf: C string containing an unsigned
966 * integer value representing the new
967 * NFSv4 lease expiry time
968 * size: non-zero length of C string in @buf
969 * Output:
970 * On success: passed-in buffer filled with '\n'-terminated C
971 * string containing unsigned integer value of the
972 * current lease expiry time;
973 * return code is the size in bytes of the string
974 * On error: return code is zero or a negative errno value
975 */
976static ssize_t write_leasetime(struct file *file, char *buf, size_t size)
977{
978 return nfsd4_write_time(file, buf, size, &nfsd4_lease);
979}
980
981/**
982 * write_gracetime - Set or report current NFSv4 grace period time
983 *
984 * As above, but sets the time of the NFSv4 grace period.
985 *
986 * Note this should never be set to less than the *previous*
987 * lease-period time, but we don't try to enforce this. (In the common
988 * case (a new boot), we don't know what the previous lease time was
989 * anyway.)
990 */
991static ssize_t write_gracetime(struct file *file, char *buf, size_t size)
992{
993 return nfsd4_write_time(file, buf, size, &nfsd4_grace);
994}
995
996extern char *nfs4_recoverydir(void);
997
998static ssize_t __write_recoverydir(struct file *file, char *buf, size_t size)
999{
1000 char *mesg = buf;
1001 char *recdir;
1002 int len, status;
1003
1004 if (size > 0) {
1005 if (nfsd_serv)
1006 return -EBUSY;
1007 if (size > PATH_MAX || buf[size-1] != '\n')
1008 return -EINVAL;
1009 buf[size-1] = 0;
1010
1011 recdir = mesg;
1012 len = qword_get(&mesg, recdir, size);
1013 if (len <= 0)
1014 return -EINVAL;
1015
1016 status = nfs4_reset_recoverydir(recdir);
1017 if (status)
1018 return status;
1019 }
1020
1021 return scnprintf(buf, SIMPLE_TRANSACTION_LIMIT, "%s\n",
1022 nfs4_recoverydir());
1023}
1024
1025/**
1026 * write_recoverydir - Set or report the pathname of the recovery directory
1027 *
1028 * Input:
1029 * buf: ignored
1030 * size: zero
1031 *
1032 * OR
1033 *
1034 * Input:
1035 * buf: C string containing the pathname
1036 * of the directory on a local file
1037 * system containing permanent NFSv4
1038 * recovery data
1039 * size: non-zero length of C string in @buf
1040 * Output:
1041 * On success: passed-in buffer filled with '\n'-terminated C string
1042 * containing the current recovery pathname setting;
1043 * return code is the size in bytes of the string
1044 * On error: return code is zero or a negative errno value
1045 */
1046static ssize_t write_recoverydir(struct file *file, char *buf, size_t size)
1047{
1048 ssize_t rv;
1049
1050 mutex_lock(&nfsd_mutex);
1051 rv = __write_recoverydir(file, buf, size);
1052 mutex_unlock(&nfsd_mutex);
1053 return rv;
1054}
1055
1056#endif
1057
1058/*----------------------------------------------------------------------------*/
1059/*
1060 * populating the filesystem.
1061 */
1062
1063static int nfsd_fill_super(struct super_block * sb, void * data, int silent)
1064{
1065 static struct tree_descr nfsd_files[] = {
1066 [NFSD_List] = {"exports", &exports_operations, S_IRUGO},
1067 [NFSD_Export_features] = {"export_features",
1068 &export_features_operations, S_IRUGO},
1069 [NFSD_FO_UnlockIP] = {"unlock_ip",
1070 &transaction_ops, S_IWUSR|S_IRUSR},
1071 [NFSD_FO_UnlockFS] = {"unlock_filesystem",
1072 &transaction_ops, S_IWUSR|S_IRUSR},
1073 [NFSD_Fh] = {"filehandle", &transaction_ops, S_IWUSR|S_IRUSR},
1074 [NFSD_Threads] = {"threads", &transaction_ops, S_IWUSR|S_IRUSR},
1075 [NFSD_Pool_Threads] = {"pool_threads", &transaction_ops, S_IWUSR|S_IRUSR},
1076 [NFSD_Pool_Stats] = {"pool_stats", &pool_stats_operations, S_IRUGO},
1077 [NFSD_Versions] = {"versions", &transaction_ops, S_IWUSR|S_IRUSR},
1078 [NFSD_Ports] = {"portlist", &transaction_ops, S_IWUSR|S_IRUGO},
1079 [NFSD_MaxBlkSize] = {"max_block_size", &transaction_ops, S_IWUSR|S_IRUGO},
1080#if defined(CONFIG_SUNRPC_GSS) || defined(CONFIG_SUNRPC_GSS_MODULE)
1081 [NFSD_SupportedEnctypes] = {"supported_krb5_enctypes", &supported_enctypes_ops, S_IRUGO},
1082#endif /* CONFIG_SUNRPC_GSS or CONFIG_SUNRPC_GSS_MODULE */
1083#ifdef CONFIG_NFSD_V4
1084 [NFSD_Leasetime] = {"nfsv4leasetime", &transaction_ops, S_IWUSR|S_IRUSR},
1085 [NFSD_Gracetime] = {"nfsv4gracetime", &transaction_ops, S_IWUSR|S_IRUSR},
1086 [NFSD_RecoveryDir] = {"nfsv4recoverydir", &transaction_ops, S_IWUSR|S_IRUSR},
1087#endif
1088 /* last one */ {""}
1089 };
1090 return simple_fill_super(sb, 0x6e667364, nfsd_files);
1091}
1092
1093static struct dentry *nfsd_mount(struct file_system_type *fs_type,
1094 int flags, const char *dev_name, void *data)
1095{
1096 return mount_single(fs_type, flags, data, nfsd_fill_super);
1097}
1098
1099static struct file_system_type nfsd_fs_type = {
1100 .owner = THIS_MODULE,
1101 .name = "nfsd",
1102 .mount = nfsd_mount,
1103 .kill_sb = kill_litter_super,
1104};
1105
1106#ifdef CONFIG_PROC_FS
1107static int create_proc_exports_entry(void)
1108{
1109 struct proc_dir_entry *entry;
1110
1111 entry = proc_mkdir("fs/nfs", NULL);
1112 if (!entry)
1113 return -ENOMEM;
1114 entry = proc_create("exports", 0, entry, &exports_operations);
1115 if (!entry)
1116 return -ENOMEM;
1117 return 0;
1118}
1119#else /* CONFIG_PROC_FS */
1120static int create_proc_exports_entry(void)
1121{
1122 return 0;
1123}
1124#endif
1125
1126static int __init init_nfsd(void)
1127{
1128 int retval;
1129 printk(KERN_INFO "Installing knfsd (copyright (C) 1996 okir@monad.swb.de).\n");
1130
1131 retval = nfs4_state_init(); /* nfs4 locking state */
1132 if (retval)
1133 return retval;
1134 nfsd_stat_init(); /* Statistics */
1135 retval = nfsd_reply_cache_init();
1136 if (retval)
1137 goto out_free_stat;
1138 retval = nfsd_export_init();
1139 if (retval)
1140 goto out_free_cache;
1141 nfsd_lockd_init(); /* lockd->nfsd callbacks */
1142 retval = nfsd_idmap_init();
1143 if (retval)
1144 goto out_free_lockd;
1145 retval = create_proc_exports_entry();
1146 if (retval)
1147 goto out_free_idmap;
1148 retval = register_filesystem(&nfsd_fs_type);
1149 if (retval)
1150 goto out_free_all;
1151 return 0;
1152out_free_all:
1153 remove_proc_entry("fs/nfs/exports", NULL);
1154 remove_proc_entry("fs/nfs", NULL);
1155out_free_idmap:
1156 nfsd_idmap_shutdown();
1157out_free_lockd:
1158 nfsd_lockd_shutdown();
1159 nfsd_export_shutdown();
1160out_free_cache:
1161 nfsd_reply_cache_shutdown();
1162out_free_stat:
1163 nfsd_stat_shutdown();
1164 nfsd4_free_slabs();
1165 return retval;
1166}
1167
1168static void __exit exit_nfsd(void)
1169{
1170 nfsd_export_shutdown();
1171 nfsd_reply_cache_shutdown();
1172 remove_proc_entry("fs/nfs/exports", NULL);
1173 remove_proc_entry("fs/nfs", NULL);
1174 nfsd_stat_shutdown();
1175 nfsd_lockd_shutdown();
1176 nfsd_idmap_shutdown();
1177 nfsd4_free_slabs();
1178 unregister_filesystem(&nfsd_fs_type);
1179}
1180
1181MODULE_AUTHOR("Olaf Kirch <okir@monad.swb.de>");
1182MODULE_LICENSE("GPL");
1183module_init(init_nfsd)
1184module_exit(exit_nfsd)
1// SPDX-License-Identifier: GPL-2.0-only
2/*
3 * Syscall interface to knfsd.
4 *
5 * Copyright (C) 1995, 1996 Olaf Kirch <okir@monad.swb.de>
6 */
7
8#include <linux/slab.h>
9#include <linux/namei.h>
10#include <linux/ctype.h>
11#include <linux/fs_context.h>
12
13#include <linux/sunrpc/svcsock.h>
14#include <linux/lockd/lockd.h>
15#include <linux/sunrpc/addr.h>
16#include <linux/sunrpc/gss_api.h>
17#include <linux/sunrpc/gss_krb5_enctypes.h>
18#include <linux/sunrpc/rpc_pipe_fs.h>
19#include <linux/module.h>
20#include <linux/fsnotify.h>
21
22#include "idmap.h"
23#include "nfsd.h"
24#include "cache.h"
25#include "state.h"
26#include "netns.h"
27#include "pnfs.h"
28
29/*
30 * We have a single directory with several nodes in it.
31 */
32enum {
33 NFSD_Root = 1,
34 NFSD_List,
35 NFSD_Export_features,
36 NFSD_Fh,
37 NFSD_FO_UnlockIP,
38 NFSD_FO_UnlockFS,
39 NFSD_Threads,
40 NFSD_Pool_Threads,
41 NFSD_Pool_Stats,
42 NFSD_Reply_Cache_Stats,
43 NFSD_Versions,
44 NFSD_Ports,
45 NFSD_MaxBlkSize,
46 NFSD_MaxConnections,
47 NFSD_SupportedEnctypes,
48 /*
49 * The below MUST come last. Otherwise we leave a hole in nfsd_files[]
50 * with !CONFIG_NFSD_V4 and simple_fill_super() goes oops
51 */
52#ifdef CONFIG_NFSD_V4
53 NFSD_Leasetime,
54 NFSD_Gracetime,
55 NFSD_RecoveryDir,
56 NFSD_V4EndGrace,
57#endif
58 NFSD_MaxReserved
59};
60
61/*
62 * write() for these nodes.
63 */
64static ssize_t write_filehandle(struct file *file, char *buf, size_t size);
65static ssize_t write_unlock_ip(struct file *file, char *buf, size_t size);
66static ssize_t write_unlock_fs(struct file *file, char *buf, size_t size);
67static ssize_t write_threads(struct file *file, char *buf, size_t size);
68static ssize_t write_pool_threads(struct file *file, char *buf, size_t size);
69static ssize_t write_versions(struct file *file, char *buf, size_t size);
70static ssize_t write_ports(struct file *file, char *buf, size_t size);
71static ssize_t write_maxblksize(struct file *file, char *buf, size_t size);
72static ssize_t write_maxconn(struct file *file, char *buf, size_t size);
73#ifdef CONFIG_NFSD_V4
74static ssize_t write_leasetime(struct file *file, char *buf, size_t size);
75static ssize_t write_gracetime(struct file *file, char *buf, size_t size);
76static ssize_t write_recoverydir(struct file *file, char *buf, size_t size);
77static ssize_t write_v4_end_grace(struct file *file, char *buf, size_t size);
78#endif
79
80static ssize_t (*const write_op[])(struct file *, char *, size_t) = {
81 [NFSD_Fh] = write_filehandle,
82 [NFSD_FO_UnlockIP] = write_unlock_ip,
83 [NFSD_FO_UnlockFS] = write_unlock_fs,
84 [NFSD_Threads] = write_threads,
85 [NFSD_Pool_Threads] = write_pool_threads,
86 [NFSD_Versions] = write_versions,
87 [NFSD_Ports] = write_ports,
88 [NFSD_MaxBlkSize] = write_maxblksize,
89 [NFSD_MaxConnections] = write_maxconn,
90#ifdef CONFIG_NFSD_V4
91 [NFSD_Leasetime] = write_leasetime,
92 [NFSD_Gracetime] = write_gracetime,
93 [NFSD_RecoveryDir] = write_recoverydir,
94 [NFSD_V4EndGrace] = write_v4_end_grace,
95#endif
96};
97
98static ssize_t nfsctl_transaction_write(struct file *file, const char __user *buf, size_t size, loff_t *pos)
99{
100 ino_t ino = file_inode(file)->i_ino;
101 char *data;
102 ssize_t rv;
103
104 if (ino >= ARRAY_SIZE(write_op) || !write_op[ino])
105 return -EINVAL;
106
107 data = simple_transaction_get(file, buf, size);
108 if (IS_ERR(data))
109 return PTR_ERR(data);
110
111 rv = write_op[ino](file, data, size);
112 if (rv >= 0) {
113 simple_transaction_set(file, rv);
114 rv = size;
115 }
116 return rv;
117}
118
119static ssize_t nfsctl_transaction_read(struct file *file, char __user *buf, size_t size, loff_t *pos)
120{
121 if (! file->private_data) {
122 /* An attempt to read a transaction file without writing
123 * causes a 0-byte write so that the file can return
124 * state information
125 */
126 ssize_t rv = nfsctl_transaction_write(file, buf, 0, pos);
127 if (rv < 0)
128 return rv;
129 }
130 return simple_transaction_read(file, buf, size, pos);
131}
132
133static const struct file_operations transaction_ops = {
134 .write = nfsctl_transaction_write,
135 .read = nfsctl_transaction_read,
136 .release = simple_transaction_release,
137 .llseek = default_llseek,
138};
139
140static int exports_net_open(struct net *net, struct file *file)
141{
142 int err;
143 struct seq_file *seq;
144 struct nfsd_net *nn = net_generic(net, nfsd_net_id);
145
146 err = seq_open(file, &nfs_exports_op);
147 if (err)
148 return err;
149
150 seq = file->private_data;
151 seq->private = nn->svc_export_cache;
152 return 0;
153}
154
155static int exports_proc_open(struct inode *inode, struct file *file)
156{
157 return exports_net_open(current->nsproxy->net_ns, file);
158}
159
160static const struct file_operations exports_proc_operations = {
161 .open = exports_proc_open,
162 .read = seq_read,
163 .llseek = seq_lseek,
164 .release = seq_release,
165};
166
167static int exports_nfsd_open(struct inode *inode, struct file *file)
168{
169 return exports_net_open(inode->i_sb->s_fs_info, file);
170}
171
172static const struct file_operations exports_nfsd_operations = {
173 .open = exports_nfsd_open,
174 .read = seq_read,
175 .llseek = seq_lseek,
176 .release = seq_release,
177};
178
179static int export_features_show(struct seq_file *m, void *v)
180{
181 seq_printf(m, "0x%x 0x%x\n", NFSEXP_ALLFLAGS, NFSEXP_SECINFO_FLAGS);
182 return 0;
183}
184
185static int export_features_open(struct inode *inode, struct file *file)
186{
187 return single_open(file, export_features_show, NULL);
188}
189
190static const struct file_operations export_features_operations = {
191 .open = export_features_open,
192 .read = seq_read,
193 .llseek = seq_lseek,
194 .release = single_release,
195};
196
197#if defined(CONFIG_SUNRPC_GSS) || defined(CONFIG_SUNRPC_GSS_MODULE)
198static int supported_enctypes_show(struct seq_file *m, void *v)
199{
200 seq_printf(m, KRB5_SUPPORTED_ENCTYPES);
201 return 0;
202}
203
204static int supported_enctypes_open(struct inode *inode, struct file *file)
205{
206 return single_open(file, supported_enctypes_show, NULL);
207}
208
209static const struct file_operations supported_enctypes_ops = {
210 .open = supported_enctypes_open,
211 .read = seq_read,
212 .llseek = seq_lseek,
213 .release = single_release,
214};
215#endif /* CONFIG_SUNRPC_GSS or CONFIG_SUNRPC_GSS_MODULE */
216
217static const struct file_operations pool_stats_operations = {
218 .open = nfsd_pool_stats_open,
219 .read = seq_read,
220 .llseek = seq_lseek,
221 .release = nfsd_pool_stats_release,
222};
223
224static const struct file_operations reply_cache_stats_operations = {
225 .open = nfsd_reply_cache_stats_open,
226 .read = seq_read,
227 .llseek = seq_lseek,
228 .release = single_release,
229};
230
231/*----------------------------------------------------------------------------*/
232/*
233 * payload - write methods
234 */
235
236static inline struct net *netns(struct file *file)
237{
238 return file_inode(file)->i_sb->s_fs_info;
239}
240
241/**
242 * write_unlock_ip - Release all locks used by a client
243 *
244 * Experimental.
245 *
246 * Input:
247 * buf: '\n'-terminated C string containing a
248 * presentation format IP address
249 * size: length of C string in @buf
250 * Output:
251 * On success: returns zero if all specified locks were released;
252 * returns one if one or more locks were not released
253 * On error: return code is negative errno value
254 */
255static ssize_t write_unlock_ip(struct file *file, char *buf, size_t size)
256{
257 struct sockaddr_storage address;
258 struct sockaddr *sap = (struct sockaddr *)&address;
259 size_t salen = sizeof(address);
260 char *fo_path;
261 struct net *net = netns(file);
262
263 /* sanity check */
264 if (size == 0)
265 return -EINVAL;
266
267 if (buf[size-1] != '\n')
268 return -EINVAL;
269
270 fo_path = buf;
271 if (qword_get(&buf, fo_path, size) < 0)
272 return -EINVAL;
273
274 if (rpc_pton(net, fo_path, size, sap, salen) == 0)
275 return -EINVAL;
276
277 return nlmsvc_unlock_all_by_ip(sap);
278}
279
280/**
281 * write_unlock_fs - Release all locks on a local file system
282 *
283 * Experimental.
284 *
285 * Input:
286 * buf: '\n'-terminated C string containing the
287 * absolute pathname of a local file system
288 * size: length of C string in @buf
289 * Output:
290 * On success: returns zero if all specified locks were released;
291 * returns one if one or more locks were not released
292 * On error: return code is negative errno value
293 */
294static ssize_t write_unlock_fs(struct file *file, char *buf, size_t size)
295{
296 struct path path;
297 char *fo_path;
298 int error;
299
300 /* sanity check */
301 if (size == 0)
302 return -EINVAL;
303
304 if (buf[size-1] != '\n')
305 return -EINVAL;
306
307 fo_path = buf;
308 if (qword_get(&buf, fo_path, size) < 0)
309 return -EINVAL;
310
311 error = kern_path(fo_path, 0, &path);
312 if (error)
313 return error;
314
315 /*
316 * XXX: Needs better sanity checking. Otherwise we could end up
317 * releasing locks on the wrong file system.
318 *
319 * For example:
320 * 1. Does the path refer to a directory?
321 * 2. Is that directory a mount point, or
322 * 3. Is that directory the root of an exported file system?
323 */
324 error = nlmsvc_unlock_all_by_sb(path.dentry->d_sb);
325
326 path_put(&path);
327 return error;
328}
329
330/**
331 * write_filehandle - Get a variable-length NFS file handle by path
332 *
333 * On input, the buffer contains a '\n'-terminated C string comprised of
334 * three alphanumeric words separated by whitespace. The string may
335 * contain escape sequences.
336 *
337 * Input:
338 * buf:
339 * domain: client domain name
340 * path: export pathname
341 * maxsize: numeric maximum size of
342 * @buf
343 * size: length of C string in @buf
344 * Output:
345 * On success: passed-in buffer filled with '\n'-terminated C
346 * string containing a ASCII hex text version
347 * of the NFS file handle;
348 * return code is the size in bytes of the string
349 * On error: return code is negative errno value
350 */
351static ssize_t write_filehandle(struct file *file, char *buf, size_t size)
352{
353 char *dname, *path;
354 int uninitialized_var(maxsize);
355 char *mesg = buf;
356 int len;
357 struct auth_domain *dom;
358 struct knfsd_fh fh;
359
360 if (size == 0)
361 return -EINVAL;
362
363 if (buf[size-1] != '\n')
364 return -EINVAL;
365 buf[size-1] = 0;
366
367 dname = mesg;
368 len = qword_get(&mesg, dname, size);
369 if (len <= 0)
370 return -EINVAL;
371
372 path = dname+len+1;
373 len = qword_get(&mesg, path, size);
374 if (len <= 0)
375 return -EINVAL;
376
377 len = get_int(&mesg, &maxsize);
378 if (len)
379 return len;
380
381 if (maxsize < NFS_FHSIZE)
382 return -EINVAL;
383 maxsize = min(maxsize, NFS3_FHSIZE);
384
385 if (qword_get(&mesg, mesg, size)>0)
386 return -EINVAL;
387
388 /* we have all the words, they are in buf.. */
389 dom = unix_domain_find(dname);
390 if (!dom)
391 return -ENOMEM;
392
393 len = exp_rootfh(netns(file), dom, path, &fh, maxsize);
394 auth_domain_put(dom);
395 if (len)
396 return len;
397
398 mesg = buf;
399 len = SIMPLE_TRANSACTION_LIMIT;
400 qword_addhex(&mesg, &len, (char*)&fh.fh_base, fh.fh_size);
401 mesg[-1] = '\n';
402 return mesg - buf;
403}
404
405/**
406 * write_threads - Start NFSD, or report the current number of running threads
407 *
408 * Input:
409 * buf: ignored
410 * size: zero
411 * Output:
412 * On success: passed-in buffer filled with '\n'-terminated C
413 * string numeric value representing the number of
414 * running NFSD threads;
415 * return code is the size in bytes of the string
416 * On error: return code is zero
417 *
418 * OR
419 *
420 * Input:
421 * buf: C string containing an unsigned
422 * integer value representing the
423 * number of NFSD threads to start
424 * size: non-zero length of C string in @buf
425 * Output:
426 * On success: NFS service is started;
427 * passed-in buffer filled with '\n'-terminated C
428 * string numeric value representing the number of
429 * running NFSD threads;
430 * return code is the size in bytes of the string
431 * On error: return code is zero or a negative errno value
432 */
433static ssize_t write_threads(struct file *file, char *buf, size_t size)
434{
435 char *mesg = buf;
436 int rv;
437 struct net *net = netns(file);
438
439 if (size > 0) {
440 int newthreads;
441 rv = get_int(&mesg, &newthreads);
442 if (rv)
443 return rv;
444 if (newthreads < 0)
445 return -EINVAL;
446 rv = nfsd_svc(newthreads, net, file->f_cred);
447 if (rv < 0)
448 return rv;
449 } else
450 rv = nfsd_nrthreads(net);
451
452 return scnprintf(buf, SIMPLE_TRANSACTION_LIMIT, "%d\n", rv);
453}
454
455/**
456 * write_pool_threads - Set or report the current number of threads per pool
457 *
458 * Input:
459 * buf: ignored
460 * size: zero
461 *
462 * OR
463 *
464 * Input:
465 * buf: C string containing whitespace-
466 * separated unsigned integer values
467 * representing the number of NFSD
468 * threads to start in each pool
469 * size: non-zero length of C string in @buf
470 * Output:
471 * On success: passed-in buffer filled with '\n'-terminated C
472 * string containing integer values representing the
473 * number of NFSD threads in each pool;
474 * return code is the size in bytes of the string
475 * On error: return code is zero or a negative errno value
476 */
477static ssize_t write_pool_threads(struct file *file, char *buf, size_t size)
478{
479 /* if size > 0, look for an array of number of threads per node
480 * and apply them then write out number of threads per node as reply
481 */
482 char *mesg = buf;
483 int i;
484 int rv;
485 int len;
486 int npools;
487 int *nthreads;
488 struct net *net = netns(file);
489
490 mutex_lock(&nfsd_mutex);
491 npools = nfsd_nrpools(net);
492 if (npools == 0) {
493 /*
494 * NFS is shut down. The admin can start it by
495 * writing to the threads file but NOT the pool_threads
496 * file, sorry. Report zero threads.
497 */
498 mutex_unlock(&nfsd_mutex);
499 strcpy(buf, "0\n");
500 return strlen(buf);
501 }
502
503 nthreads = kcalloc(npools, sizeof(int), GFP_KERNEL);
504 rv = -ENOMEM;
505 if (nthreads == NULL)
506 goto out_free;
507
508 if (size > 0) {
509 for (i = 0; i < npools; i++) {
510 rv = get_int(&mesg, &nthreads[i]);
511 if (rv == -ENOENT)
512 break; /* fewer numbers than pools */
513 if (rv)
514 goto out_free; /* syntax error */
515 rv = -EINVAL;
516 if (nthreads[i] < 0)
517 goto out_free;
518 }
519 rv = nfsd_set_nrthreads(i, nthreads, net);
520 if (rv)
521 goto out_free;
522 }
523
524 rv = nfsd_get_nrthreads(npools, nthreads, net);
525 if (rv)
526 goto out_free;
527
528 mesg = buf;
529 size = SIMPLE_TRANSACTION_LIMIT;
530 for (i = 0; i < npools && size > 0; i++) {
531 snprintf(mesg, size, "%d%c", nthreads[i], (i == npools-1 ? '\n' : ' '));
532 len = strlen(mesg);
533 size -= len;
534 mesg += len;
535 }
536 rv = mesg - buf;
537out_free:
538 kfree(nthreads);
539 mutex_unlock(&nfsd_mutex);
540 return rv;
541}
542
543static ssize_t
544nfsd_print_version_support(struct nfsd_net *nn, char *buf, int remaining,
545 const char *sep, unsigned vers, int minor)
546{
547 const char *format = minor < 0 ? "%s%c%u" : "%s%c%u.%u";
548 bool supported = !!nfsd_vers(nn, vers, NFSD_TEST);
549
550 if (vers == 4 && minor >= 0 &&
551 !nfsd_minorversion(nn, minor, NFSD_TEST))
552 supported = false;
553 if (minor == 0 && supported)
554 /*
555 * special case for backward compatability.
556 * +4.0 is never reported, it is implied by
557 * +4, unless -4.0 is present.
558 */
559 return 0;
560 return snprintf(buf, remaining, format, sep,
561 supported ? '+' : '-', vers, minor);
562}
563
564static ssize_t __write_versions(struct file *file, char *buf, size_t size)
565{
566 char *mesg = buf;
567 char *vers, *minorp, sign;
568 int len, num, remaining;
569 ssize_t tlen = 0;
570 char *sep;
571 struct nfsd_net *nn = net_generic(netns(file), nfsd_net_id);
572
573 if (size>0) {
574 if (nn->nfsd_serv)
575 /* Cannot change versions without updating
576 * nn->nfsd_serv->sv_xdrsize, and reallocing
577 * rq_argp and rq_resp
578 */
579 return -EBUSY;
580 if (buf[size-1] != '\n')
581 return -EINVAL;
582 buf[size-1] = 0;
583
584 vers = mesg;
585 len = qword_get(&mesg, vers, size);
586 if (len <= 0) return -EINVAL;
587 do {
588 enum vers_op cmd;
589 unsigned minor;
590 sign = *vers;
591 if (sign == '+' || sign == '-')
592 num = simple_strtol((vers+1), &minorp, 0);
593 else
594 num = simple_strtol(vers, &minorp, 0);
595 if (*minorp == '.') {
596 if (num != 4)
597 return -EINVAL;
598 if (kstrtouint(minorp+1, 0, &minor) < 0)
599 return -EINVAL;
600 }
601
602 cmd = sign == '-' ? NFSD_CLEAR : NFSD_SET;
603 switch(num) {
604 case 2:
605 case 3:
606 nfsd_vers(nn, num, cmd);
607 break;
608 case 4:
609 if (*minorp == '.') {
610 if (nfsd_minorversion(nn, minor, cmd) < 0)
611 return -EINVAL;
612 } else if ((cmd == NFSD_SET) != nfsd_vers(nn, num, NFSD_TEST)) {
613 /*
614 * Either we have +4 and no minors are enabled,
615 * or we have -4 and at least one minor is enabled.
616 * In either case, propagate 'cmd' to all minors.
617 */
618 minor = 0;
619 while (nfsd_minorversion(nn, minor, cmd) >= 0)
620 minor++;
621 }
622 break;
623 default:
624 return -EINVAL;
625 }
626 vers += len + 1;
627 } while ((len = qword_get(&mesg, vers, size)) > 0);
628 /* If all get turned off, turn them back on, as
629 * having no versions is BAD
630 */
631 nfsd_reset_versions(nn);
632 }
633
634 /* Now write current state into reply buffer */
635 len = 0;
636 sep = "";
637 remaining = SIMPLE_TRANSACTION_LIMIT;
638 for (num=2 ; num <= 4 ; num++) {
639 int minor;
640 if (!nfsd_vers(nn, num, NFSD_AVAIL))
641 continue;
642
643 minor = -1;
644 do {
645 len = nfsd_print_version_support(nn, buf, remaining,
646 sep, num, minor);
647 if (len >= remaining)
648 goto out;
649 remaining -= len;
650 buf += len;
651 tlen += len;
652 minor++;
653 if (len)
654 sep = " ";
655 } while (num == 4 && minor <= NFSD_SUPPORTED_MINOR_VERSION);
656 }
657out:
658 len = snprintf(buf, remaining, "\n");
659 if (len >= remaining)
660 return -EINVAL;
661 return tlen + len;
662}
663
664/**
665 * write_versions - Set or report the available NFS protocol versions
666 *
667 * Input:
668 * buf: ignored
669 * size: zero
670 * Output:
671 * On success: passed-in buffer filled with '\n'-terminated C
672 * string containing positive or negative integer
673 * values representing the current status of each
674 * protocol version;
675 * return code is the size in bytes of the string
676 * On error: return code is zero or a negative errno value
677 *
678 * OR
679 *
680 * Input:
681 * buf: C string containing whitespace-
682 * separated positive or negative
683 * integer values representing NFS
684 * protocol versions to enable ("+n")
685 * or disable ("-n")
686 * size: non-zero length of C string in @buf
687 * Output:
688 * On success: status of zero or more protocol versions has
689 * been updated; passed-in buffer filled with
690 * '\n'-terminated C string containing positive
691 * or negative integer values representing the
692 * current status of each protocol version;
693 * return code is the size in bytes of the string
694 * On error: return code is zero or a negative errno value
695 */
696static ssize_t write_versions(struct file *file, char *buf, size_t size)
697{
698 ssize_t rv;
699
700 mutex_lock(&nfsd_mutex);
701 rv = __write_versions(file, buf, size);
702 mutex_unlock(&nfsd_mutex);
703 return rv;
704}
705
706/*
707 * Zero-length write. Return a list of NFSD's current listener
708 * transports.
709 */
710static ssize_t __write_ports_names(char *buf, struct net *net)
711{
712 struct nfsd_net *nn = net_generic(net, nfsd_net_id);
713
714 if (nn->nfsd_serv == NULL)
715 return 0;
716 return svc_xprt_names(nn->nfsd_serv, buf, SIMPLE_TRANSACTION_LIMIT);
717}
718
719/*
720 * A single 'fd' number was written, in which case it must be for
721 * a socket of a supported family/protocol, and we use it as an
722 * nfsd listener.
723 */
724static ssize_t __write_ports_addfd(char *buf, struct net *net, const struct cred *cred)
725{
726 char *mesg = buf;
727 int fd, err;
728 struct nfsd_net *nn = net_generic(net, nfsd_net_id);
729
730 err = get_int(&mesg, &fd);
731 if (err != 0 || fd < 0)
732 return -EINVAL;
733
734 if (svc_alien_sock(net, fd)) {
735 printk(KERN_ERR "%s: socket net is different to NFSd's one\n", __func__);
736 return -EINVAL;
737 }
738
739 err = nfsd_create_serv(net);
740 if (err != 0)
741 return err;
742
743 err = svc_addsock(nn->nfsd_serv, fd, buf, SIMPLE_TRANSACTION_LIMIT, cred);
744 if (err < 0) {
745 nfsd_destroy(net);
746 return err;
747 }
748
749 /* Decrease the count, but don't shut down the service */
750 nn->nfsd_serv->sv_nrthreads--;
751 return err;
752}
753
754/*
755 * A transport listener is added by writing it's transport name and
756 * a port number.
757 */
758static ssize_t __write_ports_addxprt(char *buf, struct net *net, const struct cred *cred)
759{
760 char transport[16];
761 struct svc_xprt *xprt;
762 int port, err;
763 struct nfsd_net *nn = net_generic(net, nfsd_net_id);
764
765 if (sscanf(buf, "%15s %5u", transport, &port) != 2)
766 return -EINVAL;
767
768 if (port < 1 || port > USHRT_MAX)
769 return -EINVAL;
770
771 err = nfsd_create_serv(net);
772 if (err != 0)
773 return err;
774
775 err = svc_create_xprt(nn->nfsd_serv, transport, net,
776 PF_INET, port, SVC_SOCK_ANONYMOUS, cred);
777 if (err < 0)
778 goto out_err;
779
780 err = svc_create_xprt(nn->nfsd_serv, transport, net,
781 PF_INET6, port, SVC_SOCK_ANONYMOUS, cred);
782 if (err < 0 && err != -EAFNOSUPPORT)
783 goto out_close;
784
785 /* Decrease the count, but don't shut down the service */
786 nn->nfsd_serv->sv_nrthreads--;
787 return 0;
788out_close:
789 xprt = svc_find_xprt(nn->nfsd_serv, transport, net, PF_INET, port);
790 if (xprt != NULL) {
791 svc_close_xprt(xprt);
792 svc_xprt_put(xprt);
793 }
794out_err:
795 nfsd_destroy(net);
796 return err;
797}
798
799static ssize_t __write_ports(struct file *file, char *buf, size_t size,
800 struct net *net)
801{
802 if (size == 0)
803 return __write_ports_names(buf, net);
804
805 if (isdigit(buf[0]))
806 return __write_ports_addfd(buf, net, file->f_cred);
807
808 if (isalpha(buf[0]))
809 return __write_ports_addxprt(buf, net, file->f_cred);
810
811 return -EINVAL;
812}
813
814/**
815 * write_ports - Pass a socket file descriptor or transport name to listen on
816 *
817 * Input:
818 * buf: ignored
819 * size: zero
820 * Output:
821 * On success: passed-in buffer filled with a '\n'-terminated C
822 * string containing a whitespace-separated list of
823 * named NFSD listeners;
824 * return code is the size in bytes of the string
825 * On error: return code is zero or a negative errno value
826 *
827 * OR
828 *
829 * Input:
830 * buf: C string containing an unsigned
831 * integer value representing a bound
832 * but unconnected socket that is to be
833 * used as an NFSD listener; listen(3)
834 * must be called for a SOCK_STREAM
835 * socket, otherwise it is ignored
836 * size: non-zero length of C string in @buf
837 * Output:
838 * On success: NFS service is started;
839 * passed-in buffer filled with a '\n'-terminated C
840 * string containing a unique alphanumeric name of
841 * the listener;
842 * return code is the size in bytes of the string
843 * On error: return code is a negative errno value
844 *
845 * OR
846 *
847 * Input:
848 * buf: C string containing a transport
849 * name and an unsigned integer value
850 * representing the port to listen on,
851 * separated by whitespace
852 * size: non-zero length of C string in @buf
853 * Output:
854 * On success: returns zero; NFS service is started
855 * On error: return code is a negative errno value
856 */
857static ssize_t write_ports(struct file *file, char *buf, size_t size)
858{
859 ssize_t rv;
860
861 mutex_lock(&nfsd_mutex);
862 rv = __write_ports(file, buf, size, netns(file));
863 mutex_unlock(&nfsd_mutex);
864 return rv;
865}
866
867
868int nfsd_max_blksize;
869
870/**
871 * write_maxblksize - Set or report the current NFS blksize
872 *
873 * Input:
874 * buf: ignored
875 * size: zero
876 *
877 * OR
878 *
879 * Input:
880 * buf: C string containing an unsigned
881 * integer value representing the new
882 * NFS blksize
883 * size: non-zero length of C string in @buf
884 * Output:
885 * On success: passed-in buffer filled with '\n'-terminated C string
886 * containing numeric value of the current NFS blksize
887 * setting;
888 * return code is the size in bytes of the string
889 * On error: return code is zero or a negative errno value
890 */
891static ssize_t write_maxblksize(struct file *file, char *buf, size_t size)
892{
893 char *mesg = buf;
894 struct nfsd_net *nn = net_generic(netns(file), nfsd_net_id);
895
896 if (size > 0) {
897 int bsize;
898 int rv = get_int(&mesg, &bsize);
899 if (rv)
900 return rv;
901 /* force bsize into allowed range and
902 * required alignment.
903 */
904 bsize = max_t(int, bsize, 1024);
905 bsize = min_t(int, bsize, NFSSVC_MAXBLKSIZE);
906 bsize &= ~(1024-1);
907 mutex_lock(&nfsd_mutex);
908 if (nn->nfsd_serv) {
909 mutex_unlock(&nfsd_mutex);
910 return -EBUSY;
911 }
912 nfsd_max_blksize = bsize;
913 mutex_unlock(&nfsd_mutex);
914 }
915
916 return scnprintf(buf, SIMPLE_TRANSACTION_LIMIT, "%d\n",
917 nfsd_max_blksize);
918}
919
920/**
921 * write_maxconn - Set or report the current max number of connections
922 *
923 * Input:
924 * buf: ignored
925 * size: zero
926 * OR
927 *
928 * Input:
929 * buf: C string containing an unsigned
930 * integer value representing the new
931 * number of max connections
932 * size: non-zero length of C string in @buf
933 * Output:
934 * On success: passed-in buffer filled with '\n'-terminated C string
935 * containing numeric value of max_connections setting
936 * for this net namespace;
937 * return code is the size in bytes of the string
938 * On error: return code is zero or a negative errno value
939 */
940static ssize_t write_maxconn(struct file *file, char *buf, size_t size)
941{
942 char *mesg = buf;
943 struct nfsd_net *nn = net_generic(netns(file), nfsd_net_id);
944 unsigned int maxconn = nn->max_connections;
945
946 if (size > 0) {
947 int rv = get_uint(&mesg, &maxconn);
948
949 if (rv)
950 return rv;
951 nn->max_connections = maxconn;
952 }
953
954 return scnprintf(buf, SIMPLE_TRANSACTION_LIMIT, "%u\n", maxconn);
955}
956
957#ifdef CONFIG_NFSD_V4
958static ssize_t __nfsd4_write_time(struct file *file, char *buf, size_t size,
959 time_t *time, struct nfsd_net *nn)
960{
961 char *mesg = buf;
962 int rv, i;
963
964 if (size > 0) {
965 if (nn->nfsd_serv)
966 return -EBUSY;
967 rv = get_int(&mesg, &i);
968 if (rv)
969 return rv;
970 /*
971 * Some sanity checking. We don't have a reason for
972 * these particular numbers, but problems with the
973 * extremes are:
974 * - Too short: the briefest network outage may
975 * cause clients to lose all their locks. Also,
976 * the frequent polling may be wasteful.
977 * - Too long: do you really want reboot recovery
978 * to take more than an hour? Or to make other
979 * clients wait an hour before being able to
980 * revoke a dead client's locks?
981 */
982 if (i < 10 || i > 3600)
983 return -EINVAL;
984 *time = i;
985 }
986
987 return scnprintf(buf, SIMPLE_TRANSACTION_LIMIT, "%ld\n", *time);
988}
989
990static ssize_t nfsd4_write_time(struct file *file, char *buf, size_t size,
991 time_t *time, struct nfsd_net *nn)
992{
993 ssize_t rv;
994
995 mutex_lock(&nfsd_mutex);
996 rv = __nfsd4_write_time(file, buf, size, time, nn);
997 mutex_unlock(&nfsd_mutex);
998 return rv;
999}
1000
1001/**
1002 * write_leasetime - Set or report the current NFSv4 lease time
1003 *
1004 * Input:
1005 * buf: ignored
1006 * size: zero
1007 *
1008 * OR
1009 *
1010 * Input:
1011 * buf: C string containing an unsigned
1012 * integer value representing the new
1013 * NFSv4 lease expiry time
1014 * size: non-zero length of C string in @buf
1015 * Output:
1016 * On success: passed-in buffer filled with '\n'-terminated C
1017 * string containing unsigned integer value of the
1018 * current lease expiry time;
1019 * return code is the size in bytes of the string
1020 * On error: return code is zero or a negative errno value
1021 */
1022static ssize_t write_leasetime(struct file *file, char *buf, size_t size)
1023{
1024 struct nfsd_net *nn = net_generic(netns(file), nfsd_net_id);
1025 return nfsd4_write_time(file, buf, size, &nn->nfsd4_lease, nn);
1026}
1027
1028/**
1029 * write_gracetime - Set or report current NFSv4 grace period time
1030 *
1031 * As above, but sets the time of the NFSv4 grace period.
1032 *
1033 * Note this should never be set to less than the *previous*
1034 * lease-period time, but we don't try to enforce this. (In the common
1035 * case (a new boot), we don't know what the previous lease time was
1036 * anyway.)
1037 */
1038static ssize_t write_gracetime(struct file *file, char *buf, size_t size)
1039{
1040 struct nfsd_net *nn = net_generic(netns(file), nfsd_net_id);
1041 return nfsd4_write_time(file, buf, size, &nn->nfsd4_grace, nn);
1042}
1043
1044static ssize_t __write_recoverydir(struct file *file, char *buf, size_t size,
1045 struct nfsd_net *nn)
1046{
1047 char *mesg = buf;
1048 char *recdir;
1049 int len, status;
1050
1051 if (size > 0) {
1052 if (nn->nfsd_serv)
1053 return -EBUSY;
1054 if (size > PATH_MAX || buf[size-1] != '\n')
1055 return -EINVAL;
1056 buf[size-1] = 0;
1057
1058 recdir = mesg;
1059 len = qword_get(&mesg, recdir, size);
1060 if (len <= 0)
1061 return -EINVAL;
1062
1063 status = nfs4_reset_recoverydir(recdir);
1064 if (status)
1065 return status;
1066 }
1067
1068 return scnprintf(buf, SIMPLE_TRANSACTION_LIMIT, "%s\n",
1069 nfs4_recoverydir());
1070}
1071
1072/**
1073 * write_recoverydir - Set or report the pathname of the recovery directory
1074 *
1075 * Input:
1076 * buf: ignored
1077 * size: zero
1078 *
1079 * OR
1080 *
1081 * Input:
1082 * buf: C string containing the pathname
1083 * of the directory on a local file
1084 * system containing permanent NFSv4
1085 * recovery data
1086 * size: non-zero length of C string in @buf
1087 * Output:
1088 * On success: passed-in buffer filled with '\n'-terminated C string
1089 * containing the current recovery pathname setting;
1090 * return code is the size in bytes of the string
1091 * On error: return code is zero or a negative errno value
1092 */
1093static ssize_t write_recoverydir(struct file *file, char *buf, size_t size)
1094{
1095 ssize_t rv;
1096 struct nfsd_net *nn = net_generic(netns(file), nfsd_net_id);
1097
1098 mutex_lock(&nfsd_mutex);
1099 rv = __write_recoverydir(file, buf, size, nn);
1100 mutex_unlock(&nfsd_mutex);
1101 return rv;
1102}
1103
1104/**
1105 * write_v4_end_grace - release grace period for nfsd's v4.x lock manager
1106 *
1107 * Input:
1108 * buf: ignored
1109 * size: zero
1110 * OR
1111 *
1112 * Input:
1113 * buf: any value
1114 * size: non-zero length of C string in @buf
1115 * Output:
1116 * passed-in buffer filled with "Y" or "N" with a newline
1117 * and NULL-terminated C string. This indicates whether
1118 * the grace period has ended in the current net
1119 * namespace. Return code is the size in bytes of the
1120 * string. Writing a string that starts with 'Y', 'y', or
1121 * '1' to the file will end the grace period for nfsd's v4
1122 * lock manager.
1123 */
1124static ssize_t write_v4_end_grace(struct file *file, char *buf, size_t size)
1125{
1126 struct nfsd_net *nn = net_generic(netns(file), nfsd_net_id);
1127
1128 if (size > 0) {
1129 switch(buf[0]) {
1130 case 'Y':
1131 case 'y':
1132 case '1':
1133 if (!nn->nfsd_serv)
1134 return -EBUSY;
1135 nfsd4_end_grace(nn);
1136 break;
1137 default:
1138 return -EINVAL;
1139 }
1140 }
1141
1142 return scnprintf(buf, SIMPLE_TRANSACTION_LIMIT, "%c\n",
1143 nn->grace_ended ? 'Y' : 'N');
1144}
1145
1146#endif
1147
1148/*----------------------------------------------------------------------------*/
1149/*
1150 * populating the filesystem.
1151 */
1152
1153/* Basically copying rpc_get_inode. */
1154static struct inode *nfsd_get_inode(struct super_block *sb, umode_t mode)
1155{
1156 struct inode *inode = new_inode(sb);
1157 if (!inode)
1158 return NULL;
1159 /* Following advice from simple_fill_super documentation: */
1160 inode->i_ino = iunique(sb, NFSD_MaxReserved);
1161 inode->i_mode = mode;
1162 inode->i_atime = inode->i_mtime = inode->i_ctime = current_time(inode);
1163 switch (mode & S_IFMT) {
1164 case S_IFDIR:
1165 inode->i_fop = &simple_dir_operations;
1166 inode->i_op = &simple_dir_inode_operations;
1167 inc_nlink(inode);
1168 default:
1169 break;
1170 }
1171 return inode;
1172}
1173
1174static int __nfsd_mkdir(struct inode *dir, struct dentry *dentry, umode_t mode, struct nfsdfs_client *ncl)
1175{
1176 struct inode *inode;
1177
1178 inode = nfsd_get_inode(dir->i_sb, mode);
1179 if (!inode)
1180 return -ENOMEM;
1181 if (ncl) {
1182 inode->i_private = ncl;
1183 kref_get(&ncl->cl_ref);
1184 }
1185 d_add(dentry, inode);
1186 inc_nlink(dir);
1187 fsnotify_mkdir(dir, dentry);
1188 return 0;
1189}
1190
1191static struct dentry *nfsd_mkdir(struct dentry *parent, struct nfsdfs_client *ncl, char *name)
1192{
1193 struct inode *dir = parent->d_inode;
1194 struct dentry *dentry;
1195 int ret = -ENOMEM;
1196
1197 inode_lock(dir);
1198 dentry = d_alloc_name(parent, name);
1199 if (!dentry)
1200 goto out_err;
1201 ret = __nfsd_mkdir(d_inode(parent), dentry, S_IFDIR | 0600, ncl);
1202 if (ret)
1203 goto out_err;
1204out:
1205 inode_unlock(dir);
1206 return dentry;
1207out_err:
1208 dput(dentry);
1209 dentry = ERR_PTR(ret);
1210 goto out;
1211}
1212
1213static void clear_ncl(struct inode *inode)
1214{
1215 struct nfsdfs_client *ncl = inode->i_private;
1216
1217 inode->i_private = NULL;
1218 kref_put(&ncl->cl_ref, ncl->cl_release);
1219}
1220
1221static struct nfsdfs_client *__get_nfsdfs_client(struct inode *inode)
1222{
1223 struct nfsdfs_client *nc = inode->i_private;
1224
1225 if (nc)
1226 kref_get(&nc->cl_ref);
1227 return nc;
1228}
1229
1230struct nfsdfs_client *get_nfsdfs_client(struct inode *inode)
1231{
1232 struct nfsdfs_client *nc;
1233
1234 inode_lock_shared(inode);
1235 nc = __get_nfsdfs_client(inode);
1236 inode_unlock_shared(inode);
1237 return nc;
1238}
1239/* from __rpc_unlink */
1240static void nfsdfs_remove_file(struct inode *dir, struct dentry *dentry)
1241{
1242 int ret;
1243
1244 clear_ncl(d_inode(dentry));
1245 dget(dentry);
1246 ret = simple_unlink(dir, dentry);
1247 d_delete(dentry);
1248 dput(dentry);
1249 WARN_ON_ONCE(ret);
1250}
1251
1252static void nfsdfs_remove_files(struct dentry *root)
1253{
1254 struct dentry *dentry, *tmp;
1255
1256 list_for_each_entry_safe(dentry, tmp, &root->d_subdirs, d_child) {
1257 if (!simple_positive(dentry)) {
1258 WARN_ON_ONCE(1); /* I think this can't happen? */
1259 continue;
1260 }
1261 nfsdfs_remove_file(d_inode(root), dentry);
1262 }
1263}
1264
1265/* XXX: cut'n'paste from simple_fill_super; figure out if we could share
1266 * code instead. */
1267static int nfsdfs_create_files(struct dentry *root,
1268 const struct tree_descr *files)
1269{
1270 struct inode *dir = d_inode(root);
1271 struct inode *inode;
1272 struct dentry *dentry;
1273 int i;
1274
1275 inode_lock(dir);
1276 for (i = 0; files->name && files->name[0]; i++, files++) {
1277 if (!files->name)
1278 continue;
1279 dentry = d_alloc_name(root, files->name);
1280 if (!dentry)
1281 goto out;
1282 inode = nfsd_get_inode(d_inode(root)->i_sb,
1283 S_IFREG | files->mode);
1284 if (!inode) {
1285 dput(dentry);
1286 goto out;
1287 }
1288 inode->i_fop = files->ops;
1289 inode->i_private = __get_nfsdfs_client(dir);
1290 d_add(dentry, inode);
1291 fsnotify_create(dir, dentry);
1292 }
1293 inode_unlock(dir);
1294 return 0;
1295out:
1296 nfsdfs_remove_files(root);
1297 inode_unlock(dir);
1298 return -ENOMEM;
1299}
1300
1301/* on success, returns positive number unique to that client. */
1302struct dentry *nfsd_client_mkdir(struct nfsd_net *nn,
1303 struct nfsdfs_client *ncl, u32 id,
1304 const struct tree_descr *files)
1305{
1306 struct dentry *dentry;
1307 char name[11];
1308 int ret;
1309
1310 sprintf(name, "%u", id);
1311
1312 dentry = nfsd_mkdir(nn->nfsd_client_dir, ncl, name);
1313 if (IS_ERR(dentry)) /* XXX: tossing errors? */
1314 return NULL;
1315 ret = nfsdfs_create_files(dentry, files);
1316 if (ret) {
1317 nfsd_client_rmdir(dentry);
1318 return NULL;
1319 }
1320 return dentry;
1321}
1322
1323/* Taken from __rpc_rmdir: */
1324void nfsd_client_rmdir(struct dentry *dentry)
1325{
1326 struct inode *dir = d_inode(dentry->d_parent);
1327 struct inode *inode = d_inode(dentry);
1328 int ret;
1329
1330 inode_lock(dir);
1331 nfsdfs_remove_files(dentry);
1332 clear_ncl(inode);
1333 dget(dentry);
1334 ret = simple_rmdir(dir, dentry);
1335 WARN_ON_ONCE(ret);
1336 d_delete(dentry);
1337 inode_unlock(dir);
1338}
1339
1340static int nfsd_fill_super(struct super_block *sb, struct fs_context *fc)
1341{
1342 struct nfsd_net *nn = net_generic(current->nsproxy->net_ns,
1343 nfsd_net_id);
1344 struct dentry *dentry;
1345 int ret;
1346
1347 static const struct tree_descr nfsd_files[] = {
1348 [NFSD_List] = {"exports", &exports_nfsd_operations, S_IRUGO},
1349 [NFSD_Export_features] = {"export_features",
1350 &export_features_operations, S_IRUGO},
1351 [NFSD_FO_UnlockIP] = {"unlock_ip",
1352 &transaction_ops, S_IWUSR|S_IRUSR},
1353 [NFSD_FO_UnlockFS] = {"unlock_filesystem",
1354 &transaction_ops, S_IWUSR|S_IRUSR},
1355 [NFSD_Fh] = {"filehandle", &transaction_ops, S_IWUSR|S_IRUSR},
1356 [NFSD_Threads] = {"threads", &transaction_ops, S_IWUSR|S_IRUSR},
1357 [NFSD_Pool_Threads] = {"pool_threads", &transaction_ops, S_IWUSR|S_IRUSR},
1358 [NFSD_Pool_Stats] = {"pool_stats", &pool_stats_operations, S_IRUGO},
1359 [NFSD_Reply_Cache_Stats] = {"reply_cache_stats", &reply_cache_stats_operations, S_IRUGO},
1360 [NFSD_Versions] = {"versions", &transaction_ops, S_IWUSR|S_IRUSR},
1361 [NFSD_Ports] = {"portlist", &transaction_ops, S_IWUSR|S_IRUGO},
1362 [NFSD_MaxBlkSize] = {"max_block_size", &transaction_ops, S_IWUSR|S_IRUGO},
1363 [NFSD_MaxConnections] = {"max_connections", &transaction_ops, S_IWUSR|S_IRUGO},
1364#if defined(CONFIG_SUNRPC_GSS) || defined(CONFIG_SUNRPC_GSS_MODULE)
1365 [NFSD_SupportedEnctypes] = {"supported_krb5_enctypes", &supported_enctypes_ops, S_IRUGO},
1366#endif /* CONFIG_SUNRPC_GSS or CONFIG_SUNRPC_GSS_MODULE */
1367#ifdef CONFIG_NFSD_V4
1368 [NFSD_Leasetime] = {"nfsv4leasetime", &transaction_ops, S_IWUSR|S_IRUSR},
1369 [NFSD_Gracetime] = {"nfsv4gracetime", &transaction_ops, S_IWUSR|S_IRUSR},
1370 [NFSD_RecoveryDir] = {"nfsv4recoverydir", &transaction_ops, S_IWUSR|S_IRUSR},
1371 [NFSD_V4EndGrace] = {"v4_end_grace", &transaction_ops, S_IWUSR|S_IRUGO},
1372#endif
1373 /* last one */ {""}
1374 };
1375
1376 ret = simple_fill_super(sb, 0x6e667364, nfsd_files);
1377 if (ret)
1378 return ret;
1379 dentry = nfsd_mkdir(sb->s_root, NULL, "clients");
1380 if (IS_ERR(dentry))
1381 return PTR_ERR(dentry);
1382 nn->nfsd_client_dir = dentry;
1383 return 0;
1384}
1385
1386static int nfsd_fs_get_tree(struct fs_context *fc)
1387{
1388 return get_tree_keyed(fc, nfsd_fill_super, get_net(fc->net_ns));
1389}
1390
1391static void nfsd_fs_free_fc(struct fs_context *fc)
1392{
1393 if (fc->s_fs_info)
1394 put_net(fc->s_fs_info);
1395}
1396
1397static const struct fs_context_operations nfsd_fs_context_ops = {
1398 .free = nfsd_fs_free_fc,
1399 .get_tree = nfsd_fs_get_tree,
1400};
1401
1402static int nfsd_init_fs_context(struct fs_context *fc)
1403{
1404 put_user_ns(fc->user_ns);
1405 fc->user_ns = get_user_ns(fc->net_ns->user_ns);
1406 fc->ops = &nfsd_fs_context_ops;
1407 return 0;
1408}
1409
1410static void nfsd_umount(struct super_block *sb)
1411{
1412 struct net *net = sb->s_fs_info;
1413
1414 kill_litter_super(sb);
1415 put_net(net);
1416}
1417
1418static struct file_system_type nfsd_fs_type = {
1419 .owner = THIS_MODULE,
1420 .name = "nfsd",
1421 .init_fs_context = nfsd_init_fs_context,
1422 .kill_sb = nfsd_umount,
1423};
1424MODULE_ALIAS_FS("nfsd");
1425
1426#ifdef CONFIG_PROC_FS
1427static int create_proc_exports_entry(void)
1428{
1429 struct proc_dir_entry *entry;
1430
1431 entry = proc_mkdir("fs/nfs", NULL);
1432 if (!entry)
1433 return -ENOMEM;
1434 entry = proc_create("exports", 0, entry,
1435 &exports_proc_operations);
1436 if (!entry) {
1437 remove_proc_entry("fs/nfs", NULL);
1438 return -ENOMEM;
1439 }
1440 return 0;
1441}
1442#else /* CONFIG_PROC_FS */
1443static int create_proc_exports_entry(void)
1444{
1445 return 0;
1446}
1447#endif
1448
1449unsigned int nfsd_net_id;
1450
1451static __net_init int nfsd_init_net(struct net *net)
1452{
1453 int retval;
1454 struct vfsmount *mnt;
1455 struct nfsd_net *nn = net_generic(net, nfsd_net_id);
1456
1457 retval = nfsd_export_init(net);
1458 if (retval)
1459 goto out_export_error;
1460 retval = nfsd_idmap_init(net);
1461 if (retval)
1462 goto out_idmap_error;
1463 nn->nfsd_versions = NULL;
1464 nn->nfsd4_minorversions = NULL;
1465 retval = nfsd_reply_cache_init(nn);
1466 if (retval)
1467 goto out_drc_error;
1468 nn->nfsd4_lease = 90; /* default lease time */
1469 nn->nfsd4_grace = 90;
1470 nn->somebody_reclaimed = false;
1471 nn->track_reclaim_completes = false;
1472 nn->clverifier_counter = prandom_u32();
1473 nn->clientid_base = prandom_u32();
1474 nn->clientid_counter = nn->clientid_base + 1;
1475 nn->s2s_cp_cl_id = nn->clientid_counter++;
1476
1477 atomic_set(&nn->ntf_refcnt, 0);
1478 init_waitqueue_head(&nn->ntf_wq);
1479 seqlock_init(&nn->boot_lock);
1480
1481 mnt = vfs_kern_mount(&nfsd_fs_type, SB_KERNMOUNT, "nfsd", NULL);
1482 if (IS_ERR(mnt)) {
1483 retval = PTR_ERR(mnt);
1484 goto out_mount_err;
1485 }
1486 nn->nfsd_mnt = mnt;
1487 return 0;
1488
1489out_mount_err:
1490 nfsd_reply_cache_shutdown(nn);
1491out_drc_error:
1492 nfsd_idmap_shutdown(net);
1493out_idmap_error:
1494 nfsd_export_shutdown(net);
1495out_export_error:
1496 return retval;
1497}
1498
1499static __net_exit void nfsd_exit_net(struct net *net)
1500{
1501 struct nfsd_net *nn = net_generic(net, nfsd_net_id);
1502
1503 mntput(nn->nfsd_mnt);
1504 nfsd_reply_cache_shutdown(nn);
1505 nfsd_idmap_shutdown(net);
1506 nfsd_export_shutdown(net);
1507 nfsd_netns_free_versions(net_generic(net, nfsd_net_id));
1508}
1509
1510static struct pernet_operations nfsd_net_ops = {
1511 .init = nfsd_init_net,
1512 .exit = nfsd_exit_net,
1513 .id = &nfsd_net_id,
1514 .size = sizeof(struct nfsd_net),
1515};
1516
1517static int __init init_nfsd(void)
1518{
1519 int retval;
1520 printk(KERN_INFO "Installing knfsd (copyright (C) 1996 okir@monad.swb.de).\n");
1521
1522 retval = register_pernet_subsys(&nfsd_net_ops);
1523 if (retval < 0)
1524 return retval;
1525 retval = register_cld_notifier();
1526 if (retval)
1527 goto out_unregister_pernet;
1528 retval = nfsd4_init_slabs();
1529 if (retval)
1530 goto out_unregister_notifier;
1531 retval = nfsd4_init_pnfs();
1532 if (retval)
1533 goto out_free_slabs;
1534 nfsd_fault_inject_init(); /* nfsd fault injection controls */
1535 nfsd_stat_init(); /* Statistics */
1536 nfsd_lockd_init(); /* lockd->nfsd callbacks */
1537 retval = create_proc_exports_entry();
1538 if (retval)
1539 goto out_free_lockd;
1540 retval = register_filesystem(&nfsd_fs_type);
1541 if (retval)
1542 goto out_free_all;
1543 return 0;
1544out_free_all:
1545 remove_proc_entry("fs/nfs/exports", NULL);
1546 remove_proc_entry("fs/nfs", NULL);
1547out_free_lockd:
1548 nfsd_lockd_shutdown();
1549 nfsd_stat_shutdown();
1550 nfsd_fault_inject_cleanup();
1551 nfsd4_exit_pnfs();
1552out_free_slabs:
1553 nfsd4_free_slabs();
1554out_unregister_notifier:
1555 unregister_cld_notifier();
1556out_unregister_pernet:
1557 unregister_pernet_subsys(&nfsd_net_ops);
1558 return retval;
1559}
1560
1561static void __exit exit_nfsd(void)
1562{
1563 remove_proc_entry("fs/nfs/exports", NULL);
1564 remove_proc_entry("fs/nfs", NULL);
1565 nfsd_stat_shutdown();
1566 nfsd_lockd_shutdown();
1567 nfsd4_free_slabs();
1568 nfsd4_exit_pnfs();
1569 nfsd_fault_inject_cleanup();
1570 unregister_filesystem(&nfsd_fs_type);
1571 unregister_cld_notifier();
1572 unregister_pernet_subsys(&nfsd_net_ops);
1573}
1574
1575MODULE_AUTHOR("Olaf Kirch <okir@monad.swb.de>");
1576MODULE_LICENSE("GPL");
1577module_init(init_nfsd)
1578module_exit(exit_nfsd)