Loading...
1/*
2 * Syscall interface to knfsd.
3 *
4 * Copyright (C) 1995, 1996 Olaf Kirch <okir@monad.swb.de>
5 */
6
7#include <linux/slab.h>
8#include <linux/namei.h>
9#include <linux/ctype.h>
10
11#include <linux/sunrpc/svcsock.h>
12#include <linux/lockd/lockd.h>
13#include <linux/sunrpc/addr.h>
14#include <linux/sunrpc/gss_api.h>
15#include <linux/sunrpc/gss_krb5_enctypes.h>
16#include <linux/sunrpc/rpc_pipe_fs.h>
17#include <linux/module.h>
18
19#include "idmap.h"
20#include "nfsd.h"
21#include "cache.h"
22#include "state.h"
23#include "netns.h"
24#include "pnfs.h"
25
26/*
27 * We have a single directory with several nodes in it.
28 */
29enum {
30 NFSD_Root = 1,
31 NFSD_List,
32 NFSD_Export_features,
33 NFSD_Fh,
34 NFSD_FO_UnlockIP,
35 NFSD_FO_UnlockFS,
36 NFSD_Threads,
37 NFSD_Pool_Threads,
38 NFSD_Pool_Stats,
39 NFSD_Reply_Cache_Stats,
40 NFSD_Versions,
41 NFSD_Ports,
42 NFSD_MaxBlkSize,
43 NFSD_MaxConnections,
44 NFSD_SupportedEnctypes,
45 /*
46 * The below MUST come last. Otherwise we leave a hole in nfsd_files[]
47 * with !CONFIG_NFSD_V4 and simple_fill_super() goes oops
48 */
49#ifdef CONFIG_NFSD_V4
50 NFSD_Leasetime,
51 NFSD_Gracetime,
52 NFSD_RecoveryDir,
53 NFSD_V4EndGrace,
54#endif
55};
56
57/*
58 * write() for these nodes.
59 */
60static ssize_t write_filehandle(struct file *file, char *buf, size_t size);
61static ssize_t write_unlock_ip(struct file *file, char *buf, size_t size);
62static ssize_t write_unlock_fs(struct file *file, char *buf, size_t size);
63static ssize_t write_threads(struct file *file, char *buf, size_t size);
64static ssize_t write_pool_threads(struct file *file, char *buf, size_t size);
65static ssize_t write_versions(struct file *file, char *buf, size_t size);
66static ssize_t write_ports(struct file *file, char *buf, size_t size);
67static ssize_t write_maxblksize(struct file *file, char *buf, size_t size);
68static ssize_t write_maxconn(struct file *file, char *buf, size_t size);
69#ifdef CONFIG_NFSD_V4
70static ssize_t write_leasetime(struct file *file, char *buf, size_t size);
71static ssize_t write_gracetime(struct file *file, char *buf, size_t size);
72static ssize_t write_recoverydir(struct file *file, char *buf, size_t size);
73static ssize_t write_v4_end_grace(struct file *file, char *buf, size_t size);
74#endif
75
76static ssize_t (*write_op[])(struct file *, char *, size_t) = {
77 [NFSD_Fh] = write_filehandle,
78 [NFSD_FO_UnlockIP] = write_unlock_ip,
79 [NFSD_FO_UnlockFS] = write_unlock_fs,
80 [NFSD_Threads] = write_threads,
81 [NFSD_Pool_Threads] = write_pool_threads,
82 [NFSD_Versions] = write_versions,
83 [NFSD_Ports] = write_ports,
84 [NFSD_MaxBlkSize] = write_maxblksize,
85 [NFSD_MaxConnections] = write_maxconn,
86#ifdef CONFIG_NFSD_V4
87 [NFSD_Leasetime] = write_leasetime,
88 [NFSD_Gracetime] = write_gracetime,
89 [NFSD_RecoveryDir] = write_recoverydir,
90 [NFSD_V4EndGrace] = write_v4_end_grace,
91#endif
92};
93
94static ssize_t nfsctl_transaction_write(struct file *file, const char __user *buf, size_t size, loff_t *pos)
95{
96 ino_t ino = file_inode(file)->i_ino;
97 char *data;
98 ssize_t rv;
99
100 if (ino >= ARRAY_SIZE(write_op) || !write_op[ino])
101 return -EINVAL;
102
103 data = simple_transaction_get(file, buf, size);
104 if (IS_ERR(data))
105 return PTR_ERR(data);
106
107 rv = write_op[ino](file, data, size);
108 if (rv >= 0) {
109 simple_transaction_set(file, rv);
110 rv = size;
111 }
112 return rv;
113}
114
115static ssize_t nfsctl_transaction_read(struct file *file, char __user *buf, size_t size, loff_t *pos)
116{
117 if (! file->private_data) {
118 /* An attempt to read a transaction file without writing
119 * causes a 0-byte write so that the file can return
120 * state information
121 */
122 ssize_t rv = nfsctl_transaction_write(file, buf, 0, pos);
123 if (rv < 0)
124 return rv;
125 }
126 return simple_transaction_read(file, buf, size, pos);
127}
128
129static const struct file_operations transaction_ops = {
130 .write = nfsctl_transaction_write,
131 .read = nfsctl_transaction_read,
132 .release = simple_transaction_release,
133 .llseek = default_llseek,
134};
135
136static int exports_net_open(struct net *net, struct file *file)
137{
138 int err;
139 struct seq_file *seq;
140 struct nfsd_net *nn = net_generic(net, nfsd_net_id);
141
142 err = seq_open(file, &nfs_exports_op);
143 if (err)
144 return err;
145
146 seq = file->private_data;
147 seq->private = nn->svc_export_cache;
148 return 0;
149}
150
151static int exports_proc_open(struct inode *inode, struct file *file)
152{
153 return exports_net_open(current->nsproxy->net_ns, file);
154}
155
156static const struct file_operations exports_proc_operations = {
157 .open = exports_proc_open,
158 .read = seq_read,
159 .llseek = seq_lseek,
160 .release = seq_release,
161 .owner = THIS_MODULE,
162};
163
164static int exports_nfsd_open(struct inode *inode, struct file *file)
165{
166 return exports_net_open(inode->i_sb->s_fs_info, file);
167}
168
169static const struct file_operations exports_nfsd_operations = {
170 .open = exports_nfsd_open,
171 .read = seq_read,
172 .llseek = seq_lseek,
173 .release = seq_release,
174 .owner = THIS_MODULE,
175};
176
177static int export_features_show(struct seq_file *m, void *v)
178{
179 seq_printf(m, "0x%x 0x%x\n", NFSEXP_ALLFLAGS, NFSEXP_SECINFO_FLAGS);
180 return 0;
181}
182
183static int export_features_open(struct inode *inode, struct file *file)
184{
185 return single_open(file, export_features_show, NULL);
186}
187
188static const struct file_operations export_features_operations = {
189 .open = export_features_open,
190 .read = seq_read,
191 .llseek = seq_lseek,
192 .release = single_release,
193};
194
195#if defined(CONFIG_SUNRPC_GSS) || defined(CONFIG_SUNRPC_GSS_MODULE)
196static int supported_enctypes_show(struct seq_file *m, void *v)
197{
198 seq_printf(m, KRB5_SUPPORTED_ENCTYPES);
199 return 0;
200}
201
202static int supported_enctypes_open(struct inode *inode, struct file *file)
203{
204 return single_open(file, supported_enctypes_show, NULL);
205}
206
207static const struct file_operations supported_enctypes_ops = {
208 .open = supported_enctypes_open,
209 .read = seq_read,
210 .llseek = seq_lseek,
211 .release = single_release,
212};
213#endif /* CONFIG_SUNRPC_GSS or CONFIG_SUNRPC_GSS_MODULE */
214
215static const struct file_operations pool_stats_operations = {
216 .open = nfsd_pool_stats_open,
217 .read = seq_read,
218 .llseek = seq_lseek,
219 .release = nfsd_pool_stats_release,
220 .owner = THIS_MODULE,
221};
222
223static struct file_operations reply_cache_stats_operations = {
224 .open = nfsd_reply_cache_stats_open,
225 .read = seq_read,
226 .llseek = seq_lseek,
227 .release = single_release,
228};
229
230/*----------------------------------------------------------------------------*/
231/*
232 * payload - write methods
233 */
234
235static inline struct net *netns(struct file *file)
236{
237 return file_inode(file)->i_sb->s_fs_info;
238}
239
240/**
241 * write_unlock_ip - Release all locks used by a client
242 *
243 * Experimental.
244 *
245 * Input:
246 * buf: '\n'-terminated C string containing a
247 * presentation format IP address
248 * size: length of C string in @buf
249 * Output:
250 * On success: returns zero if all specified locks were released;
251 * returns one if one or more locks were not released
252 * On error: return code is negative errno value
253 */
254static ssize_t write_unlock_ip(struct file *file, char *buf, size_t size)
255{
256 struct sockaddr_storage address;
257 struct sockaddr *sap = (struct sockaddr *)&address;
258 size_t salen = sizeof(address);
259 char *fo_path;
260 struct net *net = netns(file);
261
262 /* sanity check */
263 if (size == 0)
264 return -EINVAL;
265
266 if (buf[size-1] != '\n')
267 return -EINVAL;
268
269 fo_path = buf;
270 if (qword_get(&buf, fo_path, size) < 0)
271 return -EINVAL;
272
273 if (rpc_pton(net, fo_path, size, sap, salen) == 0)
274 return -EINVAL;
275
276 return nlmsvc_unlock_all_by_ip(sap);
277}
278
279/**
280 * write_unlock_fs - Release all locks on a local file system
281 *
282 * Experimental.
283 *
284 * Input:
285 * buf: '\n'-terminated C string containing the
286 * absolute pathname of a local file system
287 * size: length of C string in @buf
288 * Output:
289 * On success: returns zero if all specified locks were released;
290 * returns one if one or more locks were not released
291 * On error: return code is negative errno value
292 */
293static ssize_t write_unlock_fs(struct file *file, char *buf, size_t size)
294{
295 struct path path;
296 char *fo_path;
297 int error;
298
299 /* sanity check */
300 if (size == 0)
301 return -EINVAL;
302
303 if (buf[size-1] != '\n')
304 return -EINVAL;
305
306 fo_path = buf;
307 if (qword_get(&buf, fo_path, size) < 0)
308 return -EINVAL;
309
310 error = kern_path(fo_path, 0, &path);
311 if (error)
312 return error;
313
314 /*
315 * XXX: Needs better sanity checking. Otherwise we could end up
316 * releasing locks on the wrong file system.
317 *
318 * For example:
319 * 1. Does the path refer to a directory?
320 * 2. Is that directory a mount point, or
321 * 3. Is that directory the root of an exported file system?
322 */
323 error = nlmsvc_unlock_all_by_sb(path.dentry->d_sb);
324
325 path_put(&path);
326 return error;
327}
328
329/**
330 * write_filehandle - Get a variable-length NFS file handle by path
331 *
332 * On input, the buffer contains a '\n'-terminated C string comprised of
333 * three alphanumeric words separated by whitespace. The string may
334 * contain escape sequences.
335 *
336 * Input:
337 * buf:
338 * domain: client domain name
339 * path: export pathname
340 * maxsize: numeric maximum size of
341 * @buf
342 * size: length of C string in @buf
343 * Output:
344 * On success: passed-in buffer filled with '\n'-terminated C
345 * string containing a ASCII hex text version
346 * of the NFS file handle;
347 * return code is the size in bytes of the string
348 * On error: return code is negative errno value
349 */
350static ssize_t write_filehandle(struct file *file, char *buf, size_t size)
351{
352 char *dname, *path;
353 int uninitialized_var(maxsize);
354 char *mesg = buf;
355 int len;
356 struct auth_domain *dom;
357 struct knfsd_fh fh;
358
359 if (size == 0)
360 return -EINVAL;
361
362 if (buf[size-1] != '\n')
363 return -EINVAL;
364 buf[size-1] = 0;
365
366 dname = mesg;
367 len = qword_get(&mesg, dname, size);
368 if (len <= 0)
369 return -EINVAL;
370
371 path = dname+len+1;
372 len = qword_get(&mesg, path, size);
373 if (len <= 0)
374 return -EINVAL;
375
376 len = get_int(&mesg, &maxsize);
377 if (len)
378 return len;
379
380 if (maxsize < NFS_FHSIZE)
381 return -EINVAL;
382 maxsize = min(maxsize, NFS3_FHSIZE);
383
384 if (qword_get(&mesg, mesg, size)>0)
385 return -EINVAL;
386
387 /* we have all the words, they are in buf.. */
388 dom = unix_domain_find(dname);
389 if (!dom)
390 return -ENOMEM;
391
392 len = exp_rootfh(netns(file), dom, path, &fh, maxsize);
393 auth_domain_put(dom);
394 if (len)
395 return len;
396
397 mesg = buf;
398 len = SIMPLE_TRANSACTION_LIMIT;
399 qword_addhex(&mesg, &len, (char*)&fh.fh_base, fh.fh_size);
400 mesg[-1] = '\n';
401 return mesg - buf;
402}
403
404/**
405 * write_threads - Start NFSD, or report the current number of running threads
406 *
407 * Input:
408 * buf: ignored
409 * size: zero
410 * Output:
411 * On success: passed-in buffer filled with '\n'-terminated C
412 * string numeric value representing the number of
413 * running NFSD threads;
414 * return code is the size in bytes of the string
415 * On error: return code is zero
416 *
417 * OR
418 *
419 * Input:
420 * buf: C string containing an unsigned
421 * integer value representing the
422 * number of NFSD threads to start
423 * size: non-zero length of C string in @buf
424 * Output:
425 * On success: NFS service is started;
426 * passed-in buffer filled with '\n'-terminated C
427 * string numeric value representing the number of
428 * running NFSD threads;
429 * return code is the size in bytes of the string
430 * On error: return code is zero or a negative errno value
431 */
432static ssize_t write_threads(struct file *file, char *buf, size_t size)
433{
434 char *mesg = buf;
435 int rv;
436 struct net *net = netns(file);
437
438 if (size > 0) {
439 int newthreads;
440 rv = get_int(&mesg, &newthreads);
441 if (rv)
442 return rv;
443 if (newthreads < 0)
444 return -EINVAL;
445 rv = nfsd_svc(newthreads, net);
446 if (rv < 0)
447 return rv;
448 } else
449 rv = nfsd_nrthreads(net);
450
451 return scnprintf(buf, SIMPLE_TRANSACTION_LIMIT, "%d\n", rv);
452}
453
454/**
455 * write_pool_threads - Set or report the current number of threads per pool
456 *
457 * Input:
458 * buf: ignored
459 * size: zero
460 *
461 * OR
462 *
463 * Input:
464 * buf: C string containing whitespace-
465 * separated unsigned integer values
466 * representing the number of NFSD
467 * threads to start in each pool
468 * size: non-zero length of C string in @buf
469 * Output:
470 * On success: passed-in buffer filled with '\n'-terminated C
471 * string containing integer values representing the
472 * number of NFSD threads in each pool;
473 * return code is the size in bytes of the string
474 * On error: return code is zero or a negative errno value
475 */
476static ssize_t write_pool_threads(struct file *file, char *buf, size_t size)
477{
478 /* if size > 0, look for an array of number of threads per node
479 * and apply them then write out number of threads per node as reply
480 */
481 char *mesg = buf;
482 int i;
483 int rv;
484 int len;
485 int npools;
486 int *nthreads;
487 struct net *net = netns(file);
488
489 mutex_lock(&nfsd_mutex);
490 npools = nfsd_nrpools(net);
491 if (npools == 0) {
492 /*
493 * NFS is shut down. The admin can start it by
494 * writing to the threads file but NOT the pool_threads
495 * file, sorry. Report zero threads.
496 */
497 mutex_unlock(&nfsd_mutex);
498 strcpy(buf, "0\n");
499 return strlen(buf);
500 }
501
502 nthreads = kcalloc(npools, sizeof(int), GFP_KERNEL);
503 rv = -ENOMEM;
504 if (nthreads == NULL)
505 goto out_free;
506
507 if (size > 0) {
508 for (i = 0; i < npools; i++) {
509 rv = get_int(&mesg, &nthreads[i]);
510 if (rv == -ENOENT)
511 break; /* fewer numbers than pools */
512 if (rv)
513 goto out_free; /* syntax error */
514 rv = -EINVAL;
515 if (nthreads[i] < 0)
516 goto out_free;
517 }
518 rv = nfsd_set_nrthreads(i, nthreads, net);
519 if (rv)
520 goto out_free;
521 }
522
523 rv = nfsd_get_nrthreads(npools, nthreads, net);
524 if (rv)
525 goto out_free;
526
527 mesg = buf;
528 size = SIMPLE_TRANSACTION_LIMIT;
529 for (i = 0; i < npools && size > 0; i++) {
530 snprintf(mesg, size, "%d%c", nthreads[i], (i == npools-1 ? '\n' : ' '));
531 len = strlen(mesg);
532 size -= len;
533 mesg += len;
534 }
535 rv = mesg - buf;
536out_free:
537 kfree(nthreads);
538 mutex_unlock(&nfsd_mutex);
539 return rv;
540}
541
542static ssize_t __write_versions(struct file *file, char *buf, size_t size)
543{
544 char *mesg = buf;
545 char *vers, *minorp, sign;
546 int len, num, remaining;
547 unsigned minor;
548 ssize_t tlen = 0;
549 char *sep;
550 struct nfsd_net *nn = net_generic(netns(file), nfsd_net_id);
551
552 if (size>0) {
553 if (nn->nfsd_serv)
554 /* Cannot change versions without updating
555 * nn->nfsd_serv->sv_xdrsize, and reallocing
556 * rq_argp and rq_resp
557 */
558 return -EBUSY;
559 if (buf[size-1] != '\n')
560 return -EINVAL;
561 buf[size-1] = 0;
562
563 vers = mesg;
564 len = qword_get(&mesg, vers, size);
565 if (len <= 0) return -EINVAL;
566 do {
567 sign = *vers;
568 if (sign == '+' || sign == '-')
569 num = simple_strtol((vers+1), &minorp, 0);
570 else
571 num = simple_strtol(vers, &minorp, 0);
572 if (*minorp == '.') {
573 if (num != 4)
574 return -EINVAL;
575 minor = simple_strtoul(minorp+1, NULL, 0);
576 if (minor == 0)
577 return -EINVAL;
578 if (nfsd_minorversion(minor, sign == '-' ?
579 NFSD_CLEAR : NFSD_SET) < 0)
580 return -EINVAL;
581 goto next;
582 }
583 switch(num) {
584 case 2:
585 case 3:
586 case 4:
587 nfsd_vers(num, sign == '-' ? NFSD_CLEAR : NFSD_SET);
588 break;
589 default:
590 return -EINVAL;
591 }
592 next:
593 vers += len + 1;
594 } while ((len = qword_get(&mesg, vers, size)) > 0);
595 /* If all get turned off, turn them back on, as
596 * having no versions is BAD
597 */
598 nfsd_reset_versions();
599 }
600
601 /* Now write current state into reply buffer */
602 len = 0;
603 sep = "";
604 remaining = SIMPLE_TRANSACTION_LIMIT;
605 for (num=2 ; num <= 4 ; num++)
606 if (nfsd_vers(num, NFSD_AVAIL)) {
607 len = snprintf(buf, remaining, "%s%c%d", sep,
608 nfsd_vers(num, NFSD_TEST)?'+':'-',
609 num);
610 sep = " ";
611
612 if (len >= remaining)
613 break;
614 remaining -= len;
615 buf += len;
616 tlen += len;
617 }
618 if (nfsd_vers(4, NFSD_AVAIL))
619 for (minor = 1; minor <= NFSD_SUPPORTED_MINOR_VERSION;
620 minor++) {
621 len = snprintf(buf, remaining, " %c4.%u",
622 (nfsd_vers(4, NFSD_TEST) &&
623 nfsd_minorversion(minor, NFSD_TEST)) ?
624 '+' : '-',
625 minor);
626
627 if (len >= remaining)
628 break;
629 remaining -= len;
630 buf += len;
631 tlen += len;
632 }
633
634 len = snprintf(buf, remaining, "\n");
635 if (len >= remaining)
636 return -EINVAL;
637 return tlen + len;
638}
639
640/**
641 * write_versions - Set or report the available NFS protocol versions
642 *
643 * Input:
644 * buf: ignored
645 * size: zero
646 * Output:
647 * On success: passed-in buffer filled with '\n'-terminated C
648 * string containing positive or negative integer
649 * values representing the current status of each
650 * protocol version;
651 * return code is the size in bytes of the string
652 * On error: return code is zero or a negative errno value
653 *
654 * OR
655 *
656 * Input:
657 * buf: C string containing whitespace-
658 * separated positive or negative
659 * integer values representing NFS
660 * protocol versions to enable ("+n")
661 * or disable ("-n")
662 * size: non-zero length of C string in @buf
663 * Output:
664 * On success: status of zero or more protocol versions has
665 * been updated; passed-in buffer filled with
666 * '\n'-terminated C string containing positive
667 * or negative integer values representing the
668 * current status of each protocol version;
669 * return code is the size in bytes of the string
670 * On error: return code is zero or a negative errno value
671 */
672static ssize_t write_versions(struct file *file, char *buf, size_t size)
673{
674 ssize_t rv;
675
676 mutex_lock(&nfsd_mutex);
677 rv = __write_versions(file, buf, size);
678 mutex_unlock(&nfsd_mutex);
679 return rv;
680}
681
682/*
683 * Zero-length write. Return a list of NFSD's current listener
684 * transports.
685 */
686static ssize_t __write_ports_names(char *buf, struct net *net)
687{
688 struct nfsd_net *nn = net_generic(net, nfsd_net_id);
689
690 if (nn->nfsd_serv == NULL)
691 return 0;
692 return svc_xprt_names(nn->nfsd_serv, buf, SIMPLE_TRANSACTION_LIMIT);
693}
694
695/*
696 * A single 'fd' number was written, in which case it must be for
697 * a socket of a supported family/protocol, and we use it as an
698 * nfsd listener.
699 */
700static ssize_t __write_ports_addfd(char *buf, struct net *net)
701{
702 char *mesg = buf;
703 int fd, err;
704 struct nfsd_net *nn = net_generic(net, nfsd_net_id);
705
706 err = get_int(&mesg, &fd);
707 if (err != 0 || fd < 0)
708 return -EINVAL;
709
710 if (svc_alien_sock(net, fd)) {
711 printk(KERN_ERR "%s: socket net is different to NFSd's one\n", __func__);
712 return -EINVAL;
713 }
714
715 err = nfsd_create_serv(net);
716 if (err != 0)
717 return err;
718
719 err = svc_addsock(nn->nfsd_serv, fd, buf, SIMPLE_TRANSACTION_LIMIT);
720 if (err < 0) {
721 nfsd_destroy(net);
722 return err;
723 }
724
725 /* Decrease the count, but don't shut down the service */
726 nn->nfsd_serv->sv_nrthreads--;
727 return err;
728}
729
730/*
731 * A transport listener is added by writing it's transport name and
732 * a port number.
733 */
734static ssize_t __write_ports_addxprt(char *buf, struct net *net)
735{
736 char transport[16];
737 struct svc_xprt *xprt;
738 int port, err;
739 struct nfsd_net *nn = net_generic(net, nfsd_net_id);
740
741 if (sscanf(buf, "%15s %5u", transport, &port) != 2)
742 return -EINVAL;
743
744 if (port < 1 || port > USHRT_MAX)
745 return -EINVAL;
746
747 err = nfsd_create_serv(net);
748 if (err != 0)
749 return err;
750
751 err = svc_create_xprt(nn->nfsd_serv, transport, net,
752 PF_INET, port, SVC_SOCK_ANONYMOUS);
753 if (err < 0)
754 goto out_err;
755
756 err = svc_create_xprt(nn->nfsd_serv, transport, net,
757 PF_INET6, port, SVC_SOCK_ANONYMOUS);
758 if (err < 0 && err != -EAFNOSUPPORT)
759 goto out_close;
760
761 /* Decrease the count, but don't shut down the service */
762 nn->nfsd_serv->sv_nrthreads--;
763 return 0;
764out_close:
765 xprt = svc_find_xprt(nn->nfsd_serv, transport, net, PF_INET, port);
766 if (xprt != NULL) {
767 svc_close_xprt(xprt);
768 svc_xprt_put(xprt);
769 }
770out_err:
771 nfsd_destroy(net);
772 return err;
773}
774
775static ssize_t __write_ports(struct file *file, char *buf, size_t size,
776 struct net *net)
777{
778 if (size == 0)
779 return __write_ports_names(buf, net);
780
781 if (isdigit(buf[0]))
782 return __write_ports_addfd(buf, net);
783
784 if (isalpha(buf[0]))
785 return __write_ports_addxprt(buf, net);
786
787 return -EINVAL;
788}
789
790/**
791 * write_ports - Pass a socket file descriptor or transport name to listen on
792 *
793 * Input:
794 * buf: ignored
795 * size: zero
796 * Output:
797 * On success: passed-in buffer filled with a '\n'-terminated C
798 * string containing a whitespace-separated list of
799 * named NFSD listeners;
800 * return code is the size in bytes of the string
801 * On error: return code is zero or a negative errno value
802 *
803 * OR
804 *
805 * Input:
806 * buf: C string containing an unsigned
807 * integer value representing a bound
808 * but unconnected socket that is to be
809 * used as an NFSD listener; listen(3)
810 * must be called for a SOCK_STREAM
811 * socket, otherwise it is ignored
812 * size: non-zero length of C string in @buf
813 * Output:
814 * On success: NFS service is started;
815 * passed-in buffer filled with a '\n'-terminated C
816 * string containing a unique alphanumeric name of
817 * the listener;
818 * return code is the size in bytes of the string
819 * On error: return code is a negative errno value
820 *
821 * OR
822 *
823 * Input:
824 * buf: C string containing a transport
825 * name and an unsigned integer value
826 * representing the port to listen on,
827 * separated by whitespace
828 * size: non-zero length of C string in @buf
829 * Output:
830 * On success: returns zero; NFS service is started
831 * On error: return code is a negative errno value
832 */
833static ssize_t write_ports(struct file *file, char *buf, size_t size)
834{
835 ssize_t rv;
836
837 mutex_lock(&nfsd_mutex);
838 rv = __write_ports(file, buf, size, netns(file));
839 mutex_unlock(&nfsd_mutex);
840 return rv;
841}
842
843
844int nfsd_max_blksize;
845
846/**
847 * write_maxblksize - Set or report the current NFS blksize
848 *
849 * Input:
850 * buf: ignored
851 * size: zero
852 *
853 * OR
854 *
855 * Input:
856 * buf: C string containing an unsigned
857 * integer value representing the new
858 * NFS blksize
859 * size: non-zero length of C string in @buf
860 * Output:
861 * On success: passed-in buffer filled with '\n'-terminated C string
862 * containing numeric value of the current NFS blksize
863 * setting;
864 * return code is the size in bytes of the string
865 * On error: return code is zero or a negative errno value
866 */
867static ssize_t write_maxblksize(struct file *file, char *buf, size_t size)
868{
869 char *mesg = buf;
870 struct nfsd_net *nn = net_generic(netns(file), nfsd_net_id);
871
872 if (size > 0) {
873 int bsize;
874 int rv = get_int(&mesg, &bsize);
875 if (rv)
876 return rv;
877 /* force bsize into allowed range and
878 * required alignment.
879 */
880 bsize = max_t(int, bsize, 1024);
881 bsize = min_t(int, bsize, NFSSVC_MAXBLKSIZE);
882 bsize &= ~(1024-1);
883 mutex_lock(&nfsd_mutex);
884 if (nn->nfsd_serv) {
885 mutex_unlock(&nfsd_mutex);
886 return -EBUSY;
887 }
888 nfsd_max_blksize = bsize;
889 mutex_unlock(&nfsd_mutex);
890 }
891
892 return scnprintf(buf, SIMPLE_TRANSACTION_LIMIT, "%d\n",
893 nfsd_max_blksize);
894}
895
896/**
897 * write_maxconn - Set or report the current max number of connections
898 *
899 * Input:
900 * buf: ignored
901 * size: zero
902 * OR
903 *
904 * Input:
905 * buf: C string containing an unsigned
906 * integer value representing the new
907 * number of max connections
908 * size: non-zero length of C string in @buf
909 * Output:
910 * On success: passed-in buffer filled with '\n'-terminated C string
911 * containing numeric value of max_connections setting
912 * for this net namespace;
913 * return code is the size in bytes of the string
914 * On error: return code is zero or a negative errno value
915 */
916static ssize_t write_maxconn(struct file *file, char *buf, size_t size)
917{
918 char *mesg = buf;
919 struct nfsd_net *nn = net_generic(netns(file), nfsd_net_id);
920 unsigned int maxconn = nn->max_connections;
921
922 if (size > 0) {
923 int rv = get_uint(&mesg, &maxconn);
924
925 if (rv)
926 return rv;
927 nn->max_connections = maxconn;
928 }
929
930 return scnprintf(buf, SIMPLE_TRANSACTION_LIMIT, "%u\n", maxconn);
931}
932
933#ifdef CONFIG_NFSD_V4
934static ssize_t __nfsd4_write_time(struct file *file, char *buf, size_t size,
935 time_t *time, struct nfsd_net *nn)
936{
937 char *mesg = buf;
938 int rv, i;
939
940 if (size > 0) {
941 if (nn->nfsd_serv)
942 return -EBUSY;
943 rv = get_int(&mesg, &i);
944 if (rv)
945 return rv;
946 /*
947 * Some sanity checking. We don't have a reason for
948 * these particular numbers, but problems with the
949 * extremes are:
950 * - Too short: the briefest network outage may
951 * cause clients to lose all their locks. Also,
952 * the frequent polling may be wasteful.
953 * - Too long: do you really want reboot recovery
954 * to take more than an hour? Or to make other
955 * clients wait an hour before being able to
956 * revoke a dead client's locks?
957 */
958 if (i < 10 || i > 3600)
959 return -EINVAL;
960 *time = i;
961 }
962
963 return scnprintf(buf, SIMPLE_TRANSACTION_LIMIT, "%ld\n", *time);
964}
965
966static ssize_t nfsd4_write_time(struct file *file, char *buf, size_t size,
967 time_t *time, struct nfsd_net *nn)
968{
969 ssize_t rv;
970
971 mutex_lock(&nfsd_mutex);
972 rv = __nfsd4_write_time(file, buf, size, time, nn);
973 mutex_unlock(&nfsd_mutex);
974 return rv;
975}
976
977/**
978 * write_leasetime - Set or report the current NFSv4 lease time
979 *
980 * Input:
981 * buf: ignored
982 * size: zero
983 *
984 * OR
985 *
986 * Input:
987 * buf: C string containing an unsigned
988 * integer value representing the new
989 * NFSv4 lease expiry time
990 * size: non-zero length of C string in @buf
991 * Output:
992 * On success: passed-in buffer filled with '\n'-terminated C
993 * string containing unsigned integer value of the
994 * current lease expiry time;
995 * return code is the size in bytes of the string
996 * On error: return code is zero or a negative errno value
997 */
998static ssize_t write_leasetime(struct file *file, char *buf, size_t size)
999{
1000 struct nfsd_net *nn = net_generic(netns(file), nfsd_net_id);
1001 return nfsd4_write_time(file, buf, size, &nn->nfsd4_lease, nn);
1002}
1003
1004/**
1005 * write_gracetime - Set or report current NFSv4 grace period time
1006 *
1007 * As above, but sets the time of the NFSv4 grace period.
1008 *
1009 * Note this should never be set to less than the *previous*
1010 * lease-period time, but we don't try to enforce this. (In the common
1011 * case (a new boot), we don't know what the previous lease time was
1012 * anyway.)
1013 */
1014static ssize_t write_gracetime(struct file *file, char *buf, size_t size)
1015{
1016 struct nfsd_net *nn = net_generic(netns(file), nfsd_net_id);
1017 return nfsd4_write_time(file, buf, size, &nn->nfsd4_grace, nn);
1018}
1019
1020static ssize_t __write_recoverydir(struct file *file, char *buf, size_t size,
1021 struct nfsd_net *nn)
1022{
1023 char *mesg = buf;
1024 char *recdir;
1025 int len, status;
1026
1027 if (size > 0) {
1028 if (nn->nfsd_serv)
1029 return -EBUSY;
1030 if (size > PATH_MAX || buf[size-1] != '\n')
1031 return -EINVAL;
1032 buf[size-1] = 0;
1033
1034 recdir = mesg;
1035 len = qword_get(&mesg, recdir, size);
1036 if (len <= 0)
1037 return -EINVAL;
1038
1039 status = nfs4_reset_recoverydir(recdir);
1040 if (status)
1041 return status;
1042 }
1043
1044 return scnprintf(buf, SIMPLE_TRANSACTION_LIMIT, "%s\n",
1045 nfs4_recoverydir());
1046}
1047
1048/**
1049 * write_recoverydir - Set or report the pathname of the recovery directory
1050 *
1051 * Input:
1052 * buf: ignored
1053 * size: zero
1054 *
1055 * OR
1056 *
1057 * Input:
1058 * buf: C string containing the pathname
1059 * of the directory on a local file
1060 * system containing permanent NFSv4
1061 * recovery data
1062 * size: non-zero length of C string in @buf
1063 * Output:
1064 * On success: passed-in buffer filled with '\n'-terminated C string
1065 * containing the current recovery pathname setting;
1066 * return code is the size in bytes of the string
1067 * On error: return code is zero or a negative errno value
1068 */
1069static ssize_t write_recoverydir(struct file *file, char *buf, size_t size)
1070{
1071 ssize_t rv;
1072 struct nfsd_net *nn = net_generic(netns(file), nfsd_net_id);
1073
1074 mutex_lock(&nfsd_mutex);
1075 rv = __write_recoverydir(file, buf, size, nn);
1076 mutex_unlock(&nfsd_mutex);
1077 return rv;
1078}
1079
1080/**
1081 * write_v4_end_grace - release grace period for nfsd's v4.x lock manager
1082 *
1083 * Input:
1084 * buf: ignored
1085 * size: zero
1086 * OR
1087 *
1088 * Input:
1089 * buf: any value
1090 * size: non-zero length of C string in @buf
1091 * Output:
1092 * passed-in buffer filled with "Y" or "N" with a newline
1093 * and NULL-terminated C string. This indicates whether
1094 * the grace period has ended in the current net
1095 * namespace. Return code is the size in bytes of the
1096 * string. Writing a string that starts with 'Y', 'y', or
1097 * '1' to the file will end the grace period for nfsd's v4
1098 * lock manager.
1099 */
1100static ssize_t write_v4_end_grace(struct file *file, char *buf, size_t size)
1101{
1102 struct nfsd_net *nn = net_generic(netns(file), nfsd_net_id);
1103
1104 if (size > 0) {
1105 switch(buf[0]) {
1106 case 'Y':
1107 case 'y':
1108 case '1':
1109 nfsd4_end_grace(nn);
1110 break;
1111 default:
1112 return -EINVAL;
1113 }
1114 }
1115
1116 return scnprintf(buf, SIMPLE_TRANSACTION_LIMIT, "%c\n",
1117 nn->grace_ended ? 'Y' : 'N');
1118}
1119
1120#endif
1121
1122/*----------------------------------------------------------------------------*/
1123/*
1124 * populating the filesystem.
1125 */
1126
1127static int nfsd_fill_super(struct super_block * sb, void * data, int silent)
1128{
1129 static struct tree_descr nfsd_files[] = {
1130 [NFSD_List] = {"exports", &exports_nfsd_operations, S_IRUGO},
1131 [NFSD_Export_features] = {"export_features",
1132 &export_features_operations, S_IRUGO},
1133 [NFSD_FO_UnlockIP] = {"unlock_ip",
1134 &transaction_ops, S_IWUSR|S_IRUSR},
1135 [NFSD_FO_UnlockFS] = {"unlock_filesystem",
1136 &transaction_ops, S_IWUSR|S_IRUSR},
1137 [NFSD_Fh] = {"filehandle", &transaction_ops, S_IWUSR|S_IRUSR},
1138 [NFSD_Threads] = {"threads", &transaction_ops, S_IWUSR|S_IRUSR},
1139 [NFSD_Pool_Threads] = {"pool_threads", &transaction_ops, S_IWUSR|S_IRUSR},
1140 [NFSD_Pool_Stats] = {"pool_stats", &pool_stats_operations, S_IRUGO},
1141 [NFSD_Reply_Cache_Stats] = {"reply_cache_stats", &reply_cache_stats_operations, S_IRUGO},
1142 [NFSD_Versions] = {"versions", &transaction_ops, S_IWUSR|S_IRUSR},
1143 [NFSD_Ports] = {"portlist", &transaction_ops, S_IWUSR|S_IRUGO},
1144 [NFSD_MaxBlkSize] = {"max_block_size", &transaction_ops, S_IWUSR|S_IRUGO},
1145 [NFSD_MaxConnections] = {"max_connections", &transaction_ops, S_IWUSR|S_IRUGO},
1146#if defined(CONFIG_SUNRPC_GSS) || defined(CONFIG_SUNRPC_GSS_MODULE)
1147 [NFSD_SupportedEnctypes] = {"supported_krb5_enctypes", &supported_enctypes_ops, S_IRUGO},
1148#endif /* CONFIG_SUNRPC_GSS or CONFIG_SUNRPC_GSS_MODULE */
1149#ifdef CONFIG_NFSD_V4
1150 [NFSD_Leasetime] = {"nfsv4leasetime", &transaction_ops, S_IWUSR|S_IRUSR},
1151 [NFSD_Gracetime] = {"nfsv4gracetime", &transaction_ops, S_IWUSR|S_IRUSR},
1152 [NFSD_RecoveryDir] = {"nfsv4recoverydir", &transaction_ops, S_IWUSR|S_IRUSR},
1153 [NFSD_V4EndGrace] = {"v4_end_grace", &transaction_ops, S_IWUSR|S_IRUGO},
1154#endif
1155 /* last one */ {""}
1156 };
1157 struct net *net = data;
1158 int ret;
1159
1160 ret = simple_fill_super(sb, 0x6e667364, nfsd_files);
1161 if (ret)
1162 return ret;
1163 sb->s_fs_info = get_net(net);
1164 return 0;
1165}
1166
1167static struct dentry *nfsd_mount(struct file_system_type *fs_type,
1168 int flags, const char *dev_name, void *data)
1169{
1170 return mount_ns(fs_type, flags, current->nsproxy->net_ns, nfsd_fill_super);
1171}
1172
1173static void nfsd_umount(struct super_block *sb)
1174{
1175 struct net *net = sb->s_fs_info;
1176
1177 kill_litter_super(sb);
1178 put_net(net);
1179}
1180
1181static struct file_system_type nfsd_fs_type = {
1182 .owner = THIS_MODULE,
1183 .name = "nfsd",
1184 .mount = nfsd_mount,
1185 .kill_sb = nfsd_umount,
1186};
1187MODULE_ALIAS_FS("nfsd");
1188
1189#ifdef CONFIG_PROC_FS
1190static int create_proc_exports_entry(void)
1191{
1192 struct proc_dir_entry *entry;
1193
1194 entry = proc_mkdir("fs/nfs", NULL);
1195 if (!entry)
1196 return -ENOMEM;
1197 entry = proc_create("exports", 0, entry,
1198 &exports_proc_operations);
1199 if (!entry) {
1200 remove_proc_entry("fs/nfs", NULL);
1201 return -ENOMEM;
1202 }
1203 return 0;
1204}
1205#else /* CONFIG_PROC_FS */
1206static int create_proc_exports_entry(void)
1207{
1208 return 0;
1209}
1210#endif
1211
1212int nfsd_net_id;
1213
1214static __net_init int nfsd_init_net(struct net *net)
1215{
1216 int retval;
1217 struct nfsd_net *nn = net_generic(net, nfsd_net_id);
1218
1219 retval = nfsd_export_init(net);
1220 if (retval)
1221 goto out_export_error;
1222 retval = nfsd_idmap_init(net);
1223 if (retval)
1224 goto out_idmap_error;
1225 nn->nfsd4_lease = 90; /* default lease time */
1226 nn->nfsd4_grace = 90;
1227 return 0;
1228
1229out_idmap_error:
1230 nfsd_export_shutdown(net);
1231out_export_error:
1232 return retval;
1233}
1234
1235static __net_exit void nfsd_exit_net(struct net *net)
1236{
1237 nfsd_idmap_shutdown(net);
1238 nfsd_export_shutdown(net);
1239}
1240
1241static struct pernet_operations nfsd_net_ops = {
1242 .init = nfsd_init_net,
1243 .exit = nfsd_exit_net,
1244 .id = &nfsd_net_id,
1245 .size = sizeof(struct nfsd_net),
1246};
1247
1248static int __init init_nfsd(void)
1249{
1250 int retval;
1251 printk(KERN_INFO "Installing knfsd (copyright (C) 1996 okir@monad.swb.de).\n");
1252
1253 retval = register_pernet_subsys(&nfsd_net_ops);
1254 if (retval < 0)
1255 return retval;
1256 retval = register_cld_notifier();
1257 if (retval)
1258 goto out_unregister_pernet;
1259 retval = nfsd4_init_slabs();
1260 if (retval)
1261 goto out_unregister_notifier;
1262 retval = nfsd4_init_pnfs();
1263 if (retval)
1264 goto out_free_slabs;
1265 retval = nfsd_fault_inject_init(); /* nfsd fault injection controls */
1266 if (retval)
1267 goto out_exit_pnfs;
1268 nfsd_stat_init(); /* Statistics */
1269 retval = nfsd_reply_cache_init();
1270 if (retval)
1271 goto out_free_stat;
1272 nfsd_lockd_init(); /* lockd->nfsd callbacks */
1273 retval = create_proc_exports_entry();
1274 if (retval)
1275 goto out_free_lockd;
1276 retval = register_filesystem(&nfsd_fs_type);
1277 if (retval)
1278 goto out_free_all;
1279 return 0;
1280out_free_all:
1281 remove_proc_entry("fs/nfs/exports", NULL);
1282 remove_proc_entry("fs/nfs", NULL);
1283out_free_lockd:
1284 nfsd_lockd_shutdown();
1285 nfsd_reply_cache_shutdown();
1286out_free_stat:
1287 nfsd_stat_shutdown();
1288 nfsd_fault_inject_cleanup();
1289out_exit_pnfs:
1290 nfsd4_exit_pnfs();
1291out_free_slabs:
1292 nfsd4_free_slabs();
1293out_unregister_notifier:
1294 unregister_cld_notifier();
1295out_unregister_pernet:
1296 unregister_pernet_subsys(&nfsd_net_ops);
1297 return retval;
1298}
1299
1300static void __exit exit_nfsd(void)
1301{
1302 nfsd_reply_cache_shutdown();
1303 remove_proc_entry("fs/nfs/exports", NULL);
1304 remove_proc_entry("fs/nfs", NULL);
1305 nfsd_stat_shutdown();
1306 nfsd_lockd_shutdown();
1307 nfsd4_free_slabs();
1308 nfsd4_exit_pnfs();
1309 nfsd_fault_inject_cleanup();
1310 unregister_filesystem(&nfsd_fs_type);
1311 unregister_cld_notifier();
1312 unregister_pernet_subsys(&nfsd_net_ops);
1313}
1314
1315MODULE_AUTHOR("Olaf Kirch <okir@monad.swb.de>");
1316MODULE_LICENSE("GPL");
1317module_init(init_nfsd)
1318module_exit(exit_nfsd)
1// SPDX-License-Identifier: GPL-2.0-only
2/*
3 * Syscall interface to knfsd.
4 *
5 * Copyright (C) 1995, 1996 Olaf Kirch <okir@monad.swb.de>
6 */
7
8#include <linux/slab.h>
9#include <linux/namei.h>
10#include <linux/ctype.h>
11#include <linux/fs_context.h>
12
13#include <linux/sunrpc/svcsock.h>
14#include <linux/lockd/lockd.h>
15#include <linux/sunrpc/addr.h>
16#include <linux/sunrpc/gss_api.h>
17#include <linux/sunrpc/gss_krb5_enctypes.h>
18#include <linux/sunrpc/rpc_pipe_fs.h>
19#include <linux/module.h>
20#include <linux/fsnotify.h>
21
22#include "idmap.h"
23#include "nfsd.h"
24#include "cache.h"
25#include "state.h"
26#include "netns.h"
27#include "pnfs.h"
28
29/*
30 * We have a single directory with several nodes in it.
31 */
32enum {
33 NFSD_Root = 1,
34 NFSD_List,
35 NFSD_Export_Stats,
36 NFSD_Export_features,
37 NFSD_Fh,
38 NFSD_FO_UnlockIP,
39 NFSD_FO_UnlockFS,
40 NFSD_Threads,
41 NFSD_Pool_Threads,
42 NFSD_Pool_Stats,
43 NFSD_Reply_Cache_Stats,
44 NFSD_Versions,
45 NFSD_Ports,
46 NFSD_MaxBlkSize,
47 NFSD_MaxConnections,
48 NFSD_SupportedEnctypes,
49 /*
50 * The below MUST come last. Otherwise we leave a hole in nfsd_files[]
51 * with !CONFIG_NFSD_V4 and simple_fill_super() goes oops
52 */
53#ifdef CONFIG_NFSD_V4
54 NFSD_Leasetime,
55 NFSD_Gracetime,
56 NFSD_RecoveryDir,
57 NFSD_V4EndGrace,
58#endif
59 NFSD_MaxReserved
60};
61
62/*
63 * write() for these nodes.
64 */
65static ssize_t write_filehandle(struct file *file, char *buf, size_t size);
66static ssize_t write_unlock_ip(struct file *file, char *buf, size_t size);
67static ssize_t write_unlock_fs(struct file *file, char *buf, size_t size);
68static ssize_t write_threads(struct file *file, char *buf, size_t size);
69static ssize_t write_pool_threads(struct file *file, char *buf, size_t size);
70static ssize_t write_versions(struct file *file, char *buf, size_t size);
71static ssize_t write_ports(struct file *file, char *buf, size_t size);
72static ssize_t write_maxblksize(struct file *file, char *buf, size_t size);
73static ssize_t write_maxconn(struct file *file, char *buf, size_t size);
74#ifdef CONFIG_NFSD_V4
75static ssize_t write_leasetime(struct file *file, char *buf, size_t size);
76static ssize_t write_gracetime(struct file *file, char *buf, size_t size);
77static ssize_t write_recoverydir(struct file *file, char *buf, size_t size);
78static ssize_t write_v4_end_grace(struct file *file, char *buf, size_t size);
79#endif
80
81static ssize_t (*const write_op[])(struct file *, char *, size_t) = {
82 [NFSD_Fh] = write_filehandle,
83 [NFSD_FO_UnlockIP] = write_unlock_ip,
84 [NFSD_FO_UnlockFS] = write_unlock_fs,
85 [NFSD_Threads] = write_threads,
86 [NFSD_Pool_Threads] = write_pool_threads,
87 [NFSD_Versions] = write_versions,
88 [NFSD_Ports] = write_ports,
89 [NFSD_MaxBlkSize] = write_maxblksize,
90 [NFSD_MaxConnections] = write_maxconn,
91#ifdef CONFIG_NFSD_V4
92 [NFSD_Leasetime] = write_leasetime,
93 [NFSD_Gracetime] = write_gracetime,
94 [NFSD_RecoveryDir] = write_recoverydir,
95 [NFSD_V4EndGrace] = write_v4_end_grace,
96#endif
97};
98
99static ssize_t nfsctl_transaction_write(struct file *file, const char __user *buf, size_t size, loff_t *pos)
100{
101 ino_t ino = file_inode(file)->i_ino;
102 char *data;
103 ssize_t rv;
104
105 if (ino >= ARRAY_SIZE(write_op) || !write_op[ino])
106 return -EINVAL;
107
108 data = simple_transaction_get(file, buf, size);
109 if (IS_ERR(data))
110 return PTR_ERR(data);
111
112 rv = write_op[ino](file, data, size);
113 if (rv >= 0) {
114 simple_transaction_set(file, rv);
115 rv = size;
116 }
117 return rv;
118}
119
120static ssize_t nfsctl_transaction_read(struct file *file, char __user *buf, size_t size, loff_t *pos)
121{
122 if (! file->private_data) {
123 /* An attempt to read a transaction file without writing
124 * causes a 0-byte write so that the file can return
125 * state information
126 */
127 ssize_t rv = nfsctl_transaction_write(file, buf, 0, pos);
128 if (rv < 0)
129 return rv;
130 }
131 return simple_transaction_read(file, buf, size, pos);
132}
133
134static const struct file_operations transaction_ops = {
135 .write = nfsctl_transaction_write,
136 .read = nfsctl_transaction_read,
137 .release = simple_transaction_release,
138 .llseek = default_llseek,
139};
140
141static int exports_net_open(struct net *net, struct file *file)
142{
143 int err;
144 struct seq_file *seq;
145 struct nfsd_net *nn = net_generic(net, nfsd_net_id);
146
147 err = seq_open(file, &nfs_exports_op);
148 if (err)
149 return err;
150
151 seq = file->private_data;
152 seq->private = nn->svc_export_cache;
153 return 0;
154}
155
156static int exports_proc_open(struct inode *inode, struct file *file)
157{
158 return exports_net_open(current->nsproxy->net_ns, file);
159}
160
161static const struct proc_ops exports_proc_ops = {
162 .proc_open = exports_proc_open,
163 .proc_read = seq_read,
164 .proc_lseek = seq_lseek,
165 .proc_release = seq_release,
166};
167
168static int exports_nfsd_open(struct inode *inode, struct file *file)
169{
170 return exports_net_open(inode->i_sb->s_fs_info, file);
171}
172
173static const struct file_operations exports_nfsd_operations = {
174 .open = exports_nfsd_open,
175 .read = seq_read,
176 .llseek = seq_lseek,
177 .release = seq_release,
178};
179
180static int export_features_show(struct seq_file *m, void *v)
181{
182 seq_printf(m, "0x%x 0x%x\n", NFSEXP_ALLFLAGS, NFSEXP_SECINFO_FLAGS);
183 return 0;
184}
185
186static int export_features_open(struct inode *inode, struct file *file)
187{
188 return single_open(file, export_features_show, NULL);
189}
190
191static const struct file_operations export_features_operations = {
192 .open = export_features_open,
193 .read = seq_read,
194 .llseek = seq_lseek,
195 .release = single_release,
196};
197
198#if defined(CONFIG_SUNRPC_GSS) || defined(CONFIG_SUNRPC_GSS_MODULE)
199static int supported_enctypes_show(struct seq_file *m, void *v)
200{
201 seq_printf(m, KRB5_SUPPORTED_ENCTYPES);
202 return 0;
203}
204
205static int supported_enctypes_open(struct inode *inode, struct file *file)
206{
207 return single_open(file, supported_enctypes_show, NULL);
208}
209
210static const struct file_operations supported_enctypes_ops = {
211 .open = supported_enctypes_open,
212 .read = seq_read,
213 .llseek = seq_lseek,
214 .release = single_release,
215};
216#endif /* CONFIG_SUNRPC_GSS or CONFIG_SUNRPC_GSS_MODULE */
217
218static const struct file_operations pool_stats_operations = {
219 .open = nfsd_pool_stats_open,
220 .read = seq_read,
221 .llseek = seq_lseek,
222 .release = nfsd_pool_stats_release,
223};
224
225static const struct file_operations reply_cache_stats_operations = {
226 .open = nfsd_reply_cache_stats_open,
227 .read = seq_read,
228 .llseek = seq_lseek,
229 .release = single_release,
230};
231
232/*----------------------------------------------------------------------------*/
233/*
234 * payload - write methods
235 */
236
237static inline struct net *netns(struct file *file)
238{
239 return file_inode(file)->i_sb->s_fs_info;
240}
241
242/*
243 * write_unlock_ip - Release all locks used by a client
244 *
245 * Experimental.
246 *
247 * Input:
248 * buf: '\n'-terminated C string containing a
249 * presentation format IP address
250 * size: length of C string in @buf
251 * Output:
252 * On success: returns zero if all specified locks were released;
253 * returns one if one or more locks were not released
254 * On error: return code is negative errno value
255 */
256static ssize_t write_unlock_ip(struct file *file, char *buf, size_t size)
257{
258 struct sockaddr_storage address;
259 struct sockaddr *sap = (struct sockaddr *)&address;
260 size_t salen = sizeof(address);
261 char *fo_path;
262 struct net *net = netns(file);
263
264 /* sanity check */
265 if (size == 0)
266 return -EINVAL;
267
268 if (buf[size-1] != '\n')
269 return -EINVAL;
270
271 fo_path = buf;
272 if (qword_get(&buf, fo_path, size) < 0)
273 return -EINVAL;
274
275 if (rpc_pton(net, fo_path, size, sap, salen) == 0)
276 return -EINVAL;
277
278 return nlmsvc_unlock_all_by_ip(sap);
279}
280
281/*
282 * write_unlock_fs - Release all locks on a local file system
283 *
284 * Experimental.
285 *
286 * Input:
287 * buf: '\n'-terminated C string containing the
288 * absolute pathname of a local file system
289 * size: length of C string in @buf
290 * Output:
291 * On success: returns zero if all specified locks were released;
292 * returns one if one or more locks were not released
293 * On error: return code is negative errno value
294 */
295static ssize_t write_unlock_fs(struct file *file, char *buf, size_t size)
296{
297 struct path path;
298 char *fo_path;
299 int error;
300
301 /* sanity check */
302 if (size == 0)
303 return -EINVAL;
304
305 if (buf[size-1] != '\n')
306 return -EINVAL;
307
308 fo_path = buf;
309 if (qword_get(&buf, fo_path, size) < 0)
310 return -EINVAL;
311
312 error = kern_path(fo_path, 0, &path);
313 if (error)
314 return error;
315
316 /*
317 * XXX: Needs better sanity checking. Otherwise we could end up
318 * releasing locks on the wrong file system.
319 *
320 * For example:
321 * 1. Does the path refer to a directory?
322 * 2. Is that directory a mount point, or
323 * 3. Is that directory the root of an exported file system?
324 */
325 error = nlmsvc_unlock_all_by_sb(path.dentry->d_sb);
326
327 path_put(&path);
328 return error;
329}
330
331/*
332 * write_filehandle - Get a variable-length NFS file handle by path
333 *
334 * On input, the buffer contains a '\n'-terminated C string comprised of
335 * three alphanumeric words separated by whitespace. The string may
336 * contain escape sequences.
337 *
338 * Input:
339 * buf:
340 * domain: client domain name
341 * path: export pathname
342 * maxsize: numeric maximum size of
343 * @buf
344 * size: length of C string in @buf
345 * Output:
346 * On success: passed-in buffer filled with '\n'-terminated C
347 * string containing a ASCII hex text version
348 * of the NFS file handle;
349 * return code is the size in bytes of the string
350 * On error: return code is negative errno value
351 */
352static ssize_t write_filehandle(struct file *file, char *buf, size_t size)
353{
354 char *dname, *path;
355 int maxsize;
356 char *mesg = buf;
357 int len;
358 struct auth_domain *dom;
359 struct knfsd_fh fh;
360
361 if (size == 0)
362 return -EINVAL;
363
364 if (buf[size-1] != '\n')
365 return -EINVAL;
366 buf[size-1] = 0;
367
368 dname = mesg;
369 len = qword_get(&mesg, dname, size);
370 if (len <= 0)
371 return -EINVAL;
372
373 path = dname+len+1;
374 len = qword_get(&mesg, path, size);
375 if (len <= 0)
376 return -EINVAL;
377
378 len = get_int(&mesg, &maxsize);
379 if (len)
380 return len;
381
382 if (maxsize < NFS_FHSIZE)
383 return -EINVAL;
384 maxsize = min(maxsize, NFS3_FHSIZE);
385
386 if (qword_get(&mesg, mesg, size)>0)
387 return -EINVAL;
388
389 /* we have all the words, they are in buf.. */
390 dom = unix_domain_find(dname);
391 if (!dom)
392 return -ENOMEM;
393
394 len = exp_rootfh(netns(file), dom, path, &fh, maxsize);
395 auth_domain_put(dom);
396 if (len)
397 return len;
398
399 mesg = buf;
400 len = SIMPLE_TRANSACTION_LIMIT;
401 qword_addhex(&mesg, &len, (char*)&fh.fh_base, fh.fh_size);
402 mesg[-1] = '\n';
403 return mesg - buf;
404}
405
406/*
407 * write_threads - Start NFSD, or report the current number of running threads
408 *
409 * Input:
410 * buf: ignored
411 * size: zero
412 * Output:
413 * On success: passed-in buffer filled with '\n'-terminated C
414 * string numeric value representing the number of
415 * running NFSD threads;
416 * return code is the size in bytes of the string
417 * On error: return code is zero
418 *
419 * OR
420 *
421 * Input:
422 * buf: C string containing an unsigned
423 * integer value representing the
424 * number of NFSD threads to start
425 * size: non-zero length of C string in @buf
426 * Output:
427 * On success: NFS service is started;
428 * passed-in buffer filled with '\n'-terminated C
429 * string numeric value representing the number of
430 * running NFSD threads;
431 * return code is the size in bytes of the string
432 * On error: return code is zero or a negative errno value
433 */
434static ssize_t write_threads(struct file *file, char *buf, size_t size)
435{
436 char *mesg = buf;
437 int rv;
438 struct net *net = netns(file);
439
440 if (size > 0) {
441 int newthreads;
442 rv = get_int(&mesg, &newthreads);
443 if (rv)
444 return rv;
445 if (newthreads < 0)
446 return -EINVAL;
447 rv = nfsd_svc(newthreads, net, file->f_cred);
448 if (rv < 0)
449 return rv;
450 } else
451 rv = nfsd_nrthreads(net);
452
453 return scnprintf(buf, SIMPLE_TRANSACTION_LIMIT, "%d\n", rv);
454}
455
456/*
457 * write_pool_threads - Set or report the current number of threads per pool
458 *
459 * Input:
460 * buf: ignored
461 * size: zero
462 *
463 * OR
464 *
465 * Input:
466 * buf: C string containing whitespace-
467 * separated unsigned integer values
468 * representing the number of NFSD
469 * threads to start in each pool
470 * size: non-zero length of C string in @buf
471 * Output:
472 * On success: passed-in buffer filled with '\n'-terminated C
473 * string containing integer values representing the
474 * number of NFSD threads in each pool;
475 * return code is the size in bytes of the string
476 * On error: return code is zero or a negative errno value
477 */
478static ssize_t write_pool_threads(struct file *file, char *buf, size_t size)
479{
480 /* if size > 0, look for an array of number of threads per node
481 * and apply them then write out number of threads per node as reply
482 */
483 char *mesg = buf;
484 int i;
485 int rv;
486 int len;
487 int npools;
488 int *nthreads;
489 struct net *net = netns(file);
490
491 mutex_lock(&nfsd_mutex);
492 npools = nfsd_nrpools(net);
493 if (npools == 0) {
494 /*
495 * NFS is shut down. The admin can start it by
496 * writing to the threads file but NOT the pool_threads
497 * file, sorry. Report zero threads.
498 */
499 mutex_unlock(&nfsd_mutex);
500 strcpy(buf, "0\n");
501 return strlen(buf);
502 }
503
504 nthreads = kcalloc(npools, sizeof(int), GFP_KERNEL);
505 rv = -ENOMEM;
506 if (nthreads == NULL)
507 goto out_free;
508
509 if (size > 0) {
510 for (i = 0; i < npools; i++) {
511 rv = get_int(&mesg, &nthreads[i]);
512 if (rv == -ENOENT)
513 break; /* fewer numbers than pools */
514 if (rv)
515 goto out_free; /* syntax error */
516 rv = -EINVAL;
517 if (nthreads[i] < 0)
518 goto out_free;
519 }
520 rv = nfsd_set_nrthreads(i, nthreads, net);
521 if (rv)
522 goto out_free;
523 }
524
525 rv = nfsd_get_nrthreads(npools, nthreads, net);
526 if (rv)
527 goto out_free;
528
529 mesg = buf;
530 size = SIMPLE_TRANSACTION_LIMIT;
531 for (i = 0; i < npools && size > 0; i++) {
532 snprintf(mesg, size, "%d%c", nthreads[i], (i == npools-1 ? '\n' : ' '));
533 len = strlen(mesg);
534 size -= len;
535 mesg += len;
536 }
537 rv = mesg - buf;
538out_free:
539 kfree(nthreads);
540 mutex_unlock(&nfsd_mutex);
541 return rv;
542}
543
544static ssize_t
545nfsd_print_version_support(struct nfsd_net *nn, char *buf, int remaining,
546 const char *sep, unsigned vers, int minor)
547{
548 const char *format = minor < 0 ? "%s%c%u" : "%s%c%u.%u";
549 bool supported = !!nfsd_vers(nn, vers, NFSD_TEST);
550
551 if (vers == 4 && minor >= 0 &&
552 !nfsd_minorversion(nn, minor, NFSD_TEST))
553 supported = false;
554 if (minor == 0 && supported)
555 /*
556 * special case for backward compatability.
557 * +4.0 is never reported, it is implied by
558 * +4, unless -4.0 is present.
559 */
560 return 0;
561 return snprintf(buf, remaining, format, sep,
562 supported ? '+' : '-', vers, minor);
563}
564
565static ssize_t __write_versions(struct file *file, char *buf, size_t size)
566{
567 char *mesg = buf;
568 char *vers, *minorp, sign;
569 int len, num, remaining;
570 ssize_t tlen = 0;
571 char *sep;
572 struct nfsd_net *nn = net_generic(netns(file), nfsd_net_id);
573
574 if (size>0) {
575 if (nn->nfsd_serv)
576 /* Cannot change versions without updating
577 * nn->nfsd_serv->sv_xdrsize, and reallocing
578 * rq_argp and rq_resp
579 */
580 return -EBUSY;
581 if (buf[size-1] != '\n')
582 return -EINVAL;
583 buf[size-1] = 0;
584
585 vers = mesg;
586 len = qword_get(&mesg, vers, size);
587 if (len <= 0) return -EINVAL;
588 do {
589 enum vers_op cmd;
590 unsigned minor;
591 sign = *vers;
592 if (sign == '+' || sign == '-')
593 num = simple_strtol((vers+1), &minorp, 0);
594 else
595 num = simple_strtol(vers, &minorp, 0);
596 if (*minorp == '.') {
597 if (num != 4)
598 return -EINVAL;
599 if (kstrtouint(minorp+1, 0, &minor) < 0)
600 return -EINVAL;
601 }
602
603 cmd = sign == '-' ? NFSD_CLEAR : NFSD_SET;
604 switch(num) {
605 case 2:
606 case 3:
607 nfsd_vers(nn, num, cmd);
608 break;
609 case 4:
610 if (*minorp == '.') {
611 if (nfsd_minorversion(nn, minor, cmd) < 0)
612 return -EINVAL;
613 } else if ((cmd == NFSD_SET) != nfsd_vers(nn, num, NFSD_TEST)) {
614 /*
615 * Either we have +4 and no minors are enabled,
616 * or we have -4 and at least one minor is enabled.
617 * In either case, propagate 'cmd' to all minors.
618 */
619 minor = 0;
620 while (nfsd_minorversion(nn, minor, cmd) >= 0)
621 minor++;
622 }
623 break;
624 default:
625 return -EINVAL;
626 }
627 vers += len + 1;
628 } while ((len = qword_get(&mesg, vers, size)) > 0);
629 /* If all get turned off, turn them back on, as
630 * having no versions is BAD
631 */
632 nfsd_reset_versions(nn);
633 }
634
635 /* Now write current state into reply buffer */
636 len = 0;
637 sep = "";
638 remaining = SIMPLE_TRANSACTION_LIMIT;
639 for (num=2 ; num <= 4 ; num++) {
640 int minor;
641 if (!nfsd_vers(nn, num, NFSD_AVAIL))
642 continue;
643
644 minor = -1;
645 do {
646 len = nfsd_print_version_support(nn, buf, remaining,
647 sep, num, minor);
648 if (len >= remaining)
649 goto out;
650 remaining -= len;
651 buf += len;
652 tlen += len;
653 minor++;
654 if (len)
655 sep = " ";
656 } while (num == 4 && minor <= NFSD_SUPPORTED_MINOR_VERSION);
657 }
658out:
659 len = snprintf(buf, remaining, "\n");
660 if (len >= remaining)
661 return -EINVAL;
662 return tlen + len;
663}
664
665/*
666 * write_versions - Set or report the available NFS protocol versions
667 *
668 * Input:
669 * buf: ignored
670 * size: zero
671 * Output:
672 * On success: passed-in buffer filled with '\n'-terminated C
673 * string containing positive or negative integer
674 * values representing the current status of each
675 * protocol version;
676 * return code is the size in bytes of the string
677 * On error: return code is zero or a negative errno value
678 *
679 * OR
680 *
681 * Input:
682 * buf: C string containing whitespace-
683 * separated positive or negative
684 * integer values representing NFS
685 * protocol versions to enable ("+n")
686 * or disable ("-n")
687 * size: non-zero length of C string in @buf
688 * Output:
689 * On success: status of zero or more protocol versions has
690 * been updated; passed-in buffer filled with
691 * '\n'-terminated C string containing positive
692 * or negative integer values representing the
693 * current status of each protocol version;
694 * return code is the size in bytes of the string
695 * On error: return code is zero or a negative errno value
696 */
697static ssize_t write_versions(struct file *file, char *buf, size_t size)
698{
699 ssize_t rv;
700
701 mutex_lock(&nfsd_mutex);
702 rv = __write_versions(file, buf, size);
703 mutex_unlock(&nfsd_mutex);
704 return rv;
705}
706
707/*
708 * Zero-length write. Return a list of NFSD's current listener
709 * transports.
710 */
711static ssize_t __write_ports_names(char *buf, struct net *net)
712{
713 struct nfsd_net *nn = net_generic(net, nfsd_net_id);
714
715 if (nn->nfsd_serv == NULL)
716 return 0;
717 return svc_xprt_names(nn->nfsd_serv, buf, SIMPLE_TRANSACTION_LIMIT);
718}
719
720/*
721 * A single 'fd' number was written, in which case it must be for
722 * a socket of a supported family/protocol, and we use it as an
723 * nfsd listener.
724 */
725static ssize_t __write_ports_addfd(char *buf, struct net *net, const struct cred *cred)
726{
727 char *mesg = buf;
728 int fd, err;
729 struct nfsd_net *nn = net_generic(net, nfsd_net_id);
730
731 err = get_int(&mesg, &fd);
732 if (err != 0 || fd < 0)
733 return -EINVAL;
734
735 if (svc_alien_sock(net, fd)) {
736 printk(KERN_ERR "%s: socket net is different to NFSd's one\n", __func__);
737 return -EINVAL;
738 }
739
740 err = nfsd_create_serv(net);
741 if (err != 0)
742 return err;
743
744 err = svc_addsock(nn->nfsd_serv, fd, buf, SIMPLE_TRANSACTION_LIMIT, cred);
745 if (err < 0) {
746 nfsd_destroy(net);
747 return err;
748 }
749
750 /* Decrease the count, but don't shut down the service */
751 nn->nfsd_serv->sv_nrthreads--;
752 return err;
753}
754
755/*
756 * A transport listener is added by writing it's transport name and
757 * a port number.
758 */
759static ssize_t __write_ports_addxprt(char *buf, struct net *net, const struct cred *cred)
760{
761 char transport[16];
762 struct svc_xprt *xprt;
763 int port, err;
764 struct nfsd_net *nn = net_generic(net, nfsd_net_id);
765
766 if (sscanf(buf, "%15s %5u", transport, &port) != 2)
767 return -EINVAL;
768
769 if (port < 1 || port > USHRT_MAX)
770 return -EINVAL;
771
772 err = nfsd_create_serv(net);
773 if (err != 0)
774 return err;
775
776 err = svc_create_xprt(nn->nfsd_serv, transport, net,
777 PF_INET, port, SVC_SOCK_ANONYMOUS, cred);
778 if (err < 0)
779 goto out_err;
780
781 err = svc_create_xprt(nn->nfsd_serv, transport, net,
782 PF_INET6, port, SVC_SOCK_ANONYMOUS, cred);
783 if (err < 0 && err != -EAFNOSUPPORT)
784 goto out_close;
785
786 /* Decrease the count, but don't shut down the service */
787 nn->nfsd_serv->sv_nrthreads--;
788 return 0;
789out_close:
790 xprt = svc_find_xprt(nn->nfsd_serv, transport, net, PF_INET, port);
791 if (xprt != NULL) {
792 svc_close_xprt(xprt);
793 svc_xprt_put(xprt);
794 }
795out_err:
796 if (!list_empty(&nn->nfsd_serv->sv_permsocks))
797 nn->nfsd_serv->sv_nrthreads--;
798 else
799 nfsd_destroy(net);
800 return err;
801}
802
803static ssize_t __write_ports(struct file *file, char *buf, size_t size,
804 struct net *net)
805{
806 if (size == 0)
807 return __write_ports_names(buf, net);
808
809 if (isdigit(buf[0]))
810 return __write_ports_addfd(buf, net, file->f_cred);
811
812 if (isalpha(buf[0]))
813 return __write_ports_addxprt(buf, net, file->f_cred);
814
815 return -EINVAL;
816}
817
818/*
819 * write_ports - Pass a socket file descriptor or transport name to listen on
820 *
821 * Input:
822 * buf: ignored
823 * size: zero
824 * Output:
825 * On success: passed-in buffer filled with a '\n'-terminated C
826 * string containing a whitespace-separated list of
827 * named NFSD listeners;
828 * return code is the size in bytes of the string
829 * On error: return code is zero or a negative errno value
830 *
831 * OR
832 *
833 * Input:
834 * buf: C string containing an unsigned
835 * integer value representing a bound
836 * but unconnected socket that is to be
837 * used as an NFSD listener; listen(3)
838 * must be called for a SOCK_STREAM
839 * socket, otherwise it is ignored
840 * size: non-zero length of C string in @buf
841 * Output:
842 * On success: NFS service is started;
843 * passed-in buffer filled with a '\n'-terminated C
844 * string containing a unique alphanumeric name of
845 * the listener;
846 * return code is the size in bytes of the string
847 * On error: return code is a negative errno value
848 *
849 * OR
850 *
851 * Input:
852 * buf: C string containing a transport
853 * name and an unsigned integer value
854 * representing the port to listen on,
855 * separated by whitespace
856 * size: non-zero length of C string in @buf
857 * Output:
858 * On success: returns zero; NFS service is started
859 * On error: return code is a negative errno value
860 */
861static ssize_t write_ports(struct file *file, char *buf, size_t size)
862{
863 ssize_t rv;
864
865 mutex_lock(&nfsd_mutex);
866 rv = __write_ports(file, buf, size, netns(file));
867 mutex_unlock(&nfsd_mutex);
868 return rv;
869}
870
871
872int nfsd_max_blksize;
873
874/*
875 * write_maxblksize - Set or report the current NFS blksize
876 *
877 * Input:
878 * buf: ignored
879 * size: zero
880 *
881 * OR
882 *
883 * Input:
884 * buf: C string containing an unsigned
885 * integer value representing the new
886 * NFS blksize
887 * size: non-zero length of C string in @buf
888 * Output:
889 * On success: passed-in buffer filled with '\n'-terminated C string
890 * containing numeric value of the current NFS blksize
891 * setting;
892 * return code is the size in bytes of the string
893 * On error: return code is zero or a negative errno value
894 */
895static ssize_t write_maxblksize(struct file *file, char *buf, size_t size)
896{
897 char *mesg = buf;
898 struct nfsd_net *nn = net_generic(netns(file), nfsd_net_id);
899
900 if (size > 0) {
901 int bsize;
902 int rv = get_int(&mesg, &bsize);
903 if (rv)
904 return rv;
905 /* force bsize into allowed range and
906 * required alignment.
907 */
908 bsize = max_t(int, bsize, 1024);
909 bsize = min_t(int, bsize, NFSSVC_MAXBLKSIZE);
910 bsize &= ~(1024-1);
911 mutex_lock(&nfsd_mutex);
912 if (nn->nfsd_serv) {
913 mutex_unlock(&nfsd_mutex);
914 return -EBUSY;
915 }
916 nfsd_max_blksize = bsize;
917 mutex_unlock(&nfsd_mutex);
918 }
919
920 return scnprintf(buf, SIMPLE_TRANSACTION_LIMIT, "%d\n",
921 nfsd_max_blksize);
922}
923
924/*
925 * write_maxconn - Set or report the current max number of connections
926 *
927 * Input:
928 * buf: ignored
929 * size: zero
930 * OR
931 *
932 * Input:
933 * buf: C string containing an unsigned
934 * integer value representing the new
935 * number of max connections
936 * size: non-zero length of C string in @buf
937 * Output:
938 * On success: passed-in buffer filled with '\n'-terminated C string
939 * containing numeric value of max_connections setting
940 * for this net namespace;
941 * return code is the size in bytes of the string
942 * On error: return code is zero or a negative errno value
943 */
944static ssize_t write_maxconn(struct file *file, char *buf, size_t size)
945{
946 char *mesg = buf;
947 struct nfsd_net *nn = net_generic(netns(file), nfsd_net_id);
948 unsigned int maxconn = nn->max_connections;
949
950 if (size > 0) {
951 int rv = get_uint(&mesg, &maxconn);
952
953 if (rv)
954 return rv;
955 nn->max_connections = maxconn;
956 }
957
958 return scnprintf(buf, SIMPLE_TRANSACTION_LIMIT, "%u\n", maxconn);
959}
960
961#ifdef CONFIG_NFSD_V4
962static ssize_t __nfsd4_write_time(struct file *file, char *buf, size_t size,
963 time64_t *time, struct nfsd_net *nn)
964{
965 char *mesg = buf;
966 int rv, i;
967
968 if (size > 0) {
969 if (nn->nfsd_serv)
970 return -EBUSY;
971 rv = get_int(&mesg, &i);
972 if (rv)
973 return rv;
974 /*
975 * Some sanity checking. We don't have a reason for
976 * these particular numbers, but problems with the
977 * extremes are:
978 * - Too short: the briefest network outage may
979 * cause clients to lose all their locks. Also,
980 * the frequent polling may be wasteful.
981 * - Too long: do you really want reboot recovery
982 * to take more than an hour? Or to make other
983 * clients wait an hour before being able to
984 * revoke a dead client's locks?
985 */
986 if (i < 10 || i > 3600)
987 return -EINVAL;
988 *time = i;
989 }
990
991 return scnprintf(buf, SIMPLE_TRANSACTION_LIMIT, "%lld\n", *time);
992}
993
994static ssize_t nfsd4_write_time(struct file *file, char *buf, size_t size,
995 time64_t *time, struct nfsd_net *nn)
996{
997 ssize_t rv;
998
999 mutex_lock(&nfsd_mutex);
1000 rv = __nfsd4_write_time(file, buf, size, time, nn);
1001 mutex_unlock(&nfsd_mutex);
1002 return rv;
1003}
1004
1005/*
1006 * write_leasetime - Set or report the current NFSv4 lease time
1007 *
1008 * Input:
1009 * buf: ignored
1010 * size: zero
1011 *
1012 * OR
1013 *
1014 * Input:
1015 * buf: C string containing an unsigned
1016 * integer value representing the new
1017 * NFSv4 lease expiry time
1018 * size: non-zero length of C string in @buf
1019 * Output:
1020 * On success: passed-in buffer filled with '\n'-terminated C
1021 * string containing unsigned integer value of the
1022 * current lease expiry time;
1023 * return code is the size in bytes of the string
1024 * On error: return code is zero or a negative errno value
1025 */
1026static ssize_t write_leasetime(struct file *file, char *buf, size_t size)
1027{
1028 struct nfsd_net *nn = net_generic(netns(file), nfsd_net_id);
1029 return nfsd4_write_time(file, buf, size, &nn->nfsd4_lease, nn);
1030}
1031
1032/*
1033 * write_gracetime - Set or report current NFSv4 grace period time
1034 *
1035 * As above, but sets the time of the NFSv4 grace period.
1036 *
1037 * Note this should never be set to less than the *previous*
1038 * lease-period time, but we don't try to enforce this. (In the common
1039 * case (a new boot), we don't know what the previous lease time was
1040 * anyway.)
1041 */
1042static ssize_t write_gracetime(struct file *file, char *buf, size_t size)
1043{
1044 struct nfsd_net *nn = net_generic(netns(file), nfsd_net_id);
1045 return nfsd4_write_time(file, buf, size, &nn->nfsd4_grace, nn);
1046}
1047
1048static ssize_t __write_recoverydir(struct file *file, char *buf, size_t size,
1049 struct nfsd_net *nn)
1050{
1051 char *mesg = buf;
1052 char *recdir;
1053 int len, status;
1054
1055 if (size > 0) {
1056 if (nn->nfsd_serv)
1057 return -EBUSY;
1058 if (size > PATH_MAX || buf[size-1] != '\n')
1059 return -EINVAL;
1060 buf[size-1] = 0;
1061
1062 recdir = mesg;
1063 len = qword_get(&mesg, recdir, size);
1064 if (len <= 0)
1065 return -EINVAL;
1066
1067 status = nfs4_reset_recoverydir(recdir);
1068 if (status)
1069 return status;
1070 }
1071
1072 return scnprintf(buf, SIMPLE_TRANSACTION_LIMIT, "%s\n",
1073 nfs4_recoverydir());
1074}
1075
1076/*
1077 * write_recoverydir - Set or report the pathname of the recovery directory
1078 *
1079 * Input:
1080 * buf: ignored
1081 * size: zero
1082 *
1083 * OR
1084 *
1085 * Input:
1086 * buf: C string containing the pathname
1087 * of the directory on a local file
1088 * system containing permanent NFSv4
1089 * recovery data
1090 * size: non-zero length of C string in @buf
1091 * Output:
1092 * On success: passed-in buffer filled with '\n'-terminated C string
1093 * containing the current recovery pathname setting;
1094 * return code is the size in bytes of the string
1095 * On error: return code is zero or a negative errno value
1096 */
1097static ssize_t write_recoverydir(struct file *file, char *buf, size_t size)
1098{
1099 ssize_t rv;
1100 struct nfsd_net *nn = net_generic(netns(file), nfsd_net_id);
1101
1102 mutex_lock(&nfsd_mutex);
1103 rv = __write_recoverydir(file, buf, size, nn);
1104 mutex_unlock(&nfsd_mutex);
1105 return rv;
1106}
1107
1108/*
1109 * write_v4_end_grace - release grace period for nfsd's v4.x lock manager
1110 *
1111 * Input:
1112 * buf: ignored
1113 * size: zero
1114 * OR
1115 *
1116 * Input:
1117 * buf: any value
1118 * size: non-zero length of C string in @buf
1119 * Output:
1120 * passed-in buffer filled with "Y" or "N" with a newline
1121 * and NULL-terminated C string. This indicates whether
1122 * the grace period has ended in the current net
1123 * namespace. Return code is the size in bytes of the
1124 * string. Writing a string that starts with 'Y', 'y', or
1125 * '1' to the file will end the grace period for nfsd's v4
1126 * lock manager.
1127 */
1128static ssize_t write_v4_end_grace(struct file *file, char *buf, size_t size)
1129{
1130 struct nfsd_net *nn = net_generic(netns(file), nfsd_net_id);
1131
1132 if (size > 0) {
1133 switch(buf[0]) {
1134 case 'Y':
1135 case 'y':
1136 case '1':
1137 if (!nn->nfsd_serv)
1138 return -EBUSY;
1139 nfsd4_end_grace(nn);
1140 break;
1141 default:
1142 return -EINVAL;
1143 }
1144 }
1145
1146 return scnprintf(buf, SIMPLE_TRANSACTION_LIMIT, "%c\n",
1147 nn->grace_ended ? 'Y' : 'N');
1148}
1149
1150#endif
1151
1152/*----------------------------------------------------------------------------*/
1153/*
1154 * populating the filesystem.
1155 */
1156
1157/* Basically copying rpc_get_inode. */
1158static struct inode *nfsd_get_inode(struct super_block *sb, umode_t mode)
1159{
1160 struct inode *inode = new_inode(sb);
1161 if (!inode)
1162 return NULL;
1163 /* Following advice from simple_fill_super documentation: */
1164 inode->i_ino = iunique(sb, NFSD_MaxReserved);
1165 inode->i_mode = mode;
1166 inode->i_atime = inode->i_mtime = inode->i_ctime = current_time(inode);
1167 switch (mode & S_IFMT) {
1168 case S_IFDIR:
1169 inode->i_fop = &simple_dir_operations;
1170 inode->i_op = &simple_dir_inode_operations;
1171 inc_nlink(inode);
1172 break;
1173 default:
1174 break;
1175 }
1176 return inode;
1177}
1178
1179static int __nfsd_mkdir(struct inode *dir, struct dentry *dentry, umode_t mode, struct nfsdfs_client *ncl)
1180{
1181 struct inode *inode;
1182
1183 inode = nfsd_get_inode(dir->i_sb, mode);
1184 if (!inode)
1185 return -ENOMEM;
1186 if (ncl) {
1187 inode->i_private = ncl;
1188 kref_get(&ncl->cl_ref);
1189 }
1190 d_add(dentry, inode);
1191 inc_nlink(dir);
1192 fsnotify_mkdir(dir, dentry);
1193 return 0;
1194}
1195
1196static struct dentry *nfsd_mkdir(struct dentry *parent, struct nfsdfs_client *ncl, char *name)
1197{
1198 struct inode *dir = parent->d_inode;
1199 struct dentry *dentry;
1200 int ret = -ENOMEM;
1201
1202 inode_lock(dir);
1203 dentry = d_alloc_name(parent, name);
1204 if (!dentry)
1205 goto out_err;
1206 ret = __nfsd_mkdir(d_inode(parent), dentry, S_IFDIR | 0600, ncl);
1207 if (ret)
1208 goto out_err;
1209out:
1210 inode_unlock(dir);
1211 return dentry;
1212out_err:
1213 dput(dentry);
1214 dentry = ERR_PTR(ret);
1215 goto out;
1216}
1217
1218static void clear_ncl(struct inode *inode)
1219{
1220 struct nfsdfs_client *ncl = inode->i_private;
1221
1222 inode->i_private = NULL;
1223 kref_put(&ncl->cl_ref, ncl->cl_release);
1224}
1225
1226static struct nfsdfs_client *__get_nfsdfs_client(struct inode *inode)
1227{
1228 struct nfsdfs_client *nc = inode->i_private;
1229
1230 if (nc)
1231 kref_get(&nc->cl_ref);
1232 return nc;
1233}
1234
1235struct nfsdfs_client *get_nfsdfs_client(struct inode *inode)
1236{
1237 struct nfsdfs_client *nc;
1238
1239 inode_lock_shared(inode);
1240 nc = __get_nfsdfs_client(inode);
1241 inode_unlock_shared(inode);
1242 return nc;
1243}
1244/* from __rpc_unlink */
1245static void nfsdfs_remove_file(struct inode *dir, struct dentry *dentry)
1246{
1247 int ret;
1248
1249 clear_ncl(d_inode(dentry));
1250 dget(dentry);
1251 ret = simple_unlink(dir, dentry);
1252 d_delete(dentry);
1253 dput(dentry);
1254 WARN_ON_ONCE(ret);
1255}
1256
1257static void nfsdfs_remove_files(struct dentry *root)
1258{
1259 struct dentry *dentry, *tmp;
1260
1261 list_for_each_entry_safe(dentry, tmp, &root->d_subdirs, d_child) {
1262 if (!simple_positive(dentry)) {
1263 WARN_ON_ONCE(1); /* I think this can't happen? */
1264 continue;
1265 }
1266 nfsdfs_remove_file(d_inode(root), dentry);
1267 }
1268}
1269
1270/* XXX: cut'n'paste from simple_fill_super; figure out if we could share
1271 * code instead. */
1272static int nfsdfs_create_files(struct dentry *root,
1273 const struct tree_descr *files,
1274 struct dentry **fdentries)
1275{
1276 struct inode *dir = d_inode(root);
1277 struct inode *inode;
1278 struct dentry *dentry;
1279 int i;
1280
1281 inode_lock(dir);
1282 for (i = 0; files->name && files->name[0]; i++, files++) {
1283 dentry = d_alloc_name(root, files->name);
1284 if (!dentry)
1285 goto out;
1286 inode = nfsd_get_inode(d_inode(root)->i_sb,
1287 S_IFREG | files->mode);
1288 if (!inode) {
1289 dput(dentry);
1290 goto out;
1291 }
1292 inode->i_fop = files->ops;
1293 inode->i_private = __get_nfsdfs_client(dir);
1294 d_add(dentry, inode);
1295 fsnotify_create(dir, dentry);
1296 if (fdentries)
1297 fdentries[i] = dentry;
1298 }
1299 inode_unlock(dir);
1300 return 0;
1301out:
1302 nfsdfs_remove_files(root);
1303 inode_unlock(dir);
1304 return -ENOMEM;
1305}
1306
1307/* on success, returns positive number unique to that client. */
1308struct dentry *nfsd_client_mkdir(struct nfsd_net *nn,
1309 struct nfsdfs_client *ncl, u32 id,
1310 const struct tree_descr *files,
1311 struct dentry **fdentries)
1312{
1313 struct dentry *dentry;
1314 char name[11];
1315 int ret;
1316
1317 sprintf(name, "%u", id);
1318
1319 dentry = nfsd_mkdir(nn->nfsd_client_dir, ncl, name);
1320 if (IS_ERR(dentry)) /* XXX: tossing errors? */
1321 return NULL;
1322 ret = nfsdfs_create_files(dentry, files, fdentries);
1323 if (ret) {
1324 nfsd_client_rmdir(dentry);
1325 return NULL;
1326 }
1327 return dentry;
1328}
1329
1330/* Taken from __rpc_rmdir: */
1331void nfsd_client_rmdir(struct dentry *dentry)
1332{
1333 struct inode *dir = d_inode(dentry->d_parent);
1334 struct inode *inode = d_inode(dentry);
1335 int ret;
1336
1337 inode_lock(dir);
1338 nfsdfs_remove_files(dentry);
1339 clear_ncl(inode);
1340 dget(dentry);
1341 ret = simple_rmdir(dir, dentry);
1342 WARN_ON_ONCE(ret);
1343 fsnotify_rmdir(dir, dentry);
1344 d_delete(dentry);
1345 dput(dentry);
1346 inode_unlock(dir);
1347}
1348
1349static int nfsd_fill_super(struct super_block *sb, struct fs_context *fc)
1350{
1351 struct nfsd_net *nn = net_generic(current->nsproxy->net_ns,
1352 nfsd_net_id);
1353 struct dentry *dentry;
1354 int ret;
1355
1356 static const struct tree_descr nfsd_files[] = {
1357 [NFSD_List] = {"exports", &exports_nfsd_operations, S_IRUGO},
1358 /* Per-export io stats use same ops as exports file */
1359 [NFSD_Export_Stats] = {"export_stats", &exports_nfsd_operations, S_IRUGO},
1360 [NFSD_Export_features] = {"export_features",
1361 &export_features_operations, S_IRUGO},
1362 [NFSD_FO_UnlockIP] = {"unlock_ip",
1363 &transaction_ops, S_IWUSR|S_IRUSR},
1364 [NFSD_FO_UnlockFS] = {"unlock_filesystem",
1365 &transaction_ops, S_IWUSR|S_IRUSR},
1366 [NFSD_Fh] = {"filehandle", &transaction_ops, S_IWUSR|S_IRUSR},
1367 [NFSD_Threads] = {"threads", &transaction_ops, S_IWUSR|S_IRUSR},
1368 [NFSD_Pool_Threads] = {"pool_threads", &transaction_ops, S_IWUSR|S_IRUSR},
1369 [NFSD_Pool_Stats] = {"pool_stats", &pool_stats_operations, S_IRUGO},
1370 [NFSD_Reply_Cache_Stats] = {"reply_cache_stats", &reply_cache_stats_operations, S_IRUGO},
1371 [NFSD_Versions] = {"versions", &transaction_ops, S_IWUSR|S_IRUSR},
1372 [NFSD_Ports] = {"portlist", &transaction_ops, S_IWUSR|S_IRUGO},
1373 [NFSD_MaxBlkSize] = {"max_block_size", &transaction_ops, S_IWUSR|S_IRUGO},
1374 [NFSD_MaxConnections] = {"max_connections", &transaction_ops, S_IWUSR|S_IRUGO},
1375#if defined(CONFIG_SUNRPC_GSS) || defined(CONFIG_SUNRPC_GSS_MODULE)
1376 [NFSD_SupportedEnctypes] = {"supported_krb5_enctypes", &supported_enctypes_ops, S_IRUGO},
1377#endif /* CONFIG_SUNRPC_GSS or CONFIG_SUNRPC_GSS_MODULE */
1378#ifdef CONFIG_NFSD_V4
1379 [NFSD_Leasetime] = {"nfsv4leasetime", &transaction_ops, S_IWUSR|S_IRUSR},
1380 [NFSD_Gracetime] = {"nfsv4gracetime", &transaction_ops, S_IWUSR|S_IRUSR},
1381 [NFSD_RecoveryDir] = {"nfsv4recoverydir", &transaction_ops, S_IWUSR|S_IRUSR},
1382 [NFSD_V4EndGrace] = {"v4_end_grace", &transaction_ops, S_IWUSR|S_IRUGO},
1383#endif
1384 /* last one */ {""}
1385 };
1386
1387 ret = simple_fill_super(sb, 0x6e667364, nfsd_files);
1388 if (ret)
1389 return ret;
1390 dentry = nfsd_mkdir(sb->s_root, NULL, "clients");
1391 if (IS_ERR(dentry))
1392 return PTR_ERR(dentry);
1393 nn->nfsd_client_dir = dentry;
1394 return 0;
1395}
1396
1397static int nfsd_fs_get_tree(struct fs_context *fc)
1398{
1399 return get_tree_keyed(fc, nfsd_fill_super, get_net(fc->net_ns));
1400}
1401
1402static void nfsd_fs_free_fc(struct fs_context *fc)
1403{
1404 if (fc->s_fs_info)
1405 put_net(fc->s_fs_info);
1406}
1407
1408static const struct fs_context_operations nfsd_fs_context_ops = {
1409 .free = nfsd_fs_free_fc,
1410 .get_tree = nfsd_fs_get_tree,
1411};
1412
1413static int nfsd_init_fs_context(struct fs_context *fc)
1414{
1415 put_user_ns(fc->user_ns);
1416 fc->user_ns = get_user_ns(fc->net_ns->user_ns);
1417 fc->ops = &nfsd_fs_context_ops;
1418 return 0;
1419}
1420
1421static void nfsd_umount(struct super_block *sb)
1422{
1423 struct net *net = sb->s_fs_info;
1424
1425 nfsd_shutdown_threads(net);
1426
1427 kill_litter_super(sb);
1428 put_net(net);
1429}
1430
1431static struct file_system_type nfsd_fs_type = {
1432 .owner = THIS_MODULE,
1433 .name = "nfsd",
1434 .init_fs_context = nfsd_init_fs_context,
1435 .kill_sb = nfsd_umount,
1436};
1437MODULE_ALIAS_FS("nfsd");
1438
1439#ifdef CONFIG_PROC_FS
1440static int create_proc_exports_entry(void)
1441{
1442 struct proc_dir_entry *entry;
1443
1444 entry = proc_mkdir("fs/nfs", NULL);
1445 if (!entry)
1446 return -ENOMEM;
1447 entry = proc_create("exports", 0, entry, &exports_proc_ops);
1448 if (!entry) {
1449 remove_proc_entry("fs/nfs", NULL);
1450 return -ENOMEM;
1451 }
1452 return 0;
1453}
1454#else /* CONFIG_PROC_FS */
1455static int create_proc_exports_entry(void)
1456{
1457 return 0;
1458}
1459#endif
1460
1461unsigned int nfsd_net_id;
1462
1463static __net_init int nfsd_init_net(struct net *net)
1464{
1465 int retval;
1466 struct nfsd_net *nn = net_generic(net, nfsd_net_id);
1467
1468 retval = nfsd_export_init(net);
1469 if (retval)
1470 goto out_export_error;
1471 retval = nfsd_idmap_init(net);
1472 if (retval)
1473 goto out_idmap_error;
1474 nn->nfsd_versions = NULL;
1475 nn->nfsd4_minorversions = NULL;
1476 retval = nfsd_reply_cache_init(nn);
1477 if (retval)
1478 goto out_drc_error;
1479 nn->nfsd4_lease = 90; /* default lease time */
1480 nn->nfsd4_grace = 90;
1481 nn->somebody_reclaimed = false;
1482 nn->track_reclaim_completes = false;
1483 nn->clverifier_counter = prandom_u32();
1484 nn->clientid_base = prandom_u32();
1485 nn->clientid_counter = nn->clientid_base + 1;
1486 nn->s2s_cp_cl_id = nn->clientid_counter++;
1487
1488 atomic_set(&nn->ntf_refcnt, 0);
1489 init_waitqueue_head(&nn->ntf_wq);
1490 seqlock_init(&nn->boot_lock);
1491
1492 return 0;
1493
1494out_drc_error:
1495 nfsd_idmap_shutdown(net);
1496out_idmap_error:
1497 nfsd_export_shutdown(net);
1498out_export_error:
1499 return retval;
1500}
1501
1502static __net_exit void nfsd_exit_net(struct net *net)
1503{
1504 struct nfsd_net *nn = net_generic(net, nfsd_net_id);
1505
1506 nfsd_reply_cache_shutdown(nn);
1507 nfsd_idmap_shutdown(net);
1508 nfsd_export_shutdown(net);
1509 nfsd_netns_free_versions(net_generic(net, nfsd_net_id));
1510}
1511
1512static struct pernet_operations nfsd_net_ops = {
1513 .init = nfsd_init_net,
1514 .exit = nfsd_exit_net,
1515 .id = &nfsd_net_id,
1516 .size = sizeof(struct nfsd_net),
1517};
1518
1519static int __init init_nfsd(void)
1520{
1521 int retval;
1522 printk(KERN_INFO "Installing knfsd (copyright (C) 1996 okir@monad.swb.de).\n");
1523
1524 retval = register_cld_notifier();
1525 if (retval)
1526 return retval;
1527 retval = nfsd4_init_slabs();
1528 if (retval)
1529 goto out_unregister_notifier;
1530 retval = nfsd4_init_pnfs();
1531 if (retval)
1532 goto out_free_slabs;
1533 retval = nfsd_stat_init(); /* Statistics */
1534 if (retval)
1535 goto out_free_pnfs;
1536 retval = nfsd_drc_slab_create();
1537 if (retval)
1538 goto out_free_stat;
1539 nfsd_lockd_init(); /* lockd->nfsd callbacks */
1540 retval = create_proc_exports_entry();
1541 if (retval)
1542 goto out_free_lockd;
1543 retval = register_filesystem(&nfsd_fs_type);
1544 if (retval)
1545 goto out_free_exports;
1546 retval = register_pernet_subsys(&nfsd_net_ops);
1547 if (retval < 0)
1548 goto out_free_all;
1549 return 0;
1550out_free_all:
1551 unregister_filesystem(&nfsd_fs_type);
1552out_free_exports:
1553 remove_proc_entry("fs/nfs/exports", NULL);
1554 remove_proc_entry("fs/nfs", NULL);
1555out_free_lockd:
1556 nfsd_lockd_shutdown();
1557 nfsd_drc_slab_free();
1558out_free_stat:
1559 nfsd_stat_shutdown();
1560out_free_pnfs:
1561 nfsd4_exit_pnfs();
1562out_free_slabs:
1563 nfsd4_free_slabs();
1564out_unregister_notifier:
1565 unregister_cld_notifier();
1566 return retval;
1567}
1568
1569static void __exit exit_nfsd(void)
1570{
1571 unregister_pernet_subsys(&nfsd_net_ops);
1572 nfsd_drc_slab_free();
1573 remove_proc_entry("fs/nfs/exports", NULL);
1574 remove_proc_entry("fs/nfs", NULL);
1575 nfsd_stat_shutdown();
1576 nfsd_lockd_shutdown();
1577 nfsd4_free_slabs();
1578 nfsd4_exit_pnfs();
1579 unregister_filesystem(&nfsd_fs_type);
1580 unregister_cld_notifier();
1581}
1582
1583MODULE_AUTHOR("Olaf Kirch <okir@monad.swb.de>");
1584MODULE_LICENSE("GPL");
1585module_init(init_nfsd)
1586module_exit(exit_nfsd)