Loading...
1/*
2 * Syscall interface to knfsd.
3 *
4 * Copyright (C) 1995, 1996 Olaf Kirch <okir@monad.swb.de>
5 */
6
7#include <linux/slab.h>
8#include <linux/namei.h>
9#include <linux/ctype.h>
10
11#include <linux/sunrpc/svcsock.h>
12#include <linux/lockd/lockd.h>
13#include <linux/sunrpc/addr.h>
14#include <linux/sunrpc/gss_api.h>
15#include <linux/sunrpc/gss_krb5_enctypes.h>
16#include <linux/sunrpc/rpc_pipe_fs.h>
17#include <linux/module.h>
18
19#include "idmap.h"
20#include "nfsd.h"
21#include "cache.h"
22#include "state.h"
23#include "netns.h"
24#include "pnfs.h"
25
26/*
27 * We have a single directory with several nodes in it.
28 */
29enum {
30 NFSD_Root = 1,
31 NFSD_List,
32 NFSD_Export_features,
33 NFSD_Fh,
34 NFSD_FO_UnlockIP,
35 NFSD_FO_UnlockFS,
36 NFSD_Threads,
37 NFSD_Pool_Threads,
38 NFSD_Pool_Stats,
39 NFSD_Reply_Cache_Stats,
40 NFSD_Versions,
41 NFSD_Ports,
42 NFSD_MaxBlkSize,
43 NFSD_MaxConnections,
44 NFSD_SupportedEnctypes,
45 /*
46 * The below MUST come last. Otherwise we leave a hole in nfsd_files[]
47 * with !CONFIG_NFSD_V4 and simple_fill_super() goes oops
48 */
49#ifdef CONFIG_NFSD_V4
50 NFSD_Leasetime,
51 NFSD_Gracetime,
52 NFSD_RecoveryDir,
53 NFSD_V4EndGrace,
54#endif
55};
56
57/*
58 * write() for these nodes.
59 */
60static ssize_t write_filehandle(struct file *file, char *buf, size_t size);
61static ssize_t write_unlock_ip(struct file *file, char *buf, size_t size);
62static ssize_t write_unlock_fs(struct file *file, char *buf, size_t size);
63static ssize_t write_threads(struct file *file, char *buf, size_t size);
64static ssize_t write_pool_threads(struct file *file, char *buf, size_t size);
65static ssize_t write_versions(struct file *file, char *buf, size_t size);
66static ssize_t write_ports(struct file *file, char *buf, size_t size);
67static ssize_t write_maxblksize(struct file *file, char *buf, size_t size);
68static ssize_t write_maxconn(struct file *file, char *buf, size_t size);
69#ifdef CONFIG_NFSD_V4
70static ssize_t write_leasetime(struct file *file, char *buf, size_t size);
71static ssize_t write_gracetime(struct file *file, char *buf, size_t size);
72static ssize_t write_recoverydir(struct file *file, char *buf, size_t size);
73static ssize_t write_v4_end_grace(struct file *file, char *buf, size_t size);
74#endif
75
76static ssize_t (*write_op[])(struct file *, char *, size_t) = {
77 [NFSD_Fh] = write_filehandle,
78 [NFSD_FO_UnlockIP] = write_unlock_ip,
79 [NFSD_FO_UnlockFS] = write_unlock_fs,
80 [NFSD_Threads] = write_threads,
81 [NFSD_Pool_Threads] = write_pool_threads,
82 [NFSD_Versions] = write_versions,
83 [NFSD_Ports] = write_ports,
84 [NFSD_MaxBlkSize] = write_maxblksize,
85 [NFSD_MaxConnections] = write_maxconn,
86#ifdef CONFIG_NFSD_V4
87 [NFSD_Leasetime] = write_leasetime,
88 [NFSD_Gracetime] = write_gracetime,
89 [NFSD_RecoveryDir] = write_recoverydir,
90 [NFSD_V4EndGrace] = write_v4_end_grace,
91#endif
92};
93
94static ssize_t nfsctl_transaction_write(struct file *file, const char __user *buf, size_t size, loff_t *pos)
95{
96 ino_t ino = file_inode(file)->i_ino;
97 char *data;
98 ssize_t rv;
99
100 if (ino >= ARRAY_SIZE(write_op) || !write_op[ino])
101 return -EINVAL;
102
103 data = simple_transaction_get(file, buf, size);
104 if (IS_ERR(data))
105 return PTR_ERR(data);
106
107 rv = write_op[ino](file, data, size);
108 if (rv >= 0) {
109 simple_transaction_set(file, rv);
110 rv = size;
111 }
112 return rv;
113}
114
115static ssize_t nfsctl_transaction_read(struct file *file, char __user *buf, size_t size, loff_t *pos)
116{
117 if (! file->private_data) {
118 /* An attempt to read a transaction file without writing
119 * causes a 0-byte write so that the file can return
120 * state information
121 */
122 ssize_t rv = nfsctl_transaction_write(file, buf, 0, pos);
123 if (rv < 0)
124 return rv;
125 }
126 return simple_transaction_read(file, buf, size, pos);
127}
128
129static const struct file_operations transaction_ops = {
130 .write = nfsctl_transaction_write,
131 .read = nfsctl_transaction_read,
132 .release = simple_transaction_release,
133 .llseek = default_llseek,
134};
135
136static int exports_net_open(struct net *net, struct file *file)
137{
138 int err;
139 struct seq_file *seq;
140 struct nfsd_net *nn = net_generic(net, nfsd_net_id);
141
142 err = seq_open(file, &nfs_exports_op);
143 if (err)
144 return err;
145
146 seq = file->private_data;
147 seq->private = nn->svc_export_cache;
148 return 0;
149}
150
151static int exports_proc_open(struct inode *inode, struct file *file)
152{
153 return exports_net_open(current->nsproxy->net_ns, file);
154}
155
156static const struct file_operations exports_proc_operations = {
157 .open = exports_proc_open,
158 .read = seq_read,
159 .llseek = seq_lseek,
160 .release = seq_release,
161 .owner = THIS_MODULE,
162};
163
164static int exports_nfsd_open(struct inode *inode, struct file *file)
165{
166 return exports_net_open(inode->i_sb->s_fs_info, file);
167}
168
169static const struct file_operations exports_nfsd_operations = {
170 .open = exports_nfsd_open,
171 .read = seq_read,
172 .llseek = seq_lseek,
173 .release = seq_release,
174 .owner = THIS_MODULE,
175};
176
177static int export_features_show(struct seq_file *m, void *v)
178{
179 seq_printf(m, "0x%x 0x%x\n", NFSEXP_ALLFLAGS, NFSEXP_SECINFO_FLAGS);
180 return 0;
181}
182
183static int export_features_open(struct inode *inode, struct file *file)
184{
185 return single_open(file, export_features_show, NULL);
186}
187
188static const struct file_operations export_features_operations = {
189 .open = export_features_open,
190 .read = seq_read,
191 .llseek = seq_lseek,
192 .release = single_release,
193};
194
195#if defined(CONFIG_SUNRPC_GSS) || defined(CONFIG_SUNRPC_GSS_MODULE)
196static int supported_enctypes_show(struct seq_file *m, void *v)
197{
198 seq_printf(m, KRB5_SUPPORTED_ENCTYPES);
199 return 0;
200}
201
202static int supported_enctypes_open(struct inode *inode, struct file *file)
203{
204 return single_open(file, supported_enctypes_show, NULL);
205}
206
207static const struct file_operations supported_enctypes_ops = {
208 .open = supported_enctypes_open,
209 .read = seq_read,
210 .llseek = seq_lseek,
211 .release = single_release,
212};
213#endif /* CONFIG_SUNRPC_GSS or CONFIG_SUNRPC_GSS_MODULE */
214
215static const struct file_operations pool_stats_operations = {
216 .open = nfsd_pool_stats_open,
217 .read = seq_read,
218 .llseek = seq_lseek,
219 .release = nfsd_pool_stats_release,
220 .owner = THIS_MODULE,
221};
222
223static struct file_operations reply_cache_stats_operations = {
224 .open = nfsd_reply_cache_stats_open,
225 .read = seq_read,
226 .llseek = seq_lseek,
227 .release = single_release,
228};
229
230/*----------------------------------------------------------------------------*/
231/*
232 * payload - write methods
233 */
234
235static inline struct net *netns(struct file *file)
236{
237 return file_inode(file)->i_sb->s_fs_info;
238}
239
240/**
241 * write_unlock_ip - Release all locks used by a client
242 *
243 * Experimental.
244 *
245 * Input:
246 * buf: '\n'-terminated C string containing a
247 * presentation format IP address
248 * size: length of C string in @buf
249 * Output:
250 * On success: returns zero if all specified locks were released;
251 * returns one if one or more locks were not released
252 * On error: return code is negative errno value
253 */
254static ssize_t write_unlock_ip(struct file *file, char *buf, size_t size)
255{
256 struct sockaddr_storage address;
257 struct sockaddr *sap = (struct sockaddr *)&address;
258 size_t salen = sizeof(address);
259 char *fo_path;
260 struct net *net = netns(file);
261
262 /* sanity check */
263 if (size == 0)
264 return -EINVAL;
265
266 if (buf[size-1] != '\n')
267 return -EINVAL;
268
269 fo_path = buf;
270 if (qword_get(&buf, fo_path, size) < 0)
271 return -EINVAL;
272
273 if (rpc_pton(net, fo_path, size, sap, salen) == 0)
274 return -EINVAL;
275
276 return nlmsvc_unlock_all_by_ip(sap);
277}
278
279/**
280 * write_unlock_fs - Release all locks on a local file system
281 *
282 * Experimental.
283 *
284 * Input:
285 * buf: '\n'-terminated C string containing the
286 * absolute pathname of a local file system
287 * size: length of C string in @buf
288 * Output:
289 * On success: returns zero if all specified locks were released;
290 * returns one if one or more locks were not released
291 * On error: return code is negative errno value
292 */
293static ssize_t write_unlock_fs(struct file *file, char *buf, size_t size)
294{
295 struct path path;
296 char *fo_path;
297 int error;
298
299 /* sanity check */
300 if (size == 0)
301 return -EINVAL;
302
303 if (buf[size-1] != '\n')
304 return -EINVAL;
305
306 fo_path = buf;
307 if (qword_get(&buf, fo_path, size) < 0)
308 return -EINVAL;
309
310 error = kern_path(fo_path, 0, &path);
311 if (error)
312 return error;
313
314 /*
315 * XXX: Needs better sanity checking. Otherwise we could end up
316 * releasing locks on the wrong file system.
317 *
318 * For example:
319 * 1. Does the path refer to a directory?
320 * 2. Is that directory a mount point, or
321 * 3. Is that directory the root of an exported file system?
322 */
323 error = nlmsvc_unlock_all_by_sb(path.dentry->d_sb);
324
325 path_put(&path);
326 return error;
327}
328
329/**
330 * write_filehandle - Get a variable-length NFS file handle by path
331 *
332 * On input, the buffer contains a '\n'-terminated C string comprised of
333 * three alphanumeric words separated by whitespace. The string may
334 * contain escape sequences.
335 *
336 * Input:
337 * buf:
338 * domain: client domain name
339 * path: export pathname
340 * maxsize: numeric maximum size of
341 * @buf
342 * size: length of C string in @buf
343 * Output:
344 * On success: passed-in buffer filled with '\n'-terminated C
345 * string containing a ASCII hex text version
346 * of the NFS file handle;
347 * return code is the size in bytes of the string
348 * On error: return code is negative errno value
349 */
350static ssize_t write_filehandle(struct file *file, char *buf, size_t size)
351{
352 char *dname, *path;
353 int uninitialized_var(maxsize);
354 char *mesg = buf;
355 int len;
356 struct auth_domain *dom;
357 struct knfsd_fh fh;
358
359 if (size == 0)
360 return -EINVAL;
361
362 if (buf[size-1] != '\n')
363 return -EINVAL;
364 buf[size-1] = 0;
365
366 dname = mesg;
367 len = qword_get(&mesg, dname, size);
368 if (len <= 0)
369 return -EINVAL;
370
371 path = dname+len+1;
372 len = qword_get(&mesg, path, size);
373 if (len <= 0)
374 return -EINVAL;
375
376 len = get_int(&mesg, &maxsize);
377 if (len)
378 return len;
379
380 if (maxsize < NFS_FHSIZE)
381 return -EINVAL;
382 maxsize = min(maxsize, NFS3_FHSIZE);
383
384 if (qword_get(&mesg, mesg, size)>0)
385 return -EINVAL;
386
387 /* we have all the words, they are in buf.. */
388 dom = unix_domain_find(dname);
389 if (!dom)
390 return -ENOMEM;
391
392 len = exp_rootfh(netns(file), dom, path, &fh, maxsize);
393 auth_domain_put(dom);
394 if (len)
395 return len;
396
397 mesg = buf;
398 len = SIMPLE_TRANSACTION_LIMIT;
399 qword_addhex(&mesg, &len, (char*)&fh.fh_base, fh.fh_size);
400 mesg[-1] = '\n';
401 return mesg - buf;
402}
403
404/**
405 * write_threads - Start NFSD, or report the current number of running threads
406 *
407 * Input:
408 * buf: ignored
409 * size: zero
410 * Output:
411 * On success: passed-in buffer filled with '\n'-terminated C
412 * string numeric value representing the number of
413 * running NFSD threads;
414 * return code is the size in bytes of the string
415 * On error: return code is zero
416 *
417 * OR
418 *
419 * Input:
420 * buf: C string containing an unsigned
421 * integer value representing the
422 * number of NFSD threads to start
423 * size: non-zero length of C string in @buf
424 * Output:
425 * On success: NFS service is started;
426 * passed-in buffer filled with '\n'-terminated C
427 * string numeric value representing the number of
428 * running NFSD threads;
429 * return code is the size in bytes of the string
430 * On error: return code is zero or a negative errno value
431 */
432static ssize_t write_threads(struct file *file, char *buf, size_t size)
433{
434 char *mesg = buf;
435 int rv;
436 struct net *net = netns(file);
437
438 if (size > 0) {
439 int newthreads;
440 rv = get_int(&mesg, &newthreads);
441 if (rv)
442 return rv;
443 if (newthreads < 0)
444 return -EINVAL;
445 rv = nfsd_svc(newthreads, net);
446 if (rv < 0)
447 return rv;
448 } else
449 rv = nfsd_nrthreads(net);
450
451 return scnprintf(buf, SIMPLE_TRANSACTION_LIMIT, "%d\n", rv);
452}
453
454/**
455 * write_pool_threads - Set or report the current number of threads per pool
456 *
457 * Input:
458 * buf: ignored
459 * size: zero
460 *
461 * OR
462 *
463 * Input:
464 * buf: C string containing whitespace-
465 * separated unsigned integer values
466 * representing the number of NFSD
467 * threads to start in each pool
468 * size: non-zero length of C string in @buf
469 * Output:
470 * On success: passed-in buffer filled with '\n'-terminated C
471 * string containing integer values representing the
472 * number of NFSD threads in each pool;
473 * return code is the size in bytes of the string
474 * On error: return code is zero or a negative errno value
475 */
476static ssize_t write_pool_threads(struct file *file, char *buf, size_t size)
477{
478 /* if size > 0, look for an array of number of threads per node
479 * and apply them then write out number of threads per node as reply
480 */
481 char *mesg = buf;
482 int i;
483 int rv;
484 int len;
485 int npools;
486 int *nthreads;
487 struct net *net = netns(file);
488
489 mutex_lock(&nfsd_mutex);
490 npools = nfsd_nrpools(net);
491 if (npools == 0) {
492 /*
493 * NFS is shut down. The admin can start it by
494 * writing to the threads file but NOT the pool_threads
495 * file, sorry. Report zero threads.
496 */
497 mutex_unlock(&nfsd_mutex);
498 strcpy(buf, "0\n");
499 return strlen(buf);
500 }
501
502 nthreads = kcalloc(npools, sizeof(int), GFP_KERNEL);
503 rv = -ENOMEM;
504 if (nthreads == NULL)
505 goto out_free;
506
507 if (size > 0) {
508 for (i = 0; i < npools; i++) {
509 rv = get_int(&mesg, &nthreads[i]);
510 if (rv == -ENOENT)
511 break; /* fewer numbers than pools */
512 if (rv)
513 goto out_free; /* syntax error */
514 rv = -EINVAL;
515 if (nthreads[i] < 0)
516 goto out_free;
517 }
518 rv = nfsd_set_nrthreads(i, nthreads, net);
519 if (rv)
520 goto out_free;
521 }
522
523 rv = nfsd_get_nrthreads(npools, nthreads, net);
524 if (rv)
525 goto out_free;
526
527 mesg = buf;
528 size = SIMPLE_TRANSACTION_LIMIT;
529 for (i = 0; i < npools && size > 0; i++) {
530 snprintf(mesg, size, "%d%c", nthreads[i], (i == npools-1 ? '\n' : ' '));
531 len = strlen(mesg);
532 size -= len;
533 mesg += len;
534 }
535 rv = mesg - buf;
536out_free:
537 kfree(nthreads);
538 mutex_unlock(&nfsd_mutex);
539 return rv;
540}
541
542static ssize_t __write_versions(struct file *file, char *buf, size_t size)
543{
544 char *mesg = buf;
545 char *vers, *minorp, sign;
546 int len, num, remaining;
547 unsigned minor;
548 ssize_t tlen = 0;
549 char *sep;
550 struct nfsd_net *nn = net_generic(netns(file), nfsd_net_id);
551
552 if (size>0) {
553 if (nn->nfsd_serv)
554 /* Cannot change versions without updating
555 * nn->nfsd_serv->sv_xdrsize, and reallocing
556 * rq_argp and rq_resp
557 */
558 return -EBUSY;
559 if (buf[size-1] != '\n')
560 return -EINVAL;
561 buf[size-1] = 0;
562
563 vers = mesg;
564 len = qword_get(&mesg, vers, size);
565 if (len <= 0) return -EINVAL;
566 do {
567 sign = *vers;
568 if (sign == '+' || sign == '-')
569 num = simple_strtol((vers+1), &minorp, 0);
570 else
571 num = simple_strtol(vers, &minorp, 0);
572 if (*minorp == '.') {
573 if (num != 4)
574 return -EINVAL;
575 minor = simple_strtoul(minorp+1, NULL, 0);
576 if (minor == 0)
577 return -EINVAL;
578 if (nfsd_minorversion(minor, sign == '-' ?
579 NFSD_CLEAR : NFSD_SET) < 0)
580 return -EINVAL;
581 goto next;
582 }
583 switch(num) {
584 case 2:
585 case 3:
586 case 4:
587 nfsd_vers(num, sign == '-' ? NFSD_CLEAR : NFSD_SET);
588 break;
589 default:
590 return -EINVAL;
591 }
592 next:
593 vers += len + 1;
594 } while ((len = qword_get(&mesg, vers, size)) > 0);
595 /* If all get turned off, turn them back on, as
596 * having no versions is BAD
597 */
598 nfsd_reset_versions();
599 }
600
601 /* Now write current state into reply buffer */
602 len = 0;
603 sep = "";
604 remaining = SIMPLE_TRANSACTION_LIMIT;
605 for (num=2 ; num <= 4 ; num++)
606 if (nfsd_vers(num, NFSD_AVAIL)) {
607 len = snprintf(buf, remaining, "%s%c%d", sep,
608 nfsd_vers(num, NFSD_TEST)?'+':'-',
609 num);
610 sep = " ";
611
612 if (len >= remaining)
613 break;
614 remaining -= len;
615 buf += len;
616 tlen += len;
617 }
618 if (nfsd_vers(4, NFSD_AVAIL))
619 for (minor = 1; minor <= NFSD_SUPPORTED_MINOR_VERSION;
620 minor++) {
621 len = snprintf(buf, remaining, " %c4.%u",
622 (nfsd_vers(4, NFSD_TEST) &&
623 nfsd_minorversion(minor, NFSD_TEST)) ?
624 '+' : '-',
625 minor);
626
627 if (len >= remaining)
628 break;
629 remaining -= len;
630 buf += len;
631 tlen += len;
632 }
633
634 len = snprintf(buf, remaining, "\n");
635 if (len >= remaining)
636 return -EINVAL;
637 return tlen + len;
638}
639
640/**
641 * write_versions - Set or report the available NFS protocol versions
642 *
643 * Input:
644 * buf: ignored
645 * size: zero
646 * Output:
647 * On success: passed-in buffer filled with '\n'-terminated C
648 * string containing positive or negative integer
649 * values representing the current status of each
650 * protocol version;
651 * return code is the size in bytes of the string
652 * On error: return code is zero or a negative errno value
653 *
654 * OR
655 *
656 * Input:
657 * buf: C string containing whitespace-
658 * separated positive or negative
659 * integer values representing NFS
660 * protocol versions to enable ("+n")
661 * or disable ("-n")
662 * size: non-zero length of C string in @buf
663 * Output:
664 * On success: status of zero or more protocol versions has
665 * been updated; passed-in buffer filled with
666 * '\n'-terminated C string containing positive
667 * or negative integer values representing the
668 * current status of each protocol version;
669 * return code is the size in bytes of the string
670 * On error: return code is zero or a negative errno value
671 */
672static ssize_t write_versions(struct file *file, char *buf, size_t size)
673{
674 ssize_t rv;
675
676 mutex_lock(&nfsd_mutex);
677 rv = __write_versions(file, buf, size);
678 mutex_unlock(&nfsd_mutex);
679 return rv;
680}
681
682/*
683 * Zero-length write. Return a list of NFSD's current listener
684 * transports.
685 */
686static ssize_t __write_ports_names(char *buf, struct net *net)
687{
688 struct nfsd_net *nn = net_generic(net, nfsd_net_id);
689
690 if (nn->nfsd_serv == NULL)
691 return 0;
692 return svc_xprt_names(nn->nfsd_serv, buf, SIMPLE_TRANSACTION_LIMIT);
693}
694
695/*
696 * A single 'fd' number was written, in which case it must be for
697 * a socket of a supported family/protocol, and we use it as an
698 * nfsd listener.
699 */
700static ssize_t __write_ports_addfd(char *buf, struct net *net)
701{
702 char *mesg = buf;
703 int fd, err;
704 struct nfsd_net *nn = net_generic(net, nfsd_net_id);
705
706 err = get_int(&mesg, &fd);
707 if (err != 0 || fd < 0)
708 return -EINVAL;
709
710 if (svc_alien_sock(net, fd)) {
711 printk(KERN_ERR "%s: socket net is different to NFSd's one\n", __func__);
712 return -EINVAL;
713 }
714
715 err = nfsd_create_serv(net);
716 if (err != 0)
717 return err;
718
719 err = svc_addsock(nn->nfsd_serv, fd, buf, SIMPLE_TRANSACTION_LIMIT);
720 if (err < 0) {
721 nfsd_destroy(net);
722 return err;
723 }
724
725 /* Decrease the count, but don't shut down the service */
726 nn->nfsd_serv->sv_nrthreads--;
727 return err;
728}
729
730/*
731 * A transport listener is added by writing it's transport name and
732 * a port number.
733 */
734static ssize_t __write_ports_addxprt(char *buf, struct net *net)
735{
736 char transport[16];
737 struct svc_xprt *xprt;
738 int port, err;
739 struct nfsd_net *nn = net_generic(net, nfsd_net_id);
740
741 if (sscanf(buf, "%15s %5u", transport, &port) != 2)
742 return -EINVAL;
743
744 if (port < 1 || port > USHRT_MAX)
745 return -EINVAL;
746
747 err = nfsd_create_serv(net);
748 if (err != 0)
749 return err;
750
751 err = svc_create_xprt(nn->nfsd_serv, transport, net,
752 PF_INET, port, SVC_SOCK_ANONYMOUS);
753 if (err < 0)
754 goto out_err;
755
756 err = svc_create_xprt(nn->nfsd_serv, transport, net,
757 PF_INET6, port, SVC_SOCK_ANONYMOUS);
758 if (err < 0 && err != -EAFNOSUPPORT)
759 goto out_close;
760
761 /* Decrease the count, but don't shut down the service */
762 nn->nfsd_serv->sv_nrthreads--;
763 return 0;
764out_close:
765 xprt = svc_find_xprt(nn->nfsd_serv, transport, net, PF_INET, port);
766 if (xprt != NULL) {
767 svc_close_xprt(xprt);
768 svc_xprt_put(xprt);
769 }
770out_err:
771 nfsd_destroy(net);
772 return err;
773}
774
775static ssize_t __write_ports(struct file *file, char *buf, size_t size,
776 struct net *net)
777{
778 if (size == 0)
779 return __write_ports_names(buf, net);
780
781 if (isdigit(buf[0]))
782 return __write_ports_addfd(buf, net);
783
784 if (isalpha(buf[0]))
785 return __write_ports_addxprt(buf, net);
786
787 return -EINVAL;
788}
789
790/**
791 * write_ports - Pass a socket file descriptor or transport name to listen on
792 *
793 * Input:
794 * buf: ignored
795 * size: zero
796 * Output:
797 * On success: passed-in buffer filled with a '\n'-terminated C
798 * string containing a whitespace-separated list of
799 * named NFSD listeners;
800 * return code is the size in bytes of the string
801 * On error: return code is zero or a negative errno value
802 *
803 * OR
804 *
805 * Input:
806 * buf: C string containing an unsigned
807 * integer value representing a bound
808 * but unconnected socket that is to be
809 * used as an NFSD listener; listen(3)
810 * must be called for a SOCK_STREAM
811 * socket, otherwise it is ignored
812 * size: non-zero length of C string in @buf
813 * Output:
814 * On success: NFS service is started;
815 * passed-in buffer filled with a '\n'-terminated C
816 * string containing a unique alphanumeric name of
817 * the listener;
818 * return code is the size in bytes of the string
819 * On error: return code is a negative errno value
820 *
821 * OR
822 *
823 * Input:
824 * buf: C string containing a transport
825 * name and an unsigned integer value
826 * representing the port to listen on,
827 * separated by whitespace
828 * size: non-zero length of C string in @buf
829 * Output:
830 * On success: returns zero; NFS service is started
831 * On error: return code is a negative errno value
832 */
833static ssize_t write_ports(struct file *file, char *buf, size_t size)
834{
835 ssize_t rv;
836
837 mutex_lock(&nfsd_mutex);
838 rv = __write_ports(file, buf, size, netns(file));
839 mutex_unlock(&nfsd_mutex);
840 return rv;
841}
842
843
844int nfsd_max_blksize;
845
846/**
847 * write_maxblksize - Set or report the current NFS blksize
848 *
849 * Input:
850 * buf: ignored
851 * size: zero
852 *
853 * OR
854 *
855 * Input:
856 * buf: C string containing an unsigned
857 * integer value representing the new
858 * NFS blksize
859 * size: non-zero length of C string in @buf
860 * Output:
861 * On success: passed-in buffer filled with '\n'-terminated C string
862 * containing numeric value of the current NFS blksize
863 * setting;
864 * return code is the size in bytes of the string
865 * On error: return code is zero or a negative errno value
866 */
867static ssize_t write_maxblksize(struct file *file, char *buf, size_t size)
868{
869 char *mesg = buf;
870 struct nfsd_net *nn = net_generic(netns(file), nfsd_net_id);
871
872 if (size > 0) {
873 int bsize;
874 int rv = get_int(&mesg, &bsize);
875 if (rv)
876 return rv;
877 /* force bsize into allowed range and
878 * required alignment.
879 */
880 bsize = max_t(int, bsize, 1024);
881 bsize = min_t(int, bsize, NFSSVC_MAXBLKSIZE);
882 bsize &= ~(1024-1);
883 mutex_lock(&nfsd_mutex);
884 if (nn->nfsd_serv) {
885 mutex_unlock(&nfsd_mutex);
886 return -EBUSY;
887 }
888 nfsd_max_blksize = bsize;
889 mutex_unlock(&nfsd_mutex);
890 }
891
892 return scnprintf(buf, SIMPLE_TRANSACTION_LIMIT, "%d\n",
893 nfsd_max_blksize);
894}
895
896/**
897 * write_maxconn - Set or report the current max number of connections
898 *
899 * Input:
900 * buf: ignored
901 * size: zero
902 * OR
903 *
904 * Input:
905 * buf: C string containing an unsigned
906 * integer value representing the new
907 * number of max connections
908 * size: non-zero length of C string in @buf
909 * Output:
910 * On success: passed-in buffer filled with '\n'-terminated C string
911 * containing numeric value of max_connections setting
912 * for this net namespace;
913 * return code is the size in bytes of the string
914 * On error: return code is zero or a negative errno value
915 */
916static ssize_t write_maxconn(struct file *file, char *buf, size_t size)
917{
918 char *mesg = buf;
919 struct nfsd_net *nn = net_generic(netns(file), nfsd_net_id);
920 unsigned int maxconn = nn->max_connections;
921
922 if (size > 0) {
923 int rv = get_uint(&mesg, &maxconn);
924
925 if (rv)
926 return rv;
927 nn->max_connections = maxconn;
928 }
929
930 return scnprintf(buf, SIMPLE_TRANSACTION_LIMIT, "%u\n", maxconn);
931}
932
933#ifdef CONFIG_NFSD_V4
934static ssize_t __nfsd4_write_time(struct file *file, char *buf, size_t size,
935 time_t *time, struct nfsd_net *nn)
936{
937 char *mesg = buf;
938 int rv, i;
939
940 if (size > 0) {
941 if (nn->nfsd_serv)
942 return -EBUSY;
943 rv = get_int(&mesg, &i);
944 if (rv)
945 return rv;
946 /*
947 * Some sanity checking. We don't have a reason for
948 * these particular numbers, but problems with the
949 * extremes are:
950 * - Too short: the briefest network outage may
951 * cause clients to lose all their locks. Also,
952 * the frequent polling may be wasteful.
953 * - Too long: do you really want reboot recovery
954 * to take more than an hour? Or to make other
955 * clients wait an hour before being able to
956 * revoke a dead client's locks?
957 */
958 if (i < 10 || i > 3600)
959 return -EINVAL;
960 *time = i;
961 }
962
963 return scnprintf(buf, SIMPLE_TRANSACTION_LIMIT, "%ld\n", *time);
964}
965
966static ssize_t nfsd4_write_time(struct file *file, char *buf, size_t size,
967 time_t *time, struct nfsd_net *nn)
968{
969 ssize_t rv;
970
971 mutex_lock(&nfsd_mutex);
972 rv = __nfsd4_write_time(file, buf, size, time, nn);
973 mutex_unlock(&nfsd_mutex);
974 return rv;
975}
976
977/**
978 * write_leasetime - Set or report the current NFSv4 lease time
979 *
980 * Input:
981 * buf: ignored
982 * size: zero
983 *
984 * OR
985 *
986 * Input:
987 * buf: C string containing an unsigned
988 * integer value representing the new
989 * NFSv4 lease expiry time
990 * size: non-zero length of C string in @buf
991 * Output:
992 * On success: passed-in buffer filled with '\n'-terminated C
993 * string containing unsigned integer value of the
994 * current lease expiry time;
995 * return code is the size in bytes of the string
996 * On error: return code is zero or a negative errno value
997 */
998static ssize_t write_leasetime(struct file *file, char *buf, size_t size)
999{
1000 struct nfsd_net *nn = net_generic(netns(file), nfsd_net_id);
1001 return nfsd4_write_time(file, buf, size, &nn->nfsd4_lease, nn);
1002}
1003
1004/**
1005 * write_gracetime - Set or report current NFSv4 grace period time
1006 *
1007 * As above, but sets the time of the NFSv4 grace period.
1008 *
1009 * Note this should never be set to less than the *previous*
1010 * lease-period time, but we don't try to enforce this. (In the common
1011 * case (a new boot), we don't know what the previous lease time was
1012 * anyway.)
1013 */
1014static ssize_t write_gracetime(struct file *file, char *buf, size_t size)
1015{
1016 struct nfsd_net *nn = net_generic(netns(file), nfsd_net_id);
1017 return nfsd4_write_time(file, buf, size, &nn->nfsd4_grace, nn);
1018}
1019
1020static ssize_t __write_recoverydir(struct file *file, char *buf, size_t size,
1021 struct nfsd_net *nn)
1022{
1023 char *mesg = buf;
1024 char *recdir;
1025 int len, status;
1026
1027 if (size > 0) {
1028 if (nn->nfsd_serv)
1029 return -EBUSY;
1030 if (size > PATH_MAX || buf[size-1] != '\n')
1031 return -EINVAL;
1032 buf[size-1] = 0;
1033
1034 recdir = mesg;
1035 len = qword_get(&mesg, recdir, size);
1036 if (len <= 0)
1037 return -EINVAL;
1038
1039 status = nfs4_reset_recoverydir(recdir);
1040 if (status)
1041 return status;
1042 }
1043
1044 return scnprintf(buf, SIMPLE_TRANSACTION_LIMIT, "%s\n",
1045 nfs4_recoverydir());
1046}
1047
1048/**
1049 * write_recoverydir - Set or report the pathname of the recovery directory
1050 *
1051 * Input:
1052 * buf: ignored
1053 * size: zero
1054 *
1055 * OR
1056 *
1057 * Input:
1058 * buf: C string containing the pathname
1059 * of the directory on a local file
1060 * system containing permanent NFSv4
1061 * recovery data
1062 * size: non-zero length of C string in @buf
1063 * Output:
1064 * On success: passed-in buffer filled with '\n'-terminated C string
1065 * containing the current recovery pathname setting;
1066 * return code is the size in bytes of the string
1067 * On error: return code is zero or a negative errno value
1068 */
1069static ssize_t write_recoverydir(struct file *file, char *buf, size_t size)
1070{
1071 ssize_t rv;
1072 struct nfsd_net *nn = net_generic(netns(file), nfsd_net_id);
1073
1074 mutex_lock(&nfsd_mutex);
1075 rv = __write_recoverydir(file, buf, size, nn);
1076 mutex_unlock(&nfsd_mutex);
1077 return rv;
1078}
1079
1080/**
1081 * write_v4_end_grace - release grace period for nfsd's v4.x lock manager
1082 *
1083 * Input:
1084 * buf: ignored
1085 * size: zero
1086 * OR
1087 *
1088 * Input:
1089 * buf: any value
1090 * size: non-zero length of C string in @buf
1091 * Output:
1092 * passed-in buffer filled with "Y" or "N" with a newline
1093 * and NULL-terminated C string. This indicates whether
1094 * the grace period has ended in the current net
1095 * namespace. Return code is the size in bytes of the
1096 * string. Writing a string that starts with 'Y', 'y', or
1097 * '1' to the file will end the grace period for nfsd's v4
1098 * lock manager.
1099 */
1100static ssize_t write_v4_end_grace(struct file *file, char *buf, size_t size)
1101{
1102 struct nfsd_net *nn = net_generic(netns(file), nfsd_net_id);
1103
1104 if (size > 0) {
1105 switch(buf[0]) {
1106 case 'Y':
1107 case 'y':
1108 case '1':
1109 nfsd4_end_grace(nn);
1110 break;
1111 default:
1112 return -EINVAL;
1113 }
1114 }
1115
1116 return scnprintf(buf, SIMPLE_TRANSACTION_LIMIT, "%c\n",
1117 nn->grace_ended ? 'Y' : 'N');
1118}
1119
1120#endif
1121
1122/*----------------------------------------------------------------------------*/
1123/*
1124 * populating the filesystem.
1125 */
1126
1127static int nfsd_fill_super(struct super_block * sb, void * data, int silent)
1128{
1129 static struct tree_descr nfsd_files[] = {
1130 [NFSD_List] = {"exports", &exports_nfsd_operations, S_IRUGO},
1131 [NFSD_Export_features] = {"export_features",
1132 &export_features_operations, S_IRUGO},
1133 [NFSD_FO_UnlockIP] = {"unlock_ip",
1134 &transaction_ops, S_IWUSR|S_IRUSR},
1135 [NFSD_FO_UnlockFS] = {"unlock_filesystem",
1136 &transaction_ops, S_IWUSR|S_IRUSR},
1137 [NFSD_Fh] = {"filehandle", &transaction_ops, S_IWUSR|S_IRUSR},
1138 [NFSD_Threads] = {"threads", &transaction_ops, S_IWUSR|S_IRUSR},
1139 [NFSD_Pool_Threads] = {"pool_threads", &transaction_ops, S_IWUSR|S_IRUSR},
1140 [NFSD_Pool_Stats] = {"pool_stats", &pool_stats_operations, S_IRUGO},
1141 [NFSD_Reply_Cache_Stats] = {"reply_cache_stats", &reply_cache_stats_operations, S_IRUGO},
1142 [NFSD_Versions] = {"versions", &transaction_ops, S_IWUSR|S_IRUSR},
1143 [NFSD_Ports] = {"portlist", &transaction_ops, S_IWUSR|S_IRUGO},
1144 [NFSD_MaxBlkSize] = {"max_block_size", &transaction_ops, S_IWUSR|S_IRUGO},
1145 [NFSD_MaxConnections] = {"max_connections", &transaction_ops, S_IWUSR|S_IRUGO},
1146#if defined(CONFIG_SUNRPC_GSS) || defined(CONFIG_SUNRPC_GSS_MODULE)
1147 [NFSD_SupportedEnctypes] = {"supported_krb5_enctypes", &supported_enctypes_ops, S_IRUGO},
1148#endif /* CONFIG_SUNRPC_GSS or CONFIG_SUNRPC_GSS_MODULE */
1149#ifdef CONFIG_NFSD_V4
1150 [NFSD_Leasetime] = {"nfsv4leasetime", &transaction_ops, S_IWUSR|S_IRUSR},
1151 [NFSD_Gracetime] = {"nfsv4gracetime", &transaction_ops, S_IWUSR|S_IRUSR},
1152 [NFSD_RecoveryDir] = {"nfsv4recoverydir", &transaction_ops, S_IWUSR|S_IRUSR},
1153 [NFSD_V4EndGrace] = {"v4_end_grace", &transaction_ops, S_IWUSR|S_IRUGO},
1154#endif
1155 /* last one */ {""}
1156 };
1157 struct net *net = data;
1158 int ret;
1159
1160 ret = simple_fill_super(sb, 0x6e667364, nfsd_files);
1161 if (ret)
1162 return ret;
1163 sb->s_fs_info = get_net(net);
1164 return 0;
1165}
1166
1167static struct dentry *nfsd_mount(struct file_system_type *fs_type,
1168 int flags, const char *dev_name, void *data)
1169{
1170 return mount_ns(fs_type, flags, current->nsproxy->net_ns, nfsd_fill_super);
1171}
1172
1173static void nfsd_umount(struct super_block *sb)
1174{
1175 struct net *net = sb->s_fs_info;
1176
1177 kill_litter_super(sb);
1178 put_net(net);
1179}
1180
1181static struct file_system_type nfsd_fs_type = {
1182 .owner = THIS_MODULE,
1183 .name = "nfsd",
1184 .mount = nfsd_mount,
1185 .kill_sb = nfsd_umount,
1186};
1187MODULE_ALIAS_FS("nfsd");
1188
1189#ifdef CONFIG_PROC_FS
1190static int create_proc_exports_entry(void)
1191{
1192 struct proc_dir_entry *entry;
1193
1194 entry = proc_mkdir("fs/nfs", NULL);
1195 if (!entry)
1196 return -ENOMEM;
1197 entry = proc_create("exports", 0, entry,
1198 &exports_proc_operations);
1199 if (!entry) {
1200 remove_proc_entry("fs/nfs", NULL);
1201 return -ENOMEM;
1202 }
1203 return 0;
1204}
1205#else /* CONFIG_PROC_FS */
1206static int create_proc_exports_entry(void)
1207{
1208 return 0;
1209}
1210#endif
1211
1212int nfsd_net_id;
1213
1214static __net_init int nfsd_init_net(struct net *net)
1215{
1216 int retval;
1217 struct nfsd_net *nn = net_generic(net, nfsd_net_id);
1218
1219 retval = nfsd_export_init(net);
1220 if (retval)
1221 goto out_export_error;
1222 retval = nfsd_idmap_init(net);
1223 if (retval)
1224 goto out_idmap_error;
1225 nn->nfsd4_lease = 90; /* default lease time */
1226 nn->nfsd4_grace = 90;
1227 return 0;
1228
1229out_idmap_error:
1230 nfsd_export_shutdown(net);
1231out_export_error:
1232 return retval;
1233}
1234
1235static __net_exit void nfsd_exit_net(struct net *net)
1236{
1237 nfsd_idmap_shutdown(net);
1238 nfsd_export_shutdown(net);
1239}
1240
1241static struct pernet_operations nfsd_net_ops = {
1242 .init = nfsd_init_net,
1243 .exit = nfsd_exit_net,
1244 .id = &nfsd_net_id,
1245 .size = sizeof(struct nfsd_net),
1246};
1247
1248static int __init init_nfsd(void)
1249{
1250 int retval;
1251 printk(KERN_INFO "Installing knfsd (copyright (C) 1996 okir@monad.swb.de).\n");
1252
1253 retval = register_pernet_subsys(&nfsd_net_ops);
1254 if (retval < 0)
1255 return retval;
1256 retval = register_cld_notifier();
1257 if (retval)
1258 goto out_unregister_pernet;
1259 retval = nfsd4_init_slabs();
1260 if (retval)
1261 goto out_unregister_notifier;
1262 retval = nfsd4_init_pnfs();
1263 if (retval)
1264 goto out_free_slabs;
1265 retval = nfsd_fault_inject_init(); /* nfsd fault injection controls */
1266 if (retval)
1267 goto out_exit_pnfs;
1268 nfsd_stat_init(); /* Statistics */
1269 retval = nfsd_reply_cache_init();
1270 if (retval)
1271 goto out_free_stat;
1272 nfsd_lockd_init(); /* lockd->nfsd callbacks */
1273 retval = create_proc_exports_entry();
1274 if (retval)
1275 goto out_free_lockd;
1276 retval = register_filesystem(&nfsd_fs_type);
1277 if (retval)
1278 goto out_free_all;
1279 return 0;
1280out_free_all:
1281 remove_proc_entry("fs/nfs/exports", NULL);
1282 remove_proc_entry("fs/nfs", NULL);
1283out_free_lockd:
1284 nfsd_lockd_shutdown();
1285 nfsd_reply_cache_shutdown();
1286out_free_stat:
1287 nfsd_stat_shutdown();
1288 nfsd_fault_inject_cleanup();
1289out_exit_pnfs:
1290 nfsd4_exit_pnfs();
1291out_free_slabs:
1292 nfsd4_free_slabs();
1293out_unregister_notifier:
1294 unregister_cld_notifier();
1295out_unregister_pernet:
1296 unregister_pernet_subsys(&nfsd_net_ops);
1297 return retval;
1298}
1299
1300static void __exit exit_nfsd(void)
1301{
1302 nfsd_reply_cache_shutdown();
1303 remove_proc_entry("fs/nfs/exports", NULL);
1304 remove_proc_entry("fs/nfs", NULL);
1305 nfsd_stat_shutdown();
1306 nfsd_lockd_shutdown();
1307 nfsd4_free_slabs();
1308 nfsd4_exit_pnfs();
1309 nfsd_fault_inject_cleanup();
1310 unregister_filesystem(&nfsd_fs_type);
1311 unregister_cld_notifier();
1312 unregister_pernet_subsys(&nfsd_net_ops);
1313}
1314
1315MODULE_AUTHOR("Olaf Kirch <okir@monad.swb.de>");
1316MODULE_LICENSE("GPL");
1317module_init(init_nfsd)
1318module_exit(exit_nfsd)
1// SPDX-License-Identifier: GPL-2.0-only
2/*
3 * Syscall interface to knfsd.
4 *
5 * Copyright (C) 1995, 1996 Olaf Kirch <okir@monad.swb.de>
6 */
7
8#include <linux/slab.h>
9#include <linux/namei.h>
10#include <linux/ctype.h>
11#include <linux/fs_context.h>
12
13#include <linux/sunrpc/svcsock.h>
14#include <linux/lockd/lockd.h>
15#include <linux/sunrpc/addr.h>
16#include <linux/sunrpc/gss_api.h>
17#include <linux/sunrpc/gss_krb5_enctypes.h>
18#include <linux/sunrpc/rpc_pipe_fs.h>
19#include <linux/module.h>
20#include <linux/fsnotify.h>
21
22#include "idmap.h"
23#include "nfsd.h"
24#include "cache.h"
25#include "state.h"
26#include "netns.h"
27#include "pnfs.h"
28
29/*
30 * We have a single directory with several nodes in it.
31 */
32enum {
33 NFSD_Root = 1,
34 NFSD_List,
35 NFSD_Export_features,
36 NFSD_Fh,
37 NFSD_FO_UnlockIP,
38 NFSD_FO_UnlockFS,
39 NFSD_Threads,
40 NFSD_Pool_Threads,
41 NFSD_Pool_Stats,
42 NFSD_Reply_Cache_Stats,
43 NFSD_Versions,
44 NFSD_Ports,
45 NFSD_MaxBlkSize,
46 NFSD_MaxConnections,
47 NFSD_SupportedEnctypes,
48 /*
49 * The below MUST come last. Otherwise we leave a hole in nfsd_files[]
50 * with !CONFIG_NFSD_V4 and simple_fill_super() goes oops
51 */
52#ifdef CONFIG_NFSD_V4
53 NFSD_Leasetime,
54 NFSD_Gracetime,
55 NFSD_RecoveryDir,
56 NFSD_V4EndGrace,
57#endif
58 NFSD_MaxReserved
59};
60
61/*
62 * write() for these nodes.
63 */
64static ssize_t write_filehandle(struct file *file, char *buf, size_t size);
65static ssize_t write_unlock_ip(struct file *file, char *buf, size_t size);
66static ssize_t write_unlock_fs(struct file *file, char *buf, size_t size);
67static ssize_t write_threads(struct file *file, char *buf, size_t size);
68static ssize_t write_pool_threads(struct file *file, char *buf, size_t size);
69static ssize_t write_versions(struct file *file, char *buf, size_t size);
70static ssize_t write_ports(struct file *file, char *buf, size_t size);
71static ssize_t write_maxblksize(struct file *file, char *buf, size_t size);
72static ssize_t write_maxconn(struct file *file, char *buf, size_t size);
73#ifdef CONFIG_NFSD_V4
74static ssize_t write_leasetime(struct file *file, char *buf, size_t size);
75static ssize_t write_gracetime(struct file *file, char *buf, size_t size);
76static ssize_t write_recoverydir(struct file *file, char *buf, size_t size);
77static ssize_t write_v4_end_grace(struct file *file, char *buf, size_t size);
78#endif
79
80static ssize_t (*const write_op[])(struct file *, char *, size_t) = {
81 [NFSD_Fh] = write_filehandle,
82 [NFSD_FO_UnlockIP] = write_unlock_ip,
83 [NFSD_FO_UnlockFS] = write_unlock_fs,
84 [NFSD_Threads] = write_threads,
85 [NFSD_Pool_Threads] = write_pool_threads,
86 [NFSD_Versions] = write_versions,
87 [NFSD_Ports] = write_ports,
88 [NFSD_MaxBlkSize] = write_maxblksize,
89 [NFSD_MaxConnections] = write_maxconn,
90#ifdef CONFIG_NFSD_V4
91 [NFSD_Leasetime] = write_leasetime,
92 [NFSD_Gracetime] = write_gracetime,
93 [NFSD_RecoveryDir] = write_recoverydir,
94 [NFSD_V4EndGrace] = write_v4_end_grace,
95#endif
96};
97
98static ssize_t nfsctl_transaction_write(struct file *file, const char __user *buf, size_t size, loff_t *pos)
99{
100 ino_t ino = file_inode(file)->i_ino;
101 char *data;
102 ssize_t rv;
103
104 if (ino >= ARRAY_SIZE(write_op) || !write_op[ino])
105 return -EINVAL;
106
107 data = simple_transaction_get(file, buf, size);
108 if (IS_ERR(data))
109 return PTR_ERR(data);
110
111 rv = write_op[ino](file, data, size);
112 if (rv >= 0) {
113 simple_transaction_set(file, rv);
114 rv = size;
115 }
116 return rv;
117}
118
119static ssize_t nfsctl_transaction_read(struct file *file, char __user *buf, size_t size, loff_t *pos)
120{
121 if (! file->private_data) {
122 /* An attempt to read a transaction file without writing
123 * causes a 0-byte write so that the file can return
124 * state information
125 */
126 ssize_t rv = nfsctl_transaction_write(file, buf, 0, pos);
127 if (rv < 0)
128 return rv;
129 }
130 return simple_transaction_read(file, buf, size, pos);
131}
132
133static const struct file_operations transaction_ops = {
134 .write = nfsctl_transaction_write,
135 .read = nfsctl_transaction_read,
136 .release = simple_transaction_release,
137 .llseek = default_llseek,
138};
139
140static int exports_net_open(struct net *net, struct file *file)
141{
142 int err;
143 struct seq_file *seq;
144 struct nfsd_net *nn = net_generic(net, nfsd_net_id);
145
146 err = seq_open(file, &nfs_exports_op);
147 if (err)
148 return err;
149
150 seq = file->private_data;
151 seq->private = nn->svc_export_cache;
152 return 0;
153}
154
155static int exports_proc_open(struct inode *inode, struct file *file)
156{
157 return exports_net_open(current->nsproxy->net_ns, file);
158}
159
160static const struct file_operations exports_proc_operations = {
161 .open = exports_proc_open,
162 .read = seq_read,
163 .llseek = seq_lseek,
164 .release = seq_release,
165};
166
167static int exports_nfsd_open(struct inode *inode, struct file *file)
168{
169 return exports_net_open(inode->i_sb->s_fs_info, file);
170}
171
172static const struct file_operations exports_nfsd_operations = {
173 .open = exports_nfsd_open,
174 .read = seq_read,
175 .llseek = seq_lseek,
176 .release = seq_release,
177};
178
179static int export_features_show(struct seq_file *m, void *v)
180{
181 seq_printf(m, "0x%x 0x%x\n", NFSEXP_ALLFLAGS, NFSEXP_SECINFO_FLAGS);
182 return 0;
183}
184
185static int export_features_open(struct inode *inode, struct file *file)
186{
187 return single_open(file, export_features_show, NULL);
188}
189
190static const struct file_operations export_features_operations = {
191 .open = export_features_open,
192 .read = seq_read,
193 .llseek = seq_lseek,
194 .release = single_release,
195};
196
197#if defined(CONFIG_SUNRPC_GSS) || defined(CONFIG_SUNRPC_GSS_MODULE)
198static int supported_enctypes_show(struct seq_file *m, void *v)
199{
200 seq_printf(m, KRB5_SUPPORTED_ENCTYPES);
201 return 0;
202}
203
204static int supported_enctypes_open(struct inode *inode, struct file *file)
205{
206 return single_open(file, supported_enctypes_show, NULL);
207}
208
209static const struct file_operations supported_enctypes_ops = {
210 .open = supported_enctypes_open,
211 .read = seq_read,
212 .llseek = seq_lseek,
213 .release = single_release,
214};
215#endif /* CONFIG_SUNRPC_GSS or CONFIG_SUNRPC_GSS_MODULE */
216
217static const struct file_operations pool_stats_operations = {
218 .open = nfsd_pool_stats_open,
219 .read = seq_read,
220 .llseek = seq_lseek,
221 .release = nfsd_pool_stats_release,
222};
223
224static const struct file_operations reply_cache_stats_operations = {
225 .open = nfsd_reply_cache_stats_open,
226 .read = seq_read,
227 .llseek = seq_lseek,
228 .release = single_release,
229};
230
231/*----------------------------------------------------------------------------*/
232/*
233 * payload - write methods
234 */
235
236static inline struct net *netns(struct file *file)
237{
238 return file_inode(file)->i_sb->s_fs_info;
239}
240
241/**
242 * write_unlock_ip - Release all locks used by a client
243 *
244 * Experimental.
245 *
246 * Input:
247 * buf: '\n'-terminated C string containing a
248 * presentation format IP address
249 * size: length of C string in @buf
250 * Output:
251 * On success: returns zero if all specified locks were released;
252 * returns one if one or more locks were not released
253 * On error: return code is negative errno value
254 */
255static ssize_t write_unlock_ip(struct file *file, char *buf, size_t size)
256{
257 struct sockaddr_storage address;
258 struct sockaddr *sap = (struct sockaddr *)&address;
259 size_t salen = sizeof(address);
260 char *fo_path;
261 struct net *net = netns(file);
262
263 /* sanity check */
264 if (size == 0)
265 return -EINVAL;
266
267 if (buf[size-1] != '\n')
268 return -EINVAL;
269
270 fo_path = buf;
271 if (qword_get(&buf, fo_path, size) < 0)
272 return -EINVAL;
273
274 if (rpc_pton(net, fo_path, size, sap, salen) == 0)
275 return -EINVAL;
276
277 return nlmsvc_unlock_all_by_ip(sap);
278}
279
280/**
281 * write_unlock_fs - Release all locks on a local file system
282 *
283 * Experimental.
284 *
285 * Input:
286 * buf: '\n'-terminated C string containing the
287 * absolute pathname of a local file system
288 * size: length of C string in @buf
289 * Output:
290 * On success: returns zero if all specified locks were released;
291 * returns one if one or more locks were not released
292 * On error: return code is negative errno value
293 */
294static ssize_t write_unlock_fs(struct file *file, char *buf, size_t size)
295{
296 struct path path;
297 char *fo_path;
298 int error;
299
300 /* sanity check */
301 if (size == 0)
302 return -EINVAL;
303
304 if (buf[size-1] != '\n')
305 return -EINVAL;
306
307 fo_path = buf;
308 if (qword_get(&buf, fo_path, size) < 0)
309 return -EINVAL;
310
311 error = kern_path(fo_path, 0, &path);
312 if (error)
313 return error;
314
315 /*
316 * XXX: Needs better sanity checking. Otherwise we could end up
317 * releasing locks on the wrong file system.
318 *
319 * For example:
320 * 1. Does the path refer to a directory?
321 * 2. Is that directory a mount point, or
322 * 3. Is that directory the root of an exported file system?
323 */
324 error = nlmsvc_unlock_all_by_sb(path.dentry->d_sb);
325
326 path_put(&path);
327 return error;
328}
329
330/**
331 * write_filehandle - Get a variable-length NFS file handle by path
332 *
333 * On input, the buffer contains a '\n'-terminated C string comprised of
334 * three alphanumeric words separated by whitespace. The string may
335 * contain escape sequences.
336 *
337 * Input:
338 * buf:
339 * domain: client domain name
340 * path: export pathname
341 * maxsize: numeric maximum size of
342 * @buf
343 * size: length of C string in @buf
344 * Output:
345 * On success: passed-in buffer filled with '\n'-terminated C
346 * string containing a ASCII hex text version
347 * of the NFS file handle;
348 * return code is the size in bytes of the string
349 * On error: return code is negative errno value
350 */
351static ssize_t write_filehandle(struct file *file, char *buf, size_t size)
352{
353 char *dname, *path;
354 int uninitialized_var(maxsize);
355 char *mesg = buf;
356 int len;
357 struct auth_domain *dom;
358 struct knfsd_fh fh;
359
360 if (size == 0)
361 return -EINVAL;
362
363 if (buf[size-1] != '\n')
364 return -EINVAL;
365 buf[size-1] = 0;
366
367 dname = mesg;
368 len = qword_get(&mesg, dname, size);
369 if (len <= 0)
370 return -EINVAL;
371
372 path = dname+len+1;
373 len = qword_get(&mesg, path, size);
374 if (len <= 0)
375 return -EINVAL;
376
377 len = get_int(&mesg, &maxsize);
378 if (len)
379 return len;
380
381 if (maxsize < NFS_FHSIZE)
382 return -EINVAL;
383 maxsize = min(maxsize, NFS3_FHSIZE);
384
385 if (qword_get(&mesg, mesg, size)>0)
386 return -EINVAL;
387
388 /* we have all the words, they are in buf.. */
389 dom = unix_domain_find(dname);
390 if (!dom)
391 return -ENOMEM;
392
393 len = exp_rootfh(netns(file), dom, path, &fh, maxsize);
394 auth_domain_put(dom);
395 if (len)
396 return len;
397
398 mesg = buf;
399 len = SIMPLE_TRANSACTION_LIMIT;
400 qword_addhex(&mesg, &len, (char*)&fh.fh_base, fh.fh_size);
401 mesg[-1] = '\n';
402 return mesg - buf;
403}
404
405/**
406 * write_threads - Start NFSD, or report the current number of running threads
407 *
408 * Input:
409 * buf: ignored
410 * size: zero
411 * Output:
412 * On success: passed-in buffer filled with '\n'-terminated C
413 * string numeric value representing the number of
414 * running NFSD threads;
415 * return code is the size in bytes of the string
416 * On error: return code is zero
417 *
418 * OR
419 *
420 * Input:
421 * buf: C string containing an unsigned
422 * integer value representing the
423 * number of NFSD threads to start
424 * size: non-zero length of C string in @buf
425 * Output:
426 * On success: NFS service is started;
427 * passed-in buffer filled with '\n'-terminated C
428 * string numeric value representing the number of
429 * running NFSD threads;
430 * return code is the size in bytes of the string
431 * On error: return code is zero or a negative errno value
432 */
433static ssize_t write_threads(struct file *file, char *buf, size_t size)
434{
435 char *mesg = buf;
436 int rv;
437 struct net *net = netns(file);
438
439 if (size > 0) {
440 int newthreads;
441 rv = get_int(&mesg, &newthreads);
442 if (rv)
443 return rv;
444 if (newthreads < 0)
445 return -EINVAL;
446 rv = nfsd_svc(newthreads, net, file->f_cred);
447 if (rv < 0)
448 return rv;
449 } else
450 rv = nfsd_nrthreads(net);
451
452 return scnprintf(buf, SIMPLE_TRANSACTION_LIMIT, "%d\n", rv);
453}
454
455/**
456 * write_pool_threads - Set or report the current number of threads per pool
457 *
458 * Input:
459 * buf: ignored
460 * size: zero
461 *
462 * OR
463 *
464 * Input:
465 * buf: C string containing whitespace-
466 * separated unsigned integer values
467 * representing the number of NFSD
468 * threads to start in each pool
469 * size: non-zero length of C string in @buf
470 * Output:
471 * On success: passed-in buffer filled with '\n'-terminated C
472 * string containing integer values representing the
473 * number of NFSD threads in each pool;
474 * return code is the size in bytes of the string
475 * On error: return code is zero or a negative errno value
476 */
477static ssize_t write_pool_threads(struct file *file, char *buf, size_t size)
478{
479 /* if size > 0, look for an array of number of threads per node
480 * and apply them then write out number of threads per node as reply
481 */
482 char *mesg = buf;
483 int i;
484 int rv;
485 int len;
486 int npools;
487 int *nthreads;
488 struct net *net = netns(file);
489
490 mutex_lock(&nfsd_mutex);
491 npools = nfsd_nrpools(net);
492 if (npools == 0) {
493 /*
494 * NFS is shut down. The admin can start it by
495 * writing to the threads file but NOT the pool_threads
496 * file, sorry. Report zero threads.
497 */
498 mutex_unlock(&nfsd_mutex);
499 strcpy(buf, "0\n");
500 return strlen(buf);
501 }
502
503 nthreads = kcalloc(npools, sizeof(int), GFP_KERNEL);
504 rv = -ENOMEM;
505 if (nthreads == NULL)
506 goto out_free;
507
508 if (size > 0) {
509 for (i = 0; i < npools; i++) {
510 rv = get_int(&mesg, &nthreads[i]);
511 if (rv == -ENOENT)
512 break; /* fewer numbers than pools */
513 if (rv)
514 goto out_free; /* syntax error */
515 rv = -EINVAL;
516 if (nthreads[i] < 0)
517 goto out_free;
518 }
519 rv = nfsd_set_nrthreads(i, nthreads, net);
520 if (rv)
521 goto out_free;
522 }
523
524 rv = nfsd_get_nrthreads(npools, nthreads, net);
525 if (rv)
526 goto out_free;
527
528 mesg = buf;
529 size = SIMPLE_TRANSACTION_LIMIT;
530 for (i = 0; i < npools && size > 0; i++) {
531 snprintf(mesg, size, "%d%c", nthreads[i], (i == npools-1 ? '\n' : ' '));
532 len = strlen(mesg);
533 size -= len;
534 mesg += len;
535 }
536 rv = mesg - buf;
537out_free:
538 kfree(nthreads);
539 mutex_unlock(&nfsd_mutex);
540 return rv;
541}
542
543static ssize_t
544nfsd_print_version_support(struct nfsd_net *nn, char *buf, int remaining,
545 const char *sep, unsigned vers, int minor)
546{
547 const char *format = minor < 0 ? "%s%c%u" : "%s%c%u.%u";
548 bool supported = !!nfsd_vers(nn, vers, NFSD_TEST);
549
550 if (vers == 4 && minor >= 0 &&
551 !nfsd_minorversion(nn, minor, NFSD_TEST))
552 supported = false;
553 if (minor == 0 && supported)
554 /*
555 * special case for backward compatability.
556 * +4.0 is never reported, it is implied by
557 * +4, unless -4.0 is present.
558 */
559 return 0;
560 return snprintf(buf, remaining, format, sep,
561 supported ? '+' : '-', vers, minor);
562}
563
564static ssize_t __write_versions(struct file *file, char *buf, size_t size)
565{
566 char *mesg = buf;
567 char *vers, *minorp, sign;
568 int len, num, remaining;
569 ssize_t tlen = 0;
570 char *sep;
571 struct nfsd_net *nn = net_generic(netns(file), nfsd_net_id);
572
573 if (size>0) {
574 if (nn->nfsd_serv)
575 /* Cannot change versions without updating
576 * nn->nfsd_serv->sv_xdrsize, and reallocing
577 * rq_argp and rq_resp
578 */
579 return -EBUSY;
580 if (buf[size-1] != '\n')
581 return -EINVAL;
582 buf[size-1] = 0;
583
584 vers = mesg;
585 len = qword_get(&mesg, vers, size);
586 if (len <= 0) return -EINVAL;
587 do {
588 enum vers_op cmd;
589 unsigned minor;
590 sign = *vers;
591 if (sign == '+' || sign == '-')
592 num = simple_strtol((vers+1), &minorp, 0);
593 else
594 num = simple_strtol(vers, &minorp, 0);
595 if (*minorp == '.') {
596 if (num != 4)
597 return -EINVAL;
598 if (kstrtouint(minorp+1, 0, &minor) < 0)
599 return -EINVAL;
600 }
601
602 cmd = sign == '-' ? NFSD_CLEAR : NFSD_SET;
603 switch(num) {
604 case 2:
605 case 3:
606 nfsd_vers(nn, num, cmd);
607 break;
608 case 4:
609 if (*minorp == '.') {
610 if (nfsd_minorversion(nn, minor, cmd) < 0)
611 return -EINVAL;
612 } else if ((cmd == NFSD_SET) != nfsd_vers(nn, num, NFSD_TEST)) {
613 /*
614 * Either we have +4 and no minors are enabled,
615 * or we have -4 and at least one minor is enabled.
616 * In either case, propagate 'cmd' to all minors.
617 */
618 minor = 0;
619 while (nfsd_minorversion(nn, minor, cmd) >= 0)
620 minor++;
621 }
622 break;
623 default:
624 return -EINVAL;
625 }
626 vers += len + 1;
627 } while ((len = qword_get(&mesg, vers, size)) > 0);
628 /* If all get turned off, turn them back on, as
629 * having no versions is BAD
630 */
631 nfsd_reset_versions(nn);
632 }
633
634 /* Now write current state into reply buffer */
635 len = 0;
636 sep = "";
637 remaining = SIMPLE_TRANSACTION_LIMIT;
638 for (num=2 ; num <= 4 ; num++) {
639 int minor;
640 if (!nfsd_vers(nn, num, NFSD_AVAIL))
641 continue;
642
643 minor = -1;
644 do {
645 len = nfsd_print_version_support(nn, buf, remaining,
646 sep, num, minor);
647 if (len >= remaining)
648 goto out;
649 remaining -= len;
650 buf += len;
651 tlen += len;
652 minor++;
653 if (len)
654 sep = " ";
655 } while (num == 4 && minor <= NFSD_SUPPORTED_MINOR_VERSION);
656 }
657out:
658 len = snprintf(buf, remaining, "\n");
659 if (len >= remaining)
660 return -EINVAL;
661 return tlen + len;
662}
663
664/**
665 * write_versions - Set or report the available NFS protocol versions
666 *
667 * Input:
668 * buf: ignored
669 * size: zero
670 * Output:
671 * On success: passed-in buffer filled with '\n'-terminated C
672 * string containing positive or negative integer
673 * values representing the current status of each
674 * protocol version;
675 * return code is the size in bytes of the string
676 * On error: return code is zero or a negative errno value
677 *
678 * OR
679 *
680 * Input:
681 * buf: C string containing whitespace-
682 * separated positive or negative
683 * integer values representing NFS
684 * protocol versions to enable ("+n")
685 * or disable ("-n")
686 * size: non-zero length of C string in @buf
687 * Output:
688 * On success: status of zero or more protocol versions has
689 * been updated; passed-in buffer filled with
690 * '\n'-terminated C string containing positive
691 * or negative integer values representing the
692 * current status of each protocol version;
693 * return code is the size in bytes of the string
694 * On error: return code is zero or a negative errno value
695 */
696static ssize_t write_versions(struct file *file, char *buf, size_t size)
697{
698 ssize_t rv;
699
700 mutex_lock(&nfsd_mutex);
701 rv = __write_versions(file, buf, size);
702 mutex_unlock(&nfsd_mutex);
703 return rv;
704}
705
706/*
707 * Zero-length write. Return a list of NFSD's current listener
708 * transports.
709 */
710static ssize_t __write_ports_names(char *buf, struct net *net)
711{
712 struct nfsd_net *nn = net_generic(net, nfsd_net_id);
713
714 if (nn->nfsd_serv == NULL)
715 return 0;
716 return svc_xprt_names(nn->nfsd_serv, buf, SIMPLE_TRANSACTION_LIMIT);
717}
718
719/*
720 * A single 'fd' number was written, in which case it must be for
721 * a socket of a supported family/protocol, and we use it as an
722 * nfsd listener.
723 */
724static ssize_t __write_ports_addfd(char *buf, struct net *net, const struct cred *cred)
725{
726 char *mesg = buf;
727 int fd, err;
728 struct nfsd_net *nn = net_generic(net, nfsd_net_id);
729
730 err = get_int(&mesg, &fd);
731 if (err != 0 || fd < 0)
732 return -EINVAL;
733
734 if (svc_alien_sock(net, fd)) {
735 printk(KERN_ERR "%s: socket net is different to NFSd's one\n", __func__);
736 return -EINVAL;
737 }
738
739 err = nfsd_create_serv(net);
740 if (err != 0)
741 return err;
742
743 err = svc_addsock(nn->nfsd_serv, fd, buf, SIMPLE_TRANSACTION_LIMIT, cred);
744 if (err < 0) {
745 nfsd_destroy(net);
746 return err;
747 }
748
749 /* Decrease the count, but don't shut down the service */
750 nn->nfsd_serv->sv_nrthreads--;
751 return err;
752}
753
754/*
755 * A transport listener is added by writing it's transport name and
756 * a port number.
757 */
758static ssize_t __write_ports_addxprt(char *buf, struct net *net, const struct cred *cred)
759{
760 char transport[16];
761 struct svc_xprt *xprt;
762 int port, err;
763 struct nfsd_net *nn = net_generic(net, nfsd_net_id);
764
765 if (sscanf(buf, "%15s %5u", transport, &port) != 2)
766 return -EINVAL;
767
768 if (port < 1 || port > USHRT_MAX)
769 return -EINVAL;
770
771 err = nfsd_create_serv(net);
772 if (err != 0)
773 return err;
774
775 err = svc_create_xprt(nn->nfsd_serv, transport, net,
776 PF_INET, port, SVC_SOCK_ANONYMOUS, cred);
777 if (err < 0)
778 goto out_err;
779
780 err = svc_create_xprt(nn->nfsd_serv, transport, net,
781 PF_INET6, port, SVC_SOCK_ANONYMOUS, cred);
782 if (err < 0 && err != -EAFNOSUPPORT)
783 goto out_close;
784
785 /* Decrease the count, but don't shut down the service */
786 nn->nfsd_serv->sv_nrthreads--;
787 return 0;
788out_close:
789 xprt = svc_find_xprt(nn->nfsd_serv, transport, net, PF_INET, port);
790 if (xprt != NULL) {
791 svc_close_xprt(xprt);
792 svc_xprt_put(xprt);
793 }
794out_err:
795 nfsd_destroy(net);
796 return err;
797}
798
799static ssize_t __write_ports(struct file *file, char *buf, size_t size,
800 struct net *net)
801{
802 if (size == 0)
803 return __write_ports_names(buf, net);
804
805 if (isdigit(buf[0]))
806 return __write_ports_addfd(buf, net, file->f_cred);
807
808 if (isalpha(buf[0]))
809 return __write_ports_addxprt(buf, net, file->f_cred);
810
811 return -EINVAL;
812}
813
814/**
815 * write_ports - Pass a socket file descriptor or transport name to listen on
816 *
817 * Input:
818 * buf: ignored
819 * size: zero
820 * Output:
821 * On success: passed-in buffer filled with a '\n'-terminated C
822 * string containing a whitespace-separated list of
823 * named NFSD listeners;
824 * return code is the size in bytes of the string
825 * On error: return code is zero or a negative errno value
826 *
827 * OR
828 *
829 * Input:
830 * buf: C string containing an unsigned
831 * integer value representing a bound
832 * but unconnected socket that is to be
833 * used as an NFSD listener; listen(3)
834 * must be called for a SOCK_STREAM
835 * socket, otherwise it is ignored
836 * size: non-zero length of C string in @buf
837 * Output:
838 * On success: NFS service is started;
839 * passed-in buffer filled with a '\n'-terminated C
840 * string containing a unique alphanumeric name of
841 * the listener;
842 * return code is the size in bytes of the string
843 * On error: return code is a negative errno value
844 *
845 * OR
846 *
847 * Input:
848 * buf: C string containing a transport
849 * name and an unsigned integer value
850 * representing the port to listen on,
851 * separated by whitespace
852 * size: non-zero length of C string in @buf
853 * Output:
854 * On success: returns zero; NFS service is started
855 * On error: return code is a negative errno value
856 */
857static ssize_t write_ports(struct file *file, char *buf, size_t size)
858{
859 ssize_t rv;
860
861 mutex_lock(&nfsd_mutex);
862 rv = __write_ports(file, buf, size, netns(file));
863 mutex_unlock(&nfsd_mutex);
864 return rv;
865}
866
867
868int nfsd_max_blksize;
869
870/**
871 * write_maxblksize - Set or report the current NFS blksize
872 *
873 * Input:
874 * buf: ignored
875 * size: zero
876 *
877 * OR
878 *
879 * Input:
880 * buf: C string containing an unsigned
881 * integer value representing the new
882 * NFS blksize
883 * size: non-zero length of C string in @buf
884 * Output:
885 * On success: passed-in buffer filled with '\n'-terminated C string
886 * containing numeric value of the current NFS blksize
887 * setting;
888 * return code is the size in bytes of the string
889 * On error: return code is zero or a negative errno value
890 */
891static ssize_t write_maxblksize(struct file *file, char *buf, size_t size)
892{
893 char *mesg = buf;
894 struct nfsd_net *nn = net_generic(netns(file), nfsd_net_id);
895
896 if (size > 0) {
897 int bsize;
898 int rv = get_int(&mesg, &bsize);
899 if (rv)
900 return rv;
901 /* force bsize into allowed range and
902 * required alignment.
903 */
904 bsize = max_t(int, bsize, 1024);
905 bsize = min_t(int, bsize, NFSSVC_MAXBLKSIZE);
906 bsize &= ~(1024-1);
907 mutex_lock(&nfsd_mutex);
908 if (nn->nfsd_serv) {
909 mutex_unlock(&nfsd_mutex);
910 return -EBUSY;
911 }
912 nfsd_max_blksize = bsize;
913 mutex_unlock(&nfsd_mutex);
914 }
915
916 return scnprintf(buf, SIMPLE_TRANSACTION_LIMIT, "%d\n",
917 nfsd_max_blksize);
918}
919
920/**
921 * write_maxconn - Set or report the current max number of connections
922 *
923 * Input:
924 * buf: ignored
925 * size: zero
926 * OR
927 *
928 * Input:
929 * buf: C string containing an unsigned
930 * integer value representing the new
931 * number of max connections
932 * size: non-zero length of C string in @buf
933 * Output:
934 * On success: passed-in buffer filled with '\n'-terminated C string
935 * containing numeric value of max_connections setting
936 * for this net namespace;
937 * return code is the size in bytes of the string
938 * On error: return code is zero or a negative errno value
939 */
940static ssize_t write_maxconn(struct file *file, char *buf, size_t size)
941{
942 char *mesg = buf;
943 struct nfsd_net *nn = net_generic(netns(file), nfsd_net_id);
944 unsigned int maxconn = nn->max_connections;
945
946 if (size > 0) {
947 int rv = get_uint(&mesg, &maxconn);
948
949 if (rv)
950 return rv;
951 nn->max_connections = maxconn;
952 }
953
954 return scnprintf(buf, SIMPLE_TRANSACTION_LIMIT, "%u\n", maxconn);
955}
956
957#ifdef CONFIG_NFSD_V4
958static ssize_t __nfsd4_write_time(struct file *file, char *buf, size_t size,
959 time_t *time, struct nfsd_net *nn)
960{
961 char *mesg = buf;
962 int rv, i;
963
964 if (size > 0) {
965 if (nn->nfsd_serv)
966 return -EBUSY;
967 rv = get_int(&mesg, &i);
968 if (rv)
969 return rv;
970 /*
971 * Some sanity checking. We don't have a reason for
972 * these particular numbers, but problems with the
973 * extremes are:
974 * - Too short: the briefest network outage may
975 * cause clients to lose all their locks. Also,
976 * the frequent polling may be wasteful.
977 * - Too long: do you really want reboot recovery
978 * to take more than an hour? Or to make other
979 * clients wait an hour before being able to
980 * revoke a dead client's locks?
981 */
982 if (i < 10 || i > 3600)
983 return -EINVAL;
984 *time = i;
985 }
986
987 return scnprintf(buf, SIMPLE_TRANSACTION_LIMIT, "%ld\n", *time);
988}
989
990static ssize_t nfsd4_write_time(struct file *file, char *buf, size_t size,
991 time_t *time, struct nfsd_net *nn)
992{
993 ssize_t rv;
994
995 mutex_lock(&nfsd_mutex);
996 rv = __nfsd4_write_time(file, buf, size, time, nn);
997 mutex_unlock(&nfsd_mutex);
998 return rv;
999}
1000
1001/**
1002 * write_leasetime - Set or report the current NFSv4 lease time
1003 *
1004 * Input:
1005 * buf: ignored
1006 * size: zero
1007 *
1008 * OR
1009 *
1010 * Input:
1011 * buf: C string containing an unsigned
1012 * integer value representing the new
1013 * NFSv4 lease expiry time
1014 * size: non-zero length of C string in @buf
1015 * Output:
1016 * On success: passed-in buffer filled with '\n'-terminated C
1017 * string containing unsigned integer value of the
1018 * current lease expiry time;
1019 * return code is the size in bytes of the string
1020 * On error: return code is zero or a negative errno value
1021 */
1022static ssize_t write_leasetime(struct file *file, char *buf, size_t size)
1023{
1024 struct nfsd_net *nn = net_generic(netns(file), nfsd_net_id);
1025 return nfsd4_write_time(file, buf, size, &nn->nfsd4_lease, nn);
1026}
1027
1028/**
1029 * write_gracetime - Set or report current NFSv4 grace period time
1030 *
1031 * As above, but sets the time of the NFSv4 grace period.
1032 *
1033 * Note this should never be set to less than the *previous*
1034 * lease-period time, but we don't try to enforce this. (In the common
1035 * case (a new boot), we don't know what the previous lease time was
1036 * anyway.)
1037 */
1038static ssize_t write_gracetime(struct file *file, char *buf, size_t size)
1039{
1040 struct nfsd_net *nn = net_generic(netns(file), nfsd_net_id);
1041 return nfsd4_write_time(file, buf, size, &nn->nfsd4_grace, nn);
1042}
1043
1044static ssize_t __write_recoverydir(struct file *file, char *buf, size_t size,
1045 struct nfsd_net *nn)
1046{
1047 char *mesg = buf;
1048 char *recdir;
1049 int len, status;
1050
1051 if (size > 0) {
1052 if (nn->nfsd_serv)
1053 return -EBUSY;
1054 if (size > PATH_MAX || buf[size-1] != '\n')
1055 return -EINVAL;
1056 buf[size-1] = 0;
1057
1058 recdir = mesg;
1059 len = qword_get(&mesg, recdir, size);
1060 if (len <= 0)
1061 return -EINVAL;
1062
1063 status = nfs4_reset_recoverydir(recdir);
1064 if (status)
1065 return status;
1066 }
1067
1068 return scnprintf(buf, SIMPLE_TRANSACTION_LIMIT, "%s\n",
1069 nfs4_recoverydir());
1070}
1071
1072/**
1073 * write_recoverydir - Set or report the pathname of the recovery directory
1074 *
1075 * Input:
1076 * buf: ignored
1077 * size: zero
1078 *
1079 * OR
1080 *
1081 * Input:
1082 * buf: C string containing the pathname
1083 * of the directory on a local file
1084 * system containing permanent NFSv4
1085 * recovery data
1086 * size: non-zero length of C string in @buf
1087 * Output:
1088 * On success: passed-in buffer filled with '\n'-terminated C string
1089 * containing the current recovery pathname setting;
1090 * return code is the size in bytes of the string
1091 * On error: return code is zero or a negative errno value
1092 */
1093static ssize_t write_recoverydir(struct file *file, char *buf, size_t size)
1094{
1095 ssize_t rv;
1096 struct nfsd_net *nn = net_generic(netns(file), nfsd_net_id);
1097
1098 mutex_lock(&nfsd_mutex);
1099 rv = __write_recoverydir(file, buf, size, nn);
1100 mutex_unlock(&nfsd_mutex);
1101 return rv;
1102}
1103
1104/**
1105 * write_v4_end_grace - release grace period for nfsd's v4.x lock manager
1106 *
1107 * Input:
1108 * buf: ignored
1109 * size: zero
1110 * OR
1111 *
1112 * Input:
1113 * buf: any value
1114 * size: non-zero length of C string in @buf
1115 * Output:
1116 * passed-in buffer filled with "Y" or "N" with a newline
1117 * and NULL-terminated C string. This indicates whether
1118 * the grace period has ended in the current net
1119 * namespace. Return code is the size in bytes of the
1120 * string. Writing a string that starts with 'Y', 'y', or
1121 * '1' to the file will end the grace period for nfsd's v4
1122 * lock manager.
1123 */
1124static ssize_t write_v4_end_grace(struct file *file, char *buf, size_t size)
1125{
1126 struct nfsd_net *nn = net_generic(netns(file), nfsd_net_id);
1127
1128 if (size > 0) {
1129 switch(buf[0]) {
1130 case 'Y':
1131 case 'y':
1132 case '1':
1133 if (!nn->nfsd_serv)
1134 return -EBUSY;
1135 nfsd4_end_grace(nn);
1136 break;
1137 default:
1138 return -EINVAL;
1139 }
1140 }
1141
1142 return scnprintf(buf, SIMPLE_TRANSACTION_LIMIT, "%c\n",
1143 nn->grace_ended ? 'Y' : 'N');
1144}
1145
1146#endif
1147
1148/*----------------------------------------------------------------------------*/
1149/*
1150 * populating the filesystem.
1151 */
1152
1153/* Basically copying rpc_get_inode. */
1154static struct inode *nfsd_get_inode(struct super_block *sb, umode_t mode)
1155{
1156 struct inode *inode = new_inode(sb);
1157 if (!inode)
1158 return NULL;
1159 /* Following advice from simple_fill_super documentation: */
1160 inode->i_ino = iunique(sb, NFSD_MaxReserved);
1161 inode->i_mode = mode;
1162 inode->i_atime = inode->i_mtime = inode->i_ctime = current_time(inode);
1163 switch (mode & S_IFMT) {
1164 case S_IFDIR:
1165 inode->i_fop = &simple_dir_operations;
1166 inode->i_op = &simple_dir_inode_operations;
1167 inc_nlink(inode);
1168 default:
1169 break;
1170 }
1171 return inode;
1172}
1173
1174static int __nfsd_mkdir(struct inode *dir, struct dentry *dentry, umode_t mode, struct nfsdfs_client *ncl)
1175{
1176 struct inode *inode;
1177
1178 inode = nfsd_get_inode(dir->i_sb, mode);
1179 if (!inode)
1180 return -ENOMEM;
1181 if (ncl) {
1182 inode->i_private = ncl;
1183 kref_get(&ncl->cl_ref);
1184 }
1185 d_add(dentry, inode);
1186 inc_nlink(dir);
1187 fsnotify_mkdir(dir, dentry);
1188 return 0;
1189}
1190
1191static struct dentry *nfsd_mkdir(struct dentry *parent, struct nfsdfs_client *ncl, char *name)
1192{
1193 struct inode *dir = parent->d_inode;
1194 struct dentry *dentry;
1195 int ret = -ENOMEM;
1196
1197 inode_lock(dir);
1198 dentry = d_alloc_name(parent, name);
1199 if (!dentry)
1200 goto out_err;
1201 ret = __nfsd_mkdir(d_inode(parent), dentry, S_IFDIR | 0600, ncl);
1202 if (ret)
1203 goto out_err;
1204out:
1205 inode_unlock(dir);
1206 return dentry;
1207out_err:
1208 dput(dentry);
1209 dentry = ERR_PTR(ret);
1210 goto out;
1211}
1212
1213static void clear_ncl(struct inode *inode)
1214{
1215 struct nfsdfs_client *ncl = inode->i_private;
1216
1217 inode->i_private = NULL;
1218 kref_put(&ncl->cl_ref, ncl->cl_release);
1219}
1220
1221static struct nfsdfs_client *__get_nfsdfs_client(struct inode *inode)
1222{
1223 struct nfsdfs_client *nc = inode->i_private;
1224
1225 if (nc)
1226 kref_get(&nc->cl_ref);
1227 return nc;
1228}
1229
1230struct nfsdfs_client *get_nfsdfs_client(struct inode *inode)
1231{
1232 struct nfsdfs_client *nc;
1233
1234 inode_lock_shared(inode);
1235 nc = __get_nfsdfs_client(inode);
1236 inode_unlock_shared(inode);
1237 return nc;
1238}
1239/* from __rpc_unlink */
1240static void nfsdfs_remove_file(struct inode *dir, struct dentry *dentry)
1241{
1242 int ret;
1243
1244 clear_ncl(d_inode(dentry));
1245 dget(dentry);
1246 ret = simple_unlink(dir, dentry);
1247 d_delete(dentry);
1248 dput(dentry);
1249 WARN_ON_ONCE(ret);
1250}
1251
1252static void nfsdfs_remove_files(struct dentry *root)
1253{
1254 struct dentry *dentry, *tmp;
1255
1256 list_for_each_entry_safe(dentry, tmp, &root->d_subdirs, d_child) {
1257 if (!simple_positive(dentry)) {
1258 WARN_ON_ONCE(1); /* I think this can't happen? */
1259 continue;
1260 }
1261 nfsdfs_remove_file(d_inode(root), dentry);
1262 }
1263}
1264
1265/* XXX: cut'n'paste from simple_fill_super; figure out if we could share
1266 * code instead. */
1267static int nfsdfs_create_files(struct dentry *root,
1268 const struct tree_descr *files)
1269{
1270 struct inode *dir = d_inode(root);
1271 struct inode *inode;
1272 struct dentry *dentry;
1273 int i;
1274
1275 inode_lock(dir);
1276 for (i = 0; files->name && files->name[0]; i++, files++) {
1277 if (!files->name)
1278 continue;
1279 dentry = d_alloc_name(root, files->name);
1280 if (!dentry)
1281 goto out;
1282 inode = nfsd_get_inode(d_inode(root)->i_sb,
1283 S_IFREG | files->mode);
1284 if (!inode) {
1285 dput(dentry);
1286 goto out;
1287 }
1288 inode->i_fop = files->ops;
1289 inode->i_private = __get_nfsdfs_client(dir);
1290 d_add(dentry, inode);
1291 fsnotify_create(dir, dentry);
1292 }
1293 inode_unlock(dir);
1294 return 0;
1295out:
1296 nfsdfs_remove_files(root);
1297 inode_unlock(dir);
1298 return -ENOMEM;
1299}
1300
1301/* on success, returns positive number unique to that client. */
1302struct dentry *nfsd_client_mkdir(struct nfsd_net *nn,
1303 struct nfsdfs_client *ncl, u32 id,
1304 const struct tree_descr *files)
1305{
1306 struct dentry *dentry;
1307 char name[11];
1308 int ret;
1309
1310 sprintf(name, "%u", id);
1311
1312 dentry = nfsd_mkdir(nn->nfsd_client_dir, ncl, name);
1313 if (IS_ERR(dentry)) /* XXX: tossing errors? */
1314 return NULL;
1315 ret = nfsdfs_create_files(dentry, files);
1316 if (ret) {
1317 nfsd_client_rmdir(dentry);
1318 return NULL;
1319 }
1320 return dentry;
1321}
1322
1323/* Taken from __rpc_rmdir: */
1324void nfsd_client_rmdir(struct dentry *dentry)
1325{
1326 struct inode *dir = d_inode(dentry->d_parent);
1327 struct inode *inode = d_inode(dentry);
1328 int ret;
1329
1330 inode_lock(dir);
1331 nfsdfs_remove_files(dentry);
1332 clear_ncl(inode);
1333 dget(dentry);
1334 ret = simple_rmdir(dir, dentry);
1335 WARN_ON_ONCE(ret);
1336 d_delete(dentry);
1337 inode_unlock(dir);
1338}
1339
1340static int nfsd_fill_super(struct super_block *sb, struct fs_context *fc)
1341{
1342 struct nfsd_net *nn = net_generic(current->nsproxy->net_ns,
1343 nfsd_net_id);
1344 struct dentry *dentry;
1345 int ret;
1346
1347 static const struct tree_descr nfsd_files[] = {
1348 [NFSD_List] = {"exports", &exports_nfsd_operations, S_IRUGO},
1349 [NFSD_Export_features] = {"export_features",
1350 &export_features_operations, S_IRUGO},
1351 [NFSD_FO_UnlockIP] = {"unlock_ip",
1352 &transaction_ops, S_IWUSR|S_IRUSR},
1353 [NFSD_FO_UnlockFS] = {"unlock_filesystem",
1354 &transaction_ops, S_IWUSR|S_IRUSR},
1355 [NFSD_Fh] = {"filehandle", &transaction_ops, S_IWUSR|S_IRUSR},
1356 [NFSD_Threads] = {"threads", &transaction_ops, S_IWUSR|S_IRUSR},
1357 [NFSD_Pool_Threads] = {"pool_threads", &transaction_ops, S_IWUSR|S_IRUSR},
1358 [NFSD_Pool_Stats] = {"pool_stats", &pool_stats_operations, S_IRUGO},
1359 [NFSD_Reply_Cache_Stats] = {"reply_cache_stats", &reply_cache_stats_operations, S_IRUGO},
1360 [NFSD_Versions] = {"versions", &transaction_ops, S_IWUSR|S_IRUSR},
1361 [NFSD_Ports] = {"portlist", &transaction_ops, S_IWUSR|S_IRUGO},
1362 [NFSD_MaxBlkSize] = {"max_block_size", &transaction_ops, S_IWUSR|S_IRUGO},
1363 [NFSD_MaxConnections] = {"max_connections", &transaction_ops, S_IWUSR|S_IRUGO},
1364#if defined(CONFIG_SUNRPC_GSS) || defined(CONFIG_SUNRPC_GSS_MODULE)
1365 [NFSD_SupportedEnctypes] = {"supported_krb5_enctypes", &supported_enctypes_ops, S_IRUGO},
1366#endif /* CONFIG_SUNRPC_GSS or CONFIG_SUNRPC_GSS_MODULE */
1367#ifdef CONFIG_NFSD_V4
1368 [NFSD_Leasetime] = {"nfsv4leasetime", &transaction_ops, S_IWUSR|S_IRUSR},
1369 [NFSD_Gracetime] = {"nfsv4gracetime", &transaction_ops, S_IWUSR|S_IRUSR},
1370 [NFSD_RecoveryDir] = {"nfsv4recoverydir", &transaction_ops, S_IWUSR|S_IRUSR},
1371 [NFSD_V4EndGrace] = {"v4_end_grace", &transaction_ops, S_IWUSR|S_IRUGO},
1372#endif
1373 /* last one */ {""}
1374 };
1375
1376 ret = simple_fill_super(sb, 0x6e667364, nfsd_files);
1377 if (ret)
1378 return ret;
1379 dentry = nfsd_mkdir(sb->s_root, NULL, "clients");
1380 if (IS_ERR(dentry))
1381 return PTR_ERR(dentry);
1382 nn->nfsd_client_dir = dentry;
1383 return 0;
1384}
1385
1386static int nfsd_fs_get_tree(struct fs_context *fc)
1387{
1388 return get_tree_keyed(fc, nfsd_fill_super, get_net(fc->net_ns));
1389}
1390
1391static void nfsd_fs_free_fc(struct fs_context *fc)
1392{
1393 if (fc->s_fs_info)
1394 put_net(fc->s_fs_info);
1395}
1396
1397static const struct fs_context_operations nfsd_fs_context_ops = {
1398 .free = nfsd_fs_free_fc,
1399 .get_tree = nfsd_fs_get_tree,
1400};
1401
1402static int nfsd_init_fs_context(struct fs_context *fc)
1403{
1404 put_user_ns(fc->user_ns);
1405 fc->user_ns = get_user_ns(fc->net_ns->user_ns);
1406 fc->ops = &nfsd_fs_context_ops;
1407 return 0;
1408}
1409
1410static void nfsd_umount(struct super_block *sb)
1411{
1412 struct net *net = sb->s_fs_info;
1413
1414 kill_litter_super(sb);
1415 put_net(net);
1416}
1417
1418static struct file_system_type nfsd_fs_type = {
1419 .owner = THIS_MODULE,
1420 .name = "nfsd",
1421 .init_fs_context = nfsd_init_fs_context,
1422 .kill_sb = nfsd_umount,
1423};
1424MODULE_ALIAS_FS("nfsd");
1425
1426#ifdef CONFIG_PROC_FS
1427static int create_proc_exports_entry(void)
1428{
1429 struct proc_dir_entry *entry;
1430
1431 entry = proc_mkdir("fs/nfs", NULL);
1432 if (!entry)
1433 return -ENOMEM;
1434 entry = proc_create("exports", 0, entry,
1435 &exports_proc_operations);
1436 if (!entry) {
1437 remove_proc_entry("fs/nfs", NULL);
1438 return -ENOMEM;
1439 }
1440 return 0;
1441}
1442#else /* CONFIG_PROC_FS */
1443static int create_proc_exports_entry(void)
1444{
1445 return 0;
1446}
1447#endif
1448
1449unsigned int nfsd_net_id;
1450
1451static __net_init int nfsd_init_net(struct net *net)
1452{
1453 int retval;
1454 struct vfsmount *mnt;
1455 struct nfsd_net *nn = net_generic(net, nfsd_net_id);
1456
1457 retval = nfsd_export_init(net);
1458 if (retval)
1459 goto out_export_error;
1460 retval = nfsd_idmap_init(net);
1461 if (retval)
1462 goto out_idmap_error;
1463 nn->nfsd_versions = NULL;
1464 nn->nfsd4_minorversions = NULL;
1465 retval = nfsd_reply_cache_init(nn);
1466 if (retval)
1467 goto out_drc_error;
1468 nn->nfsd4_lease = 90; /* default lease time */
1469 nn->nfsd4_grace = 90;
1470 nn->somebody_reclaimed = false;
1471 nn->track_reclaim_completes = false;
1472 nn->clverifier_counter = prandom_u32();
1473 nn->clientid_base = prandom_u32();
1474 nn->clientid_counter = nn->clientid_base + 1;
1475 nn->s2s_cp_cl_id = nn->clientid_counter++;
1476
1477 atomic_set(&nn->ntf_refcnt, 0);
1478 init_waitqueue_head(&nn->ntf_wq);
1479 seqlock_init(&nn->boot_lock);
1480
1481 mnt = vfs_kern_mount(&nfsd_fs_type, SB_KERNMOUNT, "nfsd", NULL);
1482 if (IS_ERR(mnt)) {
1483 retval = PTR_ERR(mnt);
1484 goto out_mount_err;
1485 }
1486 nn->nfsd_mnt = mnt;
1487 return 0;
1488
1489out_mount_err:
1490 nfsd_reply_cache_shutdown(nn);
1491out_drc_error:
1492 nfsd_idmap_shutdown(net);
1493out_idmap_error:
1494 nfsd_export_shutdown(net);
1495out_export_error:
1496 return retval;
1497}
1498
1499static __net_exit void nfsd_exit_net(struct net *net)
1500{
1501 struct nfsd_net *nn = net_generic(net, nfsd_net_id);
1502
1503 mntput(nn->nfsd_mnt);
1504 nfsd_reply_cache_shutdown(nn);
1505 nfsd_idmap_shutdown(net);
1506 nfsd_export_shutdown(net);
1507 nfsd_netns_free_versions(net_generic(net, nfsd_net_id));
1508}
1509
1510static struct pernet_operations nfsd_net_ops = {
1511 .init = nfsd_init_net,
1512 .exit = nfsd_exit_net,
1513 .id = &nfsd_net_id,
1514 .size = sizeof(struct nfsd_net),
1515};
1516
1517static int __init init_nfsd(void)
1518{
1519 int retval;
1520 printk(KERN_INFO "Installing knfsd (copyright (C) 1996 okir@monad.swb.de).\n");
1521
1522 retval = register_pernet_subsys(&nfsd_net_ops);
1523 if (retval < 0)
1524 return retval;
1525 retval = register_cld_notifier();
1526 if (retval)
1527 goto out_unregister_pernet;
1528 retval = nfsd4_init_slabs();
1529 if (retval)
1530 goto out_unregister_notifier;
1531 retval = nfsd4_init_pnfs();
1532 if (retval)
1533 goto out_free_slabs;
1534 nfsd_fault_inject_init(); /* nfsd fault injection controls */
1535 nfsd_stat_init(); /* Statistics */
1536 nfsd_lockd_init(); /* lockd->nfsd callbacks */
1537 retval = create_proc_exports_entry();
1538 if (retval)
1539 goto out_free_lockd;
1540 retval = register_filesystem(&nfsd_fs_type);
1541 if (retval)
1542 goto out_free_all;
1543 return 0;
1544out_free_all:
1545 remove_proc_entry("fs/nfs/exports", NULL);
1546 remove_proc_entry("fs/nfs", NULL);
1547out_free_lockd:
1548 nfsd_lockd_shutdown();
1549 nfsd_stat_shutdown();
1550 nfsd_fault_inject_cleanup();
1551 nfsd4_exit_pnfs();
1552out_free_slabs:
1553 nfsd4_free_slabs();
1554out_unregister_notifier:
1555 unregister_cld_notifier();
1556out_unregister_pernet:
1557 unregister_pernet_subsys(&nfsd_net_ops);
1558 return retval;
1559}
1560
1561static void __exit exit_nfsd(void)
1562{
1563 remove_proc_entry("fs/nfs/exports", NULL);
1564 remove_proc_entry("fs/nfs", NULL);
1565 nfsd_stat_shutdown();
1566 nfsd_lockd_shutdown();
1567 nfsd4_free_slabs();
1568 nfsd4_exit_pnfs();
1569 nfsd_fault_inject_cleanup();
1570 unregister_filesystem(&nfsd_fs_type);
1571 unregister_cld_notifier();
1572 unregister_pernet_subsys(&nfsd_net_ops);
1573}
1574
1575MODULE_AUTHOR("Olaf Kirch <okir@monad.swb.de>");
1576MODULE_LICENSE("GPL");
1577module_init(init_nfsd)
1578module_exit(exit_nfsd)