Linux Audio

Check our new training course

Loading...
v3.5.6
  1/*
  2 * Central processing for nfsd.
  3 *
  4 * Authors:	Olaf Kirch (okir@monad.swb.de)
  5 *
  6 * Copyright (C) 1995, 1996, 1997 Olaf Kirch <okir@monad.swb.de>
  7 */
  8
  9#include <linux/sched.h>
 10#include <linux/freezer.h>
 11#include <linux/module.h>
 12#include <linux/fs_struct.h>
 13#include <linux/swap.h>
 14#include <linux/nsproxy.h>
 15
 16#include <linux/sunrpc/stats.h>
 17#include <linux/sunrpc/svcsock.h>
 18#include <linux/lockd/bind.h>
 19#include <linux/nfsacl.h>
 20#include <linux/seq_file.h>
 21#include <net/net_namespace.h>
 22#include "nfsd.h"
 23#include "cache.h"
 24#include "vfs.h"
 25
 26#define NFSDDBG_FACILITY	NFSDDBG_SVC
 27
 28extern struct svc_program	nfsd_program;
 29static int			nfsd(void *vrqstp);
 30struct timeval			nfssvc_boot;
 31
 32/*
 33 * nfsd_mutex protects nfsd_serv -- both the pointer itself and the members
 34 * of the svc_serv struct. In particular, ->sv_nrthreads but also to some
 35 * extent ->sv_temp_socks and ->sv_permsocks. It also protects nfsdstats.th_cnt
 36 *
 37 * If (out side the lock) nfsd_serv is non-NULL, then it must point to a
 38 * properly initialised 'struct svc_serv' with ->sv_nrthreads > 0. That number
 39 * of nfsd threads must exist and each must listed in ->sp_all_threads in each
 40 * entry of ->sv_pools[].
 41 *
 42 * Transitions of the thread count between zero and non-zero are of particular
 43 * interest since the svc_serv needs to be created and initialized at that
 44 * point, or freed.
 45 *
 46 * Finally, the nfsd_mutex also protects some of the global variables that are
 47 * accessed when nfsd starts and that are settable via the write_* routines in
 48 * nfsctl.c. In particular:
 49 *
 50 *	user_recovery_dirname
 51 *	user_lease_time
 52 *	nfsd_versions
 53 */
 54DEFINE_MUTEX(nfsd_mutex);
 55struct svc_serv 		*nfsd_serv;
 56
 57/*
 58 * nfsd_drc_lock protects nfsd_drc_max_pages and nfsd_drc_pages_used.
 59 * nfsd_drc_max_pages limits the total amount of memory available for
 60 * version 4.1 DRC caches.
 61 * nfsd_drc_pages_used tracks the current version 4.1 DRC memory usage.
 62 */
 63spinlock_t	nfsd_drc_lock;
 64unsigned int	nfsd_drc_max_mem;
 65unsigned int	nfsd_drc_mem_used;
 66
 67#if defined(CONFIG_NFSD_V2_ACL) || defined(CONFIG_NFSD_V3_ACL)
 68static struct svc_stat	nfsd_acl_svcstats;
 69static struct svc_version *	nfsd_acl_version[] = {
 70	[2] = &nfsd_acl_version2,
 71	[3] = &nfsd_acl_version3,
 72};
 73
 74#define NFSD_ACL_MINVERS            2
 75#define NFSD_ACL_NRVERS		ARRAY_SIZE(nfsd_acl_version)
 76static struct svc_version *nfsd_acl_versions[NFSD_ACL_NRVERS];
 77
 78static struct svc_program	nfsd_acl_program = {
 79	.pg_prog		= NFS_ACL_PROGRAM,
 80	.pg_nvers		= NFSD_ACL_NRVERS,
 81	.pg_vers		= nfsd_acl_versions,
 82	.pg_name		= "nfsacl",
 83	.pg_class		= "nfsd",
 84	.pg_stats		= &nfsd_acl_svcstats,
 85	.pg_authenticate	= &svc_set_client,
 86};
 87
 88static struct svc_stat	nfsd_acl_svcstats = {
 89	.program	= &nfsd_acl_program,
 90};
 91#endif /* defined(CONFIG_NFSD_V2_ACL) || defined(CONFIG_NFSD_V3_ACL) */
 92
 93static struct svc_version *	nfsd_version[] = {
 94	[2] = &nfsd_version2,
 95#if defined(CONFIG_NFSD_V3)
 96	[3] = &nfsd_version3,
 97#endif
 98#if defined(CONFIG_NFSD_V4)
 99	[4] = &nfsd_version4,
100#endif
101};
102
103#define NFSD_MINVERS    	2
104#define NFSD_NRVERS		ARRAY_SIZE(nfsd_version)
105static struct svc_version *nfsd_versions[NFSD_NRVERS];
106
107struct svc_program		nfsd_program = {
108#if defined(CONFIG_NFSD_V2_ACL) || defined(CONFIG_NFSD_V3_ACL)
109	.pg_next		= &nfsd_acl_program,
110#endif
111	.pg_prog		= NFS_PROGRAM,		/* program number */
112	.pg_nvers		= NFSD_NRVERS,		/* nr of entries in nfsd_version */
113	.pg_vers		= nfsd_versions,	/* version table */
114	.pg_name		= "nfsd",		/* program name */
115	.pg_class		= "nfsd",		/* authentication class */
116	.pg_stats		= &nfsd_svcstats,	/* version table */
117	.pg_authenticate	= &svc_set_client,	/* export authentication */
118
119};
120
121u32 nfsd_supported_minorversion;
122
123int nfsd_vers(int vers, enum vers_op change)
124{
125	if (vers < NFSD_MINVERS || vers >= NFSD_NRVERS)
126		return 0;
127	switch(change) {
128	case NFSD_SET:
129		nfsd_versions[vers] = nfsd_version[vers];
130#if defined(CONFIG_NFSD_V2_ACL) || defined(CONFIG_NFSD_V3_ACL)
131		if (vers < NFSD_ACL_NRVERS)
132			nfsd_acl_versions[vers] = nfsd_acl_version[vers];
133#endif
134		break;
135	case NFSD_CLEAR:
136		nfsd_versions[vers] = NULL;
137#if defined(CONFIG_NFSD_V2_ACL) || defined(CONFIG_NFSD_V3_ACL)
138		if (vers < NFSD_ACL_NRVERS)
139			nfsd_acl_versions[vers] = NULL;
140#endif
141		break;
142	case NFSD_TEST:
143		return nfsd_versions[vers] != NULL;
144	case NFSD_AVAIL:
145		return nfsd_version[vers] != NULL;
146	}
147	return 0;
148}
149
150int nfsd_minorversion(u32 minorversion, enum vers_op change)
151{
152	if (minorversion > NFSD_SUPPORTED_MINOR_VERSION)
153		return -1;
154	switch(change) {
155	case NFSD_SET:
156		nfsd_supported_minorversion = minorversion;
157		break;
158	case NFSD_CLEAR:
159		if (minorversion == 0)
160			return -1;
161		nfsd_supported_minorversion = minorversion - 1;
162		break;
163	case NFSD_TEST:
164		return minorversion <= nfsd_supported_minorversion;
165	case NFSD_AVAIL:
166		return minorversion <= NFSD_SUPPORTED_MINOR_VERSION;
167	}
168	return 0;
169}
170
171/*
172 * Maximum number of nfsd processes
173 */
174#define	NFSD_MAXSERVS		8192
175
176int nfsd_nrthreads(void)
177{
178	int rv = 0;
179	mutex_lock(&nfsd_mutex);
180	if (nfsd_serv)
181		rv = nfsd_serv->sv_nrthreads;
182	mutex_unlock(&nfsd_mutex);
183	return rv;
184}
185
186static int nfsd_init_socks(int port)
187{
188	int error;
189	if (!list_empty(&nfsd_serv->sv_permsocks))
190		return 0;
191
192	error = svc_create_xprt(nfsd_serv, "udp", &init_net, PF_INET, port,
193					SVC_SOCK_DEFAULTS);
194	if (error < 0)
195		return error;
196
197	error = svc_create_xprt(nfsd_serv, "tcp", &init_net, PF_INET, port,
198					SVC_SOCK_DEFAULTS);
199	if (error < 0)
200		return error;
201
202	return 0;
203}
204
205static bool nfsd_up = false;
206
207static int nfsd_startup(unsigned short port, int nrservs)
208{
209	int ret;
210
211	if (nfsd_up)
212		return 0;
213	/*
214	 * Readahead param cache - will no-op if it already exists.
215	 * (Note therefore results will be suboptimal if number of
216	 * threads is modified after nfsd start.)
217	 */
218	ret = nfsd_racache_init(2*nrservs);
219	if (ret)
220		return ret;
221	ret = nfsd_init_socks(port);
222	if (ret)
223		goto out_racache;
224	ret = lockd_up(&init_net);
225	if (ret)
226		goto out_racache;
227	ret = nfs4_state_start();
228	if (ret)
229		goto out_lockd;
230	nfsd_up = true;
231	return 0;
232out_lockd:
233	lockd_down(&init_net);
234out_racache:
235	nfsd_racache_shutdown();
236	return ret;
237}
238
239static void nfsd_shutdown(void)
240{
241	/*
242	 * write_ports can create the server without actually starting
243	 * any threads--if we get shut down before any threads are
244	 * started, then nfsd_last_thread will be run before any of this
245	 * other initialization has been done.
246	 */
247	if (!nfsd_up)
248		return;
249	nfs4_state_shutdown();
250	lockd_down(&init_net);
251	nfsd_racache_shutdown();
252	nfsd_up = false;
253}
254
255static void nfsd_last_thread(struct svc_serv *serv, struct net *net)
256{
 
 
257	nfsd_shutdown();
258
259	svc_rpcb_cleanup(serv, net);
260
261	printk(KERN_WARNING "nfsd: last server has exited, flushing export "
262			    "cache\n");
263	nfsd_export_flush(net);
264}
265
266void nfsd_reset_versions(void)
267{
268	int found_one = 0;
269	int i;
270
271	for (i = NFSD_MINVERS; i < NFSD_NRVERS; i++) {
272		if (nfsd_program.pg_vers[i])
273			found_one = 1;
274	}
275
276	if (!found_one) {
277		for (i = NFSD_MINVERS; i < NFSD_NRVERS; i++)
278			nfsd_program.pg_vers[i] = nfsd_version[i];
279#if defined(CONFIG_NFSD_V2_ACL) || defined(CONFIG_NFSD_V3_ACL)
280		for (i = NFSD_ACL_MINVERS; i < NFSD_ACL_NRVERS; i++)
281			nfsd_acl_program.pg_vers[i] =
282				nfsd_acl_version[i];
283#endif
284	}
285}
286
287/*
288 * Each session guarantees a negotiated per slot memory cache for replies
289 * which in turn consumes memory beyond the v2/v3/v4.0 server. A dedicated
290 * NFSv4.1 server might want to use more memory for a DRC than a machine
291 * with mutiple services.
292 *
293 * Impose a hard limit on the number of pages for the DRC which varies
294 * according to the machines free pages. This is of course only a default.
295 *
296 * For now this is a #defined shift which could be under admin control
297 * in the future.
298 */
299static void set_max_drc(void)
300{
301	#define NFSD_DRC_SIZE_SHIFT	10
302	nfsd_drc_max_mem = (nr_free_buffer_pages()
303					>> NFSD_DRC_SIZE_SHIFT) * PAGE_SIZE;
304	nfsd_drc_mem_used = 0;
305	spin_lock_init(&nfsd_drc_lock);
306	dprintk("%s nfsd_drc_max_mem %u \n", __func__, nfsd_drc_max_mem);
307}
308
309static int nfsd_get_default_max_blksize(void)
310{
311	struct sysinfo i;
312	unsigned long long target;
313	unsigned long ret;
314
315	si_meminfo(&i);
316	target = (i.totalram - i.totalhigh) << PAGE_SHIFT;
317	/*
318	 * Aim for 1/4096 of memory per thread This gives 1MB on 4Gig
319	 * machines, but only uses 32K on 128M machines.  Bottom out at
320	 * 8K on 32M and smaller.  Of course, this is only a default.
321	 */
322	target >>= 12;
323
324	ret = NFSSVC_MAXBLKSIZE;
325	while (ret > target && ret >= 8*1024*2)
326		ret /= 2;
327	return ret;
328}
329
330int nfsd_create_serv(void)
331{
332	int error;
333	struct net *net = current->nsproxy->net_ns;
334
335	WARN_ON(!mutex_is_locked(&nfsd_mutex));
336	if (nfsd_serv) {
337		svc_get(nfsd_serv);
338		return 0;
339	}
340	if (nfsd_max_blksize == 0)
341		nfsd_max_blksize = nfsd_get_default_max_blksize();
 
 
 
 
 
 
 
 
 
 
 
 
 
 
342	nfsd_reset_versions();
 
343	nfsd_serv = svc_create_pooled(&nfsd_program, nfsd_max_blksize,
344				      nfsd_last_thread, nfsd, THIS_MODULE);
345	if (nfsd_serv == NULL)
346		return -ENOMEM;
347
348	error = svc_bind(nfsd_serv, net);
349	if (error < 0) {
350		svc_destroy(nfsd_serv);
351		return error;
352	}
353
354	set_max_drc();
355	do_gettimeofday(&nfssvc_boot);		/* record boot time */
356	return 0;
357}
358
359int nfsd_nrpools(void)
360{
361	if (nfsd_serv == NULL)
362		return 0;
363	else
364		return nfsd_serv->sv_nrpools;
365}
366
367int nfsd_get_nrthreads(int n, int *nthreads)
368{
369	int i = 0;
370
371	if (nfsd_serv != NULL) {
372		for (i = 0; i < nfsd_serv->sv_nrpools && i < n; i++)
373			nthreads[i] = nfsd_serv->sv_pools[i].sp_nrthreads;
374	}
375
376	return 0;
377}
378
379int nfsd_set_nrthreads(int n, int *nthreads)
380{
381	int i = 0;
382	int tot = 0;
383	int err = 0;
384	struct net *net = &init_net;
385
386	WARN_ON(!mutex_is_locked(&nfsd_mutex));
387
388	if (nfsd_serv == NULL || n <= 0)
389		return 0;
390
391	if (n > nfsd_serv->sv_nrpools)
392		n = nfsd_serv->sv_nrpools;
393
394	/* enforce a global maximum number of threads */
395	tot = 0;
396	for (i = 0; i < n; i++) {
397		if (nthreads[i] > NFSD_MAXSERVS)
398			nthreads[i] = NFSD_MAXSERVS;
399		tot += nthreads[i];
400	}
401	if (tot > NFSD_MAXSERVS) {
402		/* total too large: scale down requested numbers */
403		for (i = 0; i < n && tot > 0; i++) {
404		    	int new = nthreads[i] * NFSD_MAXSERVS / tot;
405			tot -= (nthreads[i] - new);
406			nthreads[i] = new;
407		}
408		for (i = 0; i < n && tot > 0; i++) {
409			nthreads[i]--;
410			tot--;
411		}
412	}
413
414	/*
415	 * There must always be a thread in pool 0; the admin
416	 * can't shut down NFS completely using pool_threads.
417	 */
418	if (nthreads[0] == 0)
419		nthreads[0] = 1;
420
421	/* apply the new numbers */
422	svc_get(nfsd_serv);
423	for (i = 0; i < n; i++) {
424		err = svc_set_num_threads(nfsd_serv, &nfsd_serv->sv_pools[i],
425				    	  nthreads[i]);
426		if (err)
427			break;
428	}
429	nfsd_destroy(net);
 
430	return err;
431}
432
433/*
434 * Adjust the number of threads and return the new number of threads.
435 * This is also the function that starts the server if necessary, if
436 * this is the first time nrservs is nonzero.
437 */
438int
439nfsd_svc(unsigned short port, int nrservs)
440{
441	int	error;
442	bool	nfsd_up_before;
443	struct net *net = &init_net;
444
445	mutex_lock(&nfsd_mutex);
446	dprintk("nfsd: creating service\n");
447	if (nrservs <= 0)
448		nrservs = 0;
449	if (nrservs > NFSD_MAXSERVS)
450		nrservs = NFSD_MAXSERVS;
451	error = 0;
452	if (nrservs == 0 && nfsd_serv == NULL)
453		goto out;
454
455	error = nfsd_create_serv();
456	if (error)
457		goto out;
458
459	nfsd_up_before = nfsd_up;
460
461	error = nfsd_startup(port, nrservs);
462	if (error)
463		goto out_destroy;
464	error = svc_set_num_threads(nfsd_serv, NULL, nrservs);
465	if (error)
466		goto out_shutdown;
467	/* We are holding a reference to nfsd_serv which
468	 * we don't want to count in the return value,
469	 * so subtract 1
470	 */
471	error = nfsd_serv->sv_nrthreads - 1;
472out_shutdown:
473	if (error < 0 && !nfsd_up_before)
474		nfsd_shutdown();
475out_destroy:
476	nfsd_destroy(net);		/* Release server */
477out:
478	mutex_unlock(&nfsd_mutex);
479	return error;
480}
481
482
483/*
484 * This is the NFS server kernel thread
485 */
486static int
487nfsd(void *vrqstp)
488{
489	struct svc_rqst *rqstp = (struct svc_rqst *) vrqstp;
490	int err, preverr = 0;
491
492	/* Lock module and set up kernel thread */
493	mutex_lock(&nfsd_mutex);
494
495	/* At this point, the thread shares current->fs
496	 * with the init process. We need to create files with a
497	 * umask of 0 instead of init's umask. */
498	if (unshare_fs_struct() < 0) {
499		printk("Unable to start nfsd thread: out of memory\n");
500		goto out;
501	}
502
503	current->fs->umask = 0;
504
505	/*
506	 * thread is spawned with all signals set to SIG_IGN, re-enable
507	 * the ones that will bring down the thread
508	 */
509	allow_signal(SIGKILL);
510	allow_signal(SIGHUP);
511	allow_signal(SIGINT);
512	allow_signal(SIGQUIT);
513
514	nfsdstats.th_cnt++;
515	mutex_unlock(&nfsd_mutex);
516
517	/*
518	 * We want less throttling in balance_dirty_pages() so that nfs to
519	 * localhost doesn't cause nfsd to lock up due to all the client's
520	 * dirty pages.
521	 */
522	current->flags |= PF_LESS_THROTTLE;
523	set_freezable();
524
525	/*
526	 * The main request loop
527	 */
528	for (;;) {
529		/*
530		 * Find a socket with data available and call its
531		 * recvfrom routine.
532		 */
533		while ((err = svc_recv(rqstp, 60*60*HZ)) == -EAGAIN)
534			;
535		if (err == -EINTR)
536			break;
537		else if (err < 0) {
538			if (err != preverr) {
539				printk(KERN_WARNING "%s: unexpected error "
540					"from svc_recv (%d)\n", __func__, -err);
541				preverr = err;
542			}
543			schedule_timeout_uninterruptible(HZ);
544			continue;
545		}
546
547		validate_process_creds();
548		svc_process(rqstp);
549		validate_process_creds();
550	}
551
552	/* Clear signals before calling svc_exit_thread() */
553	flush_signals(current);
554
555	mutex_lock(&nfsd_mutex);
556	nfsdstats.th_cnt --;
557
558out:
559	rqstp->rq_server = NULL;
560
561	/* Release the thread */
562	svc_exit_thread(rqstp);
563
564	nfsd_destroy(&init_net);
565
566	/* Release module */
567	mutex_unlock(&nfsd_mutex);
568	module_put_and_exit(0);
569	return 0;
570}
571
572static __be32 map_new_errors(u32 vers, __be32 nfserr)
573{
574	if (nfserr == nfserr_jukebox && vers == 2)
575		return nfserr_dropit;
576	if (nfserr == nfserr_wrongsec && vers < 4)
577		return nfserr_acces;
578	return nfserr;
579}
580
581int
582nfsd_dispatch(struct svc_rqst *rqstp, __be32 *statp)
583{
584	struct svc_procedure	*proc;
585	kxdrproc_t		xdr;
586	__be32			nfserr;
587	__be32			*nfserrp;
588
589	dprintk("nfsd_dispatch: vers %d proc %d\n",
590				rqstp->rq_vers, rqstp->rq_proc);
591	proc = rqstp->rq_procinfo;
592
593	/*
594	 * Give the xdr decoder a chance to change this if it wants
595	 * (necessary in the NFSv4.0 compound case)
596	 */
597	rqstp->rq_cachetype = proc->pc_cachetype;
598	/* Decode arguments */
599	xdr = proc->pc_decode;
600	if (xdr && !xdr(rqstp, (__be32*)rqstp->rq_arg.head[0].iov_base,
601			rqstp->rq_argp)) {
602		dprintk("nfsd: failed to decode arguments!\n");
603		*statp = rpc_garbage_args;
604		return 1;
605	}
606
607	/* Check whether we have this call in the cache. */
608	switch (nfsd_cache_lookup(rqstp)) {
609	case RC_INTR:
610	case RC_DROPIT:
611		return 0;
612	case RC_REPLY:
613		return 1;
614	case RC_DOIT:;
615		/* do it */
616	}
617
618	/* need to grab the location to store the status, as
619	 * nfsv4 does some encoding while processing 
620	 */
621	nfserrp = rqstp->rq_res.head[0].iov_base
622		+ rqstp->rq_res.head[0].iov_len;
623	rqstp->rq_res.head[0].iov_len += sizeof(__be32);
624
625	/* Now call the procedure handler, and encode NFS status. */
626	nfserr = proc->pc_func(rqstp, rqstp->rq_argp, rqstp->rq_resp);
627	nfserr = map_new_errors(rqstp->rq_vers, nfserr);
628	if (nfserr == nfserr_dropit || rqstp->rq_dropme) {
629		dprintk("nfsd: Dropping request; may be revisited later\n");
630		nfsd_cache_update(rqstp, RC_NOCACHE, NULL);
631		return 0;
632	}
633
634	if (rqstp->rq_proc != 0)
635		*nfserrp++ = nfserr;
636
637	/* Encode result.
638	 * For NFSv2, additional info is never returned in case of an error.
639	 */
640	if (!(nfserr && rqstp->rq_vers == 2)) {
641		xdr = proc->pc_encode;
642		if (xdr && !xdr(rqstp, nfserrp,
643				rqstp->rq_resp)) {
644			/* Failed to encode result. Release cache entry */
645			dprintk("nfsd: failed to encode result!\n");
646			nfsd_cache_update(rqstp, RC_NOCACHE, NULL);
647			*statp = rpc_system_err;
648			return 1;
649		}
650	}
651
652	/* Store reply in cache. */
653	nfsd_cache_update(rqstp, proc->pc_cachetype, statp + 1);
654	return 1;
655}
656
657int nfsd_pool_stats_open(struct inode *inode, struct file *file)
658{
659	int ret;
660	mutex_lock(&nfsd_mutex);
661	if (nfsd_serv == NULL) {
662		mutex_unlock(&nfsd_mutex);
663		return -ENODEV;
664	}
665	/* bump up the psudo refcount while traversing */
666	svc_get(nfsd_serv);
667	ret = svc_pool_stats_open(nfsd_serv, file);
668	mutex_unlock(&nfsd_mutex);
669	return ret;
670}
671
672int nfsd_pool_stats_release(struct inode *inode, struct file *file)
673{
674	int ret = seq_release(inode, file);
675	struct net *net = &init_net;
676
677	mutex_lock(&nfsd_mutex);
678	/* this function really, really should have been called svc_put() */
679	nfsd_destroy(net);
680	mutex_unlock(&nfsd_mutex);
681	return ret;
682}
v3.1
  1/*
  2 * Central processing for nfsd.
  3 *
  4 * Authors:	Olaf Kirch (okir@monad.swb.de)
  5 *
  6 * Copyright (C) 1995, 1996, 1997 Olaf Kirch <okir@monad.swb.de>
  7 */
  8
  9#include <linux/sched.h>
 10#include <linux/freezer.h>
 
 11#include <linux/fs_struct.h>
 12#include <linux/swap.h>
 
 13
 14#include <linux/sunrpc/stats.h>
 15#include <linux/sunrpc/svcsock.h>
 16#include <linux/lockd/bind.h>
 17#include <linux/nfsacl.h>
 18#include <linux/seq_file.h>
 19#include <net/net_namespace.h>
 20#include "nfsd.h"
 21#include "cache.h"
 22#include "vfs.h"
 23
 24#define NFSDDBG_FACILITY	NFSDDBG_SVC
 25
 26extern struct svc_program	nfsd_program;
 27static int			nfsd(void *vrqstp);
 28struct timeval			nfssvc_boot;
 29
 30/*
 31 * nfsd_mutex protects nfsd_serv -- both the pointer itself and the members
 32 * of the svc_serv struct. In particular, ->sv_nrthreads but also to some
 33 * extent ->sv_temp_socks and ->sv_permsocks. It also protects nfsdstats.th_cnt
 34 *
 35 * If (out side the lock) nfsd_serv is non-NULL, then it must point to a
 36 * properly initialised 'struct svc_serv' with ->sv_nrthreads > 0. That number
 37 * of nfsd threads must exist and each must listed in ->sp_all_threads in each
 38 * entry of ->sv_pools[].
 39 *
 40 * Transitions of the thread count between zero and non-zero are of particular
 41 * interest since the svc_serv needs to be created and initialized at that
 42 * point, or freed.
 43 *
 44 * Finally, the nfsd_mutex also protects some of the global variables that are
 45 * accessed when nfsd starts and that are settable via the write_* routines in
 46 * nfsctl.c. In particular:
 47 *
 48 *	user_recovery_dirname
 49 *	user_lease_time
 50 *	nfsd_versions
 51 */
 52DEFINE_MUTEX(nfsd_mutex);
 53struct svc_serv 		*nfsd_serv;
 54
 55/*
 56 * nfsd_drc_lock protects nfsd_drc_max_pages and nfsd_drc_pages_used.
 57 * nfsd_drc_max_pages limits the total amount of memory available for
 58 * version 4.1 DRC caches.
 59 * nfsd_drc_pages_used tracks the current version 4.1 DRC memory usage.
 60 */
 61spinlock_t	nfsd_drc_lock;
 62unsigned int	nfsd_drc_max_mem;
 63unsigned int	nfsd_drc_mem_used;
 64
 65#if defined(CONFIG_NFSD_V2_ACL) || defined(CONFIG_NFSD_V3_ACL)
 66static struct svc_stat	nfsd_acl_svcstats;
 67static struct svc_version *	nfsd_acl_version[] = {
 68	[2] = &nfsd_acl_version2,
 69	[3] = &nfsd_acl_version3,
 70};
 71
 72#define NFSD_ACL_MINVERS            2
 73#define NFSD_ACL_NRVERS		ARRAY_SIZE(nfsd_acl_version)
 74static struct svc_version *nfsd_acl_versions[NFSD_ACL_NRVERS];
 75
 76static struct svc_program	nfsd_acl_program = {
 77	.pg_prog		= NFS_ACL_PROGRAM,
 78	.pg_nvers		= NFSD_ACL_NRVERS,
 79	.pg_vers		= nfsd_acl_versions,
 80	.pg_name		= "nfsacl",
 81	.pg_class		= "nfsd",
 82	.pg_stats		= &nfsd_acl_svcstats,
 83	.pg_authenticate	= &svc_set_client,
 84};
 85
 86static struct svc_stat	nfsd_acl_svcstats = {
 87	.program	= &nfsd_acl_program,
 88};
 89#endif /* defined(CONFIG_NFSD_V2_ACL) || defined(CONFIG_NFSD_V3_ACL) */
 90
 91static struct svc_version *	nfsd_version[] = {
 92	[2] = &nfsd_version2,
 93#if defined(CONFIG_NFSD_V3)
 94	[3] = &nfsd_version3,
 95#endif
 96#if defined(CONFIG_NFSD_V4)
 97	[4] = &nfsd_version4,
 98#endif
 99};
100
101#define NFSD_MINVERS    	2
102#define NFSD_NRVERS		ARRAY_SIZE(nfsd_version)
103static struct svc_version *nfsd_versions[NFSD_NRVERS];
104
105struct svc_program		nfsd_program = {
106#if defined(CONFIG_NFSD_V2_ACL) || defined(CONFIG_NFSD_V3_ACL)
107	.pg_next		= &nfsd_acl_program,
108#endif
109	.pg_prog		= NFS_PROGRAM,		/* program number */
110	.pg_nvers		= NFSD_NRVERS,		/* nr of entries in nfsd_version */
111	.pg_vers		= nfsd_versions,	/* version table */
112	.pg_name		= "nfsd",		/* program name */
113	.pg_class		= "nfsd",		/* authentication class */
114	.pg_stats		= &nfsd_svcstats,	/* version table */
115	.pg_authenticate	= &svc_set_client,	/* export authentication */
116
117};
118
119u32 nfsd_supported_minorversion;
120
121int nfsd_vers(int vers, enum vers_op change)
122{
123	if (vers < NFSD_MINVERS || vers >= NFSD_NRVERS)
124		return 0;
125	switch(change) {
126	case NFSD_SET:
127		nfsd_versions[vers] = nfsd_version[vers];
128#if defined(CONFIG_NFSD_V2_ACL) || defined(CONFIG_NFSD_V3_ACL)
129		if (vers < NFSD_ACL_NRVERS)
130			nfsd_acl_versions[vers] = nfsd_acl_version[vers];
131#endif
132		break;
133	case NFSD_CLEAR:
134		nfsd_versions[vers] = NULL;
135#if defined(CONFIG_NFSD_V2_ACL) || defined(CONFIG_NFSD_V3_ACL)
136		if (vers < NFSD_ACL_NRVERS)
137			nfsd_acl_versions[vers] = NULL;
138#endif
139		break;
140	case NFSD_TEST:
141		return nfsd_versions[vers] != NULL;
142	case NFSD_AVAIL:
143		return nfsd_version[vers] != NULL;
144	}
145	return 0;
146}
147
148int nfsd_minorversion(u32 minorversion, enum vers_op change)
149{
150	if (minorversion > NFSD_SUPPORTED_MINOR_VERSION)
151		return -1;
152	switch(change) {
153	case NFSD_SET:
154		nfsd_supported_minorversion = minorversion;
155		break;
156	case NFSD_CLEAR:
157		if (minorversion == 0)
158			return -1;
159		nfsd_supported_minorversion = minorversion - 1;
160		break;
161	case NFSD_TEST:
162		return minorversion <= nfsd_supported_minorversion;
163	case NFSD_AVAIL:
164		return minorversion <= NFSD_SUPPORTED_MINOR_VERSION;
165	}
166	return 0;
167}
168
169/*
170 * Maximum number of nfsd processes
171 */
172#define	NFSD_MAXSERVS		8192
173
174int nfsd_nrthreads(void)
175{
176	int rv = 0;
177	mutex_lock(&nfsd_mutex);
178	if (nfsd_serv)
179		rv = nfsd_serv->sv_nrthreads;
180	mutex_unlock(&nfsd_mutex);
181	return rv;
182}
183
184static int nfsd_init_socks(int port)
185{
186	int error;
187	if (!list_empty(&nfsd_serv->sv_permsocks))
188		return 0;
189
190	error = svc_create_xprt(nfsd_serv, "udp", &init_net, PF_INET, port,
191					SVC_SOCK_DEFAULTS);
192	if (error < 0)
193		return error;
194
195	error = svc_create_xprt(nfsd_serv, "tcp", &init_net, PF_INET, port,
196					SVC_SOCK_DEFAULTS);
197	if (error < 0)
198		return error;
199
200	return 0;
201}
202
203static bool nfsd_up = false;
204
205static int nfsd_startup(unsigned short port, int nrservs)
206{
207	int ret;
208
209	if (nfsd_up)
210		return 0;
211	/*
212	 * Readahead param cache - will no-op if it already exists.
213	 * (Note therefore results will be suboptimal if number of
214	 * threads is modified after nfsd start.)
215	 */
216	ret = nfsd_racache_init(2*nrservs);
217	if (ret)
218		return ret;
219	ret = nfsd_init_socks(port);
220	if (ret)
221		goto out_racache;
222	ret = lockd_up();
223	if (ret)
224		goto out_racache;
225	ret = nfs4_state_start();
226	if (ret)
227		goto out_lockd;
228	nfsd_up = true;
229	return 0;
230out_lockd:
231	lockd_down();
232out_racache:
233	nfsd_racache_shutdown();
234	return ret;
235}
236
237static void nfsd_shutdown(void)
238{
239	/*
240	 * write_ports can create the server without actually starting
241	 * any threads--if we get shut down before any threads are
242	 * started, then nfsd_last_thread will be run before any of this
243	 * other initialization has been done.
244	 */
245	if (!nfsd_up)
246		return;
247	nfs4_state_shutdown();
248	lockd_down();
249	nfsd_racache_shutdown();
250	nfsd_up = false;
251}
252
253static void nfsd_last_thread(struct svc_serv *serv)
254{
255	/* When last nfsd thread exits we need to do some clean-up */
256	nfsd_serv = NULL;
257	nfsd_shutdown();
258
 
 
259	printk(KERN_WARNING "nfsd: last server has exited, flushing export "
260			    "cache\n");
261	nfsd_export_flush();
262}
263
264void nfsd_reset_versions(void)
265{
266	int found_one = 0;
267	int i;
268
269	for (i = NFSD_MINVERS; i < NFSD_NRVERS; i++) {
270		if (nfsd_program.pg_vers[i])
271			found_one = 1;
272	}
273
274	if (!found_one) {
275		for (i = NFSD_MINVERS; i < NFSD_NRVERS; i++)
276			nfsd_program.pg_vers[i] = nfsd_version[i];
277#if defined(CONFIG_NFSD_V2_ACL) || defined(CONFIG_NFSD_V3_ACL)
278		for (i = NFSD_ACL_MINVERS; i < NFSD_ACL_NRVERS; i++)
279			nfsd_acl_program.pg_vers[i] =
280				nfsd_acl_version[i];
281#endif
282	}
283}
284
285/*
286 * Each session guarantees a negotiated per slot memory cache for replies
287 * which in turn consumes memory beyond the v2/v3/v4.0 server. A dedicated
288 * NFSv4.1 server might want to use more memory for a DRC than a machine
289 * with mutiple services.
290 *
291 * Impose a hard limit on the number of pages for the DRC which varies
292 * according to the machines free pages. This is of course only a default.
293 *
294 * For now this is a #defined shift which could be under admin control
295 * in the future.
296 */
297static void set_max_drc(void)
298{
299	#define NFSD_DRC_SIZE_SHIFT	10
300	nfsd_drc_max_mem = (nr_free_buffer_pages()
301					>> NFSD_DRC_SIZE_SHIFT) * PAGE_SIZE;
302	nfsd_drc_mem_used = 0;
303	spin_lock_init(&nfsd_drc_lock);
304	dprintk("%s nfsd_drc_max_mem %u \n", __func__, nfsd_drc_max_mem);
305}
306
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
307int nfsd_create_serv(void)
308{
309	int err = 0;
 
310
311	WARN_ON(!mutex_is_locked(&nfsd_mutex));
312	if (nfsd_serv) {
313		svc_get(nfsd_serv);
314		return 0;
315	}
316	if (nfsd_max_blksize == 0) {
317		/* choose a suitable default */
318		struct sysinfo i;
319		si_meminfo(&i);
320		/* Aim for 1/4096 of memory per thread
321		 * This gives 1MB on 4Gig machines
322		 * But only uses 32K on 128M machines.
323		 * Bottom out at 8K on 32M and smaller.
324		 * Of course, this is only a default.
325		 */
326		nfsd_max_blksize = NFSSVC_MAXBLKSIZE;
327		i.totalram <<= PAGE_SHIFT - 12;
328		while (nfsd_max_blksize > i.totalram &&
329		       nfsd_max_blksize >= 8*1024*2)
330			nfsd_max_blksize /= 2;
331	}
332	nfsd_reset_versions();
333
334	nfsd_serv = svc_create_pooled(&nfsd_program, nfsd_max_blksize,
335				      nfsd_last_thread, nfsd, THIS_MODULE);
336	if (nfsd_serv == NULL)
337		return -ENOMEM;
338
 
 
 
 
 
 
339	set_max_drc();
340	do_gettimeofday(&nfssvc_boot);		/* record boot time */
341	return err;
342}
343
344int nfsd_nrpools(void)
345{
346	if (nfsd_serv == NULL)
347		return 0;
348	else
349		return nfsd_serv->sv_nrpools;
350}
351
352int nfsd_get_nrthreads(int n, int *nthreads)
353{
354	int i = 0;
355
356	if (nfsd_serv != NULL) {
357		for (i = 0; i < nfsd_serv->sv_nrpools && i < n; i++)
358			nthreads[i] = nfsd_serv->sv_pools[i].sp_nrthreads;
359	}
360
361	return 0;
362}
363
364int nfsd_set_nrthreads(int n, int *nthreads)
365{
366	int i = 0;
367	int tot = 0;
368	int err = 0;
 
369
370	WARN_ON(!mutex_is_locked(&nfsd_mutex));
371
372	if (nfsd_serv == NULL || n <= 0)
373		return 0;
374
375	if (n > nfsd_serv->sv_nrpools)
376		n = nfsd_serv->sv_nrpools;
377
378	/* enforce a global maximum number of threads */
379	tot = 0;
380	for (i = 0; i < n; i++) {
381		if (nthreads[i] > NFSD_MAXSERVS)
382			nthreads[i] = NFSD_MAXSERVS;
383		tot += nthreads[i];
384	}
385	if (tot > NFSD_MAXSERVS) {
386		/* total too large: scale down requested numbers */
387		for (i = 0; i < n && tot > 0; i++) {
388		    	int new = nthreads[i] * NFSD_MAXSERVS / tot;
389			tot -= (nthreads[i] - new);
390			nthreads[i] = new;
391		}
392		for (i = 0; i < n && tot > 0; i++) {
393			nthreads[i]--;
394			tot--;
395		}
396	}
397
398	/*
399	 * There must always be a thread in pool 0; the admin
400	 * can't shut down NFS completely using pool_threads.
401	 */
402	if (nthreads[0] == 0)
403		nthreads[0] = 1;
404
405	/* apply the new numbers */
406	svc_get(nfsd_serv);
407	for (i = 0; i < n; i++) {
408		err = svc_set_num_threads(nfsd_serv, &nfsd_serv->sv_pools[i],
409				    	  nthreads[i]);
410		if (err)
411			break;
412	}
413	svc_destroy(nfsd_serv);
414
415	return err;
416}
417
418/*
419 * Adjust the number of threads and return the new number of threads.
420 * This is also the function that starts the server if necessary, if
421 * this is the first time nrservs is nonzero.
422 */
423int
424nfsd_svc(unsigned short port, int nrservs)
425{
426	int	error;
427	bool	nfsd_up_before;
 
428
429	mutex_lock(&nfsd_mutex);
430	dprintk("nfsd: creating service\n");
431	if (nrservs <= 0)
432		nrservs = 0;
433	if (nrservs > NFSD_MAXSERVS)
434		nrservs = NFSD_MAXSERVS;
435	error = 0;
436	if (nrservs == 0 && nfsd_serv == NULL)
437		goto out;
438
439	error = nfsd_create_serv();
440	if (error)
441		goto out;
442
443	nfsd_up_before = nfsd_up;
444
445	error = nfsd_startup(port, nrservs);
446	if (error)
447		goto out_destroy;
448	error = svc_set_num_threads(nfsd_serv, NULL, nrservs);
449	if (error)
450		goto out_shutdown;
451	/* We are holding a reference to nfsd_serv which
452	 * we don't want to count in the return value,
453	 * so subtract 1
454	 */
455	error = nfsd_serv->sv_nrthreads - 1;
456out_shutdown:
457	if (error < 0 && !nfsd_up_before)
458		nfsd_shutdown();
459out_destroy:
460	svc_destroy(nfsd_serv);		/* Release server */
461out:
462	mutex_unlock(&nfsd_mutex);
463	return error;
464}
465
466
467/*
468 * This is the NFS server kernel thread
469 */
470static int
471nfsd(void *vrqstp)
472{
473	struct svc_rqst *rqstp = (struct svc_rqst *) vrqstp;
474	int err, preverr = 0;
475
476	/* Lock module and set up kernel thread */
477	mutex_lock(&nfsd_mutex);
478
479	/* At this point, the thread shares current->fs
480	 * with the init process. We need to create files with a
481	 * umask of 0 instead of init's umask. */
482	if (unshare_fs_struct() < 0) {
483		printk("Unable to start nfsd thread: out of memory\n");
484		goto out;
485	}
486
487	current->fs->umask = 0;
488
489	/*
490	 * thread is spawned with all signals set to SIG_IGN, re-enable
491	 * the ones that will bring down the thread
492	 */
493	allow_signal(SIGKILL);
494	allow_signal(SIGHUP);
495	allow_signal(SIGINT);
496	allow_signal(SIGQUIT);
497
498	nfsdstats.th_cnt++;
499	mutex_unlock(&nfsd_mutex);
500
501	/*
502	 * We want less throttling in balance_dirty_pages() so that nfs to
503	 * localhost doesn't cause nfsd to lock up due to all the client's
504	 * dirty pages.
505	 */
506	current->flags |= PF_LESS_THROTTLE;
507	set_freezable();
508
509	/*
510	 * The main request loop
511	 */
512	for (;;) {
513		/*
514		 * Find a socket with data available and call its
515		 * recvfrom routine.
516		 */
517		while ((err = svc_recv(rqstp, 60*60*HZ)) == -EAGAIN)
518			;
519		if (err == -EINTR)
520			break;
521		else if (err < 0) {
522			if (err != preverr) {
523				printk(KERN_WARNING "%s: unexpected error "
524					"from svc_recv (%d)\n", __func__, -err);
525				preverr = err;
526			}
527			schedule_timeout_uninterruptible(HZ);
528			continue;
529		}
530
531		validate_process_creds();
532		svc_process(rqstp);
533		validate_process_creds();
534	}
535
536	/* Clear signals before calling svc_exit_thread() */
537	flush_signals(current);
538
539	mutex_lock(&nfsd_mutex);
540	nfsdstats.th_cnt --;
541
542out:
 
 
543	/* Release the thread */
544	svc_exit_thread(rqstp);
545
 
 
546	/* Release module */
547	mutex_unlock(&nfsd_mutex);
548	module_put_and_exit(0);
549	return 0;
550}
551
552static __be32 map_new_errors(u32 vers, __be32 nfserr)
553{
554	if (nfserr == nfserr_jukebox && vers == 2)
555		return nfserr_dropit;
556	if (nfserr == nfserr_wrongsec && vers < 4)
557		return nfserr_acces;
558	return nfserr;
559}
560
561int
562nfsd_dispatch(struct svc_rqst *rqstp, __be32 *statp)
563{
564	struct svc_procedure	*proc;
565	kxdrproc_t		xdr;
566	__be32			nfserr;
567	__be32			*nfserrp;
568
569	dprintk("nfsd_dispatch: vers %d proc %d\n",
570				rqstp->rq_vers, rqstp->rq_proc);
571	proc = rqstp->rq_procinfo;
572
573	/*
574	 * Give the xdr decoder a chance to change this if it wants
575	 * (necessary in the NFSv4.0 compound case)
576	 */
577	rqstp->rq_cachetype = proc->pc_cachetype;
578	/* Decode arguments */
579	xdr = proc->pc_decode;
580	if (xdr && !xdr(rqstp, (__be32*)rqstp->rq_arg.head[0].iov_base,
581			rqstp->rq_argp)) {
582		dprintk("nfsd: failed to decode arguments!\n");
583		*statp = rpc_garbage_args;
584		return 1;
585	}
586
587	/* Check whether we have this call in the cache. */
588	switch (nfsd_cache_lookup(rqstp)) {
589	case RC_INTR:
590	case RC_DROPIT:
591		return 0;
592	case RC_REPLY:
593		return 1;
594	case RC_DOIT:;
595		/* do it */
596	}
597
598	/* need to grab the location to store the status, as
599	 * nfsv4 does some encoding while processing 
600	 */
601	nfserrp = rqstp->rq_res.head[0].iov_base
602		+ rqstp->rq_res.head[0].iov_len;
603	rqstp->rq_res.head[0].iov_len += sizeof(__be32);
604
605	/* Now call the procedure handler, and encode NFS status. */
606	nfserr = proc->pc_func(rqstp, rqstp->rq_argp, rqstp->rq_resp);
607	nfserr = map_new_errors(rqstp->rq_vers, nfserr);
608	if (nfserr == nfserr_dropit || rqstp->rq_dropme) {
609		dprintk("nfsd: Dropping request; may be revisited later\n");
610		nfsd_cache_update(rqstp, RC_NOCACHE, NULL);
611		return 0;
612	}
613
614	if (rqstp->rq_proc != 0)
615		*nfserrp++ = nfserr;
616
617	/* Encode result.
618	 * For NFSv2, additional info is never returned in case of an error.
619	 */
620	if (!(nfserr && rqstp->rq_vers == 2)) {
621		xdr = proc->pc_encode;
622		if (xdr && !xdr(rqstp, nfserrp,
623				rqstp->rq_resp)) {
624			/* Failed to encode result. Release cache entry */
625			dprintk("nfsd: failed to encode result!\n");
626			nfsd_cache_update(rqstp, RC_NOCACHE, NULL);
627			*statp = rpc_system_err;
628			return 1;
629		}
630	}
631
632	/* Store reply in cache. */
633	nfsd_cache_update(rqstp, proc->pc_cachetype, statp + 1);
634	return 1;
635}
636
637int nfsd_pool_stats_open(struct inode *inode, struct file *file)
638{
639	int ret;
640	mutex_lock(&nfsd_mutex);
641	if (nfsd_serv == NULL) {
642		mutex_unlock(&nfsd_mutex);
643		return -ENODEV;
644	}
645	/* bump up the psudo refcount while traversing */
646	svc_get(nfsd_serv);
647	ret = svc_pool_stats_open(nfsd_serv, file);
648	mutex_unlock(&nfsd_mutex);
649	return ret;
650}
651
652int nfsd_pool_stats_release(struct inode *inode, struct file *file)
653{
654	int ret = seq_release(inode, file);
 
 
655	mutex_lock(&nfsd_mutex);
656	/* this function really, really should have been called svc_put() */
657	svc_destroy(nfsd_serv);
658	mutex_unlock(&nfsd_mutex);
659	return ret;
660}