Linux Audio

Check our new training course

Loading...
v4.10.11
 
  1/*
  2 *  linux/fs/ioctl.c
  3 *
  4 *  Copyright (C) 1991, 1992  Linus Torvalds
  5 */
  6
  7#include <linux/syscalls.h>
  8#include <linux/mm.h>
  9#include <linux/capability.h>
 10#include <linux/file.h>
 11#include <linux/fs.h>
 12#include <linux/security.h>
 13#include <linux/export.h>
 14#include <linux/uaccess.h>
 15#include <linux/writeback.h>
 16#include <linux/buffer_head.h>
 17#include <linux/falloc.h>
 
 
 18#include "internal.h"
 19
 20#include <asm/ioctls.h>
 21
 22/* So that the fiemap access checks can't overflow on 32 bit machines. */
 23#define FIEMAP_MAX_EXTENTS	(UINT_MAX / sizeof(struct fiemap_extent))
 24
 25/**
 26 * vfs_ioctl - call filesystem specific ioctl methods
 27 * @filp:	open file to invoke ioctl method on
 28 * @cmd:	ioctl command to execute
 29 * @arg:	command-specific argument for ioctl
 30 *
 31 * Invokes filesystem specific ->unlocked_ioctl, if one exists; otherwise
 32 * returns -ENOTTY.
 33 *
 34 * Returns 0 on success, -errno on error.
 35 */
 36long vfs_ioctl(struct file *filp, unsigned int cmd, unsigned long arg)
 37{
 38	int error = -ENOTTY;
 39
 40	if (!filp->f_op->unlocked_ioctl)
 41		goto out;
 42
 43	error = filp->f_op->unlocked_ioctl(filp, cmd, arg);
 44	if (error == -ENOIOCTLCMD)
 45		error = -ENOTTY;
 46 out:
 47	return error;
 48}
 
 49
 50static int ioctl_fibmap(struct file *filp, int __user *p)
 51{
 52	struct address_space *mapping = filp->f_mapping;
 53	int res, block;
 54
 55	/* do we support this mess? */
 56	if (!mapping->a_ops->bmap)
 57		return -EINVAL;
 58	if (!capable(CAP_SYS_RAWIO))
 59		return -EPERM;
 60	res = get_user(block, p);
 61	if (res)
 62		return res;
 63	res = mapping->a_ops->bmap(mapping, block);
 64	return put_user(res, p);
 65}
 66
 67/**
 68 * fiemap_fill_next_extent - Fiemap helper function
 69 * @fieinfo:	Fiemap context passed into ->fiemap
 70 * @logical:	Extent logical start offset, in bytes
 71 * @phys:	Extent physical start offset, in bytes
 72 * @len:	Extent length, in bytes
 73 * @flags:	FIEMAP_EXTENT flags that describe this extent
 74 *
 75 * Called from file system ->fiemap callback. Will populate extent
 76 * info as passed in via arguments and copy to user memory. On
 77 * success, extent count on fieinfo is incremented.
 78 *
 79 * Returns 0 on success, -errno on error, 1 if this was the last
 80 * extent that will fit in user array.
 81 */
 82#define SET_UNKNOWN_FLAGS	(FIEMAP_EXTENT_DELALLOC)
 83#define SET_NO_UNMOUNTED_IO_FLAGS	(FIEMAP_EXTENT_DATA_ENCRYPTED)
 84#define SET_NOT_ALIGNED_FLAGS	(FIEMAP_EXTENT_DATA_TAIL|FIEMAP_EXTENT_DATA_INLINE)
 85int fiemap_fill_next_extent(struct fiemap_extent_info *fieinfo, u64 logical,
 86			    u64 phys, u64 len, u32 flags)
 87{
 88	struct fiemap_extent extent;
 89	struct fiemap_extent __user *dest = fieinfo->fi_extents_start;
 90
 91	/* only count the extents */
 92	if (fieinfo->fi_extents_max == 0) {
 93		fieinfo->fi_extents_mapped++;
 94		return (flags & FIEMAP_EXTENT_LAST) ? 1 : 0;
 95	}
 96
 97	if (fieinfo->fi_extents_mapped >= fieinfo->fi_extents_max)
 98		return 1;
 99
100	if (flags & SET_UNKNOWN_FLAGS)
101		flags |= FIEMAP_EXTENT_UNKNOWN;
102	if (flags & SET_NO_UNMOUNTED_IO_FLAGS)
103		flags |= FIEMAP_EXTENT_ENCODED;
104	if (flags & SET_NOT_ALIGNED_FLAGS)
105		flags |= FIEMAP_EXTENT_NOT_ALIGNED;
106
107	memset(&extent, 0, sizeof(extent));
108	extent.fe_logical = logical;
109	extent.fe_physical = phys;
110	extent.fe_length = len;
111	extent.fe_flags = flags;
112
113	dest += fieinfo->fi_extents_mapped;
114	if (copy_to_user(dest, &extent, sizeof(extent)))
115		return -EFAULT;
116
117	fieinfo->fi_extents_mapped++;
118	if (fieinfo->fi_extents_mapped == fieinfo->fi_extents_max)
119		return 1;
120	return (flags & FIEMAP_EXTENT_LAST) ? 1 : 0;
121}
122EXPORT_SYMBOL(fiemap_fill_next_extent);
123
124/**
125 * fiemap_check_flags - check validity of requested flags for fiemap
126 * @fieinfo:	Fiemap context passed into ->fiemap
127 * @fs_flags:	Set of fiemap flags that the file system understands
128 *
129 * Called from file system ->fiemap callback. This will compute the
130 * intersection of valid fiemap flags and those that the fs supports. That
131 * value is then compared against the user supplied flags. In case of bad user
132 * flags, the invalid values will be written into the fieinfo structure, and
133 * -EBADR is returned, which tells ioctl_fiemap() to return those values to
134 * userspace. For this reason, a return code of -EBADR should be preserved.
135 *
136 * Returns 0 on success, -EBADR on bad flags.
137 */
138int fiemap_check_flags(struct fiemap_extent_info *fieinfo, u32 fs_flags)
139{
140	u32 incompat_flags;
141
142	incompat_flags = fieinfo->fi_flags & ~(FIEMAP_FLAGS_COMPAT & fs_flags);
143	if (incompat_flags) {
144		fieinfo->fi_flags = incompat_flags;
145		return -EBADR;
146	}
147	return 0;
148}
149EXPORT_SYMBOL(fiemap_check_flags);
150
151static int fiemap_check_ranges(struct super_block *sb,
152			       u64 start, u64 len, u64 *new_len)
153{
154	u64 maxbytes = (u64) sb->s_maxbytes;
155
156	*new_len = len;
157
158	if (len == 0)
159		return -EINVAL;
160
161	if (start > maxbytes)
162		return -EFBIG;
163
164	/*
165	 * Shrink request scope to what the fs can actually handle.
166	 */
167	if (len > maxbytes || (maxbytes - len) < start)
168		*new_len = maxbytes - start;
169
170	return 0;
171}
172
173static int ioctl_fiemap(struct file *filp, unsigned long arg)
174{
175	struct fiemap fiemap;
176	struct fiemap __user *ufiemap = (struct fiemap __user *) arg;
177	struct fiemap_extent_info fieinfo = { 0, };
178	struct inode *inode = file_inode(filp);
179	struct super_block *sb = inode->i_sb;
180	u64 len;
181	int error;
182
183	if (!inode->i_op->fiemap)
184		return -EOPNOTSUPP;
185
186	if (copy_from_user(&fiemap, ufiemap, sizeof(fiemap)))
187		return -EFAULT;
188
189	if (fiemap.fm_extent_count > FIEMAP_MAX_EXTENTS)
190		return -EINVAL;
191
192	error = fiemap_check_ranges(sb, fiemap.fm_start, fiemap.fm_length,
193				    &len);
194	if (error)
195		return error;
196
197	fieinfo.fi_flags = fiemap.fm_flags;
198	fieinfo.fi_extents_max = fiemap.fm_extent_count;
199	fieinfo.fi_extents_start = ufiemap->fm_extents;
200
201	if (fiemap.fm_extent_count != 0 &&
202	    !access_ok(VERIFY_WRITE, fieinfo.fi_extents_start,
203		       fieinfo.fi_extents_max * sizeof(struct fiemap_extent)))
204		return -EFAULT;
205
206	if (fieinfo.fi_flags & FIEMAP_FLAG_SYNC)
207		filemap_write_and_wait(inode->i_mapping);
208
209	error = inode->i_op->fiemap(inode, &fieinfo, fiemap.fm_start, len);
210	fiemap.fm_flags = fieinfo.fi_flags;
211	fiemap.fm_mapped_extents = fieinfo.fi_extents_mapped;
212	if (copy_to_user(ufiemap, &fiemap, sizeof(fiemap)))
213		error = -EFAULT;
214
215	return error;
216}
217
218static long ioctl_file_clone(struct file *dst_file, unsigned long srcfd,
219			     u64 off, u64 olen, u64 destoff)
220{
221	struct fd src_file = fdget(srcfd);
 
222	int ret;
223
224	if (!src_file.file)
225		return -EBADF;
226	ret = -EXDEV;
227	if (src_file.file->f_path.mnt != dst_file->f_path.mnt)
228		goto fdput;
229	ret = do_clone_file_range(src_file.file, off, dst_file, destoff, olen);
 
 
 
 
 
 
 
230fdput:
231	fdput(src_file);
232	return ret;
233}
234
235static long ioctl_file_clone_range(struct file *file, void __user *argp)
236{
237	struct file_clone_range args;
238
239	if (copy_from_user(&args, argp, sizeof(args)))
240		return -EFAULT;
241	return ioctl_file_clone(file, args.src_fd, args.src_offset,
242				args.src_length, args.dest_offset);
243}
244
245#ifdef CONFIG_BLOCK
246
247static inline sector_t logical_to_blk(struct inode *inode, loff_t offset)
248{
249	return (offset >> inode->i_blkbits);
250}
251
252static inline loff_t blk_to_logical(struct inode *inode, sector_t blk)
253{
254	return (blk << inode->i_blkbits);
255}
256
257/**
258 * __generic_block_fiemap - FIEMAP for block based inodes (no locking)
259 * @inode: the inode to map
260 * @fieinfo: the fiemap info struct that will be passed back to userspace
261 * @start: where to start mapping in the inode
262 * @len: how much space to map
263 * @get_block: the fs's get_block function
264 *
265 * This does FIEMAP for block based inodes.  Basically it will just loop
266 * through get_block until we hit the number of extents we want to map, or we
267 * go past the end of the file and hit a hole.
268 *
269 * If it is possible to have data blocks beyond a hole past @inode->i_size, then
270 * please do not use this function, it will stop at the first unmapped block
271 * beyond i_size.
272 *
273 * If you use this function directly, you need to do your own locking. Use
274 * generic_block_fiemap if you want the locking done for you.
275 */
276
277int __generic_block_fiemap(struct inode *inode,
278			   struct fiemap_extent_info *fieinfo, loff_t start,
279			   loff_t len, get_block_t *get_block)
280{
281	struct buffer_head map_bh;
282	sector_t start_blk, last_blk;
283	loff_t isize = i_size_read(inode);
284	u64 logical = 0, phys = 0, size = 0;
285	u32 flags = FIEMAP_EXTENT_MERGED;
286	bool past_eof = false, whole_file = false;
287	int ret = 0;
288
289	ret = fiemap_check_flags(fieinfo, FIEMAP_FLAG_SYNC);
290	if (ret)
291		return ret;
292
293	/*
294	 * Either the i_mutex or other appropriate locking needs to be held
295	 * since we expect isize to not change at all through the duration of
296	 * this call.
297	 */
298	if (len >= isize) {
299		whole_file = true;
300		len = isize;
301	}
302
303	/*
304	 * Some filesystems can't deal with being asked to map less than
305	 * blocksize, so make sure our len is at least block length.
306	 */
307	if (logical_to_blk(inode, len) == 0)
308		len = blk_to_logical(inode, 1);
309
310	start_blk = logical_to_blk(inode, start);
311	last_blk = logical_to_blk(inode, start + len - 1);
312
313	do {
314		/*
315		 * we set b_size to the total size we want so it will map as
316		 * many contiguous blocks as possible at once
317		 */
318		memset(&map_bh, 0, sizeof(struct buffer_head));
319		map_bh.b_size = len;
320
321		ret = get_block(inode, start_blk, &map_bh, 0);
322		if (ret)
323			break;
324
325		/* HOLE */
326		if (!buffer_mapped(&map_bh)) {
327			start_blk++;
328
329			/*
330			 * We want to handle the case where there is an
331			 * allocated block at the front of the file, and then
332			 * nothing but holes up to the end of the file properly,
333			 * to make sure that extent at the front gets properly
334			 * marked with FIEMAP_EXTENT_LAST
335			 */
336			if (!past_eof &&
337			    blk_to_logical(inode, start_blk) >= isize)
338				past_eof = 1;
339
340			/*
341			 * First hole after going past the EOF, this is our
342			 * last extent
343			 */
344			if (past_eof && size) {
345				flags = FIEMAP_EXTENT_MERGED|FIEMAP_EXTENT_LAST;
346				ret = fiemap_fill_next_extent(fieinfo, logical,
347							      phys, size,
348							      flags);
349			} else if (size) {
350				ret = fiemap_fill_next_extent(fieinfo, logical,
351							      phys, size, flags);
352				size = 0;
353			}
354
355			/* if we have holes up to/past EOF then we're done */
356			if (start_blk > last_blk || past_eof || ret)
357				break;
358		} else {
359			/*
360			 * We have gone over the length of what we wanted to
361			 * map, and it wasn't the entire file, so add the extent
362			 * we got last time and exit.
363			 *
364			 * This is for the case where say we want to map all the
365			 * way up to the second to the last block in a file, but
366			 * the last block is a hole, making the second to last
367			 * block FIEMAP_EXTENT_LAST.  In this case we want to
368			 * see if there is a hole after the second to last block
369			 * so we can mark it properly.  If we found data after
370			 * we exceeded the length we were requesting, then we
371			 * are good to go, just add the extent to the fieinfo
372			 * and break
373			 */
374			if (start_blk > last_blk && !whole_file) {
375				ret = fiemap_fill_next_extent(fieinfo, logical,
376							      phys, size,
377							      flags);
378				break;
379			}
380
381			/*
382			 * if size != 0 then we know we already have an extent
383			 * to add, so add it.
384			 */
385			if (size) {
386				ret = fiemap_fill_next_extent(fieinfo, logical,
387							      phys, size,
388							      flags);
389				if (ret)
390					break;
391			}
392
393			logical = blk_to_logical(inode, start_blk);
394			phys = blk_to_logical(inode, map_bh.b_blocknr);
395			size = map_bh.b_size;
396			flags = FIEMAP_EXTENT_MERGED;
397
398			start_blk += logical_to_blk(inode, size);
399
400			/*
401			 * If we are past the EOF, then we need to make sure as
402			 * soon as we find a hole that the last extent we found
403			 * is marked with FIEMAP_EXTENT_LAST
404			 */
405			if (!past_eof && logical + size >= isize)
406				past_eof = true;
407		}
408		cond_resched();
409		if (fatal_signal_pending(current)) {
410			ret = -EINTR;
411			break;
412		}
413
414	} while (1);
415
416	/* If ret is 1 then we just hit the end of the extent array */
417	if (ret == 1)
418		ret = 0;
419
420	return ret;
421}
422EXPORT_SYMBOL(__generic_block_fiemap);
423
424/**
425 * generic_block_fiemap - FIEMAP for block based inodes
426 * @inode: The inode to map
427 * @fieinfo: The mapping information
428 * @start: The initial block to map
429 * @len: The length of the extect to attempt to map
430 * @get_block: The block mapping function for the fs
431 *
432 * Calls __generic_block_fiemap to map the inode, after taking
433 * the inode's mutex lock.
434 */
435
436int generic_block_fiemap(struct inode *inode,
437			 struct fiemap_extent_info *fieinfo, u64 start,
438			 u64 len, get_block_t *get_block)
439{
440	int ret;
441	inode_lock(inode);
442	ret = __generic_block_fiemap(inode, fieinfo, start, len, get_block);
443	inode_unlock(inode);
444	return ret;
445}
446EXPORT_SYMBOL(generic_block_fiemap);
447
448#endif  /*  CONFIG_BLOCK  */
449
450/*
451 * This provides compatibility with legacy XFS pre-allocation ioctls
452 * which predate the fallocate syscall.
453 *
454 * Only the l_start, l_len and l_whence fields of the 'struct space_resv'
455 * are used here, rest are ignored.
456 */
457int ioctl_preallocate(struct file *filp, void __user *argp)
458{
459	struct inode *inode = file_inode(filp);
460	struct space_resv sr;
461
462	if (copy_from_user(&sr, argp, sizeof(sr)))
463		return -EFAULT;
464
465	switch (sr.l_whence) {
466	case SEEK_SET:
467		break;
468	case SEEK_CUR:
469		sr.l_start += filp->f_pos;
470		break;
471	case SEEK_END:
472		sr.l_start += i_size_read(inode);
473		break;
474	default:
475		return -EINVAL;
476	}
477
478	return vfs_fallocate(filp, FALLOC_FL_KEEP_SIZE, sr.l_start, sr.l_len);
479}
480
481static int file_ioctl(struct file *filp, unsigned int cmd,
482		unsigned long arg)
483{
484	struct inode *inode = file_inode(filp);
485	int __user *p = (int __user *)arg;
486
487	switch (cmd) {
488	case FIBMAP:
489		return ioctl_fibmap(filp, p);
490	case FIONREAD:
491		return put_user(i_size_read(inode) - filp->f_pos, p);
492	case FS_IOC_RESVSP:
493	case FS_IOC_RESVSP64:
494		return ioctl_preallocate(filp, p);
495	}
496
497	return vfs_ioctl(filp, cmd, arg);
498}
499
500static int ioctl_fionbio(struct file *filp, int __user *argp)
501{
502	unsigned int flag;
503	int on, error;
504
505	error = get_user(on, argp);
506	if (error)
507		return error;
508	flag = O_NONBLOCK;
509#ifdef __sparc__
510	/* SunOS compatibility item. */
511	if (O_NONBLOCK != O_NDELAY)
512		flag |= O_NDELAY;
513#endif
514	spin_lock(&filp->f_lock);
515	if (on)
516		filp->f_flags |= flag;
517	else
518		filp->f_flags &= ~flag;
519	spin_unlock(&filp->f_lock);
520	return error;
521}
522
523static int ioctl_fioasync(unsigned int fd, struct file *filp,
524			  int __user *argp)
525{
526	unsigned int flag;
527	int on, error;
528
529	error = get_user(on, argp);
530	if (error)
531		return error;
532	flag = on ? FASYNC : 0;
533
534	/* Did FASYNC state change ? */
535	if ((flag ^ filp->f_flags) & FASYNC) {
536		if (filp->f_op->fasync)
537			/* fasync() adjusts filp->f_flags */
538			error = filp->f_op->fasync(fd, filp, on);
539		else
540			error = -ENOTTY;
541	}
542	return error < 0 ? error : 0;
543}
544
545static int ioctl_fsfreeze(struct file *filp)
546{
547	struct super_block *sb = file_inode(filp)->i_sb;
548
549	if (!capable(CAP_SYS_ADMIN))
550		return -EPERM;
551
552	/* If filesystem doesn't support freeze feature, return. */
553	if (sb->s_op->freeze_fs == NULL && sb->s_op->freeze_super == NULL)
554		return -EOPNOTSUPP;
555
556	/* Freeze */
557	if (sb->s_op->freeze_super)
558		return sb->s_op->freeze_super(sb);
559	return freeze_super(sb);
560}
561
562static int ioctl_fsthaw(struct file *filp)
563{
564	struct super_block *sb = file_inode(filp)->i_sb;
565
566	if (!capable(CAP_SYS_ADMIN))
567		return -EPERM;
568
569	/* Thaw */
570	if (sb->s_op->thaw_super)
571		return sb->s_op->thaw_super(sb);
572	return thaw_super(sb);
573}
574
575static int ioctl_file_dedupe_range(struct file *file, void __user *arg)
576{
577	struct file_dedupe_range __user *argp = arg;
578	struct file_dedupe_range *same = NULL;
579	int ret;
580	unsigned long size;
581	u16 count;
582
583	if (get_user(count, &argp->dest_count)) {
584		ret = -EFAULT;
585		goto out;
586	}
587
588	size = offsetof(struct file_dedupe_range __user, info[count]);
589	if (size > PAGE_SIZE) {
590		ret = -ENOMEM;
591		goto out;
592	}
593
594	same = memdup_user(argp, size);
595	if (IS_ERR(same)) {
596		ret = PTR_ERR(same);
597		same = NULL;
598		goto out;
599	}
600
601	same->dest_count = count;
602	ret = vfs_dedupe_file_range(file, same);
603	if (ret)
604		goto out;
605
606	ret = copy_to_user(argp, same, size);
607	if (ret)
608		ret = -EFAULT;
609
610out:
611	kfree(same);
612	return ret;
613}
614
615/*
616 * When you add any new common ioctls to the switches above and below
617 * please update compat_sys_ioctl() too.
618 *
619 * do_vfs_ioctl() is not for drivers and not intended to be EXPORT_SYMBOL()'d.
620 * It's just a simple helper for sys_ioctl and compat_sys_ioctl.
621 */
622int do_vfs_ioctl(struct file *filp, unsigned int fd, unsigned int cmd,
623	     unsigned long arg)
624{
625	int error = 0;
626	int __user *argp = (int __user *)arg;
627	struct inode *inode = file_inode(filp);
628
629	switch (cmd) {
630	case FIOCLEX:
631		set_close_on_exec(fd, 1);
632		break;
633
634	case FIONCLEX:
635		set_close_on_exec(fd, 0);
636		break;
637
638	case FIONBIO:
639		error = ioctl_fionbio(filp, argp);
640		break;
641
642	case FIOASYNC:
643		error = ioctl_fioasync(fd, filp, argp);
644		break;
645
646	case FIOQSIZE:
647		if (S_ISDIR(inode->i_mode) || S_ISREG(inode->i_mode) ||
648		    S_ISLNK(inode->i_mode)) {
649			loff_t res = inode_get_bytes(inode);
650			error = copy_to_user(argp, &res, sizeof(res)) ?
651					-EFAULT : 0;
652		} else
653			error = -ENOTTY;
654		break;
655
656	case FIFREEZE:
657		error = ioctl_fsfreeze(filp);
658		break;
659
660	case FITHAW:
661		error = ioctl_fsthaw(filp);
662		break;
663
664	case FS_IOC_FIEMAP:
665		return ioctl_fiemap(filp, arg);
666
667	case FIGETBSZ:
 
 
 
668		return put_user(inode->i_sb->s_blocksize, argp);
669
670	case FICLONE:
671		return ioctl_file_clone(filp, arg, 0, 0, 0);
672
673	case FICLONERANGE:
674		return ioctl_file_clone_range(filp, argp);
675
676	case FIDEDUPERANGE:
677		return ioctl_file_dedupe_range(filp, argp);
678
679	default:
680		if (S_ISREG(inode->i_mode))
681			error = file_ioctl(filp, cmd, arg);
682		else
683			error = vfs_ioctl(filp, cmd, arg);
684		break;
685	}
686	return error;
687}
688
689SYSCALL_DEFINE3(ioctl, unsigned int, fd, unsigned int, cmd, unsigned long, arg)
690{
691	int error;
692	struct fd f = fdget(fd);
693
694	if (!f.file)
695		return -EBADF;
696	error = security_file_ioctl(f.file, cmd, arg);
697	if (!error)
698		error = do_vfs_ioctl(f.file, fd, cmd, arg);
699	fdput(f);
700	return error;
 
 
 
 
 
701}
v5.4
  1// SPDX-License-Identifier: GPL-2.0
  2/*
  3 *  linux/fs/ioctl.c
  4 *
  5 *  Copyright (C) 1991, 1992  Linus Torvalds
  6 */
  7
  8#include <linux/syscalls.h>
  9#include <linux/mm.h>
 10#include <linux/capability.h>
 11#include <linux/file.h>
 12#include <linux/fs.h>
 13#include <linux/security.h>
 14#include <linux/export.h>
 15#include <linux/uaccess.h>
 16#include <linux/writeback.h>
 17#include <linux/buffer_head.h>
 18#include <linux/falloc.h>
 19#include <linux/sched/signal.h>
 20
 21#include "internal.h"
 22
 23#include <asm/ioctls.h>
 24
 25/* So that the fiemap access checks can't overflow on 32 bit machines. */
 26#define FIEMAP_MAX_EXTENTS	(UINT_MAX / sizeof(struct fiemap_extent))
 27
 28/**
 29 * vfs_ioctl - call filesystem specific ioctl methods
 30 * @filp:	open file to invoke ioctl method on
 31 * @cmd:	ioctl command to execute
 32 * @arg:	command-specific argument for ioctl
 33 *
 34 * Invokes filesystem specific ->unlocked_ioctl, if one exists; otherwise
 35 * returns -ENOTTY.
 36 *
 37 * Returns 0 on success, -errno on error.
 38 */
 39long vfs_ioctl(struct file *filp, unsigned int cmd, unsigned long arg)
 40{
 41	int error = -ENOTTY;
 42
 43	if (!filp->f_op->unlocked_ioctl)
 44		goto out;
 45
 46	error = filp->f_op->unlocked_ioctl(filp, cmd, arg);
 47	if (error == -ENOIOCTLCMD)
 48		error = -ENOTTY;
 49 out:
 50	return error;
 51}
 52EXPORT_SYMBOL(vfs_ioctl);
 53
 54static int ioctl_fibmap(struct file *filp, int __user *p)
 55{
 56	struct address_space *mapping = filp->f_mapping;
 57	int res, block;
 58
 59	/* do we support this mess? */
 60	if (!mapping->a_ops->bmap)
 61		return -EINVAL;
 62	if (!capable(CAP_SYS_RAWIO))
 63		return -EPERM;
 64	res = get_user(block, p);
 65	if (res)
 66		return res;
 67	res = mapping->a_ops->bmap(mapping, block);
 68	return put_user(res, p);
 69}
 70
 71/**
 72 * fiemap_fill_next_extent - Fiemap helper function
 73 * @fieinfo:	Fiemap context passed into ->fiemap
 74 * @logical:	Extent logical start offset, in bytes
 75 * @phys:	Extent physical start offset, in bytes
 76 * @len:	Extent length, in bytes
 77 * @flags:	FIEMAP_EXTENT flags that describe this extent
 78 *
 79 * Called from file system ->fiemap callback. Will populate extent
 80 * info as passed in via arguments and copy to user memory. On
 81 * success, extent count on fieinfo is incremented.
 82 *
 83 * Returns 0 on success, -errno on error, 1 if this was the last
 84 * extent that will fit in user array.
 85 */
 86#define SET_UNKNOWN_FLAGS	(FIEMAP_EXTENT_DELALLOC)
 87#define SET_NO_UNMOUNTED_IO_FLAGS	(FIEMAP_EXTENT_DATA_ENCRYPTED)
 88#define SET_NOT_ALIGNED_FLAGS	(FIEMAP_EXTENT_DATA_TAIL|FIEMAP_EXTENT_DATA_INLINE)
 89int fiemap_fill_next_extent(struct fiemap_extent_info *fieinfo, u64 logical,
 90			    u64 phys, u64 len, u32 flags)
 91{
 92	struct fiemap_extent extent;
 93	struct fiemap_extent __user *dest = fieinfo->fi_extents_start;
 94
 95	/* only count the extents */
 96	if (fieinfo->fi_extents_max == 0) {
 97		fieinfo->fi_extents_mapped++;
 98		return (flags & FIEMAP_EXTENT_LAST) ? 1 : 0;
 99	}
100
101	if (fieinfo->fi_extents_mapped >= fieinfo->fi_extents_max)
102		return 1;
103
104	if (flags & SET_UNKNOWN_FLAGS)
105		flags |= FIEMAP_EXTENT_UNKNOWN;
106	if (flags & SET_NO_UNMOUNTED_IO_FLAGS)
107		flags |= FIEMAP_EXTENT_ENCODED;
108	if (flags & SET_NOT_ALIGNED_FLAGS)
109		flags |= FIEMAP_EXTENT_NOT_ALIGNED;
110
111	memset(&extent, 0, sizeof(extent));
112	extent.fe_logical = logical;
113	extent.fe_physical = phys;
114	extent.fe_length = len;
115	extent.fe_flags = flags;
116
117	dest += fieinfo->fi_extents_mapped;
118	if (copy_to_user(dest, &extent, sizeof(extent)))
119		return -EFAULT;
120
121	fieinfo->fi_extents_mapped++;
122	if (fieinfo->fi_extents_mapped == fieinfo->fi_extents_max)
123		return 1;
124	return (flags & FIEMAP_EXTENT_LAST) ? 1 : 0;
125}
126EXPORT_SYMBOL(fiemap_fill_next_extent);
127
128/**
129 * fiemap_check_flags - check validity of requested flags for fiemap
130 * @fieinfo:	Fiemap context passed into ->fiemap
131 * @fs_flags:	Set of fiemap flags that the file system understands
132 *
133 * Called from file system ->fiemap callback. This will compute the
134 * intersection of valid fiemap flags and those that the fs supports. That
135 * value is then compared against the user supplied flags. In case of bad user
136 * flags, the invalid values will be written into the fieinfo structure, and
137 * -EBADR is returned, which tells ioctl_fiemap() to return those values to
138 * userspace. For this reason, a return code of -EBADR should be preserved.
139 *
140 * Returns 0 on success, -EBADR on bad flags.
141 */
142int fiemap_check_flags(struct fiemap_extent_info *fieinfo, u32 fs_flags)
143{
144	u32 incompat_flags;
145
146	incompat_flags = fieinfo->fi_flags & ~(FIEMAP_FLAGS_COMPAT & fs_flags);
147	if (incompat_flags) {
148		fieinfo->fi_flags = incompat_flags;
149		return -EBADR;
150	}
151	return 0;
152}
153EXPORT_SYMBOL(fiemap_check_flags);
154
155static int fiemap_check_ranges(struct super_block *sb,
156			       u64 start, u64 len, u64 *new_len)
157{
158	u64 maxbytes = (u64) sb->s_maxbytes;
159
160	*new_len = len;
161
162	if (len == 0)
163		return -EINVAL;
164
165	if (start > maxbytes)
166		return -EFBIG;
167
168	/*
169	 * Shrink request scope to what the fs can actually handle.
170	 */
171	if (len > maxbytes || (maxbytes - len) < start)
172		*new_len = maxbytes - start;
173
174	return 0;
175}
176
177static int ioctl_fiemap(struct file *filp, unsigned long arg)
178{
179	struct fiemap fiemap;
180	struct fiemap __user *ufiemap = (struct fiemap __user *) arg;
181	struct fiemap_extent_info fieinfo = { 0, };
182	struct inode *inode = file_inode(filp);
183	struct super_block *sb = inode->i_sb;
184	u64 len;
185	int error;
186
187	if (!inode->i_op->fiemap)
188		return -EOPNOTSUPP;
189
190	if (copy_from_user(&fiemap, ufiemap, sizeof(fiemap)))
191		return -EFAULT;
192
193	if (fiemap.fm_extent_count > FIEMAP_MAX_EXTENTS)
194		return -EINVAL;
195
196	error = fiemap_check_ranges(sb, fiemap.fm_start, fiemap.fm_length,
197				    &len);
198	if (error)
199		return error;
200
201	fieinfo.fi_flags = fiemap.fm_flags;
202	fieinfo.fi_extents_max = fiemap.fm_extent_count;
203	fieinfo.fi_extents_start = ufiemap->fm_extents;
204
205	if (fiemap.fm_extent_count != 0 &&
206	    !access_ok(fieinfo.fi_extents_start,
207		       fieinfo.fi_extents_max * sizeof(struct fiemap_extent)))
208		return -EFAULT;
209
210	if (fieinfo.fi_flags & FIEMAP_FLAG_SYNC)
211		filemap_write_and_wait(inode->i_mapping);
212
213	error = inode->i_op->fiemap(inode, &fieinfo, fiemap.fm_start, len);
214	fiemap.fm_flags = fieinfo.fi_flags;
215	fiemap.fm_mapped_extents = fieinfo.fi_extents_mapped;
216	if (copy_to_user(ufiemap, &fiemap, sizeof(fiemap)))
217		error = -EFAULT;
218
219	return error;
220}
221
222static long ioctl_file_clone(struct file *dst_file, unsigned long srcfd,
223			     u64 off, u64 olen, u64 destoff)
224{
225	struct fd src_file = fdget(srcfd);
226	loff_t cloned;
227	int ret;
228
229	if (!src_file.file)
230		return -EBADF;
231	ret = -EXDEV;
232	if (src_file.file->f_path.mnt != dst_file->f_path.mnt)
233		goto fdput;
234	cloned = vfs_clone_file_range(src_file.file, off, dst_file, destoff,
235				      olen, 0);
236	if (cloned < 0)
237		ret = cloned;
238	else if (olen && cloned != olen)
239		ret = -EINVAL;
240	else
241		ret = 0;
242fdput:
243	fdput(src_file);
244	return ret;
245}
246
247static long ioctl_file_clone_range(struct file *file, void __user *argp)
248{
249	struct file_clone_range args;
250
251	if (copy_from_user(&args, argp, sizeof(args)))
252		return -EFAULT;
253	return ioctl_file_clone(file, args.src_fd, args.src_offset,
254				args.src_length, args.dest_offset);
255}
256
257#ifdef CONFIG_BLOCK
258
259static inline sector_t logical_to_blk(struct inode *inode, loff_t offset)
260{
261	return (offset >> inode->i_blkbits);
262}
263
264static inline loff_t blk_to_logical(struct inode *inode, sector_t blk)
265{
266	return (blk << inode->i_blkbits);
267}
268
269/**
270 * __generic_block_fiemap - FIEMAP for block based inodes (no locking)
271 * @inode: the inode to map
272 * @fieinfo: the fiemap info struct that will be passed back to userspace
273 * @start: where to start mapping in the inode
274 * @len: how much space to map
275 * @get_block: the fs's get_block function
276 *
277 * This does FIEMAP for block based inodes.  Basically it will just loop
278 * through get_block until we hit the number of extents we want to map, or we
279 * go past the end of the file and hit a hole.
280 *
281 * If it is possible to have data blocks beyond a hole past @inode->i_size, then
282 * please do not use this function, it will stop at the first unmapped block
283 * beyond i_size.
284 *
285 * If you use this function directly, you need to do your own locking. Use
286 * generic_block_fiemap if you want the locking done for you.
287 */
288
289int __generic_block_fiemap(struct inode *inode,
290			   struct fiemap_extent_info *fieinfo, loff_t start,
291			   loff_t len, get_block_t *get_block)
292{
293	struct buffer_head map_bh;
294	sector_t start_blk, last_blk;
295	loff_t isize = i_size_read(inode);
296	u64 logical = 0, phys = 0, size = 0;
297	u32 flags = FIEMAP_EXTENT_MERGED;
298	bool past_eof = false, whole_file = false;
299	int ret = 0;
300
301	ret = fiemap_check_flags(fieinfo, FIEMAP_FLAG_SYNC);
302	if (ret)
303		return ret;
304
305	/*
306	 * Either the i_mutex or other appropriate locking needs to be held
307	 * since we expect isize to not change at all through the duration of
308	 * this call.
309	 */
310	if (len >= isize) {
311		whole_file = true;
312		len = isize;
313	}
314
315	/*
316	 * Some filesystems can't deal with being asked to map less than
317	 * blocksize, so make sure our len is at least block length.
318	 */
319	if (logical_to_blk(inode, len) == 0)
320		len = blk_to_logical(inode, 1);
321
322	start_blk = logical_to_blk(inode, start);
323	last_blk = logical_to_blk(inode, start + len - 1);
324
325	do {
326		/*
327		 * we set b_size to the total size we want so it will map as
328		 * many contiguous blocks as possible at once
329		 */
330		memset(&map_bh, 0, sizeof(struct buffer_head));
331		map_bh.b_size = len;
332
333		ret = get_block(inode, start_blk, &map_bh, 0);
334		if (ret)
335			break;
336
337		/* HOLE */
338		if (!buffer_mapped(&map_bh)) {
339			start_blk++;
340
341			/*
342			 * We want to handle the case where there is an
343			 * allocated block at the front of the file, and then
344			 * nothing but holes up to the end of the file properly,
345			 * to make sure that extent at the front gets properly
346			 * marked with FIEMAP_EXTENT_LAST
347			 */
348			if (!past_eof &&
349			    blk_to_logical(inode, start_blk) >= isize)
350				past_eof = 1;
351
352			/*
353			 * First hole after going past the EOF, this is our
354			 * last extent
355			 */
356			if (past_eof && size) {
357				flags = FIEMAP_EXTENT_MERGED|FIEMAP_EXTENT_LAST;
358				ret = fiemap_fill_next_extent(fieinfo, logical,
359							      phys, size,
360							      flags);
361			} else if (size) {
362				ret = fiemap_fill_next_extent(fieinfo, logical,
363							      phys, size, flags);
364				size = 0;
365			}
366
367			/* if we have holes up to/past EOF then we're done */
368			if (start_blk > last_blk || past_eof || ret)
369				break;
370		} else {
371			/*
372			 * We have gone over the length of what we wanted to
373			 * map, and it wasn't the entire file, so add the extent
374			 * we got last time and exit.
375			 *
376			 * This is for the case where say we want to map all the
377			 * way up to the second to the last block in a file, but
378			 * the last block is a hole, making the second to last
379			 * block FIEMAP_EXTENT_LAST.  In this case we want to
380			 * see if there is a hole after the second to last block
381			 * so we can mark it properly.  If we found data after
382			 * we exceeded the length we were requesting, then we
383			 * are good to go, just add the extent to the fieinfo
384			 * and break
385			 */
386			if (start_blk > last_blk && !whole_file) {
387				ret = fiemap_fill_next_extent(fieinfo, logical,
388							      phys, size,
389							      flags);
390				break;
391			}
392
393			/*
394			 * if size != 0 then we know we already have an extent
395			 * to add, so add it.
396			 */
397			if (size) {
398				ret = fiemap_fill_next_extent(fieinfo, logical,
399							      phys, size,
400							      flags);
401				if (ret)
402					break;
403			}
404
405			logical = blk_to_logical(inode, start_blk);
406			phys = blk_to_logical(inode, map_bh.b_blocknr);
407			size = map_bh.b_size;
408			flags = FIEMAP_EXTENT_MERGED;
409
410			start_blk += logical_to_blk(inode, size);
411
412			/*
413			 * If we are past the EOF, then we need to make sure as
414			 * soon as we find a hole that the last extent we found
415			 * is marked with FIEMAP_EXTENT_LAST
416			 */
417			if (!past_eof && logical + size >= isize)
418				past_eof = true;
419		}
420		cond_resched();
421		if (fatal_signal_pending(current)) {
422			ret = -EINTR;
423			break;
424		}
425
426	} while (1);
427
428	/* If ret is 1 then we just hit the end of the extent array */
429	if (ret == 1)
430		ret = 0;
431
432	return ret;
433}
434EXPORT_SYMBOL(__generic_block_fiemap);
435
436/**
437 * generic_block_fiemap - FIEMAP for block based inodes
438 * @inode: The inode to map
439 * @fieinfo: The mapping information
440 * @start: The initial block to map
441 * @len: The length of the extect to attempt to map
442 * @get_block: The block mapping function for the fs
443 *
444 * Calls __generic_block_fiemap to map the inode, after taking
445 * the inode's mutex lock.
446 */
447
448int generic_block_fiemap(struct inode *inode,
449			 struct fiemap_extent_info *fieinfo, u64 start,
450			 u64 len, get_block_t *get_block)
451{
452	int ret;
453	inode_lock(inode);
454	ret = __generic_block_fiemap(inode, fieinfo, start, len, get_block);
455	inode_unlock(inode);
456	return ret;
457}
458EXPORT_SYMBOL(generic_block_fiemap);
459
460#endif  /*  CONFIG_BLOCK  */
461
462/*
463 * This provides compatibility with legacy XFS pre-allocation ioctls
464 * which predate the fallocate syscall.
465 *
466 * Only the l_start, l_len and l_whence fields of the 'struct space_resv'
467 * are used here, rest are ignored.
468 */
469int ioctl_preallocate(struct file *filp, void __user *argp)
470{
471	struct inode *inode = file_inode(filp);
472	struct space_resv sr;
473
474	if (copy_from_user(&sr, argp, sizeof(sr)))
475		return -EFAULT;
476
477	switch (sr.l_whence) {
478	case SEEK_SET:
479		break;
480	case SEEK_CUR:
481		sr.l_start += filp->f_pos;
482		break;
483	case SEEK_END:
484		sr.l_start += i_size_read(inode);
485		break;
486	default:
487		return -EINVAL;
488	}
489
490	return vfs_fallocate(filp, FALLOC_FL_KEEP_SIZE, sr.l_start, sr.l_len);
491}
492
493static int file_ioctl(struct file *filp, unsigned int cmd,
494		unsigned long arg)
495{
496	struct inode *inode = file_inode(filp);
497	int __user *p = (int __user *)arg;
498
499	switch (cmd) {
500	case FIBMAP:
501		return ioctl_fibmap(filp, p);
502	case FIONREAD:
503		return put_user(i_size_read(inode) - filp->f_pos, p);
504	case FS_IOC_RESVSP:
505	case FS_IOC_RESVSP64:
506		return ioctl_preallocate(filp, p);
507	}
508
509	return vfs_ioctl(filp, cmd, arg);
510}
511
512static int ioctl_fionbio(struct file *filp, int __user *argp)
513{
514	unsigned int flag;
515	int on, error;
516
517	error = get_user(on, argp);
518	if (error)
519		return error;
520	flag = O_NONBLOCK;
521#ifdef __sparc__
522	/* SunOS compatibility item. */
523	if (O_NONBLOCK != O_NDELAY)
524		flag |= O_NDELAY;
525#endif
526	spin_lock(&filp->f_lock);
527	if (on)
528		filp->f_flags |= flag;
529	else
530		filp->f_flags &= ~flag;
531	spin_unlock(&filp->f_lock);
532	return error;
533}
534
535static int ioctl_fioasync(unsigned int fd, struct file *filp,
536			  int __user *argp)
537{
538	unsigned int flag;
539	int on, error;
540
541	error = get_user(on, argp);
542	if (error)
543		return error;
544	flag = on ? FASYNC : 0;
545
546	/* Did FASYNC state change ? */
547	if ((flag ^ filp->f_flags) & FASYNC) {
548		if (filp->f_op->fasync)
549			/* fasync() adjusts filp->f_flags */
550			error = filp->f_op->fasync(fd, filp, on);
551		else
552			error = -ENOTTY;
553	}
554	return error < 0 ? error : 0;
555}
556
557static int ioctl_fsfreeze(struct file *filp)
558{
559	struct super_block *sb = file_inode(filp)->i_sb;
560
561	if (!ns_capable(sb->s_user_ns, CAP_SYS_ADMIN))
562		return -EPERM;
563
564	/* If filesystem doesn't support freeze feature, return. */
565	if (sb->s_op->freeze_fs == NULL && sb->s_op->freeze_super == NULL)
566		return -EOPNOTSUPP;
567
568	/* Freeze */
569	if (sb->s_op->freeze_super)
570		return sb->s_op->freeze_super(sb);
571	return freeze_super(sb);
572}
573
574static int ioctl_fsthaw(struct file *filp)
575{
576	struct super_block *sb = file_inode(filp)->i_sb;
577
578	if (!ns_capable(sb->s_user_ns, CAP_SYS_ADMIN))
579		return -EPERM;
580
581	/* Thaw */
582	if (sb->s_op->thaw_super)
583		return sb->s_op->thaw_super(sb);
584	return thaw_super(sb);
585}
586
587static int ioctl_file_dedupe_range(struct file *file, void __user *arg)
588{
589	struct file_dedupe_range __user *argp = arg;
590	struct file_dedupe_range *same = NULL;
591	int ret;
592	unsigned long size;
593	u16 count;
594
595	if (get_user(count, &argp->dest_count)) {
596		ret = -EFAULT;
597		goto out;
598	}
599
600	size = offsetof(struct file_dedupe_range __user, info[count]);
601	if (size > PAGE_SIZE) {
602		ret = -ENOMEM;
603		goto out;
604	}
605
606	same = memdup_user(argp, size);
607	if (IS_ERR(same)) {
608		ret = PTR_ERR(same);
609		same = NULL;
610		goto out;
611	}
612
613	same->dest_count = count;
614	ret = vfs_dedupe_file_range(file, same);
615	if (ret)
616		goto out;
617
618	ret = copy_to_user(argp, same, size);
619	if (ret)
620		ret = -EFAULT;
621
622out:
623	kfree(same);
624	return ret;
625}
626
627/*
628 * When you add any new common ioctls to the switches above and below
629 * please update compat_sys_ioctl() too.
630 *
631 * do_vfs_ioctl() is not for drivers and not intended to be EXPORT_SYMBOL()'d.
632 * It's just a simple helper for sys_ioctl and compat_sys_ioctl.
633 */
634int do_vfs_ioctl(struct file *filp, unsigned int fd, unsigned int cmd,
635	     unsigned long arg)
636{
637	int error = 0;
638	int __user *argp = (int __user *)arg;
639	struct inode *inode = file_inode(filp);
640
641	switch (cmd) {
642	case FIOCLEX:
643		set_close_on_exec(fd, 1);
644		break;
645
646	case FIONCLEX:
647		set_close_on_exec(fd, 0);
648		break;
649
650	case FIONBIO:
651		error = ioctl_fionbio(filp, argp);
652		break;
653
654	case FIOASYNC:
655		error = ioctl_fioasync(fd, filp, argp);
656		break;
657
658	case FIOQSIZE:
659		if (S_ISDIR(inode->i_mode) || S_ISREG(inode->i_mode) ||
660		    S_ISLNK(inode->i_mode)) {
661			loff_t res = inode_get_bytes(inode);
662			error = copy_to_user(argp, &res, sizeof(res)) ?
663					-EFAULT : 0;
664		} else
665			error = -ENOTTY;
666		break;
667
668	case FIFREEZE:
669		error = ioctl_fsfreeze(filp);
670		break;
671
672	case FITHAW:
673		error = ioctl_fsthaw(filp);
674		break;
675
676	case FS_IOC_FIEMAP:
677		return ioctl_fiemap(filp, arg);
678
679	case FIGETBSZ:
680		/* anon_bdev filesystems may not have a block size */
681		if (!inode->i_sb->s_blocksize)
682			return -EINVAL;
683		return put_user(inode->i_sb->s_blocksize, argp);
684
685	case FICLONE:
686		return ioctl_file_clone(filp, arg, 0, 0, 0);
687
688	case FICLONERANGE:
689		return ioctl_file_clone_range(filp, argp);
690
691	case FIDEDUPERANGE:
692		return ioctl_file_dedupe_range(filp, argp);
693
694	default:
695		if (S_ISREG(inode->i_mode))
696			error = file_ioctl(filp, cmd, arg);
697		else
698			error = vfs_ioctl(filp, cmd, arg);
699		break;
700	}
701	return error;
702}
703
704int ksys_ioctl(unsigned int fd, unsigned int cmd, unsigned long arg)
705{
706	int error;
707	struct fd f = fdget(fd);
708
709	if (!f.file)
710		return -EBADF;
711	error = security_file_ioctl(f.file, cmd, arg);
712	if (!error)
713		error = do_vfs_ioctl(f.file, fd, cmd, arg);
714	fdput(f);
715	return error;
716}
717
718SYSCALL_DEFINE3(ioctl, unsigned int, fd, unsigned int, cmd, unsigned long, arg)
719{
720	return ksys_ioctl(fd, cmd, arg);
721}