Linux Audio

Check our new training course

Open-source upstreaming

Need help get the support for your hardware in upstream Linux?
Loading...
v6.2
  1// SPDX-License-Identifier: GPL-2.0
  2/*
  3 *  linux/fs/ioctl.c
  4 *
  5 *  Copyright (C) 1991, 1992  Linus Torvalds
  6 */
  7
  8#include <linux/syscalls.h>
  9#include <linux/mm.h>
 10#include <linux/capability.h>
 11#include <linux/compat.h>
 12#include <linux/file.h>
 13#include <linux/fs.h>
 14#include <linux/security.h>
 15#include <linux/export.h>
 16#include <linux/uaccess.h>
 17#include <linux/writeback.h>
 18#include <linux/buffer_head.h>
 19#include <linux/falloc.h>
 20#include <linux/sched/signal.h>
 21#include <linux/fiemap.h>
 22#include <linux/mount.h>
 23#include <linux/fscrypt.h>
 24#include <linux/fileattr.h>
 25
 26#include "internal.h"
 27
 28#include <asm/ioctls.h>
 29
 30/* So that the fiemap access checks can't overflow on 32 bit machines. */
 31#define FIEMAP_MAX_EXTENTS	(UINT_MAX / sizeof(struct fiemap_extent))
 32
 33/**
 34 * vfs_ioctl - call filesystem specific ioctl methods
 35 * @filp:	open file to invoke ioctl method on
 36 * @cmd:	ioctl command to execute
 37 * @arg:	command-specific argument for ioctl
 38 *
 39 * Invokes filesystem specific ->unlocked_ioctl, if one exists; otherwise
 40 * returns -ENOTTY.
 41 *
 42 * Returns 0 on success, -errno on error.
 43 */
 44long vfs_ioctl(struct file *filp, unsigned int cmd, unsigned long arg)
 45{
 46	int error = -ENOTTY;
 47
 48	if (!filp->f_op->unlocked_ioctl)
 49		goto out;
 50
 51	error = filp->f_op->unlocked_ioctl(filp, cmd, arg);
 52	if (error == -ENOIOCTLCMD)
 53		error = -ENOTTY;
 54 out:
 55	return error;
 56}
 57EXPORT_SYMBOL(vfs_ioctl);
 58
 59static int ioctl_fibmap(struct file *filp, int __user *p)
 60{
 61	struct inode *inode = file_inode(filp);
 62	struct super_block *sb = inode->i_sb;
 63	int error, ur_block;
 64	sector_t block;
 65
 66	if (!capable(CAP_SYS_RAWIO))
 67		return -EPERM;
 68
 69	error = get_user(ur_block, p);
 70	if (error)
 71		return error;
 72
 73	if (ur_block < 0)
 74		return -EINVAL;
 75
 76	block = ur_block;
 77	error = bmap(inode, &block);
 78
 79	if (block > INT_MAX) {
 80		error = -ERANGE;
 81		pr_warn_ratelimited("[%s/%d] FS: %s File: %pD4 would truncate fibmap result\n",
 82				    current->comm, task_pid_nr(current),
 83				    sb->s_id, filp);
 84	}
 85
 86	if (error)
 87		ur_block = 0;
 88	else
 89		ur_block = block;
 90
 91	if (put_user(ur_block, p))
 92		error = -EFAULT;
 93
 94	return error;
 95}
 96
 97/**
 98 * fiemap_fill_next_extent - Fiemap helper function
 99 * @fieinfo:	Fiemap context passed into ->fiemap
100 * @logical:	Extent logical start offset, in bytes
101 * @phys:	Extent physical start offset, in bytes
102 * @len:	Extent length, in bytes
103 * @flags:	FIEMAP_EXTENT flags that describe this extent
104 *
105 * Called from file system ->fiemap callback. Will populate extent
106 * info as passed in via arguments and copy to user memory. On
107 * success, extent count on fieinfo is incremented.
108 *
109 * Returns 0 on success, -errno on error, 1 if this was the last
110 * extent that will fit in user array.
111 */
112#define SET_UNKNOWN_FLAGS	(FIEMAP_EXTENT_DELALLOC)
113#define SET_NO_UNMOUNTED_IO_FLAGS	(FIEMAP_EXTENT_DATA_ENCRYPTED)
114#define SET_NOT_ALIGNED_FLAGS	(FIEMAP_EXTENT_DATA_TAIL|FIEMAP_EXTENT_DATA_INLINE)
115int fiemap_fill_next_extent(struct fiemap_extent_info *fieinfo, u64 logical,
116			    u64 phys, u64 len, u32 flags)
117{
118	struct fiemap_extent extent;
119	struct fiemap_extent __user *dest = fieinfo->fi_extents_start;
120
121	/* only count the extents */
122	if (fieinfo->fi_extents_max == 0) {
123		fieinfo->fi_extents_mapped++;
124		return (flags & FIEMAP_EXTENT_LAST) ? 1 : 0;
125	}
126
127	if (fieinfo->fi_extents_mapped >= fieinfo->fi_extents_max)
128		return 1;
129
130	if (flags & SET_UNKNOWN_FLAGS)
131		flags |= FIEMAP_EXTENT_UNKNOWN;
132	if (flags & SET_NO_UNMOUNTED_IO_FLAGS)
133		flags |= FIEMAP_EXTENT_ENCODED;
134	if (flags & SET_NOT_ALIGNED_FLAGS)
135		flags |= FIEMAP_EXTENT_NOT_ALIGNED;
136
137	memset(&extent, 0, sizeof(extent));
138	extent.fe_logical = logical;
139	extent.fe_physical = phys;
140	extent.fe_length = len;
141	extent.fe_flags = flags;
142
143	dest += fieinfo->fi_extents_mapped;
144	if (copy_to_user(dest, &extent, sizeof(extent)))
145		return -EFAULT;
146
147	fieinfo->fi_extents_mapped++;
148	if (fieinfo->fi_extents_mapped == fieinfo->fi_extents_max)
149		return 1;
150	return (flags & FIEMAP_EXTENT_LAST) ? 1 : 0;
151}
152EXPORT_SYMBOL(fiemap_fill_next_extent);
153
154/**
155 * fiemap_prep - check validity of requested flags for fiemap
156 * @inode:	Inode to operate on
157 * @fieinfo:	Fiemap context passed into ->fiemap
158 * @start:	Start of the mapped range
159 * @len:	Length of the mapped range, can be truncated by this function.
160 * @supported_flags:	Set of fiemap flags that the file system understands
161 *
162 * This function must be called from each ->fiemap instance to validate the
163 * fiemap request against the file system parameters.
164 *
165 * Returns 0 on success, or a negative error on failure.
166 */
167int fiemap_prep(struct inode *inode, struct fiemap_extent_info *fieinfo,
168		u64 start, u64 *len, u32 supported_flags)
169{
170	u64 maxbytes = inode->i_sb->s_maxbytes;
171	u32 incompat_flags;
172	int ret = 0;
173
174	if (*len == 0)
175		return -EINVAL;
176	if (start >= maxbytes)
177		return -EFBIG;
178
179	/*
180	 * Shrink request scope to what the fs can actually handle.
181	 */
182	if (*len > maxbytes || (maxbytes - *len) < start)
183		*len = maxbytes - start;
184
185	supported_flags |= FIEMAP_FLAG_SYNC;
186	supported_flags &= FIEMAP_FLAGS_COMPAT;
187	incompat_flags = fieinfo->fi_flags & ~supported_flags;
188	if (incompat_flags) {
189		fieinfo->fi_flags = incompat_flags;
190		return -EBADR;
191	}
192
193	if (fieinfo->fi_flags & FIEMAP_FLAG_SYNC)
194		ret = filemap_write_and_wait(inode->i_mapping);
195	return ret;
196}
197EXPORT_SYMBOL(fiemap_prep);
198
199static int ioctl_fiemap(struct file *filp, struct fiemap __user *ufiemap)
200{
201	struct fiemap fiemap;
202	struct fiemap_extent_info fieinfo = { 0, };
203	struct inode *inode = file_inode(filp);
204	int error;
205
206	if (!inode->i_op->fiemap)
207		return -EOPNOTSUPP;
208
209	if (copy_from_user(&fiemap, ufiemap, sizeof(fiemap)))
210		return -EFAULT;
211
212	if (fiemap.fm_extent_count > FIEMAP_MAX_EXTENTS)
213		return -EINVAL;
214
215	fieinfo.fi_flags = fiemap.fm_flags;
216	fieinfo.fi_extents_max = fiemap.fm_extent_count;
217	fieinfo.fi_extents_start = ufiemap->fm_extents;
218
219	error = inode->i_op->fiemap(inode, &fieinfo, fiemap.fm_start,
220			fiemap.fm_length);
221
222	fiemap.fm_flags = fieinfo.fi_flags;
223	fiemap.fm_mapped_extents = fieinfo.fi_extents_mapped;
224	if (copy_to_user(ufiemap, &fiemap, sizeof(fiemap)))
225		error = -EFAULT;
226
227	return error;
228}
229
230static long ioctl_file_clone(struct file *dst_file, unsigned long srcfd,
231			     u64 off, u64 olen, u64 destoff)
232{
233	struct fd src_file = fdget(srcfd);
234	loff_t cloned;
235	int ret;
236
237	if (!src_file.file)
238		return -EBADF;
 
 
 
239	cloned = vfs_clone_file_range(src_file.file, off, dst_file, destoff,
240				      olen, 0);
241	if (cloned < 0)
242		ret = cloned;
243	else if (olen && cloned != olen)
244		ret = -EINVAL;
245	else
246		ret = 0;
 
247	fdput(src_file);
248	return ret;
249}
250
251static long ioctl_file_clone_range(struct file *file,
252				   struct file_clone_range __user *argp)
253{
254	struct file_clone_range args;
255
256	if (copy_from_user(&args, argp, sizeof(args)))
257		return -EFAULT;
258	return ioctl_file_clone(file, args.src_fd, args.src_offset,
259				args.src_length, args.dest_offset);
260}
261
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
262/*
263 * This provides compatibility with legacy XFS pre-allocation ioctls
264 * which predate the fallocate syscall.
265 *
266 * Only the l_start, l_len and l_whence fields of the 'struct space_resv'
267 * are used here, rest are ignored.
268 */
269static int ioctl_preallocate(struct file *filp, int mode, void __user *argp)
270{
271	struct inode *inode = file_inode(filp);
272	struct space_resv sr;
273
274	if (copy_from_user(&sr, argp, sizeof(sr)))
275		return -EFAULT;
276
277	switch (sr.l_whence) {
278	case SEEK_SET:
279		break;
280	case SEEK_CUR:
281		sr.l_start += filp->f_pos;
282		break;
283	case SEEK_END:
284		sr.l_start += i_size_read(inode);
285		break;
286	default:
287		return -EINVAL;
288	}
289
290	return vfs_fallocate(filp, mode | FALLOC_FL_KEEP_SIZE, sr.l_start,
291			sr.l_len);
292}
293
294/* on ia32 l_start is on a 32-bit boundary */
295#if defined CONFIG_COMPAT && defined(CONFIG_X86_64)
296/* just account for different alignment */
297static int compat_ioctl_preallocate(struct file *file, int mode,
298				    struct space_resv_32 __user *argp)
299{
300	struct inode *inode = file_inode(file);
301	struct space_resv_32 sr;
302
303	if (copy_from_user(&sr, argp, sizeof(sr)))
304		return -EFAULT;
305
306	switch (sr.l_whence) {
307	case SEEK_SET:
308		break;
309	case SEEK_CUR:
310		sr.l_start += file->f_pos;
311		break;
312	case SEEK_END:
313		sr.l_start += i_size_read(inode);
314		break;
315	default:
316		return -EINVAL;
317	}
318
319	return vfs_fallocate(file, mode | FALLOC_FL_KEEP_SIZE, sr.l_start, sr.l_len);
320}
321#endif
322
323static int file_ioctl(struct file *filp, unsigned int cmd, int __user *p)
324{
325	switch (cmd) {
326	case FIBMAP:
327		return ioctl_fibmap(filp, p);
328	case FS_IOC_RESVSP:
329	case FS_IOC_RESVSP64:
330		return ioctl_preallocate(filp, 0, p);
331	case FS_IOC_UNRESVSP:
332	case FS_IOC_UNRESVSP64:
333		return ioctl_preallocate(filp, FALLOC_FL_PUNCH_HOLE, p);
334	case FS_IOC_ZERO_RANGE:
335		return ioctl_preallocate(filp, FALLOC_FL_ZERO_RANGE, p);
336	}
337
338	return -ENOIOCTLCMD;
339}
340
341static int ioctl_fionbio(struct file *filp, int __user *argp)
342{
343	unsigned int flag;
344	int on, error;
345
346	error = get_user(on, argp);
347	if (error)
348		return error;
349	flag = O_NONBLOCK;
350#ifdef __sparc__
351	/* SunOS compatibility item. */
352	if (O_NONBLOCK != O_NDELAY)
353		flag |= O_NDELAY;
354#endif
355	spin_lock(&filp->f_lock);
356	if (on)
357		filp->f_flags |= flag;
358	else
359		filp->f_flags &= ~flag;
360	spin_unlock(&filp->f_lock);
361	return error;
362}
363
364static int ioctl_fioasync(unsigned int fd, struct file *filp,
365			  int __user *argp)
366{
367	unsigned int flag;
368	int on, error;
369
370	error = get_user(on, argp);
371	if (error)
372		return error;
373	flag = on ? FASYNC : 0;
374
375	/* Did FASYNC state change ? */
376	if ((flag ^ filp->f_flags) & FASYNC) {
377		if (filp->f_op->fasync)
378			/* fasync() adjusts filp->f_flags */
379			error = filp->f_op->fasync(fd, filp, on);
380		else
381			error = -ENOTTY;
382	}
383	return error < 0 ? error : 0;
384}
385
386static int ioctl_fsfreeze(struct file *filp)
387{
388	struct super_block *sb = file_inode(filp)->i_sb;
389
390	if (!ns_capable(sb->s_user_ns, CAP_SYS_ADMIN))
391		return -EPERM;
392
393	/* If filesystem doesn't support freeze feature, return. */
394	if (sb->s_op->freeze_fs == NULL && sb->s_op->freeze_super == NULL)
395		return -EOPNOTSUPP;
396
397	/* Freeze */
398	if (sb->s_op->freeze_super)
399		return sb->s_op->freeze_super(sb);
400	return freeze_super(sb);
401}
402
403static int ioctl_fsthaw(struct file *filp)
404{
405	struct super_block *sb = file_inode(filp)->i_sb;
406
407	if (!ns_capable(sb->s_user_ns, CAP_SYS_ADMIN))
408		return -EPERM;
409
410	/* Thaw */
411	if (sb->s_op->thaw_super)
412		return sb->s_op->thaw_super(sb);
413	return thaw_super(sb);
414}
415
416static int ioctl_file_dedupe_range(struct file *file,
417				   struct file_dedupe_range __user *argp)
418{
419	struct file_dedupe_range *same = NULL;
420	int ret;
421	unsigned long size;
422	u16 count;
423
424	if (get_user(count, &argp->dest_count)) {
425		ret = -EFAULT;
426		goto out;
427	}
428
429	size = offsetof(struct file_dedupe_range, info[count]);
430	if (size > PAGE_SIZE) {
431		ret = -ENOMEM;
432		goto out;
433	}
434
435	same = memdup_user(argp, size);
436	if (IS_ERR(same)) {
437		ret = PTR_ERR(same);
438		same = NULL;
439		goto out;
440	}
441
442	same->dest_count = count;
443	ret = vfs_dedupe_file_range(file, same);
444	if (ret)
445		goto out;
446
447	ret = copy_to_user(argp, same, size);
448	if (ret)
449		ret = -EFAULT;
450
451out:
452	kfree(same);
453	return ret;
454}
455
456/**
457 * fileattr_fill_xflags - initialize fileattr with xflags
458 * @fa:		fileattr pointer
459 * @xflags:	FS_XFLAG_* flags
460 *
461 * Set ->fsx_xflags, ->fsx_valid and ->flags (translated xflags).  All
462 * other fields are zeroed.
463 */
464void fileattr_fill_xflags(struct fileattr *fa, u32 xflags)
465{
466	memset(fa, 0, sizeof(*fa));
467	fa->fsx_valid = true;
468	fa->fsx_xflags = xflags;
469	if (fa->fsx_xflags & FS_XFLAG_IMMUTABLE)
470		fa->flags |= FS_IMMUTABLE_FL;
471	if (fa->fsx_xflags & FS_XFLAG_APPEND)
472		fa->flags |= FS_APPEND_FL;
473	if (fa->fsx_xflags & FS_XFLAG_SYNC)
474		fa->flags |= FS_SYNC_FL;
475	if (fa->fsx_xflags & FS_XFLAG_NOATIME)
476		fa->flags |= FS_NOATIME_FL;
477	if (fa->fsx_xflags & FS_XFLAG_NODUMP)
478		fa->flags |= FS_NODUMP_FL;
479	if (fa->fsx_xflags & FS_XFLAG_DAX)
480		fa->flags |= FS_DAX_FL;
481	if (fa->fsx_xflags & FS_XFLAG_PROJINHERIT)
482		fa->flags |= FS_PROJINHERIT_FL;
483}
484EXPORT_SYMBOL(fileattr_fill_xflags);
485
486/**
487 * fileattr_fill_flags - initialize fileattr with flags
488 * @fa:		fileattr pointer
489 * @flags:	FS_*_FL flags
490 *
491 * Set ->flags, ->flags_valid and ->fsx_xflags (translated flags).
492 * All other fields are zeroed.
493 */
494void fileattr_fill_flags(struct fileattr *fa, u32 flags)
495{
496	memset(fa, 0, sizeof(*fa));
497	fa->flags_valid = true;
498	fa->flags = flags;
499	if (fa->flags & FS_SYNC_FL)
500		fa->fsx_xflags |= FS_XFLAG_SYNC;
501	if (fa->flags & FS_IMMUTABLE_FL)
502		fa->fsx_xflags |= FS_XFLAG_IMMUTABLE;
503	if (fa->flags & FS_APPEND_FL)
504		fa->fsx_xflags |= FS_XFLAG_APPEND;
505	if (fa->flags & FS_NODUMP_FL)
506		fa->fsx_xflags |= FS_XFLAG_NODUMP;
507	if (fa->flags & FS_NOATIME_FL)
508		fa->fsx_xflags |= FS_XFLAG_NOATIME;
509	if (fa->flags & FS_DAX_FL)
510		fa->fsx_xflags |= FS_XFLAG_DAX;
511	if (fa->flags & FS_PROJINHERIT_FL)
512		fa->fsx_xflags |= FS_XFLAG_PROJINHERIT;
513}
514EXPORT_SYMBOL(fileattr_fill_flags);
515
516/**
517 * vfs_fileattr_get - retrieve miscellaneous file attributes
518 * @dentry:	the object to retrieve from
519 * @fa:		fileattr pointer
520 *
521 * Call i_op->fileattr_get() callback, if exists.
522 *
523 * Return: 0 on success, or a negative error on failure.
524 */
525int vfs_fileattr_get(struct dentry *dentry, struct fileattr *fa)
526{
527	struct inode *inode = d_inode(dentry);
528
529	if (!inode->i_op->fileattr_get)
530		return -ENOIOCTLCMD;
531
532	return inode->i_op->fileattr_get(dentry, fa);
533}
534EXPORT_SYMBOL(vfs_fileattr_get);
535
536/**
537 * copy_fsxattr_to_user - copy fsxattr to userspace.
538 * @fa:		fileattr pointer
539 * @ufa:	fsxattr user pointer
540 *
541 * Return: 0 on success, or -EFAULT on failure.
542 */
543int copy_fsxattr_to_user(const struct fileattr *fa, struct fsxattr __user *ufa)
544{
545	struct fsxattr xfa;
546
547	memset(&xfa, 0, sizeof(xfa));
548	xfa.fsx_xflags = fa->fsx_xflags;
549	xfa.fsx_extsize = fa->fsx_extsize;
550	xfa.fsx_nextents = fa->fsx_nextents;
551	xfa.fsx_projid = fa->fsx_projid;
552	xfa.fsx_cowextsize = fa->fsx_cowextsize;
553
554	if (copy_to_user(ufa, &xfa, sizeof(xfa)))
555		return -EFAULT;
556
557	return 0;
558}
559EXPORT_SYMBOL(copy_fsxattr_to_user);
560
561static int copy_fsxattr_from_user(struct fileattr *fa,
562				  struct fsxattr __user *ufa)
563{
564	struct fsxattr xfa;
565
566	if (copy_from_user(&xfa, ufa, sizeof(xfa)))
567		return -EFAULT;
568
569	fileattr_fill_xflags(fa, xfa.fsx_xflags);
570	fa->fsx_extsize = xfa.fsx_extsize;
571	fa->fsx_nextents = xfa.fsx_nextents;
572	fa->fsx_projid = xfa.fsx_projid;
573	fa->fsx_cowextsize = xfa.fsx_cowextsize;
574
575	return 0;
576}
577
578/*
579 * Generic function to check FS_IOC_FSSETXATTR/FS_IOC_SETFLAGS values and reject
580 * any invalid configurations.
581 *
582 * Note: must be called with inode lock held.
583 */
584static int fileattr_set_prepare(struct inode *inode,
585			      const struct fileattr *old_ma,
586			      struct fileattr *fa)
587{
588	int err;
589
590	/*
591	 * The IMMUTABLE and APPEND_ONLY flags can only be changed by
592	 * the relevant capability.
593	 */
594	if ((fa->flags ^ old_ma->flags) & (FS_APPEND_FL | FS_IMMUTABLE_FL) &&
595	    !capable(CAP_LINUX_IMMUTABLE))
596		return -EPERM;
597
598	err = fscrypt_prepare_setflags(inode, old_ma->flags, fa->flags);
599	if (err)
600		return err;
601
602	/*
603	 * Project Quota ID state is only allowed to change from within the init
604	 * namespace. Enforce that restriction only if we are trying to change
605	 * the quota ID state. Everything else is allowed in user namespaces.
606	 */
607	if (current_user_ns() != &init_user_ns) {
608		if (old_ma->fsx_projid != fa->fsx_projid)
609			return -EINVAL;
610		if ((old_ma->fsx_xflags ^ fa->fsx_xflags) &
611				FS_XFLAG_PROJINHERIT)
612			return -EINVAL;
613	} else {
614		/*
615		 * Caller is allowed to change the project ID. If it is being
616		 * changed, make sure that the new value is valid.
617		 */
618		if (old_ma->fsx_projid != fa->fsx_projid &&
619		    !projid_valid(make_kprojid(&init_user_ns, fa->fsx_projid)))
620			return -EINVAL;
621	}
622
623	/* Check extent size hints. */
624	if ((fa->fsx_xflags & FS_XFLAG_EXTSIZE) && !S_ISREG(inode->i_mode))
625		return -EINVAL;
626
627	if ((fa->fsx_xflags & FS_XFLAG_EXTSZINHERIT) &&
628			!S_ISDIR(inode->i_mode))
629		return -EINVAL;
630
631	if ((fa->fsx_xflags & FS_XFLAG_COWEXTSIZE) &&
632	    !S_ISREG(inode->i_mode) && !S_ISDIR(inode->i_mode))
633		return -EINVAL;
634
635	/*
636	 * It is only valid to set the DAX flag on regular files and
637	 * directories on filesystems.
638	 */
639	if ((fa->fsx_xflags & FS_XFLAG_DAX) &&
640	    !(S_ISREG(inode->i_mode) || S_ISDIR(inode->i_mode)))
641		return -EINVAL;
642
643	/* Extent size hints of zero turn off the flags. */
644	if (fa->fsx_extsize == 0)
645		fa->fsx_xflags &= ~(FS_XFLAG_EXTSIZE | FS_XFLAG_EXTSZINHERIT);
646	if (fa->fsx_cowextsize == 0)
647		fa->fsx_xflags &= ~FS_XFLAG_COWEXTSIZE;
648
649	return 0;
650}
651
652/**
653 * vfs_fileattr_set - change miscellaneous file attributes
654 * @mnt_userns:	user namespace of the mount
655 * @dentry:	the object to change
656 * @fa:		fileattr pointer
657 *
658 * After verifying permissions, call i_op->fileattr_set() callback, if
659 * exists.
660 *
661 * Verifying attributes involves retrieving current attributes with
662 * i_op->fileattr_get(), this also allows initializing attributes that have
663 * not been set by the caller to current values.  Inode lock is held
664 * thoughout to prevent racing with another instance.
665 *
666 * Return: 0 on success, or a negative error on failure.
667 */
668int vfs_fileattr_set(struct user_namespace *mnt_userns, struct dentry *dentry,
669		     struct fileattr *fa)
670{
671	struct inode *inode = d_inode(dentry);
672	struct fileattr old_ma = {};
673	int err;
674
675	if (!inode->i_op->fileattr_set)
676		return -ENOIOCTLCMD;
677
678	if (!inode_owner_or_capable(mnt_userns, inode))
679		return -EPERM;
680
681	inode_lock(inode);
682	err = vfs_fileattr_get(dentry, &old_ma);
683	if (!err) {
684		/* initialize missing bits from old_ma */
685		if (fa->flags_valid) {
686			fa->fsx_xflags |= old_ma.fsx_xflags & ~FS_XFLAG_COMMON;
687			fa->fsx_extsize = old_ma.fsx_extsize;
688			fa->fsx_nextents = old_ma.fsx_nextents;
689			fa->fsx_projid = old_ma.fsx_projid;
690			fa->fsx_cowextsize = old_ma.fsx_cowextsize;
691		} else {
692			fa->flags |= old_ma.flags & ~FS_COMMON_FL;
693		}
694		err = fileattr_set_prepare(inode, &old_ma, fa);
695		if (!err)
696			err = inode->i_op->fileattr_set(mnt_userns, dentry, fa);
697	}
698	inode_unlock(inode);
699
700	return err;
701}
702EXPORT_SYMBOL(vfs_fileattr_set);
703
704static int ioctl_getflags(struct file *file, unsigned int __user *argp)
705{
706	struct fileattr fa = { .flags_valid = true }; /* hint only */
707	int err;
708
709	err = vfs_fileattr_get(file->f_path.dentry, &fa);
710	if (!err)
711		err = put_user(fa.flags, argp);
712	return err;
713}
714
715static int ioctl_setflags(struct file *file, unsigned int __user *argp)
716{
717	struct user_namespace *mnt_userns = file_mnt_user_ns(file);
718	struct dentry *dentry = file->f_path.dentry;
719	struct fileattr fa;
720	unsigned int flags;
721	int err;
722
723	err = get_user(flags, argp);
724	if (!err) {
725		err = mnt_want_write_file(file);
726		if (!err) {
727			fileattr_fill_flags(&fa, flags);
728			err = vfs_fileattr_set(mnt_userns, dentry, &fa);
729			mnt_drop_write_file(file);
730		}
731	}
732	return err;
733}
734
735static int ioctl_fsgetxattr(struct file *file, void __user *argp)
736{
737	struct fileattr fa = { .fsx_valid = true }; /* hint only */
738	int err;
739
740	err = vfs_fileattr_get(file->f_path.dentry, &fa);
741	if (!err)
742		err = copy_fsxattr_to_user(&fa, argp);
743
744	return err;
745}
746
747static int ioctl_fssetxattr(struct file *file, void __user *argp)
748{
749	struct user_namespace *mnt_userns = file_mnt_user_ns(file);
750	struct dentry *dentry = file->f_path.dentry;
751	struct fileattr fa;
752	int err;
753
754	err = copy_fsxattr_from_user(&fa, argp);
755	if (!err) {
756		err = mnt_want_write_file(file);
757		if (!err) {
758			err = vfs_fileattr_set(mnt_userns, dentry, &fa);
759			mnt_drop_write_file(file);
760		}
761	}
762	return err;
763}
764
765/*
766 * do_vfs_ioctl() is not for drivers and not intended to be EXPORT_SYMBOL()'d.
767 * It's just a simple helper for sys_ioctl and compat_sys_ioctl.
768 *
769 * When you add any new common ioctls to the switches above and below,
770 * please ensure they have compatible arguments in compat mode.
771 */
772static int do_vfs_ioctl(struct file *filp, unsigned int fd,
773			unsigned int cmd, unsigned long arg)
774{
775	void __user *argp = (void __user *)arg;
776	struct inode *inode = file_inode(filp);
777
778	switch (cmd) {
779	case FIOCLEX:
780		set_close_on_exec(fd, 1);
781		return 0;
782
783	case FIONCLEX:
784		set_close_on_exec(fd, 0);
785		return 0;
786
787	case FIONBIO:
788		return ioctl_fionbio(filp, argp);
789
790	case FIOASYNC:
791		return ioctl_fioasync(fd, filp, argp);
792
793	case FIOQSIZE:
794		if (S_ISDIR(inode->i_mode) || S_ISREG(inode->i_mode) ||
795		    S_ISLNK(inode->i_mode)) {
796			loff_t res = inode_get_bytes(inode);
797			return copy_to_user(argp, &res, sizeof(res)) ?
798					    -EFAULT : 0;
799		}
800
801		return -ENOTTY;
802
803	case FIFREEZE:
804		return ioctl_fsfreeze(filp);
805
806	case FITHAW:
807		return ioctl_fsthaw(filp);
808
809	case FS_IOC_FIEMAP:
810		return ioctl_fiemap(filp, argp);
811
812	case FIGETBSZ:
813		/* anon_bdev filesystems may not have a block size */
814		if (!inode->i_sb->s_blocksize)
815			return -EINVAL;
816
817		return put_user(inode->i_sb->s_blocksize, (int __user *)argp);
818
819	case FICLONE:
820		return ioctl_file_clone(filp, arg, 0, 0, 0);
821
822	case FICLONERANGE:
823		return ioctl_file_clone_range(filp, argp);
824
825	case FIDEDUPERANGE:
826		return ioctl_file_dedupe_range(filp, argp);
827
828	case FIONREAD:
829		if (!S_ISREG(inode->i_mode))
830			return vfs_ioctl(filp, cmd, arg);
831
832		return put_user(i_size_read(inode) - filp->f_pos,
833				(int __user *)argp);
834
835	case FS_IOC_GETFLAGS:
836		return ioctl_getflags(filp, argp);
837
838	case FS_IOC_SETFLAGS:
839		return ioctl_setflags(filp, argp);
840
841	case FS_IOC_FSGETXATTR:
842		return ioctl_fsgetxattr(filp, argp);
843
844	case FS_IOC_FSSETXATTR:
845		return ioctl_fssetxattr(filp, argp);
846
847	default:
848		if (S_ISREG(inode->i_mode))
849			return file_ioctl(filp, cmd, argp);
850		break;
851	}
852
853	return -ENOIOCTLCMD;
854}
855
856SYSCALL_DEFINE3(ioctl, unsigned int, fd, unsigned int, cmd, unsigned long, arg)
857{
858	struct fd f = fdget(fd);
859	int error;
860
861	if (!f.file)
862		return -EBADF;
863
864	error = security_file_ioctl(f.file, cmd, arg);
865	if (error)
866		goto out;
867
868	error = do_vfs_ioctl(f.file, fd, cmd, arg);
869	if (error == -ENOIOCTLCMD)
870		error = vfs_ioctl(f.file, cmd, arg);
871
872out:
873	fdput(f);
874	return error;
875}
876
877#ifdef CONFIG_COMPAT
878/**
879 * compat_ptr_ioctl - generic implementation of .compat_ioctl file operation
880 *
881 * This is not normally called as a function, but instead set in struct
882 * file_operations as
883 *
884 *     .compat_ioctl = compat_ptr_ioctl,
885 *
886 * On most architectures, the compat_ptr_ioctl() just passes all arguments
887 * to the corresponding ->ioctl handler. The exception is arch/s390, where
888 * compat_ptr() clears the top bit of a 32-bit pointer value, so user space
889 * pointers to the second 2GB alias the first 2GB, as is the case for
890 * native 32-bit s390 user space.
891 *
892 * The compat_ptr_ioctl() function must therefore be used only with ioctl
893 * functions that either ignore the argument or pass a pointer to a
894 * compatible data type.
895 *
896 * If any ioctl command handled by fops->unlocked_ioctl passes a plain
897 * integer instead of a pointer, or any of the passed data types
898 * is incompatible between 32-bit and 64-bit architectures, a proper
899 * handler is required instead of compat_ptr_ioctl.
900 */
901long compat_ptr_ioctl(struct file *file, unsigned int cmd, unsigned long arg)
902{
903	if (!file->f_op->unlocked_ioctl)
904		return -ENOIOCTLCMD;
905
906	return file->f_op->unlocked_ioctl(file, cmd, (unsigned long)compat_ptr(arg));
907}
908EXPORT_SYMBOL(compat_ptr_ioctl);
909
910COMPAT_SYSCALL_DEFINE3(ioctl, unsigned int, fd, unsigned int, cmd,
911		       compat_ulong_t, arg)
912{
913	struct fd f = fdget(fd);
914	int error;
915
916	if (!f.file)
917		return -EBADF;
918
919	/* RED-PEN how should LSM module know it's handling 32bit? */
920	error = security_file_ioctl(f.file, cmd, arg);
921	if (error)
922		goto out;
923
924	switch (cmd) {
925	/* FICLONE takes an int argument, so don't use compat_ptr() */
926	case FICLONE:
927		error = ioctl_file_clone(f.file, arg, 0, 0, 0);
928		break;
929
930#if defined(CONFIG_X86_64)
931	/* these get messy on amd64 due to alignment differences */
932	case FS_IOC_RESVSP_32:
933	case FS_IOC_RESVSP64_32:
934		error = compat_ioctl_preallocate(f.file, 0, compat_ptr(arg));
935		break;
936	case FS_IOC_UNRESVSP_32:
937	case FS_IOC_UNRESVSP64_32:
938		error = compat_ioctl_preallocate(f.file, FALLOC_FL_PUNCH_HOLE,
939				compat_ptr(arg));
940		break;
941	case FS_IOC_ZERO_RANGE_32:
942		error = compat_ioctl_preallocate(f.file, FALLOC_FL_ZERO_RANGE,
943				compat_ptr(arg));
944		break;
945#endif
946
947	/*
948	 * These access 32-bit values anyway so no further handling is
949	 * necessary.
950	 */
951	case FS_IOC32_GETFLAGS:
952	case FS_IOC32_SETFLAGS:
953		cmd = (cmd == FS_IOC32_GETFLAGS) ?
954			FS_IOC_GETFLAGS : FS_IOC_SETFLAGS;
955		fallthrough;
956	/*
957	 * everything else in do_vfs_ioctl() takes either a compatible
958	 * pointer argument or no argument -- call it with a modified
959	 * argument.
960	 */
961	default:
962		error = do_vfs_ioctl(f.file, fd, cmd,
963				     (unsigned long)compat_ptr(arg));
964		if (error != -ENOIOCTLCMD)
965			break;
966
967		if (f.file->f_op->compat_ioctl)
968			error = f.file->f_op->compat_ioctl(f.file, cmd, arg);
969		if (error == -ENOIOCTLCMD)
970			error = -ENOTTY;
971		break;
972	}
973
974 out:
975	fdput(f);
976
977	return error;
978}
979#endif
v5.14.15
   1// SPDX-License-Identifier: GPL-2.0
   2/*
   3 *  linux/fs/ioctl.c
   4 *
   5 *  Copyright (C) 1991, 1992  Linus Torvalds
   6 */
   7
   8#include <linux/syscalls.h>
   9#include <linux/mm.h>
  10#include <linux/capability.h>
  11#include <linux/compat.h>
  12#include <linux/file.h>
  13#include <linux/fs.h>
  14#include <linux/security.h>
  15#include <linux/export.h>
  16#include <linux/uaccess.h>
  17#include <linux/writeback.h>
  18#include <linux/buffer_head.h>
  19#include <linux/falloc.h>
  20#include <linux/sched/signal.h>
  21#include <linux/fiemap.h>
  22#include <linux/mount.h>
  23#include <linux/fscrypt.h>
  24#include <linux/fileattr.h>
  25
  26#include "internal.h"
  27
  28#include <asm/ioctls.h>
  29
  30/* So that the fiemap access checks can't overflow on 32 bit machines. */
  31#define FIEMAP_MAX_EXTENTS	(UINT_MAX / sizeof(struct fiemap_extent))
  32
  33/**
  34 * vfs_ioctl - call filesystem specific ioctl methods
  35 * @filp:	open file to invoke ioctl method on
  36 * @cmd:	ioctl command to execute
  37 * @arg:	command-specific argument for ioctl
  38 *
  39 * Invokes filesystem specific ->unlocked_ioctl, if one exists; otherwise
  40 * returns -ENOTTY.
  41 *
  42 * Returns 0 on success, -errno on error.
  43 */
  44long vfs_ioctl(struct file *filp, unsigned int cmd, unsigned long arg)
  45{
  46	int error = -ENOTTY;
  47
  48	if (!filp->f_op->unlocked_ioctl)
  49		goto out;
  50
  51	error = filp->f_op->unlocked_ioctl(filp, cmd, arg);
  52	if (error == -ENOIOCTLCMD)
  53		error = -ENOTTY;
  54 out:
  55	return error;
  56}
  57EXPORT_SYMBOL(vfs_ioctl);
  58
  59static int ioctl_fibmap(struct file *filp, int __user *p)
  60{
  61	struct inode *inode = file_inode(filp);
  62	struct super_block *sb = inode->i_sb;
  63	int error, ur_block;
  64	sector_t block;
  65
  66	if (!capable(CAP_SYS_RAWIO))
  67		return -EPERM;
  68
  69	error = get_user(ur_block, p);
  70	if (error)
  71		return error;
  72
  73	if (ur_block < 0)
  74		return -EINVAL;
  75
  76	block = ur_block;
  77	error = bmap(inode, &block);
  78
  79	if (block > INT_MAX) {
  80		error = -ERANGE;
  81		pr_warn_ratelimited("[%s/%d] FS: %s File: %pD4 would truncate fibmap result\n",
  82				    current->comm, task_pid_nr(current),
  83				    sb->s_id, filp);
  84	}
  85
  86	if (error)
  87		ur_block = 0;
  88	else
  89		ur_block = block;
  90
  91	if (put_user(ur_block, p))
  92		error = -EFAULT;
  93
  94	return error;
  95}
  96
  97/**
  98 * fiemap_fill_next_extent - Fiemap helper function
  99 * @fieinfo:	Fiemap context passed into ->fiemap
 100 * @logical:	Extent logical start offset, in bytes
 101 * @phys:	Extent physical start offset, in bytes
 102 * @len:	Extent length, in bytes
 103 * @flags:	FIEMAP_EXTENT flags that describe this extent
 104 *
 105 * Called from file system ->fiemap callback. Will populate extent
 106 * info as passed in via arguments and copy to user memory. On
 107 * success, extent count on fieinfo is incremented.
 108 *
 109 * Returns 0 on success, -errno on error, 1 if this was the last
 110 * extent that will fit in user array.
 111 */
 112#define SET_UNKNOWN_FLAGS	(FIEMAP_EXTENT_DELALLOC)
 113#define SET_NO_UNMOUNTED_IO_FLAGS	(FIEMAP_EXTENT_DATA_ENCRYPTED)
 114#define SET_NOT_ALIGNED_FLAGS	(FIEMAP_EXTENT_DATA_TAIL|FIEMAP_EXTENT_DATA_INLINE)
 115int fiemap_fill_next_extent(struct fiemap_extent_info *fieinfo, u64 logical,
 116			    u64 phys, u64 len, u32 flags)
 117{
 118	struct fiemap_extent extent;
 119	struct fiemap_extent __user *dest = fieinfo->fi_extents_start;
 120
 121	/* only count the extents */
 122	if (fieinfo->fi_extents_max == 0) {
 123		fieinfo->fi_extents_mapped++;
 124		return (flags & FIEMAP_EXTENT_LAST) ? 1 : 0;
 125	}
 126
 127	if (fieinfo->fi_extents_mapped >= fieinfo->fi_extents_max)
 128		return 1;
 129
 130	if (flags & SET_UNKNOWN_FLAGS)
 131		flags |= FIEMAP_EXTENT_UNKNOWN;
 132	if (flags & SET_NO_UNMOUNTED_IO_FLAGS)
 133		flags |= FIEMAP_EXTENT_ENCODED;
 134	if (flags & SET_NOT_ALIGNED_FLAGS)
 135		flags |= FIEMAP_EXTENT_NOT_ALIGNED;
 136
 137	memset(&extent, 0, sizeof(extent));
 138	extent.fe_logical = logical;
 139	extent.fe_physical = phys;
 140	extent.fe_length = len;
 141	extent.fe_flags = flags;
 142
 143	dest += fieinfo->fi_extents_mapped;
 144	if (copy_to_user(dest, &extent, sizeof(extent)))
 145		return -EFAULT;
 146
 147	fieinfo->fi_extents_mapped++;
 148	if (fieinfo->fi_extents_mapped == fieinfo->fi_extents_max)
 149		return 1;
 150	return (flags & FIEMAP_EXTENT_LAST) ? 1 : 0;
 151}
 152EXPORT_SYMBOL(fiemap_fill_next_extent);
 153
 154/**
 155 * fiemap_prep - check validity of requested flags for fiemap
 156 * @inode:	Inode to operate on
 157 * @fieinfo:	Fiemap context passed into ->fiemap
 158 * @start:	Start of the mapped range
 159 * @len:	Length of the mapped range, can be truncated by this function.
 160 * @supported_flags:	Set of fiemap flags that the file system understands
 161 *
 162 * This function must be called from each ->fiemap instance to validate the
 163 * fiemap request against the file system parameters.
 164 *
 165 * Returns 0 on success, or a negative error on failure.
 166 */
 167int fiemap_prep(struct inode *inode, struct fiemap_extent_info *fieinfo,
 168		u64 start, u64 *len, u32 supported_flags)
 169{
 170	u64 maxbytes = inode->i_sb->s_maxbytes;
 171	u32 incompat_flags;
 172	int ret = 0;
 173
 174	if (*len == 0)
 175		return -EINVAL;
 176	if (start > maxbytes)
 177		return -EFBIG;
 178
 179	/*
 180	 * Shrink request scope to what the fs can actually handle.
 181	 */
 182	if (*len > maxbytes || (maxbytes - *len) < start)
 183		*len = maxbytes - start;
 184
 185	supported_flags |= FIEMAP_FLAG_SYNC;
 186	supported_flags &= FIEMAP_FLAGS_COMPAT;
 187	incompat_flags = fieinfo->fi_flags & ~supported_flags;
 188	if (incompat_flags) {
 189		fieinfo->fi_flags = incompat_flags;
 190		return -EBADR;
 191	}
 192
 193	if (fieinfo->fi_flags & FIEMAP_FLAG_SYNC)
 194		ret = filemap_write_and_wait(inode->i_mapping);
 195	return ret;
 196}
 197EXPORT_SYMBOL(fiemap_prep);
 198
 199static int ioctl_fiemap(struct file *filp, struct fiemap __user *ufiemap)
 200{
 201	struct fiemap fiemap;
 202	struct fiemap_extent_info fieinfo = { 0, };
 203	struct inode *inode = file_inode(filp);
 204	int error;
 205
 206	if (!inode->i_op->fiemap)
 207		return -EOPNOTSUPP;
 208
 209	if (copy_from_user(&fiemap, ufiemap, sizeof(fiemap)))
 210		return -EFAULT;
 211
 212	if (fiemap.fm_extent_count > FIEMAP_MAX_EXTENTS)
 213		return -EINVAL;
 214
 215	fieinfo.fi_flags = fiemap.fm_flags;
 216	fieinfo.fi_extents_max = fiemap.fm_extent_count;
 217	fieinfo.fi_extents_start = ufiemap->fm_extents;
 218
 219	error = inode->i_op->fiemap(inode, &fieinfo, fiemap.fm_start,
 220			fiemap.fm_length);
 221
 222	fiemap.fm_flags = fieinfo.fi_flags;
 223	fiemap.fm_mapped_extents = fieinfo.fi_extents_mapped;
 224	if (copy_to_user(ufiemap, &fiemap, sizeof(fiemap)))
 225		error = -EFAULT;
 226
 227	return error;
 228}
 229
 230static long ioctl_file_clone(struct file *dst_file, unsigned long srcfd,
 231			     u64 off, u64 olen, u64 destoff)
 232{
 233	struct fd src_file = fdget(srcfd);
 234	loff_t cloned;
 235	int ret;
 236
 237	if (!src_file.file)
 238		return -EBADF;
 239	ret = -EXDEV;
 240	if (src_file.file->f_path.mnt != dst_file->f_path.mnt)
 241		goto fdput;
 242	cloned = vfs_clone_file_range(src_file.file, off, dst_file, destoff,
 243				      olen, 0);
 244	if (cloned < 0)
 245		ret = cloned;
 246	else if (olen && cloned != olen)
 247		ret = -EINVAL;
 248	else
 249		ret = 0;
 250fdput:
 251	fdput(src_file);
 252	return ret;
 253}
 254
 255static long ioctl_file_clone_range(struct file *file,
 256				   struct file_clone_range __user *argp)
 257{
 258	struct file_clone_range args;
 259
 260	if (copy_from_user(&args, argp, sizeof(args)))
 261		return -EFAULT;
 262	return ioctl_file_clone(file, args.src_fd, args.src_offset,
 263				args.src_length, args.dest_offset);
 264}
 265
 266#ifdef CONFIG_BLOCK
 267
 268static inline sector_t logical_to_blk(struct inode *inode, loff_t offset)
 269{
 270	return (offset >> inode->i_blkbits);
 271}
 272
 273static inline loff_t blk_to_logical(struct inode *inode, sector_t blk)
 274{
 275	return (blk << inode->i_blkbits);
 276}
 277
 278/**
 279 * __generic_block_fiemap - FIEMAP for block based inodes (no locking)
 280 * @inode: the inode to map
 281 * @fieinfo: the fiemap info struct that will be passed back to userspace
 282 * @start: where to start mapping in the inode
 283 * @len: how much space to map
 284 * @get_block: the fs's get_block function
 285 *
 286 * This does FIEMAP for block based inodes.  Basically it will just loop
 287 * through get_block until we hit the number of extents we want to map, or we
 288 * go past the end of the file and hit a hole.
 289 *
 290 * If it is possible to have data blocks beyond a hole past @inode->i_size, then
 291 * please do not use this function, it will stop at the first unmapped block
 292 * beyond i_size.
 293 *
 294 * If you use this function directly, you need to do your own locking. Use
 295 * generic_block_fiemap if you want the locking done for you.
 296 */
 297static int __generic_block_fiemap(struct inode *inode,
 298			   struct fiemap_extent_info *fieinfo, loff_t start,
 299			   loff_t len, get_block_t *get_block)
 300{
 301	struct buffer_head map_bh;
 302	sector_t start_blk, last_blk;
 303	loff_t isize = i_size_read(inode);
 304	u64 logical = 0, phys = 0, size = 0;
 305	u32 flags = FIEMAP_EXTENT_MERGED;
 306	bool past_eof = false, whole_file = false;
 307	int ret = 0;
 308
 309	ret = fiemap_prep(inode, fieinfo, start, &len, FIEMAP_FLAG_SYNC);
 310	if (ret)
 311		return ret;
 312
 313	/*
 314	 * Either the i_mutex or other appropriate locking needs to be held
 315	 * since we expect isize to not change at all through the duration of
 316	 * this call.
 317	 */
 318	if (len >= isize) {
 319		whole_file = true;
 320		len = isize;
 321	}
 322
 323	/*
 324	 * Some filesystems can't deal with being asked to map less than
 325	 * blocksize, so make sure our len is at least block length.
 326	 */
 327	if (logical_to_blk(inode, len) == 0)
 328		len = blk_to_logical(inode, 1);
 329
 330	start_blk = logical_to_blk(inode, start);
 331	last_blk = logical_to_blk(inode, start + len - 1);
 332
 333	do {
 334		/*
 335		 * we set b_size to the total size we want so it will map as
 336		 * many contiguous blocks as possible at once
 337		 */
 338		memset(&map_bh, 0, sizeof(struct buffer_head));
 339		map_bh.b_size = len;
 340
 341		ret = get_block(inode, start_blk, &map_bh, 0);
 342		if (ret)
 343			break;
 344
 345		/* HOLE */
 346		if (!buffer_mapped(&map_bh)) {
 347			start_blk++;
 348
 349			/*
 350			 * We want to handle the case where there is an
 351			 * allocated block at the front of the file, and then
 352			 * nothing but holes up to the end of the file properly,
 353			 * to make sure that extent at the front gets properly
 354			 * marked with FIEMAP_EXTENT_LAST
 355			 */
 356			if (!past_eof &&
 357			    blk_to_logical(inode, start_blk) >= isize)
 358				past_eof = 1;
 359
 360			/*
 361			 * First hole after going past the EOF, this is our
 362			 * last extent
 363			 */
 364			if (past_eof && size) {
 365				flags = FIEMAP_EXTENT_MERGED|FIEMAP_EXTENT_LAST;
 366				ret = fiemap_fill_next_extent(fieinfo, logical,
 367							      phys, size,
 368							      flags);
 369			} else if (size) {
 370				ret = fiemap_fill_next_extent(fieinfo, logical,
 371							      phys, size, flags);
 372				size = 0;
 373			}
 374
 375			/* if we have holes up to/past EOF then we're done */
 376			if (start_blk > last_blk || past_eof || ret)
 377				break;
 378		} else {
 379			/*
 380			 * We have gone over the length of what we wanted to
 381			 * map, and it wasn't the entire file, so add the extent
 382			 * we got last time and exit.
 383			 *
 384			 * This is for the case where say we want to map all the
 385			 * way up to the second to the last block in a file, but
 386			 * the last block is a hole, making the second to last
 387			 * block FIEMAP_EXTENT_LAST.  In this case we want to
 388			 * see if there is a hole after the second to last block
 389			 * so we can mark it properly.  If we found data after
 390			 * we exceeded the length we were requesting, then we
 391			 * are good to go, just add the extent to the fieinfo
 392			 * and break
 393			 */
 394			if (start_blk > last_blk && !whole_file) {
 395				ret = fiemap_fill_next_extent(fieinfo, logical,
 396							      phys, size,
 397							      flags);
 398				break;
 399			}
 400
 401			/*
 402			 * if size != 0 then we know we already have an extent
 403			 * to add, so add it.
 404			 */
 405			if (size) {
 406				ret = fiemap_fill_next_extent(fieinfo, logical,
 407							      phys, size,
 408							      flags);
 409				if (ret)
 410					break;
 411			}
 412
 413			logical = blk_to_logical(inode, start_blk);
 414			phys = blk_to_logical(inode, map_bh.b_blocknr);
 415			size = map_bh.b_size;
 416			flags = FIEMAP_EXTENT_MERGED;
 417
 418			start_blk += logical_to_blk(inode, size);
 419
 420			/*
 421			 * If we are past the EOF, then we need to make sure as
 422			 * soon as we find a hole that the last extent we found
 423			 * is marked with FIEMAP_EXTENT_LAST
 424			 */
 425			if (!past_eof && logical + size >= isize)
 426				past_eof = true;
 427		}
 428		cond_resched();
 429		if (fatal_signal_pending(current)) {
 430			ret = -EINTR;
 431			break;
 432		}
 433
 434	} while (1);
 435
 436	/* If ret is 1 then we just hit the end of the extent array */
 437	if (ret == 1)
 438		ret = 0;
 439
 440	return ret;
 441}
 442
 443/**
 444 * generic_block_fiemap - FIEMAP for block based inodes
 445 * @inode: The inode to map
 446 * @fieinfo: The mapping information
 447 * @start: The initial block to map
 448 * @len: The length of the extect to attempt to map
 449 * @get_block: The block mapping function for the fs
 450 *
 451 * Calls __generic_block_fiemap to map the inode, after taking
 452 * the inode's mutex lock.
 453 */
 454
 455int generic_block_fiemap(struct inode *inode,
 456			 struct fiemap_extent_info *fieinfo, u64 start,
 457			 u64 len, get_block_t *get_block)
 458{
 459	int ret;
 460	inode_lock(inode);
 461	ret = __generic_block_fiemap(inode, fieinfo, start, len, get_block);
 462	inode_unlock(inode);
 463	return ret;
 464}
 465EXPORT_SYMBOL(generic_block_fiemap);
 466
 467#endif  /*  CONFIG_BLOCK  */
 468
 469/*
 470 * This provides compatibility with legacy XFS pre-allocation ioctls
 471 * which predate the fallocate syscall.
 472 *
 473 * Only the l_start, l_len and l_whence fields of the 'struct space_resv'
 474 * are used here, rest are ignored.
 475 */
 476static int ioctl_preallocate(struct file *filp, int mode, void __user *argp)
 477{
 478	struct inode *inode = file_inode(filp);
 479	struct space_resv sr;
 480
 481	if (copy_from_user(&sr, argp, sizeof(sr)))
 482		return -EFAULT;
 483
 484	switch (sr.l_whence) {
 485	case SEEK_SET:
 486		break;
 487	case SEEK_CUR:
 488		sr.l_start += filp->f_pos;
 489		break;
 490	case SEEK_END:
 491		sr.l_start += i_size_read(inode);
 492		break;
 493	default:
 494		return -EINVAL;
 495	}
 496
 497	return vfs_fallocate(filp, mode | FALLOC_FL_KEEP_SIZE, sr.l_start,
 498			sr.l_len);
 499}
 500
 501/* on ia32 l_start is on a 32-bit boundary */
 502#if defined CONFIG_COMPAT && defined(CONFIG_X86_64)
 503/* just account for different alignment */
 504static int compat_ioctl_preallocate(struct file *file, int mode,
 505				    struct space_resv_32 __user *argp)
 506{
 507	struct inode *inode = file_inode(file);
 508	struct space_resv_32 sr;
 509
 510	if (copy_from_user(&sr, argp, sizeof(sr)))
 511		return -EFAULT;
 512
 513	switch (sr.l_whence) {
 514	case SEEK_SET:
 515		break;
 516	case SEEK_CUR:
 517		sr.l_start += file->f_pos;
 518		break;
 519	case SEEK_END:
 520		sr.l_start += i_size_read(inode);
 521		break;
 522	default:
 523		return -EINVAL;
 524	}
 525
 526	return vfs_fallocate(file, mode | FALLOC_FL_KEEP_SIZE, sr.l_start, sr.l_len);
 527}
 528#endif
 529
 530static int file_ioctl(struct file *filp, unsigned int cmd, int __user *p)
 531{
 532	switch (cmd) {
 533	case FIBMAP:
 534		return ioctl_fibmap(filp, p);
 535	case FS_IOC_RESVSP:
 536	case FS_IOC_RESVSP64:
 537		return ioctl_preallocate(filp, 0, p);
 538	case FS_IOC_UNRESVSP:
 539	case FS_IOC_UNRESVSP64:
 540		return ioctl_preallocate(filp, FALLOC_FL_PUNCH_HOLE, p);
 541	case FS_IOC_ZERO_RANGE:
 542		return ioctl_preallocate(filp, FALLOC_FL_ZERO_RANGE, p);
 543	}
 544
 545	return -ENOIOCTLCMD;
 546}
 547
 548static int ioctl_fionbio(struct file *filp, int __user *argp)
 549{
 550	unsigned int flag;
 551	int on, error;
 552
 553	error = get_user(on, argp);
 554	if (error)
 555		return error;
 556	flag = O_NONBLOCK;
 557#ifdef __sparc__
 558	/* SunOS compatibility item. */
 559	if (O_NONBLOCK != O_NDELAY)
 560		flag |= O_NDELAY;
 561#endif
 562	spin_lock(&filp->f_lock);
 563	if (on)
 564		filp->f_flags |= flag;
 565	else
 566		filp->f_flags &= ~flag;
 567	spin_unlock(&filp->f_lock);
 568	return error;
 569}
 570
 571static int ioctl_fioasync(unsigned int fd, struct file *filp,
 572			  int __user *argp)
 573{
 574	unsigned int flag;
 575	int on, error;
 576
 577	error = get_user(on, argp);
 578	if (error)
 579		return error;
 580	flag = on ? FASYNC : 0;
 581
 582	/* Did FASYNC state change ? */
 583	if ((flag ^ filp->f_flags) & FASYNC) {
 584		if (filp->f_op->fasync)
 585			/* fasync() adjusts filp->f_flags */
 586			error = filp->f_op->fasync(fd, filp, on);
 587		else
 588			error = -ENOTTY;
 589	}
 590	return error < 0 ? error : 0;
 591}
 592
 593static int ioctl_fsfreeze(struct file *filp)
 594{
 595	struct super_block *sb = file_inode(filp)->i_sb;
 596
 597	if (!ns_capable(sb->s_user_ns, CAP_SYS_ADMIN))
 598		return -EPERM;
 599
 600	/* If filesystem doesn't support freeze feature, return. */
 601	if (sb->s_op->freeze_fs == NULL && sb->s_op->freeze_super == NULL)
 602		return -EOPNOTSUPP;
 603
 604	/* Freeze */
 605	if (sb->s_op->freeze_super)
 606		return sb->s_op->freeze_super(sb);
 607	return freeze_super(sb);
 608}
 609
 610static int ioctl_fsthaw(struct file *filp)
 611{
 612	struct super_block *sb = file_inode(filp)->i_sb;
 613
 614	if (!ns_capable(sb->s_user_ns, CAP_SYS_ADMIN))
 615		return -EPERM;
 616
 617	/* Thaw */
 618	if (sb->s_op->thaw_super)
 619		return sb->s_op->thaw_super(sb);
 620	return thaw_super(sb);
 621}
 622
 623static int ioctl_file_dedupe_range(struct file *file,
 624				   struct file_dedupe_range __user *argp)
 625{
 626	struct file_dedupe_range *same = NULL;
 627	int ret;
 628	unsigned long size;
 629	u16 count;
 630
 631	if (get_user(count, &argp->dest_count)) {
 632		ret = -EFAULT;
 633		goto out;
 634	}
 635
 636	size = offsetof(struct file_dedupe_range __user, info[count]);
 637	if (size > PAGE_SIZE) {
 638		ret = -ENOMEM;
 639		goto out;
 640	}
 641
 642	same = memdup_user(argp, size);
 643	if (IS_ERR(same)) {
 644		ret = PTR_ERR(same);
 645		same = NULL;
 646		goto out;
 647	}
 648
 649	same->dest_count = count;
 650	ret = vfs_dedupe_file_range(file, same);
 651	if (ret)
 652		goto out;
 653
 654	ret = copy_to_user(argp, same, size);
 655	if (ret)
 656		ret = -EFAULT;
 657
 658out:
 659	kfree(same);
 660	return ret;
 661}
 662
 663/**
 664 * fileattr_fill_xflags - initialize fileattr with xflags
 665 * @fa:		fileattr pointer
 666 * @xflags:	FS_XFLAG_* flags
 667 *
 668 * Set ->fsx_xflags, ->fsx_valid and ->flags (translated xflags).  All
 669 * other fields are zeroed.
 670 */
 671void fileattr_fill_xflags(struct fileattr *fa, u32 xflags)
 672{
 673	memset(fa, 0, sizeof(*fa));
 674	fa->fsx_valid = true;
 675	fa->fsx_xflags = xflags;
 676	if (fa->fsx_xflags & FS_XFLAG_IMMUTABLE)
 677		fa->flags |= FS_IMMUTABLE_FL;
 678	if (fa->fsx_xflags & FS_XFLAG_APPEND)
 679		fa->flags |= FS_APPEND_FL;
 680	if (fa->fsx_xflags & FS_XFLAG_SYNC)
 681		fa->flags |= FS_SYNC_FL;
 682	if (fa->fsx_xflags & FS_XFLAG_NOATIME)
 683		fa->flags |= FS_NOATIME_FL;
 684	if (fa->fsx_xflags & FS_XFLAG_NODUMP)
 685		fa->flags |= FS_NODUMP_FL;
 686	if (fa->fsx_xflags & FS_XFLAG_DAX)
 687		fa->flags |= FS_DAX_FL;
 688	if (fa->fsx_xflags & FS_XFLAG_PROJINHERIT)
 689		fa->flags |= FS_PROJINHERIT_FL;
 690}
 691EXPORT_SYMBOL(fileattr_fill_xflags);
 692
 693/**
 694 * fileattr_fill_flags - initialize fileattr with flags
 695 * @fa:		fileattr pointer
 696 * @flags:	FS_*_FL flags
 697 *
 698 * Set ->flags, ->flags_valid and ->fsx_xflags (translated flags).
 699 * All other fields are zeroed.
 700 */
 701void fileattr_fill_flags(struct fileattr *fa, u32 flags)
 702{
 703	memset(fa, 0, sizeof(*fa));
 704	fa->flags_valid = true;
 705	fa->flags = flags;
 706	if (fa->flags & FS_SYNC_FL)
 707		fa->fsx_xflags |= FS_XFLAG_SYNC;
 708	if (fa->flags & FS_IMMUTABLE_FL)
 709		fa->fsx_xflags |= FS_XFLAG_IMMUTABLE;
 710	if (fa->flags & FS_APPEND_FL)
 711		fa->fsx_xflags |= FS_XFLAG_APPEND;
 712	if (fa->flags & FS_NODUMP_FL)
 713		fa->fsx_xflags |= FS_XFLAG_NODUMP;
 714	if (fa->flags & FS_NOATIME_FL)
 715		fa->fsx_xflags |= FS_XFLAG_NOATIME;
 716	if (fa->flags & FS_DAX_FL)
 717		fa->fsx_xflags |= FS_XFLAG_DAX;
 718	if (fa->flags & FS_PROJINHERIT_FL)
 719		fa->fsx_xflags |= FS_XFLAG_PROJINHERIT;
 720}
 721EXPORT_SYMBOL(fileattr_fill_flags);
 722
 723/**
 724 * vfs_fileattr_get - retrieve miscellaneous file attributes
 725 * @dentry:	the object to retrieve from
 726 * @fa:		fileattr pointer
 727 *
 728 * Call i_op->fileattr_get() callback, if exists.
 729 *
 730 * Return: 0 on success, or a negative error on failure.
 731 */
 732int vfs_fileattr_get(struct dentry *dentry, struct fileattr *fa)
 733{
 734	struct inode *inode = d_inode(dentry);
 735
 736	if (!inode->i_op->fileattr_get)
 737		return -ENOIOCTLCMD;
 738
 739	return inode->i_op->fileattr_get(dentry, fa);
 740}
 741EXPORT_SYMBOL(vfs_fileattr_get);
 742
 743/**
 744 * copy_fsxattr_to_user - copy fsxattr to userspace.
 745 * @fa:		fileattr pointer
 746 * @ufa:	fsxattr user pointer
 747 *
 748 * Return: 0 on success, or -EFAULT on failure.
 749 */
 750int copy_fsxattr_to_user(const struct fileattr *fa, struct fsxattr __user *ufa)
 751{
 752	struct fsxattr xfa;
 753
 754	memset(&xfa, 0, sizeof(xfa));
 755	xfa.fsx_xflags = fa->fsx_xflags;
 756	xfa.fsx_extsize = fa->fsx_extsize;
 757	xfa.fsx_nextents = fa->fsx_nextents;
 758	xfa.fsx_projid = fa->fsx_projid;
 759	xfa.fsx_cowextsize = fa->fsx_cowextsize;
 760
 761	if (copy_to_user(ufa, &xfa, sizeof(xfa)))
 762		return -EFAULT;
 763
 764	return 0;
 765}
 766EXPORT_SYMBOL(copy_fsxattr_to_user);
 767
 768static int copy_fsxattr_from_user(struct fileattr *fa,
 769				  struct fsxattr __user *ufa)
 770{
 771	struct fsxattr xfa;
 772
 773	if (copy_from_user(&xfa, ufa, sizeof(xfa)))
 774		return -EFAULT;
 775
 776	fileattr_fill_xflags(fa, xfa.fsx_xflags);
 777	fa->fsx_extsize = xfa.fsx_extsize;
 778	fa->fsx_nextents = xfa.fsx_nextents;
 779	fa->fsx_projid = xfa.fsx_projid;
 780	fa->fsx_cowextsize = xfa.fsx_cowextsize;
 781
 782	return 0;
 783}
 784
 785/*
 786 * Generic function to check FS_IOC_FSSETXATTR/FS_IOC_SETFLAGS values and reject
 787 * any invalid configurations.
 788 *
 789 * Note: must be called with inode lock held.
 790 */
 791static int fileattr_set_prepare(struct inode *inode,
 792			      const struct fileattr *old_ma,
 793			      struct fileattr *fa)
 794{
 795	int err;
 796
 797	/*
 798	 * The IMMUTABLE and APPEND_ONLY flags can only be changed by
 799	 * the relevant capability.
 800	 */
 801	if ((fa->flags ^ old_ma->flags) & (FS_APPEND_FL | FS_IMMUTABLE_FL) &&
 802	    !capable(CAP_LINUX_IMMUTABLE))
 803		return -EPERM;
 804
 805	err = fscrypt_prepare_setflags(inode, old_ma->flags, fa->flags);
 806	if (err)
 807		return err;
 808
 809	/*
 810	 * Project Quota ID state is only allowed to change from within the init
 811	 * namespace. Enforce that restriction only if we are trying to change
 812	 * the quota ID state. Everything else is allowed in user namespaces.
 813	 */
 814	if (current_user_ns() != &init_user_ns) {
 815		if (old_ma->fsx_projid != fa->fsx_projid)
 816			return -EINVAL;
 817		if ((old_ma->fsx_xflags ^ fa->fsx_xflags) &
 818				FS_XFLAG_PROJINHERIT)
 
 
 
 
 
 
 
 
 819			return -EINVAL;
 820	}
 821
 822	/* Check extent size hints. */
 823	if ((fa->fsx_xflags & FS_XFLAG_EXTSIZE) && !S_ISREG(inode->i_mode))
 824		return -EINVAL;
 825
 826	if ((fa->fsx_xflags & FS_XFLAG_EXTSZINHERIT) &&
 827			!S_ISDIR(inode->i_mode))
 828		return -EINVAL;
 829
 830	if ((fa->fsx_xflags & FS_XFLAG_COWEXTSIZE) &&
 831	    !S_ISREG(inode->i_mode) && !S_ISDIR(inode->i_mode))
 832		return -EINVAL;
 833
 834	/*
 835	 * It is only valid to set the DAX flag on regular files and
 836	 * directories on filesystems.
 837	 */
 838	if ((fa->fsx_xflags & FS_XFLAG_DAX) &&
 839	    !(S_ISREG(inode->i_mode) || S_ISDIR(inode->i_mode)))
 840		return -EINVAL;
 841
 842	/* Extent size hints of zero turn off the flags. */
 843	if (fa->fsx_extsize == 0)
 844		fa->fsx_xflags &= ~(FS_XFLAG_EXTSIZE | FS_XFLAG_EXTSZINHERIT);
 845	if (fa->fsx_cowextsize == 0)
 846		fa->fsx_xflags &= ~FS_XFLAG_COWEXTSIZE;
 847
 848	return 0;
 849}
 850
 851/**
 852 * vfs_fileattr_set - change miscellaneous file attributes
 853 * @mnt_userns:	user namespace of the mount
 854 * @dentry:	the object to change
 855 * @fa:		fileattr pointer
 856 *
 857 * After verifying permissions, call i_op->fileattr_set() callback, if
 858 * exists.
 859 *
 860 * Verifying attributes involves retrieving current attributes with
 861 * i_op->fileattr_get(), this also allows initializing attributes that have
 862 * not been set by the caller to current values.  Inode lock is held
 863 * thoughout to prevent racing with another instance.
 864 *
 865 * Return: 0 on success, or a negative error on failure.
 866 */
 867int vfs_fileattr_set(struct user_namespace *mnt_userns, struct dentry *dentry,
 868		     struct fileattr *fa)
 869{
 870	struct inode *inode = d_inode(dentry);
 871	struct fileattr old_ma = {};
 872	int err;
 873
 874	if (!inode->i_op->fileattr_set)
 875		return -ENOIOCTLCMD;
 876
 877	if (!inode_owner_or_capable(mnt_userns, inode))
 878		return -EPERM;
 879
 880	inode_lock(inode);
 881	err = vfs_fileattr_get(dentry, &old_ma);
 882	if (!err) {
 883		/* initialize missing bits from old_ma */
 884		if (fa->flags_valid) {
 885			fa->fsx_xflags |= old_ma.fsx_xflags & ~FS_XFLAG_COMMON;
 886			fa->fsx_extsize = old_ma.fsx_extsize;
 887			fa->fsx_nextents = old_ma.fsx_nextents;
 888			fa->fsx_projid = old_ma.fsx_projid;
 889			fa->fsx_cowextsize = old_ma.fsx_cowextsize;
 890		} else {
 891			fa->flags |= old_ma.flags & ~FS_COMMON_FL;
 892		}
 893		err = fileattr_set_prepare(inode, &old_ma, fa);
 894		if (!err)
 895			err = inode->i_op->fileattr_set(mnt_userns, dentry, fa);
 896	}
 897	inode_unlock(inode);
 898
 899	return err;
 900}
 901EXPORT_SYMBOL(vfs_fileattr_set);
 902
 903static int ioctl_getflags(struct file *file, unsigned int __user *argp)
 904{
 905	struct fileattr fa = { .flags_valid = true }; /* hint only */
 906	int err;
 907
 908	err = vfs_fileattr_get(file->f_path.dentry, &fa);
 909	if (!err)
 910		err = put_user(fa.flags, argp);
 911	return err;
 912}
 913
 914static int ioctl_setflags(struct file *file, unsigned int __user *argp)
 915{
 916	struct user_namespace *mnt_userns = file_mnt_user_ns(file);
 917	struct dentry *dentry = file->f_path.dentry;
 918	struct fileattr fa;
 919	unsigned int flags;
 920	int err;
 921
 922	err = get_user(flags, argp);
 923	if (!err) {
 924		err = mnt_want_write_file(file);
 925		if (!err) {
 926			fileattr_fill_flags(&fa, flags);
 927			err = vfs_fileattr_set(mnt_userns, dentry, &fa);
 928			mnt_drop_write_file(file);
 929		}
 930	}
 931	return err;
 932}
 933
 934static int ioctl_fsgetxattr(struct file *file, void __user *argp)
 935{
 936	struct fileattr fa = { .fsx_valid = true }; /* hint only */
 937	int err;
 938
 939	err = vfs_fileattr_get(file->f_path.dentry, &fa);
 940	if (!err)
 941		err = copy_fsxattr_to_user(&fa, argp);
 942
 943	return err;
 944}
 945
 946static int ioctl_fssetxattr(struct file *file, void __user *argp)
 947{
 948	struct user_namespace *mnt_userns = file_mnt_user_ns(file);
 949	struct dentry *dentry = file->f_path.dentry;
 950	struct fileattr fa;
 951	int err;
 952
 953	err = copy_fsxattr_from_user(&fa, argp);
 954	if (!err) {
 955		err = mnt_want_write_file(file);
 956		if (!err) {
 957			err = vfs_fileattr_set(mnt_userns, dentry, &fa);
 958			mnt_drop_write_file(file);
 959		}
 960	}
 961	return err;
 962}
 963
 964/*
 965 * do_vfs_ioctl() is not for drivers and not intended to be EXPORT_SYMBOL()'d.
 966 * It's just a simple helper for sys_ioctl and compat_sys_ioctl.
 967 *
 968 * When you add any new common ioctls to the switches above and below,
 969 * please ensure they have compatible arguments in compat mode.
 970 */
 971static int do_vfs_ioctl(struct file *filp, unsigned int fd,
 972			unsigned int cmd, unsigned long arg)
 973{
 974	void __user *argp = (void __user *)arg;
 975	struct inode *inode = file_inode(filp);
 976
 977	switch (cmd) {
 978	case FIOCLEX:
 979		set_close_on_exec(fd, 1);
 980		return 0;
 981
 982	case FIONCLEX:
 983		set_close_on_exec(fd, 0);
 984		return 0;
 985
 986	case FIONBIO:
 987		return ioctl_fionbio(filp, argp);
 988
 989	case FIOASYNC:
 990		return ioctl_fioasync(fd, filp, argp);
 991
 992	case FIOQSIZE:
 993		if (S_ISDIR(inode->i_mode) || S_ISREG(inode->i_mode) ||
 994		    S_ISLNK(inode->i_mode)) {
 995			loff_t res = inode_get_bytes(inode);
 996			return copy_to_user(argp, &res, sizeof(res)) ?
 997					    -EFAULT : 0;
 998		}
 999
1000		return -ENOTTY;
1001
1002	case FIFREEZE:
1003		return ioctl_fsfreeze(filp);
1004
1005	case FITHAW:
1006		return ioctl_fsthaw(filp);
1007
1008	case FS_IOC_FIEMAP:
1009		return ioctl_fiemap(filp, argp);
1010
1011	case FIGETBSZ:
1012		/* anon_bdev filesystems may not have a block size */
1013		if (!inode->i_sb->s_blocksize)
1014			return -EINVAL;
1015
1016		return put_user(inode->i_sb->s_blocksize, (int __user *)argp);
1017
1018	case FICLONE:
1019		return ioctl_file_clone(filp, arg, 0, 0, 0);
1020
1021	case FICLONERANGE:
1022		return ioctl_file_clone_range(filp, argp);
1023
1024	case FIDEDUPERANGE:
1025		return ioctl_file_dedupe_range(filp, argp);
1026
1027	case FIONREAD:
1028		if (!S_ISREG(inode->i_mode))
1029			return vfs_ioctl(filp, cmd, arg);
1030
1031		return put_user(i_size_read(inode) - filp->f_pos,
1032				(int __user *)argp);
1033
1034	case FS_IOC_GETFLAGS:
1035		return ioctl_getflags(filp, argp);
1036
1037	case FS_IOC_SETFLAGS:
1038		return ioctl_setflags(filp, argp);
1039
1040	case FS_IOC_FSGETXATTR:
1041		return ioctl_fsgetxattr(filp, argp);
1042
1043	case FS_IOC_FSSETXATTR:
1044		return ioctl_fssetxattr(filp, argp);
1045
1046	default:
1047		if (S_ISREG(inode->i_mode))
1048			return file_ioctl(filp, cmd, argp);
1049		break;
1050	}
1051
1052	return -ENOIOCTLCMD;
1053}
1054
1055SYSCALL_DEFINE3(ioctl, unsigned int, fd, unsigned int, cmd, unsigned long, arg)
1056{
1057	struct fd f = fdget(fd);
1058	int error;
1059
1060	if (!f.file)
1061		return -EBADF;
1062
1063	error = security_file_ioctl(f.file, cmd, arg);
1064	if (error)
1065		goto out;
1066
1067	error = do_vfs_ioctl(f.file, fd, cmd, arg);
1068	if (error == -ENOIOCTLCMD)
1069		error = vfs_ioctl(f.file, cmd, arg);
1070
1071out:
1072	fdput(f);
1073	return error;
1074}
1075
1076#ifdef CONFIG_COMPAT
1077/**
1078 * compat_ptr_ioctl - generic implementation of .compat_ioctl file operation
1079 *
1080 * This is not normally called as a function, but instead set in struct
1081 * file_operations as
1082 *
1083 *     .compat_ioctl = compat_ptr_ioctl,
1084 *
1085 * On most architectures, the compat_ptr_ioctl() just passes all arguments
1086 * to the corresponding ->ioctl handler. The exception is arch/s390, where
1087 * compat_ptr() clears the top bit of a 32-bit pointer value, so user space
1088 * pointers to the second 2GB alias the first 2GB, as is the case for
1089 * native 32-bit s390 user space.
1090 *
1091 * The compat_ptr_ioctl() function must therefore be used only with ioctl
1092 * functions that either ignore the argument or pass a pointer to a
1093 * compatible data type.
1094 *
1095 * If any ioctl command handled by fops->unlocked_ioctl passes a plain
1096 * integer instead of a pointer, or any of the passed data types
1097 * is incompatible between 32-bit and 64-bit architectures, a proper
1098 * handler is required instead of compat_ptr_ioctl.
1099 */
1100long compat_ptr_ioctl(struct file *file, unsigned int cmd, unsigned long arg)
1101{
1102	if (!file->f_op->unlocked_ioctl)
1103		return -ENOIOCTLCMD;
1104
1105	return file->f_op->unlocked_ioctl(file, cmd, (unsigned long)compat_ptr(arg));
1106}
1107EXPORT_SYMBOL(compat_ptr_ioctl);
1108
1109COMPAT_SYSCALL_DEFINE3(ioctl, unsigned int, fd, unsigned int, cmd,
1110		       compat_ulong_t, arg)
1111{
1112	struct fd f = fdget(fd);
1113	int error;
1114
1115	if (!f.file)
1116		return -EBADF;
1117
1118	/* RED-PEN how should LSM module know it's handling 32bit? */
1119	error = security_file_ioctl(f.file, cmd, arg);
1120	if (error)
1121		goto out;
1122
1123	switch (cmd) {
1124	/* FICLONE takes an int argument, so don't use compat_ptr() */
1125	case FICLONE:
1126		error = ioctl_file_clone(f.file, arg, 0, 0, 0);
1127		break;
1128
1129#if defined(CONFIG_X86_64)
1130	/* these get messy on amd64 due to alignment differences */
1131	case FS_IOC_RESVSP_32:
1132	case FS_IOC_RESVSP64_32:
1133		error = compat_ioctl_preallocate(f.file, 0, compat_ptr(arg));
1134		break;
1135	case FS_IOC_UNRESVSP_32:
1136	case FS_IOC_UNRESVSP64_32:
1137		error = compat_ioctl_preallocate(f.file, FALLOC_FL_PUNCH_HOLE,
1138				compat_ptr(arg));
1139		break;
1140	case FS_IOC_ZERO_RANGE_32:
1141		error = compat_ioctl_preallocate(f.file, FALLOC_FL_ZERO_RANGE,
1142				compat_ptr(arg));
1143		break;
1144#endif
1145
1146	/*
1147	 * These access 32-bit values anyway so no further handling is
1148	 * necessary.
1149	 */
1150	case FS_IOC32_GETFLAGS:
1151	case FS_IOC32_SETFLAGS:
1152		cmd = (cmd == FS_IOC32_GETFLAGS) ?
1153			FS_IOC_GETFLAGS : FS_IOC_SETFLAGS;
1154		fallthrough;
1155	/*
1156	 * everything else in do_vfs_ioctl() takes either a compatible
1157	 * pointer argument or no argument -- call it with a modified
1158	 * argument.
1159	 */
1160	default:
1161		error = do_vfs_ioctl(f.file, fd, cmd,
1162				     (unsigned long)compat_ptr(arg));
1163		if (error != -ENOIOCTLCMD)
1164			break;
1165
1166		if (f.file->f_op->compat_ioctl)
1167			error = f.file->f_op->compat_ioctl(f.file, cmd, arg);
1168		if (error == -ENOIOCTLCMD)
1169			error = -ENOTTY;
1170		break;
1171	}
1172
1173 out:
1174	fdput(f);
1175
1176	return error;
1177}
1178#endif