Loading...
1// SPDX-License-Identifier: GPL-2.0
2/*
3 * linux/fs/ocfs2/ioctl.c
4 *
5 * Copyright (C) 2006 Herbert Poetzl
6 * adapted from Remy Card's ext2/ioctl.c
7 */
8
9#include <linux/fs.h>
10#include <linux/mount.h>
11#include <linux/blkdev.h>
12#include <linux/compat.h>
13#include <linux/fileattr.h>
14
15#include <cluster/masklog.h>
16
17#include "ocfs2.h"
18#include "alloc.h"
19#include "dlmglue.h"
20#include "file.h"
21#include "inode.h"
22#include "journal.h"
23
24#include "ocfs2_fs.h"
25#include "ioctl.h"
26#include "resize.h"
27#include "refcounttree.h"
28#include "sysfile.h"
29#include "dir.h"
30#include "buffer_head_io.h"
31#include "suballoc.h"
32#include "move_extents.h"
33
34#define o2info_from_user(a, b) \
35 copy_from_user(&(a), (b), sizeof(a))
36#define o2info_to_user(a, b) \
37 copy_to_user((typeof(a) __user *)b, &(a), sizeof(a))
38
39/*
40 * This is just a best-effort to tell userspace that this request
41 * caused the error.
42 */
43static inline void o2info_set_request_error(struct ocfs2_info_request *kreq,
44 struct ocfs2_info_request __user *req)
45{
46 kreq->ir_flags |= OCFS2_INFO_FL_ERROR;
47 (void)put_user(kreq->ir_flags, (__u32 __user *)&(req->ir_flags));
48}
49
50static inline void o2info_set_request_filled(struct ocfs2_info_request *req)
51{
52 req->ir_flags |= OCFS2_INFO_FL_FILLED;
53}
54
55static inline void o2info_clear_request_filled(struct ocfs2_info_request *req)
56{
57 req->ir_flags &= ~OCFS2_INFO_FL_FILLED;
58}
59
60static inline int o2info_coherent(struct ocfs2_info_request *req)
61{
62 return (!(req->ir_flags & OCFS2_INFO_FL_NON_COHERENT));
63}
64
65int ocfs2_fileattr_get(struct dentry *dentry, struct fileattr *fa)
66{
67 struct inode *inode = d_inode(dentry);
68 unsigned int flags;
69 int status;
70
71 status = ocfs2_inode_lock(inode, NULL, 0);
72 if (status < 0) {
73 mlog_errno(status);
74 return status;
75 }
76 ocfs2_get_inode_flags(OCFS2_I(inode));
77 flags = OCFS2_I(inode)->ip_attr;
78 ocfs2_inode_unlock(inode, 0);
79
80 fileattr_fill_flags(fa, flags & OCFS2_FL_VISIBLE);
81
82 return status;
83}
84
85int ocfs2_fileattr_set(struct user_namespace *mnt_userns,
86 struct dentry *dentry, struct fileattr *fa)
87{
88 struct inode *inode = d_inode(dentry);
89 unsigned int flags = fa->flags;
90 struct ocfs2_inode_info *ocfs2_inode = OCFS2_I(inode);
91 struct ocfs2_super *osb = OCFS2_SB(inode->i_sb);
92 handle_t *handle = NULL;
93 struct buffer_head *bh = NULL;
94 unsigned oldflags;
95 int status;
96
97 if (fileattr_has_fsx(fa))
98 return -EOPNOTSUPP;
99
100 status = ocfs2_inode_lock(inode, &bh, 1);
101 if (status < 0) {
102 mlog_errno(status);
103 goto bail;
104 }
105
106 if (!S_ISDIR(inode->i_mode))
107 flags &= ~OCFS2_DIRSYNC_FL;
108
109 oldflags = ocfs2_inode->ip_attr;
110 flags = flags & OCFS2_FL_MODIFIABLE;
111 flags |= oldflags & ~OCFS2_FL_MODIFIABLE;
112
113 /* Check already done by VFS, but repeat with ocfs lock */
114 status = -EPERM;
115 if ((flags ^ oldflags) & (FS_APPEND_FL | FS_IMMUTABLE_FL) &&
116 !capable(CAP_LINUX_IMMUTABLE))
117 goto bail_unlock;
118
119 handle = ocfs2_start_trans(osb, OCFS2_INODE_UPDATE_CREDITS);
120 if (IS_ERR(handle)) {
121 status = PTR_ERR(handle);
122 mlog_errno(status);
123 goto bail_unlock;
124 }
125
126 ocfs2_inode->ip_attr = flags;
127 ocfs2_set_inode_flags(inode);
128
129 status = ocfs2_mark_inode_dirty(handle, inode, bh);
130 if (status < 0)
131 mlog_errno(status);
132
133 ocfs2_commit_trans(osb, handle);
134
135bail_unlock:
136 ocfs2_inode_unlock(inode, 1);
137bail:
138 brelse(bh);
139
140 return status;
141}
142
143static int ocfs2_info_handle_blocksize(struct inode *inode,
144 struct ocfs2_info_request __user *req)
145{
146 struct ocfs2_info_blocksize oib;
147
148 if (o2info_from_user(oib, req))
149 return -EFAULT;
150
151 oib.ib_blocksize = inode->i_sb->s_blocksize;
152
153 o2info_set_request_filled(&oib.ib_req);
154
155 if (o2info_to_user(oib, req))
156 return -EFAULT;
157
158 return 0;
159}
160
161static int ocfs2_info_handle_clustersize(struct inode *inode,
162 struct ocfs2_info_request __user *req)
163{
164 struct ocfs2_info_clustersize oic;
165 struct ocfs2_super *osb = OCFS2_SB(inode->i_sb);
166
167 if (o2info_from_user(oic, req))
168 return -EFAULT;
169
170 oic.ic_clustersize = osb->s_clustersize;
171
172 o2info_set_request_filled(&oic.ic_req);
173
174 if (o2info_to_user(oic, req))
175 return -EFAULT;
176
177 return 0;
178}
179
180static int ocfs2_info_handle_maxslots(struct inode *inode,
181 struct ocfs2_info_request __user *req)
182{
183 struct ocfs2_info_maxslots oim;
184 struct ocfs2_super *osb = OCFS2_SB(inode->i_sb);
185
186 if (o2info_from_user(oim, req))
187 return -EFAULT;
188
189 oim.im_max_slots = osb->max_slots;
190
191 o2info_set_request_filled(&oim.im_req);
192
193 if (o2info_to_user(oim, req))
194 return -EFAULT;
195
196 return 0;
197}
198
199static int ocfs2_info_handle_label(struct inode *inode,
200 struct ocfs2_info_request __user *req)
201{
202 struct ocfs2_info_label oil;
203 struct ocfs2_super *osb = OCFS2_SB(inode->i_sb);
204
205 if (o2info_from_user(oil, req))
206 return -EFAULT;
207
208 memcpy(oil.il_label, osb->vol_label, OCFS2_MAX_VOL_LABEL_LEN);
209
210 o2info_set_request_filled(&oil.il_req);
211
212 if (o2info_to_user(oil, req))
213 return -EFAULT;
214
215 return 0;
216}
217
218static int ocfs2_info_handle_uuid(struct inode *inode,
219 struct ocfs2_info_request __user *req)
220{
221 struct ocfs2_info_uuid oiu;
222 struct ocfs2_super *osb = OCFS2_SB(inode->i_sb);
223
224 if (o2info_from_user(oiu, req))
225 return -EFAULT;
226
227 memcpy(oiu.iu_uuid_str, osb->uuid_str, OCFS2_TEXT_UUID_LEN + 1);
228
229 o2info_set_request_filled(&oiu.iu_req);
230
231 if (o2info_to_user(oiu, req))
232 return -EFAULT;
233
234 return 0;
235}
236
237static int ocfs2_info_handle_fs_features(struct inode *inode,
238 struct ocfs2_info_request __user *req)
239{
240 struct ocfs2_info_fs_features oif;
241 struct ocfs2_super *osb = OCFS2_SB(inode->i_sb);
242
243 if (o2info_from_user(oif, req))
244 return -EFAULT;
245
246 oif.if_compat_features = osb->s_feature_compat;
247 oif.if_incompat_features = osb->s_feature_incompat;
248 oif.if_ro_compat_features = osb->s_feature_ro_compat;
249
250 o2info_set_request_filled(&oif.if_req);
251
252 if (o2info_to_user(oif, req))
253 return -EFAULT;
254
255 return 0;
256}
257
258static int ocfs2_info_handle_journal_size(struct inode *inode,
259 struct ocfs2_info_request __user *req)
260{
261 struct ocfs2_info_journal_size oij;
262 struct ocfs2_super *osb = OCFS2_SB(inode->i_sb);
263
264 if (o2info_from_user(oij, req))
265 return -EFAULT;
266
267 oij.ij_journal_size = i_size_read(osb->journal->j_inode);
268
269 o2info_set_request_filled(&oij.ij_req);
270
271 if (o2info_to_user(oij, req))
272 return -EFAULT;
273
274 return 0;
275}
276
277static int ocfs2_info_scan_inode_alloc(struct ocfs2_super *osb,
278 struct inode *inode_alloc, u64 blkno,
279 struct ocfs2_info_freeinode *fi,
280 u32 slot)
281{
282 int status = 0, unlock = 0;
283
284 struct buffer_head *bh = NULL;
285 struct ocfs2_dinode *dinode_alloc = NULL;
286
287 if (inode_alloc)
288 inode_lock(inode_alloc);
289
290 if (inode_alloc && o2info_coherent(&fi->ifi_req)) {
291 status = ocfs2_inode_lock(inode_alloc, &bh, 0);
292 if (status < 0) {
293 mlog_errno(status);
294 goto bail;
295 }
296 unlock = 1;
297 } else {
298 status = ocfs2_read_blocks_sync(osb, blkno, 1, &bh);
299 if (status < 0) {
300 mlog_errno(status);
301 goto bail;
302 }
303 }
304
305 dinode_alloc = (struct ocfs2_dinode *)bh->b_data;
306
307 fi->ifi_stat[slot].lfi_total =
308 le32_to_cpu(dinode_alloc->id1.bitmap1.i_total);
309 fi->ifi_stat[slot].lfi_free =
310 le32_to_cpu(dinode_alloc->id1.bitmap1.i_total) -
311 le32_to_cpu(dinode_alloc->id1.bitmap1.i_used);
312
313bail:
314 if (unlock)
315 ocfs2_inode_unlock(inode_alloc, 0);
316
317 if (inode_alloc)
318 inode_unlock(inode_alloc);
319
320 brelse(bh);
321
322 return status;
323}
324
325static int ocfs2_info_handle_freeinode(struct inode *inode,
326 struct ocfs2_info_request __user *req)
327{
328 u32 i;
329 u64 blkno = -1;
330 char namebuf[40];
331 int status, type = INODE_ALLOC_SYSTEM_INODE;
332 struct ocfs2_info_freeinode *oifi = NULL;
333 struct ocfs2_super *osb = OCFS2_SB(inode->i_sb);
334 struct inode *inode_alloc = NULL;
335
336 oifi = kzalloc(sizeof(struct ocfs2_info_freeinode), GFP_KERNEL);
337 if (!oifi) {
338 status = -ENOMEM;
339 mlog_errno(status);
340 goto out_err;
341 }
342
343 if (o2info_from_user(*oifi, req)) {
344 status = -EFAULT;
345 goto out_free;
346 }
347
348 oifi->ifi_slotnum = osb->max_slots;
349
350 for (i = 0; i < oifi->ifi_slotnum; i++) {
351 if (o2info_coherent(&oifi->ifi_req)) {
352 inode_alloc = ocfs2_get_system_file_inode(osb, type, i);
353 if (!inode_alloc) {
354 mlog(ML_ERROR, "unable to get alloc inode in "
355 "slot %u\n", i);
356 status = -EIO;
357 goto bail;
358 }
359 } else {
360 ocfs2_sprintf_system_inode_name(namebuf,
361 sizeof(namebuf),
362 type, i);
363 status = ocfs2_lookup_ino_from_name(osb->sys_root_inode,
364 namebuf,
365 strlen(namebuf),
366 &blkno);
367 if (status < 0) {
368 status = -ENOENT;
369 goto bail;
370 }
371 }
372
373 status = ocfs2_info_scan_inode_alloc(osb, inode_alloc, blkno, oifi, i);
374
375 iput(inode_alloc);
376 inode_alloc = NULL;
377
378 if (status < 0)
379 goto bail;
380 }
381
382 o2info_set_request_filled(&oifi->ifi_req);
383
384 if (o2info_to_user(*oifi, req)) {
385 status = -EFAULT;
386 goto out_free;
387 }
388
389 status = 0;
390bail:
391 if (status)
392 o2info_set_request_error(&oifi->ifi_req, req);
393out_free:
394 kfree(oifi);
395out_err:
396 return status;
397}
398
399static void o2ffg_update_histogram(struct ocfs2_info_free_chunk_list *hist,
400 unsigned int chunksize)
401{
402 u32 index;
403
404 index = __ilog2_u32(chunksize);
405 if (index >= OCFS2_INFO_MAX_HIST)
406 index = OCFS2_INFO_MAX_HIST - 1;
407
408 hist->fc_chunks[index]++;
409 hist->fc_clusters[index] += chunksize;
410}
411
412static void o2ffg_update_stats(struct ocfs2_info_freefrag_stats *stats,
413 unsigned int chunksize)
414{
415 if (chunksize > stats->ffs_max)
416 stats->ffs_max = chunksize;
417
418 if (chunksize < stats->ffs_min)
419 stats->ffs_min = chunksize;
420
421 stats->ffs_avg += chunksize;
422 stats->ffs_free_chunks_real++;
423}
424
425static void ocfs2_info_update_ffg(struct ocfs2_info_freefrag *ffg,
426 unsigned int chunksize)
427{
428 o2ffg_update_histogram(&(ffg->iff_ffs.ffs_fc_hist), chunksize);
429 o2ffg_update_stats(&(ffg->iff_ffs), chunksize);
430}
431
432static int ocfs2_info_freefrag_scan_chain(struct ocfs2_super *osb,
433 struct inode *gb_inode,
434 struct ocfs2_dinode *gb_dinode,
435 struct ocfs2_chain_rec *rec,
436 struct ocfs2_info_freefrag *ffg,
437 u32 chunks_in_group)
438{
439 int status = 0, used;
440 u64 blkno;
441
442 struct buffer_head *bh = NULL;
443 struct ocfs2_group_desc *bg = NULL;
444
445 unsigned int max_bits, num_clusters;
446 unsigned int offset = 0, cluster, chunk;
447 unsigned int chunk_free, last_chunksize = 0;
448
449 if (!le32_to_cpu(rec->c_free))
450 goto bail;
451
452 do {
453 if (!bg)
454 blkno = le64_to_cpu(rec->c_blkno);
455 else
456 blkno = le64_to_cpu(bg->bg_next_group);
457
458 if (bh) {
459 brelse(bh);
460 bh = NULL;
461 }
462
463 if (o2info_coherent(&ffg->iff_req))
464 status = ocfs2_read_group_descriptor(gb_inode,
465 gb_dinode,
466 blkno, &bh);
467 else
468 status = ocfs2_read_blocks_sync(osb, blkno, 1, &bh);
469
470 if (status < 0) {
471 mlog(ML_ERROR, "Can't read the group descriptor # "
472 "%llu from device.", (unsigned long long)blkno);
473 status = -EIO;
474 goto bail;
475 }
476
477 bg = (struct ocfs2_group_desc *)bh->b_data;
478
479 if (!le16_to_cpu(bg->bg_free_bits_count))
480 continue;
481
482 max_bits = le16_to_cpu(bg->bg_bits);
483 offset = 0;
484
485 for (chunk = 0; chunk < chunks_in_group; chunk++) {
486 /*
487 * last chunk may be not an entire one.
488 */
489 if ((offset + ffg->iff_chunksize) > max_bits)
490 num_clusters = max_bits - offset;
491 else
492 num_clusters = ffg->iff_chunksize;
493
494 chunk_free = 0;
495 for (cluster = 0; cluster < num_clusters; cluster++) {
496 used = ocfs2_test_bit(offset,
497 (unsigned long *)bg->bg_bitmap);
498 /*
499 * - chunk_free counts free clusters in #N chunk.
500 * - last_chunksize records the size(in) clusters
501 * for the last real free chunk being counted.
502 */
503 if (!used) {
504 last_chunksize++;
505 chunk_free++;
506 }
507
508 if (used && last_chunksize) {
509 ocfs2_info_update_ffg(ffg,
510 last_chunksize);
511 last_chunksize = 0;
512 }
513
514 offset++;
515 }
516
517 if (chunk_free == ffg->iff_chunksize)
518 ffg->iff_ffs.ffs_free_chunks++;
519 }
520
521 /*
522 * need to update the info for last free chunk.
523 */
524 if (last_chunksize)
525 ocfs2_info_update_ffg(ffg, last_chunksize);
526
527 } while (le64_to_cpu(bg->bg_next_group));
528
529bail:
530 brelse(bh);
531
532 return status;
533}
534
535static int ocfs2_info_freefrag_scan_bitmap(struct ocfs2_super *osb,
536 struct inode *gb_inode, u64 blkno,
537 struct ocfs2_info_freefrag *ffg)
538{
539 u32 chunks_in_group;
540 int status = 0, unlock = 0, i;
541
542 struct buffer_head *bh = NULL;
543 struct ocfs2_chain_list *cl = NULL;
544 struct ocfs2_chain_rec *rec = NULL;
545 struct ocfs2_dinode *gb_dinode = NULL;
546
547 if (gb_inode)
548 inode_lock(gb_inode);
549
550 if (o2info_coherent(&ffg->iff_req)) {
551 status = ocfs2_inode_lock(gb_inode, &bh, 0);
552 if (status < 0) {
553 mlog_errno(status);
554 goto bail;
555 }
556 unlock = 1;
557 } else {
558 status = ocfs2_read_blocks_sync(osb, blkno, 1, &bh);
559 if (status < 0) {
560 mlog_errno(status);
561 goto bail;
562 }
563 }
564
565 gb_dinode = (struct ocfs2_dinode *)bh->b_data;
566 cl = &(gb_dinode->id2.i_chain);
567
568 /*
569 * Chunksize(in) clusters from userspace should be
570 * less than clusters in a group.
571 */
572 if (ffg->iff_chunksize > le16_to_cpu(cl->cl_cpg)) {
573 status = -EINVAL;
574 goto bail;
575 }
576
577 memset(&ffg->iff_ffs, 0, sizeof(struct ocfs2_info_freefrag_stats));
578
579 ffg->iff_ffs.ffs_min = ~0U;
580 ffg->iff_ffs.ffs_clusters =
581 le32_to_cpu(gb_dinode->id1.bitmap1.i_total);
582 ffg->iff_ffs.ffs_free_clusters = ffg->iff_ffs.ffs_clusters -
583 le32_to_cpu(gb_dinode->id1.bitmap1.i_used);
584
585 chunks_in_group = le16_to_cpu(cl->cl_cpg) / ffg->iff_chunksize + 1;
586
587 for (i = 0; i < le16_to_cpu(cl->cl_next_free_rec); i++) {
588 rec = &(cl->cl_recs[i]);
589 status = ocfs2_info_freefrag_scan_chain(osb, gb_inode,
590 gb_dinode,
591 rec, ffg,
592 chunks_in_group);
593 if (status)
594 goto bail;
595 }
596
597 if (ffg->iff_ffs.ffs_free_chunks_real)
598 ffg->iff_ffs.ffs_avg = (ffg->iff_ffs.ffs_avg /
599 ffg->iff_ffs.ffs_free_chunks_real);
600bail:
601 if (unlock)
602 ocfs2_inode_unlock(gb_inode, 0);
603
604 if (gb_inode)
605 inode_unlock(gb_inode);
606
607 iput(gb_inode);
608 brelse(bh);
609
610 return status;
611}
612
613static int ocfs2_info_handle_freefrag(struct inode *inode,
614 struct ocfs2_info_request __user *req)
615{
616 u64 blkno = -1;
617 char namebuf[40];
618 int status, type = GLOBAL_BITMAP_SYSTEM_INODE;
619
620 struct ocfs2_info_freefrag *oiff;
621 struct ocfs2_super *osb = OCFS2_SB(inode->i_sb);
622 struct inode *gb_inode = NULL;
623
624 oiff = kzalloc(sizeof(struct ocfs2_info_freefrag), GFP_KERNEL);
625 if (!oiff) {
626 status = -ENOMEM;
627 mlog_errno(status);
628 goto out_err;
629 }
630
631 if (o2info_from_user(*oiff, req)) {
632 status = -EFAULT;
633 goto out_free;
634 }
635 /*
636 * chunksize from userspace should be power of 2.
637 */
638 if ((oiff->iff_chunksize & (oiff->iff_chunksize - 1)) ||
639 (!oiff->iff_chunksize)) {
640 status = -EINVAL;
641 goto bail;
642 }
643
644 if (o2info_coherent(&oiff->iff_req)) {
645 gb_inode = ocfs2_get_system_file_inode(osb, type,
646 OCFS2_INVALID_SLOT);
647 if (!gb_inode) {
648 mlog(ML_ERROR, "unable to get global_bitmap inode\n");
649 status = -EIO;
650 goto bail;
651 }
652 } else {
653 ocfs2_sprintf_system_inode_name(namebuf, sizeof(namebuf), type,
654 OCFS2_INVALID_SLOT);
655 status = ocfs2_lookup_ino_from_name(osb->sys_root_inode,
656 namebuf,
657 strlen(namebuf),
658 &blkno);
659 if (status < 0) {
660 status = -ENOENT;
661 goto bail;
662 }
663 }
664
665 status = ocfs2_info_freefrag_scan_bitmap(osb, gb_inode, blkno, oiff);
666 if (status < 0)
667 goto bail;
668
669 o2info_set_request_filled(&oiff->iff_req);
670
671 if (o2info_to_user(*oiff, req)) {
672 status = -EFAULT;
673 goto out_free;
674 }
675
676 status = 0;
677bail:
678 if (status)
679 o2info_set_request_error(&oiff->iff_req, req);
680out_free:
681 kfree(oiff);
682out_err:
683 return status;
684}
685
686static int ocfs2_info_handle_unknown(struct inode *inode,
687 struct ocfs2_info_request __user *req)
688{
689 struct ocfs2_info_request oir;
690
691 if (o2info_from_user(oir, req))
692 return -EFAULT;
693
694 o2info_clear_request_filled(&oir);
695
696 if (o2info_to_user(oir, req))
697 return -EFAULT;
698
699 return 0;
700}
701
702/*
703 * Validate and distinguish OCFS2_IOC_INFO requests.
704 *
705 * - validate the magic number.
706 * - distinguish different requests.
707 * - validate size of different requests.
708 */
709static int ocfs2_info_handle_request(struct inode *inode,
710 struct ocfs2_info_request __user *req)
711{
712 int status = -EFAULT;
713 struct ocfs2_info_request oir;
714
715 if (o2info_from_user(oir, req))
716 goto bail;
717
718 status = -EINVAL;
719 if (oir.ir_magic != OCFS2_INFO_MAGIC)
720 goto bail;
721
722 switch (oir.ir_code) {
723 case OCFS2_INFO_BLOCKSIZE:
724 if (oir.ir_size == sizeof(struct ocfs2_info_blocksize))
725 status = ocfs2_info_handle_blocksize(inode, req);
726 break;
727 case OCFS2_INFO_CLUSTERSIZE:
728 if (oir.ir_size == sizeof(struct ocfs2_info_clustersize))
729 status = ocfs2_info_handle_clustersize(inode, req);
730 break;
731 case OCFS2_INFO_MAXSLOTS:
732 if (oir.ir_size == sizeof(struct ocfs2_info_maxslots))
733 status = ocfs2_info_handle_maxslots(inode, req);
734 break;
735 case OCFS2_INFO_LABEL:
736 if (oir.ir_size == sizeof(struct ocfs2_info_label))
737 status = ocfs2_info_handle_label(inode, req);
738 break;
739 case OCFS2_INFO_UUID:
740 if (oir.ir_size == sizeof(struct ocfs2_info_uuid))
741 status = ocfs2_info_handle_uuid(inode, req);
742 break;
743 case OCFS2_INFO_FS_FEATURES:
744 if (oir.ir_size == sizeof(struct ocfs2_info_fs_features))
745 status = ocfs2_info_handle_fs_features(inode, req);
746 break;
747 case OCFS2_INFO_JOURNAL_SIZE:
748 if (oir.ir_size == sizeof(struct ocfs2_info_journal_size))
749 status = ocfs2_info_handle_journal_size(inode, req);
750 break;
751 case OCFS2_INFO_FREEINODE:
752 if (oir.ir_size == sizeof(struct ocfs2_info_freeinode))
753 status = ocfs2_info_handle_freeinode(inode, req);
754 break;
755 case OCFS2_INFO_FREEFRAG:
756 if (oir.ir_size == sizeof(struct ocfs2_info_freefrag))
757 status = ocfs2_info_handle_freefrag(inode, req);
758 break;
759 default:
760 status = ocfs2_info_handle_unknown(inode, req);
761 break;
762 }
763
764bail:
765 return status;
766}
767
768static int ocfs2_get_request_ptr(struct ocfs2_info *info, int idx,
769 u64 *req_addr, int compat_flag)
770{
771 int status = -EFAULT;
772 u64 __user *bp = NULL;
773
774 if (compat_flag) {
775#ifdef CONFIG_COMPAT
776 /*
777 * pointer bp stores the base address of a pointers array,
778 * which collects all addresses of separate request.
779 */
780 bp = (u64 __user *)(unsigned long)compat_ptr(info->oi_requests);
781#else
782 BUG();
783#endif
784 } else
785 bp = (u64 __user *)(unsigned long)(info->oi_requests);
786
787 if (o2info_from_user(*req_addr, bp + idx))
788 goto bail;
789
790 status = 0;
791bail:
792 return status;
793}
794
795/*
796 * OCFS2_IOC_INFO handles an array of requests passed from userspace.
797 *
798 * ocfs2_info_handle() recevies a large info aggregation, grab and
799 * validate the request count from header, then break it into small
800 * pieces, later specific handlers can handle them one by one.
801 *
802 * Idea here is to make each separate request small enough to ensure
803 * a better backward&forward compatibility, since a small piece of
804 * request will be less likely to be broken if disk layout get changed.
805 */
806static int ocfs2_info_handle(struct inode *inode, struct ocfs2_info *info,
807 int compat_flag)
808{
809 int i, status = 0;
810 u64 req_addr;
811 struct ocfs2_info_request __user *reqp;
812
813 if ((info->oi_count > OCFS2_INFO_MAX_REQUEST) ||
814 (!info->oi_requests)) {
815 status = -EINVAL;
816 goto bail;
817 }
818
819 for (i = 0; i < info->oi_count; i++) {
820
821 status = ocfs2_get_request_ptr(info, i, &req_addr, compat_flag);
822 if (status)
823 break;
824
825 reqp = (struct ocfs2_info_request __user *)(unsigned long)req_addr;
826 if (!reqp) {
827 status = -EINVAL;
828 goto bail;
829 }
830
831 status = ocfs2_info_handle_request(inode, reqp);
832 if (status)
833 break;
834 }
835
836bail:
837 return status;
838}
839
840long ocfs2_ioctl(struct file *filp, unsigned int cmd, unsigned long arg)
841{
842 struct inode *inode = file_inode(filp);
843 int new_clusters;
844 int status;
845 struct ocfs2_space_resv sr;
846 struct ocfs2_new_group_input input;
847 struct reflink_arguments args;
848 const char __user *old_path;
849 const char __user *new_path;
850 bool preserve;
851 struct ocfs2_info info;
852 void __user *argp = (void __user *)arg;
853
854 switch (cmd) {
855 case OCFS2_IOC_RESVSP:
856 case OCFS2_IOC_RESVSP64:
857 case OCFS2_IOC_UNRESVSP:
858 case OCFS2_IOC_UNRESVSP64:
859 if (copy_from_user(&sr, (int __user *) arg, sizeof(sr)))
860 return -EFAULT;
861
862 return ocfs2_change_file_space(filp, cmd, &sr);
863 case OCFS2_IOC_GROUP_EXTEND:
864 if (!capable(CAP_SYS_RESOURCE))
865 return -EPERM;
866
867 if (get_user(new_clusters, (int __user *)arg))
868 return -EFAULT;
869
870 status = mnt_want_write_file(filp);
871 if (status)
872 return status;
873 status = ocfs2_group_extend(inode, new_clusters);
874 mnt_drop_write_file(filp);
875 return status;
876 case OCFS2_IOC_GROUP_ADD:
877 case OCFS2_IOC_GROUP_ADD64:
878 if (!capable(CAP_SYS_RESOURCE))
879 return -EPERM;
880
881 if (copy_from_user(&input, (int __user *) arg, sizeof(input)))
882 return -EFAULT;
883
884 status = mnt_want_write_file(filp);
885 if (status)
886 return status;
887 status = ocfs2_group_add(inode, &input);
888 mnt_drop_write_file(filp);
889 return status;
890 case OCFS2_IOC_REFLINK:
891 if (copy_from_user(&args, argp, sizeof(args)))
892 return -EFAULT;
893 old_path = (const char __user *)(unsigned long)args.old_path;
894 new_path = (const char __user *)(unsigned long)args.new_path;
895 preserve = (args.preserve != 0);
896
897 return ocfs2_reflink_ioctl(inode, old_path, new_path, preserve);
898 case OCFS2_IOC_INFO:
899 if (copy_from_user(&info, argp, sizeof(struct ocfs2_info)))
900 return -EFAULT;
901
902 return ocfs2_info_handle(inode, &info, 0);
903 case FITRIM:
904 {
905 struct super_block *sb = inode->i_sb;
906 struct fstrim_range range;
907 int ret = 0;
908
909 if (!capable(CAP_SYS_ADMIN))
910 return -EPERM;
911
912 if (!bdev_max_discard_sectors(sb->s_bdev))
913 return -EOPNOTSUPP;
914
915 if (copy_from_user(&range, argp, sizeof(range)))
916 return -EFAULT;
917
918 range.minlen = max_t(u64, bdev_discard_granularity(sb->s_bdev),
919 range.minlen);
920 ret = ocfs2_trim_fs(sb, &range);
921 if (ret < 0)
922 return ret;
923
924 if (copy_to_user(argp, &range, sizeof(range)))
925 return -EFAULT;
926
927 return 0;
928 }
929 case OCFS2_IOC_MOVE_EXT:
930 return ocfs2_ioctl_move_extents(filp, argp);
931 default:
932 return -ENOTTY;
933 }
934}
935
936#ifdef CONFIG_COMPAT
937long ocfs2_compat_ioctl(struct file *file, unsigned cmd, unsigned long arg)
938{
939 bool preserve;
940 struct reflink_arguments args;
941 struct inode *inode = file_inode(file);
942 struct ocfs2_info info;
943 void __user *argp = (void __user *)arg;
944
945 switch (cmd) {
946 case OCFS2_IOC_RESVSP:
947 case OCFS2_IOC_RESVSP64:
948 case OCFS2_IOC_UNRESVSP:
949 case OCFS2_IOC_UNRESVSP64:
950 case OCFS2_IOC_GROUP_EXTEND:
951 case OCFS2_IOC_GROUP_ADD:
952 case OCFS2_IOC_GROUP_ADD64:
953 break;
954 case OCFS2_IOC_REFLINK:
955 if (copy_from_user(&args, argp, sizeof(args)))
956 return -EFAULT;
957 preserve = (args.preserve != 0);
958
959 return ocfs2_reflink_ioctl(inode, compat_ptr(args.old_path),
960 compat_ptr(args.new_path), preserve);
961 case OCFS2_IOC_INFO:
962 if (copy_from_user(&info, argp, sizeof(struct ocfs2_info)))
963 return -EFAULT;
964
965 return ocfs2_info_handle(inode, &info, 1);
966 case FITRIM:
967 case OCFS2_IOC_MOVE_EXT:
968 break;
969 default:
970 return -ENOIOCTLCMD;
971 }
972
973 return ocfs2_ioctl(file, cmd, arg);
974}
975#endif
1/*
2 * linux/fs/ocfs2/ioctl.c
3 *
4 * Copyright (C) 2006 Herbert Poetzl
5 * adapted from Remy Card's ext2/ioctl.c
6 */
7
8#include <linux/fs.h>
9#include <linux/mount.h>
10#include <linux/compat.h>
11
12#include <cluster/masklog.h>
13
14#include "ocfs2.h"
15#include "alloc.h"
16#include "dlmglue.h"
17#include "file.h"
18#include "inode.h"
19#include "journal.h"
20
21#include "ocfs2_fs.h"
22#include "ioctl.h"
23#include "resize.h"
24#include "refcounttree.h"
25#include "sysfile.h"
26#include "dir.h"
27#include "buffer_head_io.h"
28#include "suballoc.h"
29#include "move_extents.h"
30
31#define o2info_from_user(a, b) \
32 copy_from_user(&(a), (b), sizeof(a))
33#define o2info_to_user(a, b) \
34 copy_to_user((typeof(a) __user *)b, &(a), sizeof(a))
35
36/*
37 * This call is void because we are already reporting an error that may
38 * be -EFAULT. The error will be returned from the ioctl(2) call. It's
39 * just a best-effort to tell userspace that this request caused the error.
40 */
41static inline void o2info_set_request_error(struct ocfs2_info_request *kreq,
42 struct ocfs2_info_request __user *req)
43{
44 kreq->ir_flags |= OCFS2_INFO_FL_ERROR;
45 (void)put_user(kreq->ir_flags, (__u32 __user *)&(req->ir_flags));
46}
47
48static inline void o2info_set_request_filled(struct ocfs2_info_request *req)
49{
50 req->ir_flags |= OCFS2_INFO_FL_FILLED;
51}
52
53static inline void o2info_clear_request_filled(struct ocfs2_info_request *req)
54{
55 req->ir_flags &= ~OCFS2_INFO_FL_FILLED;
56}
57
58static inline int o2info_coherent(struct ocfs2_info_request *req)
59{
60 return (!(req->ir_flags & OCFS2_INFO_FL_NON_COHERENT));
61}
62
63static int ocfs2_get_inode_attr(struct inode *inode, unsigned *flags)
64{
65 int status;
66
67 status = ocfs2_inode_lock(inode, NULL, 0);
68 if (status < 0) {
69 mlog_errno(status);
70 return status;
71 }
72 ocfs2_get_inode_flags(OCFS2_I(inode));
73 *flags = OCFS2_I(inode)->ip_attr;
74 ocfs2_inode_unlock(inode, 0);
75
76 return status;
77}
78
79static int ocfs2_set_inode_attr(struct inode *inode, unsigned flags,
80 unsigned mask)
81{
82 struct ocfs2_inode_info *ocfs2_inode = OCFS2_I(inode);
83 struct ocfs2_super *osb = OCFS2_SB(inode->i_sb);
84 handle_t *handle = NULL;
85 struct buffer_head *bh = NULL;
86 unsigned oldflags;
87 int status;
88
89 mutex_lock(&inode->i_mutex);
90
91 status = ocfs2_inode_lock(inode, &bh, 1);
92 if (status < 0) {
93 mlog_errno(status);
94 goto bail;
95 }
96
97 status = -EACCES;
98 if (!inode_owner_or_capable(inode))
99 goto bail_unlock;
100
101 if (!S_ISDIR(inode->i_mode))
102 flags &= ~OCFS2_DIRSYNC_FL;
103
104 handle = ocfs2_start_trans(osb, OCFS2_INODE_UPDATE_CREDITS);
105 if (IS_ERR(handle)) {
106 status = PTR_ERR(handle);
107 mlog_errno(status);
108 goto bail_unlock;
109 }
110
111 oldflags = ocfs2_inode->ip_attr;
112 flags = flags & mask;
113 flags |= oldflags & ~mask;
114
115 /*
116 * The IMMUTABLE and APPEND_ONLY flags can only be changed by
117 * the relevant capability.
118 */
119 status = -EPERM;
120 if ((oldflags & OCFS2_IMMUTABLE_FL) || ((flags ^ oldflags) &
121 (OCFS2_APPEND_FL | OCFS2_IMMUTABLE_FL))) {
122 if (!capable(CAP_LINUX_IMMUTABLE))
123 goto bail_commit;
124 }
125
126 ocfs2_inode->ip_attr = flags;
127 ocfs2_set_inode_flags(inode);
128
129 status = ocfs2_mark_inode_dirty(handle, inode, bh);
130 if (status < 0)
131 mlog_errno(status);
132
133bail_commit:
134 ocfs2_commit_trans(osb, handle);
135bail_unlock:
136 ocfs2_inode_unlock(inode, 1);
137bail:
138 mutex_unlock(&inode->i_mutex);
139
140 brelse(bh);
141
142 return status;
143}
144
145int ocfs2_info_handle_blocksize(struct inode *inode,
146 struct ocfs2_info_request __user *req)
147{
148 int status = -EFAULT;
149 struct ocfs2_info_blocksize oib;
150
151 if (o2info_from_user(oib, req))
152 goto bail;
153
154 oib.ib_blocksize = inode->i_sb->s_blocksize;
155
156 o2info_set_request_filled(&oib.ib_req);
157
158 if (o2info_to_user(oib, req))
159 goto bail;
160
161 status = 0;
162bail:
163 if (status)
164 o2info_set_request_error(&oib.ib_req, req);
165
166 return status;
167}
168
169int ocfs2_info_handle_clustersize(struct inode *inode,
170 struct ocfs2_info_request __user *req)
171{
172 int status = -EFAULT;
173 struct ocfs2_info_clustersize oic;
174 struct ocfs2_super *osb = OCFS2_SB(inode->i_sb);
175
176 if (o2info_from_user(oic, req))
177 goto bail;
178
179 oic.ic_clustersize = osb->s_clustersize;
180
181 o2info_set_request_filled(&oic.ic_req);
182
183 if (o2info_to_user(oic, req))
184 goto bail;
185
186 status = 0;
187bail:
188 if (status)
189 o2info_set_request_error(&oic.ic_req, req);
190
191 return status;
192}
193
194int ocfs2_info_handle_maxslots(struct inode *inode,
195 struct ocfs2_info_request __user *req)
196{
197 int status = -EFAULT;
198 struct ocfs2_info_maxslots oim;
199 struct ocfs2_super *osb = OCFS2_SB(inode->i_sb);
200
201 if (o2info_from_user(oim, req))
202 goto bail;
203
204 oim.im_max_slots = osb->max_slots;
205
206 o2info_set_request_filled(&oim.im_req);
207
208 if (o2info_to_user(oim, req))
209 goto bail;
210
211 status = 0;
212bail:
213 if (status)
214 o2info_set_request_error(&oim.im_req, req);
215
216 return status;
217}
218
219int ocfs2_info_handle_label(struct inode *inode,
220 struct ocfs2_info_request __user *req)
221{
222 int status = -EFAULT;
223 struct ocfs2_info_label oil;
224 struct ocfs2_super *osb = OCFS2_SB(inode->i_sb);
225
226 if (o2info_from_user(oil, req))
227 goto bail;
228
229 memcpy(oil.il_label, osb->vol_label, OCFS2_MAX_VOL_LABEL_LEN);
230
231 o2info_set_request_filled(&oil.il_req);
232
233 if (o2info_to_user(oil, req))
234 goto bail;
235
236 status = 0;
237bail:
238 if (status)
239 o2info_set_request_error(&oil.il_req, req);
240
241 return status;
242}
243
244int ocfs2_info_handle_uuid(struct inode *inode,
245 struct ocfs2_info_request __user *req)
246{
247 int status = -EFAULT;
248 struct ocfs2_info_uuid oiu;
249 struct ocfs2_super *osb = OCFS2_SB(inode->i_sb);
250
251 if (o2info_from_user(oiu, req))
252 goto bail;
253
254 memcpy(oiu.iu_uuid_str, osb->uuid_str, OCFS2_TEXT_UUID_LEN + 1);
255
256 o2info_set_request_filled(&oiu.iu_req);
257
258 if (o2info_to_user(oiu, req))
259 goto bail;
260
261 status = 0;
262bail:
263 if (status)
264 o2info_set_request_error(&oiu.iu_req, req);
265
266 return status;
267}
268
269int ocfs2_info_handle_fs_features(struct inode *inode,
270 struct ocfs2_info_request __user *req)
271{
272 int status = -EFAULT;
273 struct ocfs2_info_fs_features oif;
274 struct ocfs2_super *osb = OCFS2_SB(inode->i_sb);
275
276 if (o2info_from_user(oif, req))
277 goto bail;
278
279 oif.if_compat_features = osb->s_feature_compat;
280 oif.if_incompat_features = osb->s_feature_incompat;
281 oif.if_ro_compat_features = osb->s_feature_ro_compat;
282
283 o2info_set_request_filled(&oif.if_req);
284
285 if (o2info_to_user(oif, req))
286 goto bail;
287
288 status = 0;
289bail:
290 if (status)
291 o2info_set_request_error(&oif.if_req, req);
292
293 return status;
294}
295
296int ocfs2_info_handle_journal_size(struct inode *inode,
297 struct ocfs2_info_request __user *req)
298{
299 int status = -EFAULT;
300 struct ocfs2_info_journal_size oij;
301 struct ocfs2_super *osb = OCFS2_SB(inode->i_sb);
302
303 if (o2info_from_user(oij, req))
304 goto bail;
305
306 oij.ij_journal_size = osb->journal->j_inode->i_size;
307
308 o2info_set_request_filled(&oij.ij_req);
309
310 if (o2info_to_user(oij, req))
311 goto bail;
312
313 status = 0;
314bail:
315 if (status)
316 o2info_set_request_error(&oij.ij_req, req);
317
318 return status;
319}
320
321int ocfs2_info_scan_inode_alloc(struct ocfs2_super *osb,
322 struct inode *inode_alloc, u64 blkno,
323 struct ocfs2_info_freeinode *fi, u32 slot)
324{
325 int status = 0, unlock = 0;
326
327 struct buffer_head *bh = NULL;
328 struct ocfs2_dinode *dinode_alloc = NULL;
329
330 if (inode_alloc)
331 mutex_lock(&inode_alloc->i_mutex);
332
333 if (o2info_coherent(&fi->ifi_req)) {
334 status = ocfs2_inode_lock(inode_alloc, &bh, 0);
335 if (status < 0) {
336 mlog_errno(status);
337 goto bail;
338 }
339 unlock = 1;
340 } else {
341 status = ocfs2_read_blocks_sync(osb, blkno, 1, &bh);
342 if (status < 0) {
343 mlog_errno(status);
344 goto bail;
345 }
346 }
347
348 dinode_alloc = (struct ocfs2_dinode *)bh->b_data;
349
350 fi->ifi_stat[slot].lfi_total =
351 le32_to_cpu(dinode_alloc->id1.bitmap1.i_total);
352 fi->ifi_stat[slot].lfi_free =
353 le32_to_cpu(dinode_alloc->id1.bitmap1.i_total) -
354 le32_to_cpu(dinode_alloc->id1.bitmap1.i_used);
355
356bail:
357 if (unlock)
358 ocfs2_inode_unlock(inode_alloc, 0);
359
360 if (inode_alloc)
361 mutex_unlock(&inode_alloc->i_mutex);
362
363 brelse(bh);
364
365 return status;
366}
367
368int ocfs2_info_handle_freeinode(struct inode *inode,
369 struct ocfs2_info_request __user *req)
370{
371 u32 i;
372 u64 blkno = -1;
373 char namebuf[40];
374 int status = -EFAULT, type = INODE_ALLOC_SYSTEM_INODE;
375 struct ocfs2_info_freeinode *oifi = NULL;
376 struct ocfs2_super *osb = OCFS2_SB(inode->i_sb);
377 struct inode *inode_alloc = NULL;
378
379 oifi = kzalloc(sizeof(struct ocfs2_info_freeinode), GFP_KERNEL);
380 if (!oifi) {
381 status = -ENOMEM;
382 mlog_errno(status);
383 goto out_err;
384 }
385
386 if (o2info_from_user(*oifi, req))
387 goto bail;
388
389 oifi->ifi_slotnum = osb->max_slots;
390
391 for (i = 0; i < oifi->ifi_slotnum; i++) {
392 if (o2info_coherent(&oifi->ifi_req)) {
393 inode_alloc = ocfs2_get_system_file_inode(osb, type, i);
394 if (!inode_alloc) {
395 mlog(ML_ERROR, "unable to get alloc inode in "
396 "slot %u\n", i);
397 status = -EIO;
398 goto bail;
399 }
400 } else {
401 ocfs2_sprintf_system_inode_name(namebuf,
402 sizeof(namebuf),
403 type, i);
404 status = ocfs2_lookup_ino_from_name(osb->sys_root_inode,
405 namebuf,
406 strlen(namebuf),
407 &blkno);
408 if (status < 0) {
409 status = -ENOENT;
410 goto bail;
411 }
412 }
413
414 status = ocfs2_info_scan_inode_alloc(osb, inode_alloc, blkno, oifi, i);
415 if (status < 0)
416 goto bail;
417
418 iput(inode_alloc);
419 inode_alloc = NULL;
420 }
421
422 o2info_set_request_filled(&oifi->ifi_req);
423
424 if (o2info_to_user(*oifi, req))
425 goto bail;
426
427 status = 0;
428bail:
429 if (status)
430 o2info_set_request_error(&oifi->ifi_req, req);
431
432 kfree(oifi);
433out_err:
434 return status;
435}
436
437static void o2ffg_update_histogram(struct ocfs2_info_free_chunk_list *hist,
438 unsigned int chunksize)
439{
440 int index;
441
442 index = __ilog2_u32(chunksize);
443 if (index >= OCFS2_INFO_MAX_HIST)
444 index = OCFS2_INFO_MAX_HIST - 1;
445
446 hist->fc_chunks[index]++;
447 hist->fc_clusters[index] += chunksize;
448}
449
450static void o2ffg_update_stats(struct ocfs2_info_freefrag_stats *stats,
451 unsigned int chunksize)
452{
453 if (chunksize > stats->ffs_max)
454 stats->ffs_max = chunksize;
455
456 if (chunksize < stats->ffs_min)
457 stats->ffs_min = chunksize;
458
459 stats->ffs_avg += chunksize;
460 stats->ffs_free_chunks_real++;
461}
462
463void ocfs2_info_update_ffg(struct ocfs2_info_freefrag *ffg,
464 unsigned int chunksize)
465{
466 o2ffg_update_histogram(&(ffg->iff_ffs.ffs_fc_hist), chunksize);
467 o2ffg_update_stats(&(ffg->iff_ffs), chunksize);
468}
469
470int ocfs2_info_freefrag_scan_chain(struct ocfs2_super *osb,
471 struct inode *gb_inode,
472 struct ocfs2_dinode *gb_dinode,
473 struct ocfs2_chain_rec *rec,
474 struct ocfs2_info_freefrag *ffg,
475 u32 chunks_in_group)
476{
477 int status = 0, used;
478 u64 blkno;
479
480 struct buffer_head *bh = NULL;
481 struct ocfs2_group_desc *bg = NULL;
482
483 unsigned int max_bits, num_clusters;
484 unsigned int offset = 0, cluster, chunk;
485 unsigned int chunk_free, last_chunksize = 0;
486
487 if (!le32_to_cpu(rec->c_free))
488 goto bail;
489
490 do {
491 if (!bg)
492 blkno = le64_to_cpu(rec->c_blkno);
493 else
494 blkno = le64_to_cpu(bg->bg_next_group);
495
496 if (bh) {
497 brelse(bh);
498 bh = NULL;
499 }
500
501 if (o2info_coherent(&ffg->iff_req))
502 status = ocfs2_read_group_descriptor(gb_inode,
503 gb_dinode,
504 blkno, &bh);
505 else
506 status = ocfs2_read_blocks_sync(osb, blkno, 1, &bh);
507
508 if (status < 0) {
509 mlog(ML_ERROR, "Can't read the group descriptor # "
510 "%llu from device.", (unsigned long long)blkno);
511 status = -EIO;
512 goto bail;
513 }
514
515 bg = (struct ocfs2_group_desc *)bh->b_data;
516
517 if (!le16_to_cpu(bg->bg_free_bits_count))
518 continue;
519
520 max_bits = le16_to_cpu(bg->bg_bits);
521 offset = 0;
522
523 for (chunk = 0; chunk < chunks_in_group; chunk++) {
524 /*
525 * last chunk may be not an entire one.
526 */
527 if ((offset + ffg->iff_chunksize) > max_bits)
528 num_clusters = max_bits - offset;
529 else
530 num_clusters = ffg->iff_chunksize;
531
532 chunk_free = 0;
533 for (cluster = 0; cluster < num_clusters; cluster++) {
534 used = ocfs2_test_bit(offset,
535 (unsigned long *)bg->bg_bitmap);
536 /*
537 * - chunk_free counts free clusters in #N chunk.
538 * - last_chunksize records the size(in) clusters
539 * for the last real free chunk being counted.
540 */
541 if (!used) {
542 last_chunksize++;
543 chunk_free++;
544 }
545
546 if (used && last_chunksize) {
547 ocfs2_info_update_ffg(ffg,
548 last_chunksize);
549 last_chunksize = 0;
550 }
551
552 offset++;
553 }
554
555 if (chunk_free == ffg->iff_chunksize)
556 ffg->iff_ffs.ffs_free_chunks++;
557 }
558
559 /*
560 * need to update the info for last free chunk.
561 */
562 if (last_chunksize)
563 ocfs2_info_update_ffg(ffg, last_chunksize);
564
565 } while (le64_to_cpu(bg->bg_next_group));
566
567bail:
568 brelse(bh);
569
570 return status;
571}
572
573int ocfs2_info_freefrag_scan_bitmap(struct ocfs2_super *osb,
574 struct inode *gb_inode, u64 blkno,
575 struct ocfs2_info_freefrag *ffg)
576{
577 u32 chunks_in_group;
578 int status = 0, unlock = 0, i;
579
580 struct buffer_head *bh = NULL;
581 struct ocfs2_chain_list *cl = NULL;
582 struct ocfs2_chain_rec *rec = NULL;
583 struct ocfs2_dinode *gb_dinode = NULL;
584
585 if (gb_inode)
586 mutex_lock(&gb_inode->i_mutex);
587
588 if (o2info_coherent(&ffg->iff_req)) {
589 status = ocfs2_inode_lock(gb_inode, &bh, 0);
590 if (status < 0) {
591 mlog_errno(status);
592 goto bail;
593 }
594 unlock = 1;
595 } else {
596 status = ocfs2_read_blocks_sync(osb, blkno, 1, &bh);
597 if (status < 0) {
598 mlog_errno(status);
599 goto bail;
600 }
601 }
602
603 gb_dinode = (struct ocfs2_dinode *)bh->b_data;
604 cl = &(gb_dinode->id2.i_chain);
605
606 /*
607 * Chunksize(in) clusters from userspace should be
608 * less than clusters in a group.
609 */
610 if (ffg->iff_chunksize > le16_to_cpu(cl->cl_cpg)) {
611 status = -EINVAL;
612 goto bail;
613 }
614
615 memset(&ffg->iff_ffs, 0, sizeof(struct ocfs2_info_freefrag_stats));
616
617 ffg->iff_ffs.ffs_min = ~0U;
618 ffg->iff_ffs.ffs_clusters =
619 le32_to_cpu(gb_dinode->id1.bitmap1.i_total);
620 ffg->iff_ffs.ffs_free_clusters = ffg->iff_ffs.ffs_clusters -
621 le32_to_cpu(gb_dinode->id1.bitmap1.i_used);
622
623 chunks_in_group = le16_to_cpu(cl->cl_cpg) / ffg->iff_chunksize + 1;
624
625 for (i = 0; i < le16_to_cpu(cl->cl_next_free_rec); i++) {
626 rec = &(cl->cl_recs[i]);
627 status = ocfs2_info_freefrag_scan_chain(osb, gb_inode,
628 gb_dinode,
629 rec, ffg,
630 chunks_in_group);
631 if (status)
632 goto bail;
633 }
634
635 if (ffg->iff_ffs.ffs_free_chunks_real)
636 ffg->iff_ffs.ffs_avg = (ffg->iff_ffs.ffs_avg /
637 ffg->iff_ffs.ffs_free_chunks_real);
638bail:
639 if (unlock)
640 ocfs2_inode_unlock(gb_inode, 0);
641
642 if (gb_inode)
643 mutex_unlock(&gb_inode->i_mutex);
644
645 if (gb_inode)
646 iput(gb_inode);
647
648 brelse(bh);
649
650 return status;
651}
652
653int ocfs2_info_handle_freefrag(struct inode *inode,
654 struct ocfs2_info_request __user *req)
655{
656 u64 blkno = -1;
657 char namebuf[40];
658 int status = -EFAULT, type = GLOBAL_BITMAP_SYSTEM_INODE;
659
660 struct ocfs2_info_freefrag *oiff;
661 struct ocfs2_super *osb = OCFS2_SB(inode->i_sb);
662 struct inode *gb_inode = NULL;
663
664 oiff = kzalloc(sizeof(struct ocfs2_info_freefrag), GFP_KERNEL);
665 if (!oiff) {
666 status = -ENOMEM;
667 mlog_errno(status);
668 goto out_err;
669 }
670
671 if (o2info_from_user(*oiff, req))
672 goto bail;
673 /*
674 * chunksize from userspace should be power of 2.
675 */
676 if ((oiff->iff_chunksize & (oiff->iff_chunksize - 1)) ||
677 (!oiff->iff_chunksize)) {
678 status = -EINVAL;
679 goto bail;
680 }
681
682 if (o2info_coherent(&oiff->iff_req)) {
683 gb_inode = ocfs2_get_system_file_inode(osb, type,
684 OCFS2_INVALID_SLOT);
685 if (!gb_inode) {
686 mlog(ML_ERROR, "unable to get global_bitmap inode\n");
687 status = -EIO;
688 goto bail;
689 }
690 } else {
691 ocfs2_sprintf_system_inode_name(namebuf, sizeof(namebuf), type,
692 OCFS2_INVALID_SLOT);
693 status = ocfs2_lookup_ino_from_name(osb->sys_root_inode,
694 namebuf,
695 strlen(namebuf),
696 &blkno);
697 if (status < 0) {
698 status = -ENOENT;
699 goto bail;
700 }
701 }
702
703 status = ocfs2_info_freefrag_scan_bitmap(osb, gb_inode, blkno, oiff);
704 if (status < 0)
705 goto bail;
706
707 o2info_set_request_filled(&oiff->iff_req);
708
709 if (o2info_to_user(*oiff, req))
710 goto bail;
711
712 status = 0;
713bail:
714 if (status)
715 o2info_set_request_error(&oiff->iff_req, req);
716
717 kfree(oiff);
718out_err:
719 return status;
720}
721
722int ocfs2_info_handle_unknown(struct inode *inode,
723 struct ocfs2_info_request __user *req)
724{
725 int status = -EFAULT;
726 struct ocfs2_info_request oir;
727
728 if (o2info_from_user(oir, req))
729 goto bail;
730
731 o2info_clear_request_filled(&oir);
732
733 if (o2info_to_user(oir, req))
734 goto bail;
735
736 status = 0;
737bail:
738 if (status)
739 o2info_set_request_error(&oir, req);
740
741 return status;
742}
743
744/*
745 * Validate and distinguish OCFS2_IOC_INFO requests.
746 *
747 * - validate the magic number.
748 * - distinguish different requests.
749 * - validate size of different requests.
750 */
751int ocfs2_info_handle_request(struct inode *inode,
752 struct ocfs2_info_request __user *req)
753{
754 int status = -EFAULT;
755 struct ocfs2_info_request oir;
756
757 if (o2info_from_user(oir, req))
758 goto bail;
759
760 status = -EINVAL;
761 if (oir.ir_magic != OCFS2_INFO_MAGIC)
762 goto bail;
763
764 switch (oir.ir_code) {
765 case OCFS2_INFO_BLOCKSIZE:
766 if (oir.ir_size == sizeof(struct ocfs2_info_blocksize))
767 status = ocfs2_info_handle_blocksize(inode, req);
768 break;
769 case OCFS2_INFO_CLUSTERSIZE:
770 if (oir.ir_size == sizeof(struct ocfs2_info_clustersize))
771 status = ocfs2_info_handle_clustersize(inode, req);
772 break;
773 case OCFS2_INFO_MAXSLOTS:
774 if (oir.ir_size == sizeof(struct ocfs2_info_maxslots))
775 status = ocfs2_info_handle_maxslots(inode, req);
776 break;
777 case OCFS2_INFO_LABEL:
778 if (oir.ir_size == sizeof(struct ocfs2_info_label))
779 status = ocfs2_info_handle_label(inode, req);
780 break;
781 case OCFS2_INFO_UUID:
782 if (oir.ir_size == sizeof(struct ocfs2_info_uuid))
783 status = ocfs2_info_handle_uuid(inode, req);
784 break;
785 case OCFS2_INFO_FS_FEATURES:
786 if (oir.ir_size == sizeof(struct ocfs2_info_fs_features))
787 status = ocfs2_info_handle_fs_features(inode, req);
788 break;
789 case OCFS2_INFO_JOURNAL_SIZE:
790 if (oir.ir_size == sizeof(struct ocfs2_info_journal_size))
791 status = ocfs2_info_handle_journal_size(inode, req);
792 break;
793 case OCFS2_INFO_FREEINODE:
794 if (oir.ir_size == sizeof(struct ocfs2_info_freeinode))
795 status = ocfs2_info_handle_freeinode(inode, req);
796 break;
797 case OCFS2_INFO_FREEFRAG:
798 if (oir.ir_size == sizeof(struct ocfs2_info_freefrag))
799 status = ocfs2_info_handle_freefrag(inode, req);
800 break;
801 default:
802 status = ocfs2_info_handle_unknown(inode, req);
803 break;
804 }
805
806bail:
807 return status;
808}
809
810int ocfs2_get_request_ptr(struct ocfs2_info *info, int idx,
811 u64 *req_addr, int compat_flag)
812{
813 int status = -EFAULT;
814 u64 __user *bp = NULL;
815
816 if (compat_flag) {
817#ifdef CONFIG_COMPAT
818 /*
819 * pointer bp stores the base address of a pointers array,
820 * which collects all addresses of separate request.
821 */
822 bp = (u64 __user *)(unsigned long)compat_ptr(info->oi_requests);
823#else
824 BUG();
825#endif
826 } else
827 bp = (u64 __user *)(unsigned long)(info->oi_requests);
828
829 if (o2info_from_user(*req_addr, bp + idx))
830 goto bail;
831
832 status = 0;
833bail:
834 return status;
835}
836
837/*
838 * OCFS2_IOC_INFO handles an array of requests passed from userspace.
839 *
840 * ocfs2_info_handle() recevies a large info aggregation, grab and
841 * validate the request count from header, then break it into small
842 * pieces, later specific handlers can handle them one by one.
843 *
844 * Idea here is to make each separate request small enough to ensure
845 * a better backward&forward compatibility, since a small piece of
846 * request will be less likely to be broken if disk layout get changed.
847 */
848int ocfs2_info_handle(struct inode *inode, struct ocfs2_info *info,
849 int compat_flag)
850{
851 int i, status = 0;
852 u64 req_addr;
853 struct ocfs2_info_request __user *reqp;
854
855 if ((info->oi_count > OCFS2_INFO_MAX_REQUEST) ||
856 (!info->oi_requests)) {
857 status = -EINVAL;
858 goto bail;
859 }
860
861 for (i = 0; i < info->oi_count; i++) {
862
863 status = ocfs2_get_request_ptr(info, i, &req_addr, compat_flag);
864 if (status)
865 break;
866
867 reqp = (struct ocfs2_info_request __user *)(unsigned long)req_addr;
868 if (!reqp) {
869 status = -EINVAL;
870 goto bail;
871 }
872
873 status = ocfs2_info_handle_request(inode, reqp);
874 if (status)
875 break;
876 }
877
878bail:
879 return status;
880}
881
882long ocfs2_ioctl(struct file *filp, unsigned int cmd, unsigned long arg)
883{
884 struct inode *inode = filp->f_path.dentry->d_inode;
885 unsigned int flags;
886 int new_clusters;
887 int status;
888 struct ocfs2_space_resv sr;
889 struct ocfs2_new_group_input input;
890 struct reflink_arguments args;
891 const char __user *old_path;
892 const char __user *new_path;
893 bool preserve;
894 struct ocfs2_info info;
895 void __user *argp = (void __user *)arg;
896
897 switch (cmd) {
898 case OCFS2_IOC_GETFLAGS:
899 status = ocfs2_get_inode_attr(inode, &flags);
900 if (status < 0)
901 return status;
902
903 flags &= OCFS2_FL_VISIBLE;
904 return put_user(flags, (int __user *) arg);
905 case OCFS2_IOC_SETFLAGS:
906 if (get_user(flags, (int __user *) arg))
907 return -EFAULT;
908
909 status = mnt_want_write_file(filp);
910 if (status)
911 return status;
912 status = ocfs2_set_inode_attr(inode, flags,
913 OCFS2_FL_MODIFIABLE);
914 mnt_drop_write_file(filp);
915 return status;
916 case OCFS2_IOC_RESVSP:
917 case OCFS2_IOC_RESVSP64:
918 case OCFS2_IOC_UNRESVSP:
919 case OCFS2_IOC_UNRESVSP64:
920 if (copy_from_user(&sr, (int __user *) arg, sizeof(sr)))
921 return -EFAULT;
922
923 return ocfs2_change_file_space(filp, cmd, &sr);
924 case OCFS2_IOC_GROUP_EXTEND:
925 if (!capable(CAP_SYS_RESOURCE))
926 return -EPERM;
927
928 if (get_user(new_clusters, (int __user *)arg))
929 return -EFAULT;
930
931 return ocfs2_group_extend(inode, new_clusters);
932 case OCFS2_IOC_GROUP_ADD:
933 case OCFS2_IOC_GROUP_ADD64:
934 if (!capable(CAP_SYS_RESOURCE))
935 return -EPERM;
936
937 if (copy_from_user(&input, (int __user *) arg, sizeof(input)))
938 return -EFAULT;
939
940 return ocfs2_group_add(inode, &input);
941 case OCFS2_IOC_REFLINK:
942 if (copy_from_user(&args, argp, sizeof(args)))
943 return -EFAULT;
944 old_path = (const char __user *)(unsigned long)args.old_path;
945 new_path = (const char __user *)(unsigned long)args.new_path;
946 preserve = (args.preserve != 0);
947
948 return ocfs2_reflink_ioctl(inode, old_path, new_path, preserve);
949 case OCFS2_IOC_INFO:
950 if (copy_from_user(&info, argp, sizeof(struct ocfs2_info)))
951 return -EFAULT;
952
953 return ocfs2_info_handle(inode, &info, 0);
954 case FITRIM:
955 {
956 struct super_block *sb = inode->i_sb;
957 struct fstrim_range range;
958 int ret = 0;
959
960 if (!capable(CAP_SYS_ADMIN))
961 return -EPERM;
962
963 if (copy_from_user(&range, argp, sizeof(range)))
964 return -EFAULT;
965
966 ret = ocfs2_trim_fs(sb, &range);
967 if (ret < 0)
968 return ret;
969
970 if (copy_to_user(argp, &range, sizeof(range)))
971 return -EFAULT;
972
973 return 0;
974 }
975 case OCFS2_IOC_MOVE_EXT:
976 return ocfs2_ioctl_move_extents(filp, argp);
977 default:
978 return -ENOTTY;
979 }
980}
981
982#ifdef CONFIG_COMPAT
983long ocfs2_compat_ioctl(struct file *file, unsigned cmd, unsigned long arg)
984{
985 bool preserve;
986 struct reflink_arguments args;
987 struct inode *inode = file->f_path.dentry->d_inode;
988 struct ocfs2_info info;
989 void __user *argp = (void __user *)arg;
990
991 switch (cmd) {
992 case OCFS2_IOC32_GETFLAGS:
993 cmd = OCFS2_IOC_GETFLAGS;
994 break;
995 case OCFS2_IOC32_SETFLAGS:
996 cmd = OCFS2_IOC_SETFLAGS;
997 break;
998 case OCFS2_IOC_RESVSP:
999 case OCFS2_IOC_RESVSP64:
1000 case OCFS2_IOC_UNRESVSP:
1001 case OCFS2_IOC_UNRESVSP64:
1002 case OCFS2_IOC_GROUP_EXTEND:
1003 case OCFS2_IOC_GROUP_ADD:
1004 case OCFS2_IOC_GROUP_ADD64:
1005 case FITRIM:
1006 break;
1007 case OCFS2_IOC_REFLINK:
1008 if (copy_from_user(&args, argp, sizeof(args)))
1009 return -EFAULT;
1010 preserve = (args.preserve != 0);
1011
1012 return ocfs2_reflink_ioctl(inode, compat_ptr(args.old_path),
1013 compat_ptr(args.new_path), preserve);
1014 case OCFS2_IOC_INFO:
1015 if (copy_from_user(&info, argp, sizeof(struct ocfs2_info)))
1016 return -EFAULT;
1017
1018 return ocfs2_info_handle(inode, &info, 1);
1019 case OCFS2_IOC_MOVE_EXT:
1020 break;
1021 default:
1022 return -ENOIOCTLCMD;
1023 }
1024
1025 return ocfs2_ioctl(file, cmd, arg);
1026}
1027#endif