Loading...
1/*
2 * linux/fs/ocfs2/ioctl.c
3 *
4 * Copyright (C) 2006 Herbert Poetzl
5 * adapted from Remy Card's ext2/ioctl.c
6 */
7
8#include <linux/fs.h>
9#include <linux/mount.h>
10#include <linux/compat.h>
11
12#include <cluster/masklog.h>
13
14#include "ocfs2.h"
15#include "alloc.h"
16#include "dlmglue.h"
17#include "file.h"
18#include "inode.h"
19#include "journal.h"
20
21#include "ocfs2_fs.h"
22#include "ioctl.h"
23#include "resize.h"
24#include "refcounttree.h"
25#include "sysfile.h"
26#include "dir.h"
27#include "buffer_head_io.h"
28#include "suballoc.h"
29#include "move_extents.h"
30
31#include <linux/ext2_fs.h>
32
33#define o2info_from_user(a, b) \
34 copy_from_user(&(a), (b), sizeof(a))
35#define o2info_to_user(a, b) \
36 copy_to_user((typeof(a) __user *)b, &(a), sizeof(a))
37
38/*
39 * This call is void because we are already reporting an error that may
40 * be -EFAULT. The error will be returned from the ioctl(2) call. It's
41 * just a best-effort to tell userspace that this request caused the error.
42 */
43static inline void o2info_set_request_error(struct ocfs2_info_request *kreq,
44 struct ocfs2_info_request __user *req)
45{
46 kreq->ir_flags |= OCFS2_INFO_FL_ERROR;
47 (void)put_user(kreq->ir_flags, (__u32 __user *)&(req->ir_flags));
48}
49
50static inline void o2info_set_request_filled(struct ocfs2_info_request *req)
51{
52 req->ir_flags |= OCFS2_INFO_FL_FILLED;
53}
54
55static inline void o2info_clear_request_filled(struct ocfs2_info_request *req)
56{
57 req->ir_flags &= ~OCFS2_INFO_FL_FILLED;
58}
59
60static inline int o2info_coherent(struct ocfs2_info_request *req)
61{
62 return (!(req->ir_flags & OCFS2_INFO_FL_NON_COHERENT));
63}
64
65static int ocfs2_get_inode_attr(struct inode *inode, unsigned *flags)
66{
67 int status;
68
69 status = ocfs2_inode_lock(inode, NULL, 0);
70 if (status < 0) {
71 mlog_errno(status);
72 return status;
73 }
74 ocfs2_get_inode_flags(OCFS2_I(inode));
75 *flags = OCFS2_I(inode)->ip_attr;
76 ocfs2_inode_unlock(inode, 0);
77
78 return status;
79}
80
81static int ocfs2_set_inode_attr(struct inode *inode, unsigned flags,
82 unsigned mask)
83{
84 struct ocfs2_inode_info *ocfs2_inode = OCFS2_I(inode);
85 struct ocfs2_super *osb = OCFS2_SB(inode->i_sb);
86 handle_t *handle = NULL;
87 struct buffer_head *bh = NULL;
88 unsigned oldflags;
89 int status;
90
91 mutex_lock(&inode->i_mutex);
92
93 status = ocfs2_inode_lock(inode, &bh, 1);
94 if (status < 0) {
95 mlog_errno(status);
96 goto bail;
97 }
98
99 status = -EACCES;
100 if (!inode_owner_or_capable(inode))
101 goto bail_unlock;
102
103 if (!S_ISDIR(inode->i_mode))
104 flags &= ~OCFS2_DIRSYNC_FL;
105
106 handle = ocfs2_start_trans(osb, OCFS2_INODE_UPDATE_CREDITS);
107 if (IS_ERR(handle)) {
108 status = PTR_ERR(handle);
109 mlog_errno(status);
110 goto bail_unlock;
111 }
112
113 oldflags = ocfs2_inode->ip_attr;
114 flags = flags & mask;
115 flags |= oldflags & ~mask;
116
117 /*
118 * The IMMUTABLE and APPEND_ONLY flags can only be changed by
119 * the relevant capability.
120 */
121 status = -EPERM;
122 if ((oldflags & OCFS2_IMMUTABLE_FL) || ((flags ^ oldflags) &
123 (OCFS2_APPEND_FL | OCFS2_IMMUTABLE_FL))) {
124 if (!capable(CAP_LINUX_IMMUTABLE))
125 goto bail_unlock;
126 }
127
128 ocfs2_inode->ip_attr = flags;
129 ocfs2_set_inode_flags(inode);
130
131 status = ocfs2_mark_inode_dirty(handle, inode, bh);
132 if (status < 0)
133 mlog_errno(status);
134
135 ocfs2_commit_trans(osb, handle);
136bail_unlock:
137 ocfs2_inode_unlock(inode, 1);
138bail:
139 mutex_unlock(&inode->i_mutex);
140
141 brelse(bh);
142
143 return status;
144}
145
146int ocfs2_info_handle_blocksize(struct inode *inode,
147 struct ocfs2_info_request __user *req)
148{
149 int status = -EFAULT;
150 struct ocfs2_info_blocksize oib;
151
152 if (o2info_from_user(oib, req))
153 goto bail;
154
155 oib.ib_blocksize = inode->i_sb->s_blocksize;
156
157 o2info_set_request_filled(&oib.ib_req);
158
159 if (o2info_to_user(oib, req))
160 goto bail;
161
162 status = 0;
163bail:
164 if (status)
165 o2info_set_request_error(&oib.ib_req, req);
166
167 return status;
168}
169
170int ocfs2_info_handle_clustersize(struct inode *inode,
171 struct ocfs2_info_request __user *req)
172{
173 int status = -EFAULT;
174 struct ocfs2_info_clustersize oic;
175 struct ocfs2_super *osb = OCFS2_SB(inode->i_sb);
176
177 if (o2info_from_user(oic, req))
178 goto bail;
179
180 oic.ic_clustersize = osb->s_clustersize;
181
182 o2info_set_request_filled(&oic.ic_req);
183
184 if (o2info_to_user(oic, req))
185 goto bail;
186
187 status = 0;
188bail:
189 if (status)
190 o2info_set_request_error(&oic.ic_req, req);
191
192 return status;
193}
194
195int ocfs2_info_handle_maxslots(struct inode *inode,
196 struct ocfs2_info_request __user *req)
197{
198 int status = -EFAULT;
199 struct ocfs2_info_maxslots oim;
200 struct ocfs2_super *osb = OCFS2_SB(inode->i_sb);
201
202 if (o2info_from_user(oim, req))
203 goto bail;
204
205 oim.im_max_slots = osb->max_slots;
206
207 o2info_set_request_filled(&oim.im_req);
208
209 if (o2info_to_user(oim, req))
210 goto bail;
211
212 status = 0;
213bail:
214 if (status)
215 o2info_set_request_error(&oim.im_req, req);
216
217 return status;
218}
219
220int ocfs2_info_handle_label(struct inode *inode,
221 struct ocfs2_info_request __user *req)
222{
223 int status = -EFAULT;
224 struct ocfs2_info_label oil;
225 struct ocfs2_super *osb = OCFS2_SB(inode->i_sb);
226
227 if (o2info_from_user(oil, req))
228 goto bail;
229
230 memcpy(oil.il_label, osb->vol_label, OCFS2_MAX_VOL_LABEL_LEN);
231
232 o2info_set_request_filled(&oil.il_req);
233
234 if (o2info_to_user(oil, req))
235 goto bail;
236
237 status = 0;
238bail:
239 if (status)
240 o2info_set_request_error(&oil.il_req, req);
241
242 return status;
243}
244
245int ocfs2_info_handle_uuid(struct inode *inode,
246 struct ocfs2_info_request __user *req)
247{
248 int status = -EFAULT;
249 struct ocfs2_info_uuid oiu;
250 struct ocfs2_super *osb = OCFS2_SB(inode->i_sb);
251
252 if (o2info_from_user(oiu, req))
253 goto bail;
254
255 memcpy(oiu.iu_uuid_str, osb->uuid_str, OCFS2_TEXT_UUID_LEN + 1);
256
257 o2info_set_request_filled(&oiu.iu_req);
258
259 if (o2info_to_user(oiu, req))
260 goto bail;
261
262 status = 0;
263bail:
264 if (status)
265 o2info_set_request_error(&oiu.iu_req, req);
266
267 return status;
268}
269
270int ocfs2_info_handle_fs_features(struct inode *inode,
271 struct ocfs2_info_request __user *req)
272{
273 int status = -EFAULT;
274 struct ocfs2_info_fs_features oif;
275 struct ocfs2_super *osb = OCFS2_SB(inode->i_sb);
276
277 if (o2info_from_user(oif, req))
278 goto bail;
279
280 oif.if_compat_features = osb->s_feature_compat;
281 oif.if_incompat_features = osb->s_feature_incompat;
282 oif.if_ro_compat_features = osb->s_feature_ro_compat;
283
284 o2info_set_request_filled(&oif.if_req);
285
286 if (o2info_to_user(oif, req))
287 goto bail;
288
289 status = 0;
290bail:
291 if (status)
292 o2info_set_request_error(&oif.if_req, req);
293
294 return status;
295}
296
297int ocfs2_info_handle_journal_size(struct inode *inode,
298 struct ocfs2_info_request __user *req)
299{
300 int status = -EFAULT;
301 struct ocfs2_info_journal_size oij;
302 struct ocfs2_super *osb = OCFS2_SB(inode->i_sb);
303
304 if (o2info_from_user(oij, req))
305 goto bail;
306
307 oij.ij_journal_size = osb->journal->j_inode->i_size;
308
309 o2info_set_request_filled(&oij.ij_req);
310
311 if (o2info_to_user(oij, req))
312 goto bail;
313
314 status = 0;
315bail:
316 if (status)
317 o2info_set_request_error(&oij.ij_req, req);
318
319 return status;
320}
321
322int ocfs2_info_scan_inode_alloc(struct ocfs2_super *osb,
323 struct inode *inode_alloc, u64 blkno,
324 struct ocfs2_info_freeinode *fi, u32 slot)
325{
326 int status = 0, unlock = 0;
327
328 struct buffer_head *bh = NULL;
329 struct ocfs2_dinode *dinode_alloc = NULL;
330
331 if (inode_alloc)
332 mutex_lock(&inode_alloc->i_mutex);
333
334 if (o2info_coherent(&fi->ifi_req)) {
335 status = ocfs2_inode_lock(inode_alloc, &bh, 0);
336 if (status < 0) {
337 mlog_errno(status);
338 goto bail;
339 }
340 unlock = 1;
341 } else {
342 status = ocfs2_read_blocks_sync(osb, blkno, 1, &bh);
343 if (status < 0) {
344 mlog_errno(status);
345 goto bail;
346 }
347 }
348
349 dinode_alloc = (struct ocfs2_dinode *)bh->b_data;
350
351 fi->ifi_stat[slot].lfi_total =
352 le32_to_cpu(dinode_alloc->id1.bitmap1.i_total);
353 fi->ifi_stat[slot].lfi_free =
354 le32_to_cpu(dinode_alloc->id1.bitmap1.i_total) -
355 le32_to_cpu(dinode_alloc->id1.bitmap1.i_used);
356
357bail:
358 if (unlock)
359 ocfs2_inode_unlock(inode_alloc, 0);
360
361 if (inode_alloc)
362 mutex_unlock(&inode_alloc->i_mutex);
363
364 brelse(bh);
365
366 return status;
367}
368
369int ocfs2_info_handle_freeinode(struct inode *inode,
370 struct ocfs2_info_request __user *req)
371{
372 u32 i;
373 u64 blkno = -1;
374 char namebuf[40];
375 int status = -EFAULT, type = INODE_ALLOC_SYSTEM_INODE;
376 struct ocfs2_info_freeinode *oifi = NULL;
377 struct ocfs2_super *osb = OCFS2_SB(inode->i_sb);
378 struct inode *inode_alloc = NULL;
379
380 oifi = kzalloc(sizeof(struct ocfs2_info_freeinode), GFP_KERNEL);
381 if (!oifi) {
382 status = -ENOMEM;
383 mlog_errno(status);
384 goto bail;
385 }
386
387 if (o2info_from_user(*oifi, req))
388 goto bail;
389
390 oifi->ifi_slotnum = osb->max_slots;
391
392 for (i = 0; i < oifi->ifi_slotnum; i++) {
393 if (o2info_coherent(&oifi->ifi_req)) {
394 inode_alloc = ocfs2_get_system_file_inode(osb, type, i);
395 if (!inode_alloc) {
396 mlog(ML_ERROR, "unable to get alloc inode in "
397 "slot %u\n", i);
398 status = -EIO;
399 goto bail;
400 }
401 } else {
402 ocfs2_sprintf_system_inode_name(namebuf,
403 sizeof(namebuf),
404 type, i);
405 status = ocfs2_lookup_ino_from_name(osb->sys_root_inode,
406 namebuf,
407 strlen(namebuf),
408 &blkno);
409 if (status < 0) {
410 status = -ENOENT;
411 goto bail;
412 }
413 }
414
415 status = ocfs2_info_scan_inode_alloc(osb, inode_alloc, blkno, oifi, i);
416 if (status < 0)
417 goto bail;
418
419 iput(inode_alloc);
420 inode_alloc = NULL;
421 }
422
423 o2info_set_request_filled(&oifi->ifi_req);
424
425 if (o2info_to_user(*oifi, req))
426 goto bail;
427
428 status = 0;
429bail:
430 if (status)
431 o2info_set_request_error(&oifi->ifi_req, req);
432
433 kfree(oifi);
434
435 return status;
436}
437
438static void o2ffg_update_histogram(struct ocfs2_info_free_chunk_list *hist,
439 unsigned int chunksize)
440{
441 int index;
442
443 index = __ilog2_u32(chunksize);
444 if (index >= OCFS2_INFO_MAX_HIST)
445 index = OCFS2_INFO_MAX_HIST - 1;
446
447 hist->fc_chunks[index]++;
448 hist->fc_clusters[index] += chunksize;
449}
450
451static void o2ffg_update_stats(struct ocfs2_info_freefrag_stats *stats,
452 unsigned int chunksize)
453{
454 if (chunksize > stats->ffs_max)
455 stats->ffs_max = chunksize;
456
457 if (chunksize < stats->ffs_min)
458 stats->ffs_min = chunksize;
459
460 stats->ffs_avg += chunksize;
461 stats->ffs_free_chunks_real++;
462}
463
464void ocfs2_info_update_ffg(struct ocfs2_info_freefrag *ffg,
465 unsigned int chunksize)
466{
467 o2ffg_update_histogram(&(ffg->iff_ffs.ffs_fc_hist), chunksize);
468 o2ffg_update_stats(&(ffg->iff_ffs), chunksize);
469}
470
471int ocfs2_info_freefrag_scan_chain(struct ocfs2_super *osb,
472 struct inode *gb_inode,
473 struct ocfs2_dinode *gb_dinode,
474 struct ocfs2_chain_rec *rec,
475 struct ocfs2_info_freefrag *ffg,
476 u32 chunks_in_group)
477{
478 int status = 0, used;
479 u64 blkno;
480
481 struct buffer_head *bh = NULL;
482 struct ocfs2_group_desc *bg = NULL;
483
484 unsigned int max_bits, num_clusters;
485 unsigned int offset = 0, cluster, chunk;
486 unsigned int chunk_free, last_chunksize = 0;
487
488 if (!le32_to_cpu(rec->c_free))
489 goto bail;
490
491 do {
492 if (!bg)
493 blkno = le64_to_cpu(rec->c_blkno);
494 else
495 blkno = le64_to_cpu(bg->bg_next_group);
496
497 if (bh) {
498 brelse(bh);
499 bh = NULL;
500 }
501
502 if (o2info_coherent(&ffg->iff_req))
503 status = ocfs2_read_group_descriptor(gb_inode,
504 gb_dinode,
505 blkno, &bh);
506 else
507 status = ocfs2_read_blocks_sync(osb, blkno, 1, &bh);
508
509 if (status < 0) {
510 mlog(ML_ERROR, "Can't read the group descriptor # "
511 "%llu from device.", (unsigned long long)blkno);
512 status = -EIO;
513 goto bail;
514 }
515
516 bg = (struct ocfs2_group_desc *)bh->b_data;
517
518 if (!le16_to_cpu(bg->bg_free_bits_count))
519 continue;
520
521 max_bits = le16_to_cpu(bg->bg_bits);
522 offset = 0;
523
524 for (chunk = 0; chunk < chunks_in_group; chunk++) {
525 /*
526 * last chunk may be not an entire one.
527 */
528 if ((offset + ffg->iff_chunksize) > max_bits)
529 num_clusters = max_bits - offset;
530 else
531 num_clusters = ffg->iff_chunksize;
532
533 chunk_free = 0;
534 for (cluster = 0; cluster < num_clusters; cluster++) {
535 used = ocfs2_test_bit(offset,
536 (unsigned long *)bg->bg_bitmap);
537 /*
538 * - chunk_free counts free clusters in #N chunk.
539 * - last_chunksize records the size(in) clusters
540 * for the last real free chunk being counted.
541 */
542 if (!used) {
543 last_chunksize++;
544 chunk_free++;
545 }
546
547 if (used && last_chunksize) {
548 ocfs2_info_update_ffg(ffg,
549 last_chunksize);
550 last_chunksize = 0;
551 }
552
553 offset++;
554 }
555
556 if (chunk_free == ffg->iff_chunksize)
557 ffg->iff_ffs.ffs_free_chunks++;
558 }
559
560 /*
561 * need to update the info for last free chunk.
562 */
563 if (last_chunksize)
564 ocfs2_info_update_ffg(ffg, last_chunksize);
565
566 } while (le64_to_cpu(bg->bg_next_group));
567
568bail:
569 brelse(bh);
570
571 return status;
572}
573
574int ocfs2_info_freefrag_scan_bitmap(struct ocfs2_super *osb,
575 struct inode *gb_inode, u64 blkno,
576 struct ocfs2_info_freefrag *ffg)
577{
578 u32 chunks_in_group;
579 int status = 0, unlock = 0, i;
580
581 struct buffer_head *bh = NULL;
582 struct ocfs2_chain_list *cl = NULL;
583 struct ocfs2_chain_rec *rec = NULL;
584 struct ocfs2_dinode *gb_dinode = NULL;
585
586 if (gb_inode)
587 mutex_lock(&gb_inode->i_mutex);
588
589 if (o2info_coherent(&ffg->iff_req)) {
590 status = ocfs2_inode_lock(gb_inode, &bh, 0);
591 if (status < 0) {
592 mlog_errno(status);
593 goto bail;
594 }
595 unlock = 1;
596 } else {
597 status = ocfs2_read_blocks_sync(osb, blkno, 1, &bh);
598 if (status < 0) {
599 mlog_errno(status);
600 goto bail;
601 }
602 }
603
604 gb_dinode = (struct ocfs2_dinode *)bh->b_data;
605 cl = &(gb_dinode->id2.i_chain);
606
607 /*
608 * Chunksize(in) clusters from userspace should be
609 * less than clusters in a group.
610 */
611 if (ffg->iff_chunksize > le16_to_cpu(cl->cl_cpg)) {
612 status = -EINVAL;
613 goto bail;
614 }
615
616 memset(&ffg->iff_ffs, 0, sizeof(struct ocfs2_info_freefrag_stats));
617
618 ffg->iff_ffs.ffs_min = ~0U;
619 ffg->iff_ffs.ffs_clusters =
620 le32_to_cpu(gb_dinode->id1.bitmap1.i_total);
621 ffg->iff_ffs.ffs_free_clusters = ffg->iff_ffs.ffs_clusters -
622 le32_to_cpu(gb_dinode->id1.bitmap1.i_used);
623
624 chunks_in_group = le16_to_cpu(cl->cl_cpg) / ffg->iff_chunksize + 1;
625
626 for (i = 0; i < le16_to_cpu(cl->cl_next_free_rec); i++) {
627 rec = &(cl->cl_recs[i]);
628 status = ocfs2_info_freefrag_scan_chain(osb, gb_inode,
629 gb_dinode,
630 rec, ffg,
631 chunks_in_group);
632 if (status)
633 goto bail;
634 }
635
636 if (ffg->iff_ffs.ffs_free_chunks_real)
637 ffg->iff_ffs.ffs_avg = (ffg->iff_ffs.ffs_avg /
638 ffg->iff_ffs.ffs_free_chunks_real);
639bail:
640 if (unlock)
641 ocfs2_inode_unlock(gb_inode, 0);
642
643 if (gb_inode)
644 mutex_unlock(&gb_inode->i_mutex);
645
646 if (gb_inode)
647 iput(gb_inode);
648
649 brelse(bh);
650
651 return status;
652}
653
654int ocfs2_info_handle_freefrag(struct inode *inode,
655 struct ocfs2_info_request __user *req)
656{
657 u64 blkno = -1;
658 char namebuf[40];
659 int status = -EFAULT, type = GLOBAL_BITMAP_SYSTEM_INODE;
660
661 struct ocfs2_info_freefrag *oiff;
662 struct ocfs2_super *osb = OCFS2_SB(inode->i_sb);
663 struct inode *gb_inode = NULL;
664
665 oiff = kzalloc(sizeof(struct ocfs2_info_freefrag), GFP_KERNEL);
666 if (!oiff) {
667 status = -ENOMEM;
668 mlog_errno(status);
669 goto bail;
670 }
671
672 if (o2info_from_user(*oiff, req))
673 goto bail;
674 /*
675 * chunksize from userspace should be power of 2.
676 */
677 if ((oiff->iff_chunksize & (oiff->iff_chunksize - 1)) ||
678 (!oiff->iff_chunksize)) {
679 status = -EINVAL;
680 goto bail;
681 }
682
683 if (o2info_coherent(&oiff->iff_req)) {
684 gb_inode = ocfs2_get_system_file_inode(osb, type,
685 OCFS2_INVALID_SLOT);
686 if (!gb_inode) {
687 mlog(ML_ERROR, "unable to get global_bitmap inode\n");
688 status = -EIO;
689 goto bail;
690 }
691 } else {
692 ocfs2_sprintf_system_inode_name(namebuf, sizeof(namebuf), type,
693 OCFS2_INVALID_SLOT);
694 status = ocfs2_lookup_ino_from_name(osb->sys_root_inode,
695 namebuf,
696 strlen(namebuf),
697 &blkno);
698 if (status < 0) {
699 status = -ENOENT;
700 goto bail;
701 }
702 }
703
704 status = ocfs2_info_freefrag_scan_bitmap(osb, gb_inode, blkno, oiff);
705 if (status < 0)
706 goto bail;
707
708 o2info_set_request_filled(&oiff->iff_req);
709
710 if (o2info_to_user(*oiff, req))
711 goto bail;
712
713 status = 0;
714bail:
715 if (status)
716 o2info_set_request_error(&oiff->iff_req, req);
717
718 kfree(oiff);
719
720 return status;
721}
722
723int ocfs2_info_handle_unknown(struct inode *inode,
724 struct ocfs2_info_request __user *req)
725{
726 int status = -EFAULT;
727 struct ocfs2_info_request oir;
728
729 if (o2info_from_user(oir, req))
730 goto bail;
731
732 o2info_clear_request_filled(&oir);
733
734 if (o2info_to_user(oir, req))
735 goto bail;
736
737 status = 0;
738bail:
739 if (status)
740 o2info_set_request_error(&oir, req);
741
742 return status;
743}
744
745/*
746 * Validate and distinguish OCFS2_IOC_INFO requests.
747 *
748 * - validate the magic number.
749 * - distinguish different requests.
750 * - validate size of different requests.
751 */
752int ocfs2_info_handle_request(struct inode *inode,
753 struct ocfs2_info_request __user *req)
754{
755 int status = -EFAULT;
756 struct ocfs2_info_request oir;
757
758 if (o2info_from_user(oir, req))
759 goto bail;
760
761 status = -EINVAL;
762 if (oir.ir_magic != OCFS2_INFO_MAGIC)
763 goto bail;
764
765 switch (oir.ir_code) {
766 case OCFS2_INFO_BLOCKSIZE:
767 if (oir.ir_size == sizeof(struct ocfs2_info_blocksize))
768 status = ocfs2_info_handle_blocksize(inode, req);
769 break;
770 case OCFS2_INFO_CLUSTERSIZE:
771 if (oir.ir_size == sizeof(struct ocfs2_info_clustersize))
772 status = ocfs2_info_handle_clustersize(inode, req);
773 break;
774 case OCFS2_INFO_MAXSLOTS:
775 if (oir.ir_size == sizeof(struct ocfs2_info_maxslots))
776 status = ocfs2_info_handle_maxslots(inode, req);
777 break;
778 case OCFS2_INFO_LABEL:
779 if (oir.ir_size == sizeof(struct ocfs2_info_label))
780 status = ocfs2_info_handle_label(inode, req);
781 break;
782 case OCFS2_INFO_UUID:
783 if (oir.ir_size == sizeof(struct ocfs2_info_uuid))
784 status = ocfs2_info_handle_uuid(inode, req);
785 break;
786 case OCFS2_INFO_FS_FEATURES:
787 if (oir.ir_size == sizeof(struct ocfs2_info_fs_features))
788 status = ocfs2_info_handle_fs_features(inode, req);
789 break;
790 case OCFS2_INFO_JOURNAL_SIZE:
791 if (oir.ir_size == sizeof(struct ocfs2_info_journal_size))
792 status = ocfs2_info_handle_journal_size(inode, req);
793 break;
794 case OCFS2_INFO_FREEINODE:
795 if (oir.ir_size == sizeof(struct ocfs2_info_freeinode))
796 status = ocfs2_info_handle_freeinode(inode, req);
797 break;
798 case OCFS2_INFO_FREEFRAG:
799 if (oir.ir_size == sizeof(struct ocfs2_info_freefrag))
800 status = ocfs2_info_handle_freefrag(inode, req);
801 break;
802 default:
803 status = ocfs2_info_handle_unknown(inode, req);
804 break;
805 }
806
807bail:
808 return status;
809}
810
811int ocfs2_get_request_ptr(struct ocfs2_info *info, int idx,
812 u64 *req_addr, int compat_flag)
813{
814 int status = -EFAULT;
815 u64 __user *bp = NULL;
816
817 if (compat_flag) {
818#ifdef CONFIG_COMPAT
819 /*
820 * pointer bp stores the base address of a pointers array,
821 * which collects all addresses of separate request.
822 */
823 bp = (u64 __user *)(unsigned long)compat_ptr(info->oi_requests);
824#else
825 BUG();
826#endif
827 } else
828 bp = (u64 __user *)(unsigned long)(info->oi_requests);
829
830 if (o2info_from_user(*req_addr, bp + idx))
831 goto bail;
832
833 status = 0;
834bail:
835 return status;
836}
837
838/*
839 * OCFS2_IOC_INFO handles an array of requests passed from userspace.
840 *
841 * ocfs2_info_handle() recevies a large info aggregation, grab and
842 * validate the request count from header, then break it into small
843 * pieces, later specific handlers can handle them one by one.
844 *
845 * Idea here is to make each separate request small enough to ensure
846 * a better backward&forward compatibility, since a small piece of
847 * request will be less likely to be broken if disk layout get changed.
848 */
849int ocfs2_info_handle(struct inode *inode, struct ocfs2_info *info,
850 int compat_flag)
851{
852 int i, status = 0;
853 u64 req_addr;
854 struct ocfs2_info_request __user *reqp;
855
856 if ((info->oi_count > OCFS2_INFO_MAX_REQUEST) ||
857 (!info->oi_requests)) {
858 status = -EINVAL;
859 goto bail;
860 }
861
862 for (i = 0; i < info->oi_count; i++) {
863
864 status = ocfs2_get_request_ptr(info, i, &req_addr, compat_flag);
865 if (status)
866 break;
867
868 reqp = (struct ocfs2_info_request *)(unsigned long)req_addr;
869 if (!reqp) {
870 status = -EINVAL;
871 goto bail;
872 }
873
874 status = ocfs2_info_handle_request(inode, reqp);
875 if (status)
876 break;
877 }
878
879bail:
880 return status;
881}
882
883long ocfs2_ioctl(struct file *filp, unsigned int cmd, unsigned long arg)
884{
885 struct inode *inode = filp->f_path.dentry->d_inode;
886 unsigned int flags;
887 int new_clusters;
888 int status;
889 struct ocfs2_space_resv sr;
890 struct ocfs2_new_group_input input;
891 struct reflink_arguments args;
892 const char *old_path, *new_path;
893 bool preserve;
894 struct ocfs2_info info;
895
896 switch (cmd) {
897 case OCFS2_IOC_GETFLAGS:
898 status = ocfs2_get_inode_attr(inode, &flags);
899 if (status < 0)
900 return status;
901
902 flags &= OCFS2_FL_VISIBLE;
903 return put_user(flags, (int __user *) arg);
904 case OCFS2_IOC_SETFLAGS:
905 if (get_user(flags, (int __user *) arg))
906 return -EFAULT;
907
908 status = mnt_want_write(filp->f_path.mnt);
909 if (status)
910 return status;
911 status = ocfs2_set_inode_attr(inode, flags,
912 OCFS2_FL_MODIFIABLE);
913 mnt_drop_write(filp->f_path.mnt);
914 return status;
915 case OCFS2_IOC_RESVSP:
916 case OCFS2_IOC_RESVSP64:
917 case OCFS2_IOC_UNRESVSP:
918 case OCFS2_IOC_UNRESVSP64:
919 if (copy_from_user(&sr, (int __user *) arg, sizeof(sr)))
920 return -EFAULT;
921
922 return ocfs2_change_file_space(filp, cmd, &sr);
923 case OCFS2_IOC_GROUP_EXTEND:
924 if (!capable(CAP_SYS_RESOURCE))
925 return -EPERM;
926
927 if (get_user(new_clusters, (int __user *)arg))
928 return -EFAULT;
929
930 return ocfs2_group_extend(inode, new_clusters);
931 case OCFS2_IOC_GROUP_ADD:
932 case OCFS2_IOC_GROUP_ADD64:
933 if (!capable(CAP_SYS_RESOURCE))
934 return -EPERM;
935
936 if (copy_from_user(&input, (int __user *) arg, sizeof(input)))
937 return -EFAULT;
938
939 return ocfs2_group_add(inode, &input);
940 case OCFS2_IOC_REFLINK:
941 if (copy_from_user(&args, (struct reflink_arguments *)arg,
942 sizeof(args)))
943 return -EFAULT;
944 old_path = (const char *)(unsigned long)args.old_path;
945 new_path = (const char *)(unsigned long)args.new_path;
946 preserve = (args.preserve != 0);
947
948 return ocfs2_reflink_ioctl(inode, old_path, new_path, preserve);
949 case OCFS2_IOC_INFO:
950 if (copy_from_user(&info, (struct ocfs2_info __user *)arg,
951 sizeof(struct ocfs2_info)))
952 return -EFAULT;
953
954 return ocfs2_info_handle(inode, &info, 0);
955 case FITRIM:
956 {
957 struct super_block *sb = inode->i_sb;
958 struct fstrim_range range;
959 int ret = 0;
960
961 if (!capable(CAP_SYS_ADMIN))
962 return -EPERM;
963
964 if (copy_from_user(&range, (struct fstrim_range *)arg,
965 sizeof(range)))
966 return -EFAULT;
967
968 ret = ocfs2_trim_fs(sb, &range);
969 if (ret < 0)
970 return ret;
971
972 if (copy_to_user((struct fstrim_range *)arg, &range,
973 sizeof(range)))
974 return -EFAULT;
975
976 return 0;
977 }
978 case OCFS2_IOC_MOVE_EXT:
979 return ocfs2_ioctl_move_extents(filp, (void __user *)arg);
980 default:
981 return -ENOTTY;
982 }
983}
984
985#ifdef CONFIG_COMPAT
986long ocfs2_compat_ioctl(struct file *file, unsigned cmd, unsigned long arg)
987{
988 bool preserve;
989 struct reflink_arguments args;
990 struct inode *inode = file->f_path.dentry->d_inode;
991 struct ocfs2_info info;
992
993 switch (cmd) {
994 case OCFS2_IOC32_GETFLAGS:
995 cmd = OCFS2_IOC_GETFLAGS;
996 break;
997 case OCFS2_IOC32_SETFLAGS:
998 cmd = OCFS2_IOC_SETFLAGS;
999 break;
1000 case OCFS2_IOC_RESVSP:
1001 case OCFS2_IOC_RESVSP64:
1002 case OCFS2_IOC_UNRESVSP:
1003 case OCFS2_IOC_UNRESVSP64:
1004 case OCFS2_IOC_GROUP_EXTEND:
1005 case OCFS2_IOC_GROUP_ADD:
1006 case OCFS2_IOC_GROUP_ADD64:
1007 case FITRIM:
1008 break;
1009 case OCFS2_IOC_REFLINK:
1010 if (copy_from_user(&args, (struct reflink_arguments *)arg,
1011 sizeof(args)))
1012 return -EFAULT;
1013 preserve = (args.preserve != 0);
1014
1015 return ocfs2_reflink_ioctl(inode, compat_ptr(args.old_path),
1016 compat_ptr(args.new_path), preserve);
1017 case OCFS2_IOC_INFO:
1018 if (copy_from_user(&info, (struct ocfs2_info __user *)arg,
1019 sizeof(struct ocfs2_info)))
1020 return -EFAULT;
1021
1022 return ocfs2_info_handle(inode, &info, 1);
1023 case OCFS2_IOC_MOVE_EXT:
1024 break;
1025 default:
1026 return -ENOIOCTLCMD;
1027 }
1028
1029 return ocfs2_ioctl(file, cmd, arg);
1030}
1031#endif
1// SPDX-License-Identifier: GPL-2.0
2/*
3 * linux/fs/ocfs2/ioctl.c
4 *
5 * Copyright (C) 2006 Herbert Poetzl
6 * adapted from Remy Card's ext2/ioctl.c
7 */
8
9#include <linux/fs.h>
10#include <linux/mount.h>
11#include <linux/blkdev.h>
12#include <linux/compat.h>
13
14#include <cluster/masklog.h>
15
16#include "ocfs2.h"
17#include "alloc.h"
18#include "dlmglue.h"
19#include "file.h"
20#include "inode.h"
21#include "journal.h"
22
23#include "ocfs2_fs.h"
24#include "ioctl.h"
25#include "resize.h"
26#include "refcounttree.h"
27#include "sysfile.h"
28#include "dir.h"
29#include "buffer_head_io.h"
30#include "suballoc.h"
31#include "move_extents.h"
32
33#define o2info_from_user(a, b) \
34 copy_from_user(&(a), (b), sizeof(a))
35#define o2info_to_user(a, b) \
36 copy_to_user((typeof(a) __user *)b, &(a), sizeof(a))
37
38/*
39 * This is just a best-effort to tell userspace that this request
40 * caused the error.
41 */
42static inline void o2info_set_request_error(struct ocfs2_info_request *kreq,
43 struct ocfs2_info_request __user *req)
44{
45 kreq->ir_flags |= OCFS2_INFO_FL_ERROR;
46 (void)put_user(kreq->ir_flags, (__u32 __user *)&(req->ir_flags));
47}
48
49static inline void o2info_set_request_filled(struct ocfs2_info_request *req)
50{
51 req->ir_flags |= OCFS2_INFO_FL_FILLED;
52}
53
54static inline void o2info_clear_request_filled(struct ocfs2_info_request *req)
55{
56 req->ir_flags &= ~OCFS2_INFO_FL_FILLED;
57}
58
59static inline int o2info_coherent(struct ocfs2_info_request *req)
60{
61 return (!(req->ir_flags & OCFS2_INFO_FL_NON_COHERENT));
62}
63
64static int ocfs2_get_inode_attr(struct inode *inode, unsigned *flags)
65{
66 int status;
67
68 status = ocfs2_inode_lock(inode, NULL, 0);
69 if (status < 0) {
70 mlog_errno(status);
71 return status;
72 }
73 ocfs2_get_inode_flags(OCFS2_I(inode));
74 *flags = OCFS2_I(inode)->ip_attr;
75 ocfs2_inode_unlock(inode, 0);
76
77 return status;
78}
79
80static int ocfs2_set_inode_attr(struct inode *inode, unsigned flags,
81 unsigned mask)
82{
83 struct ocfs2_inode_info *ocfs2_inode = OCFS2_I(inode);
84 struct ocfs2_super *osb = OCFS2_SB(inode->i_sb);
85 handle_t *handle = NULL;
86 struct buffer_head *bh = NULL;
87 unsigned oldflags;
88 int status;
89
90 inode_lock(inode);
91
92 status = ocfs2_inode_lock(inode, &bh, 1);
93 if (status < 0) {
94 mlog_errno(status);
95 goto bail;
96 }
97
98 status = -EACCES;
99 if (!inode_owner_or_capable(inode))
100 goto bail_unlock;
101
102 if (!S_ISDIR(inode->i_mode))
103 flags &= ~OCFS2_DIRSYNC_FL;
104
105 oldflags = ocfs2_inode->ip_attr;
106 flags = flags & mask;
107 flags |= oldflags & ~mask;
108
109 status = vfs_ioc_setflags_prepare(inode, oldflags, flags);
110 if (status)
111 goto bail_unlock;
112
113 handle = ocfs2_start_trans(osb, OCFS2_INODE_UPDATE_CREDITS);
114 if (IS_ERR(handle)) {
115 status = PTR_ERR(handle);
116 mlog_errno(status);
117 goto bail_unlock;
118 }
119
120 ocfs2_inode->ip_attr = flags;
121 ocfs2_set_inode_flags(inode);
122
123 status = ocfs2_mark_inode_dirty(handle, inode, bh);
124 if (status < 0)
125 mlog_errno(status);
126
127 ocfs2_commit_trans(osb, handle);
128
129bail_unlock:
130 ocfs2_inode_unlock(inode, 1);
131bail:
132 inode_unlock(inode);
133
134 brelse(bh);
135
136 return status;
137}
138
139static int ocfs2_info_handle_blocksize(struct inode *inode,
140 struct ocfs2_info_request __user *req)
141{
142 struct ocfs2_info_blocksize oib;
143
144 if (o2info_from_user(oib, req))
145 return -EFAULT;
146
147 oib.ib_blocksize = inode->i_sb->s_blocksize;
148
149 o2info_set_request_filled(&oib.ib_req);
150
151 if (o2info_to_user(oib, req))
152 return -EFAULT;
153
154 return 0;
155}
156
157static int ocfs2_info_handle_clustersize(struct inode *inode,
158 struct ocfs2_info_request __user *req)
159{
160 struct ocfs2_info_clustersize oic;
161 struct ocfs2_super *osb = OCFS2_SB(inode->i_sb);
162
163 if (o2info_from_user(oic, req))
164 return -EFAULT;
165
166 oic.ic_clustersize = osb->s_clustersize;
167
168 o2info_set_request_filled(&oic.ic_req);
169
170 if (o2info_to_user(oic, req))
171 return -EFAULT;
172
173 return 0;
174}
175
176static int ocfs2_info_handle_maxslots(struct inode *inode,
177 struct ocfs2_info_request __user *req)
178{
179 struct ocfs2_info_maxslots oim;
180 struct ocfs2_super *osb = OCFS2_SB(inode->i_sb);
181
182 if (o2info_from_user(oim, req))
183 return -EFAULT;
184
185 oim.im_max_slots = osb->max_slots;
186
187 o2info_set_request_filled(&oim.im_req);
188
189 if (o2info_to_user(oim, req))
190 return -EFAULT;
191
192 return 0;
193}
194
195static int ocfs2_info_handle_label(struct inode *inode,
196 struct ocfs2_info_request __user *req)
197{
198 struct ocfs2_info_label oil;
199 struct ocfs2_super *osb = OCFS2_SB(inode->i_sb);
200
201 if (o2info_from_user(oil, req))
202 return -EFAULT;
203
204 memcpy(oil.il_label, osb->vol_label, OCFS2_MAX_VOL_LABEL_LEN);
205
206 o2info_set_request_filled(&oil.il_req);
207
208 if (o2info_to_user(oil, req))
209 return -EFAULT;
210
211 return 0;
212}
213
214static int ocfs2_info_handle_uuid(struct inode *inode,
215 struct ocfs2_info_request __user *req)
216{
217 struct ocfs2_info_uuid oiu;
218 struct ocfs2_super *osb = OCFS2_SB(inode->i_sb);
219
220 if (o2info_from_user(oiu, req))
221 return -EFAULT;
222
223 memcpy(oiu.iu_uuid_str, osb->uuid_str, OCFS2_TEXT_UUID_LEN + 1);
224
225 o2info_set_request_filled(&oiu.iu_req);
226
227 if (o2info_to_user(oiu, req))
228 return -EFAULT;
229
230 return 0;
231}
232
233static int ocfs2_info_handle_fs_features(struct inode *inode,
234 struct ocfs2_info_request __user *req)
235{
236 struct ocfs2_info_fs_features oif;
237 struct ocfs2_super *osb = OCFS2_SB(inode->i_sb);
238
239 if (o2info_from_user(oif, req))
240 return -EFAULT;
241
242 oif.if_compat_features = osb->s_feature_compat;
243 oif.if_incompat_features = osb->s_feature_incompat;
244 oif.if_ro_compat_features = osb->s_feature_ro_compat;
245
246 o2info_set_request_filled(&oif.if_req);
247
248 if (o2info_to_user(oif, req))
249 return -EFAULT;
250
251 return 0;
252}
253
254static int ocfs2_info_handle_journal_size(struct inode *inode,
255 struct ocfs2_info_request __user *req)
256{
257 struct ocfs2_info_journal_size oij;
258 struct ocfs2_super *osb = OCFS2_SB(inode->i_sb);
259
260 if (o2info_from_user(oij, req))
261 return -EFAULT;
262
263 oij.ij_journal_size = i_size_read(osb->journal->j_inode);
264
265 o2info_set_request_filled(&oij.ij_req);
266
267 if (o2info_to_user(oij, req))
268 return -EFAULT;
269
270 return 0;
271}
272
273static int ocfs2_info_scan_inode_alloc(struct ocfs2_super *osb,
274 struct inode *inode_alloc, u64 blkno,
275 struct ocfs2_info_freeinode *fi,
276 u32 slot)
277{
278 int status = 0, unlock = 0;
279
280 struct buffer_head *bh = NULL;
281 struct ocfs2_dinode *dinode_alloc = NULL;
282
283 if (inode_alloc)
284 inode_lock(inode_alloc);
285
286 if (inode_alloc && o2info_coherent(&fi->ifi_req)) {
287 status = ocfs2_inode_lock(inode_alloc, &bh, 0);
288 if (status < 0) {
289 mlog_errno(status);
290 goto bail;
291 }
292 unlock = 1;
293 } else {
294 status = ocfs2_read_blocks_sync(osb, blkno, 1, &bh);
295 if (status < 0) {
296 mlog_errno(status);
297 goto bail;
298 }
299 }
300
301 dinode_alloc = (struct ocfs2_dinode *)bh->b_data;
302
303 fi->ifi_stat[slot].lfi_total =
304 le32_to_cpu(dinode_alloc->id1.bitmap1.i_total);
305 fi->ifi_stat[slot].lfi_free =
306 le32_to_cpu(dinode_alloc->id1.bitmap1.i_total) -
307 le32_to_cpu(dinode_alloc->id1.bitmap1.i_used);
308
309bail:
310 if (unlock)
311 ocfs2_inode_unlock(inode_alloc, 0);
312
313 if (inode_alloc)
314 inode_unlock(inode_alloc);
315
316 brelse(bh);
317
318 return status;
319}
320
321static int ocfs2_info_handle_freeinode(struct inode *inode,
322 struct ocfs2_info_request __user *req)
323{
324 u32 i;
325 u64 blkno = -1;
326 char namebuf[40];
327 int status, type = INODE_ALLOC_SYSTEM_INODE;
328 struct ocfs2_info_freeinode *oifi = NULL;
329 struct ocfs2_super *osb = OCFS2_SB(inode->i_sb);
330 struct inode *inode_alloc = NULL;
331
332 oifi = kzalloc(sizeof(struct ocfs2_info_freeinode), GFP_KERNEL);
333 if (!oifi) {
334 status = -ENOMEM;
335 mlog_errno(status);
336 goto out_err;
337 }
338
339 if (o2info_from_user(*oifi, req)) {
340 status = -EFAULT;
341 goto out_free;
342 }
343
344 oifi->ifi_slotnum = osb->max_slots;
345
346 for (i = 0; i < oifi->ifi_slotnum; i++) {
347 if (o2info_coherent(&oifi->ifi_req)) {
348 inode_alloc = ocfs2_get_system_file_inode(osb, type, i);
349 if (!inode_alloc) {
350 mlog(ML_ERROR, "unable to get alloc inode in "
351 "slot %u\n", i);
352 status = -EIO;
353 goto bail;
354 }
355 } else {
356 ocfs2_sprintf_system_inode_name(namebuf,
357 sizeof(namebuf),
358 type, i);
359 status = ocfs2_lookup_ino_from_name(osb->sys_root_inode,
360 namebuf,
361 strlen(namebuf),
362 &blkno);
363 if (status < 0) {
364 status = -ENOENT;
365 goto bail;
366 }
367 }
368
369 status = ocfs2_info_scan_inode_alloc(osb, inode_alloc, blkno, oifi, i);
370
371 iput(inode_alloc);
372 inode_alloc = NULL;
373
374 if (status < 0)
375 goto bail;
376 }
377
378 o2info_set_request_filled(&oifi->ifi_req);
379
380 if (o2info_to_user(*oifi, req)) {
381 status = -EFAULT;
382 goto out_free;
383 }
384
385 status = 0;
386bail:
387 if (status)
388 o2info_set_request_error(&oifi->ifi_req, req);
389out_free:
390 kfree(oifi);
391out_err:
392 return status;
393}
394
395static void o2ffg_update_histogram(struct ocfs2_info_free_chunk_list *hist,
396 unsigned int chunksize)
397{
398 u32 index;
399
400 index = __ilog2_u32(chunksize);
401 if (index >= OCFS2_INFO_MAX_HIST)
402 index = OCFS2_INFO_MAX_HIST - 1;
403
404 hist->fc_chunks[index]++;
405 hist->fc_clusters[index] += chunksize;
406}
407
408static void o2ffg_update_stats(struct ocfs2_info_freefrag_stats *stats,
409 unsigned int chunksize)
410{
411 if (chunksize > stats->ffs_max)
412 stats->ffs_max = chunksize;
413
414 if (chunksize < stats->ffs_min)
415 stats->ffs_min = chunksize;
416
417 stats->ffs_avg += chunksize;
418 stats->ffs_free_chunks_real++;
419}
420
421static void ocfs2_info_update_ffg(struct ocfs2_info_freefrag *ffg,
422 unsigned int chunksize)
423{
424 o2ffg_update_histogram(&(ffg->iff_ffs.ffs_fc_hist), chunksize);
425 o2ffg_update_stats(&(ffg->iff_ffs), chunksize);
426}
427
428static int ocfs2_info_freefrag_scan_chain(struct ocfs2_super *osb,
429 struct inode *gb_inode,
430 struct ocfs2_dinode *gb_dinode,
431 struct ocfs2_chain_rec *rec,
432 struct ocfs2_info_freefrag *ffg,
433 u32 chunks_in_group)
434{
435 int status = 0, used;
436 u64 blkno;
437
438 struct buffer_head *bh = NULL;
439 struct ocfs2_group_desc *bg = NULL;
440
441 unsigned int max_bits, num_clusters;
442 unsigned int offset = 0, cluster, chunk;
443 unsigned int chunk_free, last_chunksize = 0;
444
445 if (!le32_to_cpu(rec->c_free))
446 goto bail;
447
448 do {
449 if (!bg)
450 blkno = le64_to_cpu(rec->c_blkno);
451 else
452 blkno = le64_to_cpu(bg->bg_next_group);
453
454 if (bh) {
455 brelse(bh);
456 bh = NULL;
457 }
458
459 if (o2info_coherent(&ffg->iff_req))
460 status = ocfs2_read_group_descriptor(gb_inode,
461 gb_dinode,
462 blkno, &bh);
463 else
464 status = ocfs2_read_blocks_sync(osb, blkno, 1, &bh);
465
466 if (status < 0) {
467 mlog(ML_ERROR, "Can't read the group descriptor # "
468 "%llu from device.", (unsigned long long)blkno);
469 status = -EIO;
470 goto bail;
471 }
472
473 bg = (struct ocfs2_group_desc *)bh->b_data;
474
475 if (!le16_to_cpu(bg->bg_free_bits_count))
476 continue;
477
478 max_bits = le16_to_cpu(bg->bg_bits);
479 offset = 0;
480
481 for (chunk = 0; chunk < chunks_in_group; chunk++) {
482 /*
483 * last chunk may be not an entire one.
484 */
485 if ((offset + ffg->iff_chunksize) > max_bits)
486 num_clusters = max_bits - offset;
487 else
488 num_clusters = ffg->iff_chunksize;
489
490 chunk_free = 0;
491 for (cluster = 0; cluster < num_clusters; cluster++) {
492 used = ocfs2_test_bit(offset,
493 (unsigned long *)bg->bg_bitmap);
494 /*
495 * - chunk_free counts free clusters in #N chunk.
496 * - last_chunksize records the size(in) clusters
497 * for the last real free chunk being counted.
498 */
499 if (!used) {
500 last_chunksize++;
501 chunk_free++;
502 }
503
504 if (used && last_chunksize) {
505 ocfs2_info_update_ffg(ffg,
506 last_chunksize);
507 last_chunksize = 0;
508 }
509
510 offset++;
511 }
512
513 if (chunk_free == ffg->iff_chunksize)
514 ffg->iff_ffs.ffs_free_chunks++;
515 }
516
517 /*
518 * need to update the info for last free chunk.
519 */
520 if (last_chunksize)
521 ocfs2_info_update_ffg(ffg, last_chunksize);
522
523 } while (le64_to_cpu(bg->bg_next_group));
524
525bail:
526 brelse(bh);
527
528 return status;
529}
530
531static int ocfs2_info_freefrag_scan_bitmap(struct ocfs2_super *osb,
532 struct inode *gb_inode, u64 blkno,
533 struct ocfs2_info_freefrag *ffg)
534{
535 u32 chunks_in_group;
536 int status = 0, unlock = 0, i;
537
538 struct buffer_head *bh = NULL;
539 struct ocfs2_chain_list *cl = NULL;
540 struct ocfs2_chain_rec *rec = NULL;
541 struct ocfs2_dinode *gb_dinode = NULL;
542
543 if (gb_inode)
544 inode_lock(gb_inode);
545
546 if (o2info_coherent(&ffg->iff_req)) {
547 status = ocfs2_inode_lock(gb_inode, &bh, 0);
548 if (status < 0) {
549 mlog_errno(status);
550 goto bail;
551 }
552 unlock = 1;
553 } else {
554 status = ocfs2_read_blocks_sync(osb, blkno, 1, &bh);
555 if (status < 0) {
556 mlog_errno(status);
557 goto bail;
558 }
559 }
560
561 gb_dinode = (struct ocfs2_dinode *)bh->b_data;
562 cl = &(gb_dinode->id2.i_chain);
563
564 /*
565 * Chunksize(in) clusters from userspace should be
566 * less than clusters in a group.
567 */
568 if (ffg->iff_chunksize > le16_to_cpu(cl->cl_cpg)) {
569 status = -EINVAL;
570 goto bail;
571 }
572
573 memset(&ffg->iff_ffs, 0, sizeof(struct ocfs2_info_freefrag_stats));
574
575 ffg->iff_ffs.ffs_min = ~0U;
576 ffg->iff_ffs.ffs_clusters =
577 le32_to_cpu(gb_dinode->id1.bitmap1.i_total);
578 ffg->iff_ffs.ffs_free_clusters = ffg->iff_ffs.ffs_clusters -
579 le32_to_cpu(gb_dinode->id1.bitmap1.i_used);
580
581 chunks_in_group = le16_to_cpu(cl->cl_cpg) / ffg->iff_chunksize + 1;
582
583 for (i = 0; i < le16_to_cpu(cl->cl_next_free_rec); i++) {
584 rec = &(cl->cl_recs[i]);
585 status = ocfs2_info_freefrag_scan_chain(osb, gb_inode,
586 gb_dinode,
587 rec, ffg,
588 chunks_in_group);
589 if (status)
590 goto bail;
591 }
592
593 if (ffg->iff_ffs.ffs_free_chunks_real)
594 ffg->iff_ffs.ffs_avg = (ffg->iff_ffs.ffs_avg /
595 ffg->iff_ffs.ffs_free_chunks_real);
596bail:
597 if (unlock)
598 ocfs2_inode_unlock(gb_inode, 0);
599
600 if (gb_inode)
601 inode_unlock(gb_inode);
602
603 iput(gb_inode);
604 brelse(bh);
605
606 return status;
607}
608
609static int ocfs2_info_handle_freefrag(struct inode *inode,
610 struct ocfs2_info_request __user *req)
611{
612 u64 blkno = -1;
613 char namebuf[40];
614 int status, type = GLOBAL_BITMAP_SYSTEM_INODE;
615
616 struct ocfs2_info_freefrag *oiff;
617 struct ocfs2_super *osb = OCFS2_SB(inode->i_sb);
618 struct inode *gb_inode = NULL;
619
620 oiff = kzalloc(sizeof(struct ocfs2_info_freefrag), GFP_KERNEL);
621 if (!oiff) {
622 status = -ENOMEM;
623 mlog_errno(status);
624 goto out_err;
625 }
626
627 if (o2info_from_user(*oiff, req)) {
628 status = -EFAULT;
629 goto out_free;
630 }
631 /*
632 * chunksize from userspace should be power of 2.
633 */
634 if ((oiff->iff_chunksize & (oiff->iff_chunksize - 1)) ||
635 (!oiff->iff_chunksize)) {
636 status = -EINVAL;
637 goto bail;
638 }
639
640 if (o2info_coherent(&oiff->iff_req)) {
641 gb_inode = ocfs2_get_system_file_inode(osb, type,
642 OCFS2_INVALID_SLOT);
643 if (!gb_inode) {
644 mlog(ML_ERROR, "unable to get global_bitmap inode\n");
645 status = -EIO;
646 goto bail;
647 }
648 } else {
649 ocfs2_sprintf_system_inode_name(namebuf, sizeof(namebuf), type,
650 OCFS2_INVALID_SLOT);
651 status = ocfs2_lookup_ino_from_name(osb->sys_root_inode,
652 namebuf,
653 strlen(namebuf),
654 &blkno);
655 if (status < 0) {
656 status = -ENOENT;
657 goto bail;
658 }
659 }
660
661 status = ocfs2_info_freefrag_scan_bitmap(osb, gb_inode, blkno, oiff);
662 if (status < 0)
663 goto bail;
664
665 o2info_set_request_filled(&oiff->iff_req);
666
667 if (o2info_to_user(*oiff, req)) {
668 status = -EFAULT;
669 goto out_free;
670 }
671
672 status = 0;
673bail:
674 if (status)
675 o2info_set_request_error(&oiff->iff_req, req);
676out_free:
677 kfree(oiff);
678out_err:
679 return status;
680}
681
682static int ocfs2_info_handle_unknown(struct inode *inode,
683 struct ocfs2_info_request __user *req)
684{
685 struct ocfs2_info_request oir;
686
687 if (o2info_from_user(oir, req))
688 return -EFAULT;
689
690 o2info_clear_request_filled(&oir);
691
692 if (o2info_to_user(oir, req))
693 return -EFAULT;
694
695 return 0;
696}
697
698/*
699 * Validate and distinguish OCFS2_IOC_INFO requests.
700 *
701 * - validate the magic number.
702 * - distinguish different requests.
703 * - validate size of different requests.
704 */
705static int ocfs2_info_handle_request(struct inode *inode,
706 struct ocfs2_info_request __user *req)
707{
708 int status = -EFAULT;
709 struct ocfs2_info_request oir;
710
711 if (o2info_from_user(oir, req))
712 goto bail;
713
714 status = -EINVAL;
715 if (oir.ir_magic != OCFS2_INFO_MAGIC)
716 goto bail;
717
718 switch (oir.ir_code) {
719 case OCFS2_INFO_BLOCKSIZE:
720 if (oir.ir_size == sizeof(struct ocfs2_info_blocksize))
721 status = ocfs2_info_handle_blocksize(inode, req);
722 break;
723 case OCFS2_INFO_CLUSTERSIZE:
724 if (oir.ir_size == sizeof(struct ocfs2_info_clustersize))
725 status = ocfs2_info_handle_clustersize(inode, req);
726 break;
727 case OCFS2_INFO_MAXSLOTS:
728 if (oir.ir_size == sizeof(struct ocfs2_info_maxslots))
729 status = ocfs2_info_handle_maxslots(inode, req);
730 break;
731 case OCFS2_INFO_LABEL:
732 if (oir.ir_size == sizeof(struct ocfs2_info_label))
733 status = ocfs2_info_handle_label(inode, req);
734 break;
735 case OCFS2_INFO_UUID:
736 if (oir.ir_size == sizeof(struct ocfs2_info_uuid))
737 status = ocfs2_info_handle_uuid(inode, req);
738 break;
739 case OCFS2_INFO_FS_FEATURES:
740 if (oir.ir_size == sizeof(struct ocfs2_info_fs_features))
741 status = ocfs2_info_handle_fs_features(inode, req);
742 break;
743 case OCFS2_INFO_JOURNAL_SIZE:
744 if (oir.ir_size == sizeof(struct ocfs2_info_journal_size))
745 status = ocfs2_info_handle_journal_size(inode, req);
746 break;
747 case OCFS2_INFO_FREEINODE:
748 if (oir.ir_size == sizeof(struct ocfs2_info_freeinode))
749 status = ocfs2_info_handle_freeinode(inode, req);
750 break;
751 case OCFS2_INFO_FREEFRAG:
752 if (oir.ir_size == sizeof(struct ocfs2_info_freefrag))
753 status = ocfs2_info_handle_freefrag(inode, req);
754 break;
755 default:
756 status = ocfs2_info_handle_unknown(inode, req);
757 break;
758 }
759
760bail:
761 return status;
762}
763
764static int ocfs2_get_request_ptr(struct ocfs2_info *info, int idx,
765 u64 *req_addr, int compat_flag)
766{
767 int status = -EFAULT;
768 u64 __user *bp = NULL;
769
770 if (compat_flag) {
771#ifdef CONFIG_COMPAT
772 /*
773 * pointer bp stores the base address of a pointers array,
774 * which collects all addresses of separate request.
775 */
776 bp = (u64 __user *)(unsigned long)compat_ptr(info->oi_requests);
777#else
778 BUG();
779#endif
780 } else
781 bp = (u64 __user *)(unsigned long)(info->oi_requests);
782
783 if (o2info_from_user(*req_addr, bp + idx))
784 goto bail;
785
786 status = 0;
787bail:
788 return status;
789}
790
791/*
792 * OCFS2_IOC_INFO handles an array of requests passed from userspace.
793 *
794 * ocfs2_info_handle() recevies a large info aggregation, grab and
795 * validate the request count from header, then break it into small
796 * pieces, later specific handlers can handle them one by one.
797 *
798 * Idea here is to make each separate request small enough to ensure
799 * a better backward&forward compatibility, since a small piece of
800 * request will be less likely to be broken if disk layout get changed.
801 */
802static int ocfs2_info_handle(struct inode *inode, struct ocfs2_info *info,
803 int compat_flag)
804{
805 int i, status = 0;
806 u64 req_addr;
807 struct ocfs2_info_request __user *reqp;
808
809 if ((info->oi_count > OCFS2_INFO_MAX_REQUEST) ||
810 (!info->oi_requests)) {
811 status = -EINVAL;
812 goto bail;
813 }
814
815 for (i = 0; i < info->oi_count; i++) {
816
817 status = ocfs2_get_request_ptr(info, i, &req_addr, compat_flag);
818 if (status)
819 break;
820
821 reqp = (struct ocfs2_info_request __user *)(unsigned long)req_addr;
822 if (!reqp) {
823 status = -EINVAL;
824 goto bail;
825 }
826
827 status = ocfs2_info_handle_request(inode, reqp);
828 if (status)
829 break;
830 }
831
832bail:
833 return status;
834}
835
836long ocfs2_ioctl(struct file *filp, unsigned int cmd, unsigned long arg)
837{
838 struct inode *inode = file_inode(filp);
839 unsigned int flags;
840 int new_clusters;
841 int status;
842 struct ocfs2_space_resv sr;
843 struct ocfs2_new_group_input input;
844 struct reflink_arguments args;
845 const char __user *old_path;
846 const char __user *new_path;
847 bool preserve;
848 struct ocfs2_info info;
849 void __user *argp = (void __user *)arg;
850
851 switch (cmd) {
852 case OCFS2_IOC_GETFLAGS:
853 status = ocfs2_get_inode_attr(inode, &flags);
854 if (status < 0)
855 return status;
856
857 flags &= OCFS2_FL_VISIBLE;
858 return put_user(flags, (int __user *) arg);
859 case OCFS2_IOC_SETFLAGS:
860 if (get_user(flags, (int __user *) arg))
861 return -EFAULT;
862
863 status = mnt_want_write_file(filp);
864 if (status)
865 return status;
866 status = ocfs2_set_inode_attr(inode, flags,
867 OCFS2_FL_MODIFIABLE);
868 mnt_drop_write_file(filp);
869 return status;
870 case OCFS2_IOC_RESVSP:
871 case OCFS2_IOC_RESVSP64:
872 case OCFS2_IOC_UNRESVSP:
873 case OCFS2_IOC_UNRESVSP64:
874 if (copy_from_user(&sr, (int __user *) arg, sizeof(sr)))
875 return -EFAULT;
876
877 return ocfs2_change_file_space(filp, cmd, &sr);
878 case OCFS2_IOC_GROUP_EXTEND:
879 if (!capable(CAP_SYS_RESOURCE))
880 return -EPERM;
881
882 if (get_user(new_clusters, (int __user *)arg))
883 return -EFAULT;
884
885 status = mnt_want_write_file(filp);
886 if (status)
887 return status;
888 status = ocfs2_group_extend(inode, new_clusters);
889 mnt_drop_write_file(filp);
890 return status;
891 case OCFS2_IOC_GROUP_ADD:
892 case OCFS2_IOC_GROUP_ADD64:
893 if (!capable(CAP_SYS_RESOURCE))
894 return -EPERM;
895
896 if (copy_from_user(&input, (int __user *) arg, sizeof(input)))
897 return -EFAULT;
898
899 status = mnt_want_write_file(filp);
900 if (status)
901 return status;
902 status = ocfs2_group_add(inode, &input);
903 mnt_drop_write_file(filp);
904 return status;
905 case OCFS2_IOC_REFLINK:
906 if (copy_from_user(&args, argp, sizeof(args)))
907 return -EFAULT;
908 old_path = (const char __user *)(unsigned long)args.old_path;
909 new_path = (const char __user *)(unsigned long)args.new_path;
910 preserve = (args.preserve != 0);
911
912 return ocfs2_reflink_ioctl(inode, old_path, new_path, preserve);
913 case OCFS2_IOC_INFO:
914 if (copy_from_user(&info, argp, sizeof(struct ocfs2_info)))
915 return -EFAULT;
916
917 return ocfs2_info_handle(inode, &info, 0);
918 case FITRIM:
919 {
920 struct super_block *sb = inode->i_sb;
921 struct request_queue *q = bdev_get_queue(sb->s_bdev);
922 struct fstrim_range range;
923 int ret = 0;
924
925 if (!capable(CAP_SYS_ADMIN))
926 return -EPERM;
927
928 if (!blk_queue_discard(q))
929 return -EOPNOTSUPP;
930
931 if (copy_from_user(&range, argp, sizeof(range)))
932 return -EFAULT;
933
934 range.minlen = max_t(u64, q->limits.discard_granularity,
935 range.minlen);
936 ret = ocfs2_trim_fs(sb, &range);
937 if (ret < 0)
938 return ret;
939
940 if (copy_to_user(argp, &range, sizeof(range)))
941 return -EFAULT;
942
943 return 0;
944 }
945 case OCFS2_IOC_MOVE_EXT:
946 return ocfs2_ioctl_move_extents(filp, argp);
947 default:
948 return -ENOTTY;
949 }
950}
951
952#ifdef CONFIG_COMPAT
953long ocfs2_compat_ioctl(struct file *file, unsigned cmd, unsigned long arg)
954{
955 bool preserve;
956 struct reflink_arguments args;
957 struct inode *inode = file_inode(file);
958 struct ocfs2_info info;
959 void __user *argp = (void __user *)arg;
960
961 switch (cmd) {
962 case OCFS2_IOC32_GETFLAGS:
963 cmd = OCFS2_IOC_GETFLAGS;
964 break;
965 case OCFS2_IOC32_SETFLAGS:
966 cmd = OCFS2_IOC_SETFLAGS;
967 break;
968 case OCFS2_IOC_RESVSP:
969 case OCFS2_IOC_RESVSP64:
970 case OCFS2_IOC_UNRESVSP:
971 case OCFS2_IOC_UNRESVSP64:
972 case OCFS2_IOC_GROUP_EXTEND:
973 case OCFS2_IOC_GROUP_ADD:
974 case OCFS2_IOC_GROUP_ADD64:
975 break;
976 case OCFS2_IOC_REFLINK:
977 if (copy_from_user(&args, argp, sizeof(args)))
978 return -EFAULT;
979 preserve = (args.preserve != 0);
980
981 return ocfs2_reflink_ioctl(inode, compat_ptr(args.old_path),
982 compat_ptr(args.new_path), preserve);
983 case OCFS2_IOC_INFO:
984 if (copy_from_user(&info, argp, sizeof(struct ocfs2_info)))
985 return -EFAULT;
986
987 return ocfs2_info_handle(inode, &info, 1);
988 case OCFS2_IOC_MOVE_EXT:
989 break;
990 default:
991 return -ENOIOCTLCMD;
992 }
993
994 return ocfs2_ioctl(file, cmd, arg);
995}
996#endif