Loading...
1// SPDX-License-Identifier: GPL-2.0
2/*
3 * Copyright (c) 2014 Red Hat, Inc.
4 * All Rights Reserved.
5 */
6#include "xfs.h"
7#include "xfs_fs.h"
8#include "xfs_shared.h"
9#include "xfs_format.h"
10#include "xfs_log_format.h"
11#include "xfs_trans_resv.h"
12#include "xfs_bit.h"
13#include "xfs_mount.h"
14#include "xfs_sb.h"
15#include "xfs_defer.h"
16#include "xfs_btree.h"
17#include "xfs_trans.h"
18#include "xfs_alloc.h"
19#include "xfs_rmap.h"
20#include "xfs_rmap_btree.h"
21#include "xfs_trace.h"
22#include "xfs_errortag.h"
23#include "xfs_error.h"
24#include "xfs_inode.h"
25#include "xfs_ag.h"
26
27/*
28 * Lookup the first record less than or equal to [bno, len, owner, offset]
29 * in the btree given by cur.
30 */
31int
32xfs_rmap_lookup_le(
33 struct xfs_btree_cur *cur,
34 xfs_agblock_t bno,
35 xfs_extlen_t len,
36 uint64_t owner,
37 uint64_t offset,
38 unsigned int flags,
39 int *stat)
40{
41 cur->bc_rec.r.rm_startblock = bno;
42 cur->bc_rec.r.rm_blockcount = len;
43 cur->bc_rec.r.rm_owner = owner;
44 cur->bc_rec.r.rm_offset = offset;
45 cur->bc_rec.r.rm_flags = flags;
46 return xfs_btree_lookup(cur, XFS_LOOKUP_LE, stat);
47}
48
49/*
50 * Lookup the record exactly matching [bno, len, owner, offset]
51 * in the btree given by cur.
52 */
53int
54xfs_rmap_lookup_eq(
55 struct xfs_btree_cur *cur,
56 xfs_agblock_t bno,
57 xfs_extlen_t len,
58 uint64_t owner,
59 uint64_t offset,
60 unsigned int flags,
61 int *stat)
62{
63 cur->bc_rec.r.rm_startblock = bno;
64 cur->bc_rec.r.rm_blockcount = len;
65 cur->bc_rec.r.rm_owner = owner;
66 cur->bc_rec.r.rm_offset = offset;
67 cur->bc_rec.r.rm_flags = flags;
68 return xfs_btree_lookup(cur, XFS_LOOKUP_EQ, stat);
69}
70
71/*
72 * Update the record referred to by cur to the value given
73 * by [bno, len, owner, offset].
74 * This either works (return 0) or gets an EFSCORRUPTED error.
75 */
76STATIC int
77xfs_rmap_update(
78 struct xfs_btree_cur *cur,
79 struct xfs_rmap_irec *irec)
80{
81 union xfs_btree_rec rec;
82 int error;
83
84 trace_xfs_rmap_update(cur->bc_mp, cur->bc_ag.pag->pag_agno,
85 irec->rm_startblock, irec->rm_blockcount,
86 irec->rm_owner, irec->rm_offset, irec->rm_flags);
87
88 rec.rmap.rm_startblock = cpu_to_be32(irec->rm_startblock);
89 rec.rmap.rm_blockcount = cpu_to_be32(irec->rm_blockcount);
90 rec.rmap.rm_owner = cpu_to_be64(irec->rm_owner);
91 rec.rmap.rm_offset = cpu_to_be64(
92 xfs_rmap_irec_offset_pack(irec));
93 error = xfs_btree_update(cur, &rec);
94 if (error)
95 trace_xfs_rmap_update_error(cur->bc_mp,
96 cur->bc_ag.pag->pag_agno, error, _RET_IP_);
97 return error;
98}
99
100int
101xfs_rmap_insert(
102 struct xfs_btree_cur *rcur,
103 xfs_agblock_t agbno,
104 xfs_extlen_t len,
105 uint64_t owner,
106 uint64_t offset,
107 unsigned int flags)
108{
109 int i;
110 int error;
111
112 trace_xfs_rmap_insert(rcur->bc_mp, rcur->bc_ag.pag->pag_agno, agbno,
113 len, owner, offset, flags);
114
115 error = xfs_rmap_lookup_eq(rcur, agbno, len, owner, offset, flags, &i);
116 if (error)
117 goto done;
118 if (XFS_IS_CORRUPT(rcur->bc_mp, i != 0)) {
119 error = -EFSCORRUPTED;
120 goto done;
121 }
122
123 rcur->bc_rec.r.rm_startblock = agbno;
124 rcur->bc_rec.r.rm_blockcount = len;
125 rcur->bc_rec.r.rm_owner = owner;
126 rcur->bc_rec.r.rm_offset = offset;
127 rcur->bc_rec.r.rm_flags = flags;
128 error = xfs_btree_insert(rcur, &i);
129 if (error)
130 goto done;
131 if (XFS_IS_CORRUPT(rcur->bc_mp, i != 1)) {
132 error = -EFSCORRUPTED;
133 goto done;
134 }
135done:
136 if (error)
137 trace_xfs_rmap_insert_error(rcur->bc_mp,
138 rcur->bc_ag.pag->pag_agno, error, _RET_IP_);
139 return error;
140}
141
142STATIC int
143xfs_rmap_delete(
144 struct xfs_btree_cur *rcur,
145 xfs_agblock_t agbno,
146 xfs_extlen_t len,
147 uint64_t owner,
148 uint64_t offset,
149 unsigned int flags)
150{
151 int i;
152 int error;
153
154 trace_xfs_rmap_delete(rcur->bc_mp, rcur->bc_ag.pag->pag_agno, agbno,
155 len, owner, offset, flags);
156
157 error = xfs_rmap_lookup_eq(rcur, agbno, len, owner, offset, flags, &i);
158 if (error)
159 goto done;
160 if (XFS_IS_CORRUPT(rcur->bc_mp, i != 1)) {
161 error = -EFSCORRUPTED;
162 goto done;
163 }
164
165 error = xfs_btree_delete(rcur, &i);
166 if (error)
167 goto done;
168 if (XFS_IS_CORRUPT(rcur->bc_mp, i != 1)) {
169 error = -EFSCORRUPTED;
170 goto done;
171 }
172done:
173 if (error)
174 trace_xfs_rmap_delete_error(rcur->bc_mp,
175 rcur->bc_ag.pag->pag_agno, error, _RET_IP_);
176 return error;
177}
178
179/* Convert an internal btree record to an rmap record. */
180int
181xfs_rmap_btrec_to_irec(
182 union xfs_btree_rec *rec,
183 struct xfs_rmap_irec *irec)
184{
185 irec->rm_startblock = be32_to_cpu(rec->rmap.rm_startblock);
186 irec->rm_blockcount = be32_to_cpu(rec->rmap.rm_blockcount);
187 irec->rm_owner = be64_to_cpu(rec->rmap.rm_owner);
188 return xfs_rmap_irec_offset_unpack(be64_to_cpu(rec->rmap.rm_offset),
189 irec);
190}
191
192/*
193 * Get the data from the pointed-to record.
194 */
195int
196xfs_rmap_get_rec(
197 struct xfs_btree_cur *cur,
198 struct xfs_rmap_irec *irec,
199 int *stat)
200{
201 struct xfs_mount *mp = cur->bc_mp;
202 xfs_agnumber_t agno = cur->bc_ag.pag->pag_agno;
203 union xfs_btree_rec *rec;
204 int error;
205
206 error = xfs_btree_get_rec(cur, &rec, stat);
207 if (error || !*stat)
208 return error;
209
210 if (xfs_rmap_btrec_to_irec(rec, irec))
211 goto out_bad_rec;
212
213 if (irec->rm_blockcount == 0)
214 goto out_bad_rec;
215 if (irec->rm_startblock <= XFS_AGFL_BLOCK(mp)) {
216 if (irec->rm_owner != XFS_RMAP_OWN_FS)
217 goto out_bad_rec;
218 if (irec->rm_blockcount != XFS_AGFL_BLOCK(mp) + 1)
219 goto out_bad_rec;
220 } else {
221 /* check for valid extent range, including overflow */
222 if (!xfs_verify_agbno(mp, agno, irec->rm_startblock))
223 goto out_bad_rec;
224 if (irec->rm_startblock >
225 irec->rm_startblock + irec->rm_blockcount)
226 goto out_bad_rec;
227 if (!xfs_verify_agbno(mp, agno,
228 irec->rm_startblock + irec->rm_blockcount - 1))
229 goto out_bad_rec;
230 }
231
232 if (!(xfs_verify_ino(mp, irec->rm_owner) ||
233 (irec->rm_owner <= XFS_RMAP_OWN_FS &&
234 irec->rm_owner >= XFS_RMAP_OWN_MIN)))
235 goto out_bad_rec;
236
237 return 0;
238out_bad_rec:
239 xfs_warn(mp,
240 "Reverse Mapping BTree record corruption in AG %d detected!",
241 agno);
242 xfs_warn(mp,
243 "Owner 0x%llx, flags 0x%x, start block 0x%x block count 0x%x",
244 irec->rm_owner, irec->rm_flags, irec->rm_startblock,
245 irec->rm_blockcount);
246 return -EFSCORRUPTED;
247}
248
249struct xfs_find_left_neighbor_info {
250 struct xfs_rmap_irec high;
251 struct xfs_rmap_irec *irec;
252 int *stat;
253};
254
255/* For each rmap given, figure out if it matches the key we want. */
256STATIC int
257xfs_rmap_find_left_neighbor_helper(
258 struct xfs_btree_cur *cur,
259 struct xfs_rmap_irec *rec,
260 void *priv)
261{
262 struct xfs_find_left_neighbor_info *info = priv;
263
264 trace_xfs_rmap_find_left_neighbor_candidate(cur->bc_mp,
265 cur->bc_ag.pag->pag_agno, rec->rm_startblock,
266 rec->rm_blockcount, rec->rm_owner, rec->rm_offset,
267 rec->rm_flags);
268
269 if (rec->rm_owner != info->high.rm_owner)
270 return 0;
271 if (!XFS_RMAP_NON_INODE_OWNER(rec->rm_owner) &&
272 !(rec->rm_flags & XFS_RMAP_BMBT_BLOCK) &&
273 rec->rm_offset + rec->rm_blockcount - 1 != info->high.rm_offset)
274 return 0;
275
276 *info->irec = *rec;
277 *info->stat = 1;
278 return -ECANCELED;
279}
280
281/*
282 * Find the record to the left of the given extent, being careful only to
283 * return a match with the same owner and adjacent physical and logical
284 * block ranges.
285 */
286int
287xfs_rmap_find_left_neighbor(
288 struct xfs_btree_cur *cur,
289 xfs_agblock_t bno,
290 uint64_t owner,
291 uint64_t offset,
292 unsigned int flags,
293 struct xfs_rmap_irec *irec,
294 int *stat)
295{
296 struct xfs_find_left_neighbor_info info;
297 int error;
298
299 *stat = 0;
300 if (bno == 0)
301 return 0;
302 info.high.rm_startblock = bno - 1;
303 info.high.rm_owner = owner;
304 if (!XFS_RMAP_NON_INODE_OWNER(owner) &&
305 !(flags & XFS_RMAP_BMBT_BLOCK)) {
306 if (offset == 0)
307 return 0;
308 info.high.rm_offset = offset - 1;
309 } else
310 info.high.rm_offset = 0;
311 info.high.rm_flags = flags;
312 info.high.rm_blockcount = 0;
313 info.irec = irec;
314 info.stat = stat;
315
316 trace_xfs_rmap_find_left_neighbor_query(cur->bc_mp,
317 cur->bc_ag.pag->pag_agno, bno, 0, owner, offset, flags);
318
319 error = xfs_rmap_query_range(cur, &info.high, &info.high,
320 xfs_rmap_find_left_neighbor_helper, &info);
321 if (error == -ECANCELED)
322 error = 0;
323 if (*stat)
324 trace_xfs_rmap_find_left_neighbor_result(cur->bc_mp,
325 cur->bc_ag.pag->pag_agno, irec->rm_startblock,
326 irec->rm_blockcount, irec->rm_owner,
327 irec->rm_offset, irec->rm_flags);
328 return error;
329}
330
331/* For each rmap given, figure out if it matches the key we want. */
332STATIC int
333xfs_rmap_lookup_le_range_helper(
334 struct xfs_btree_cur *cur,
335 struct xfs_rmap_irec *rec,
336 void *priv)
337{
338 struct xfs_find_left_neighbor_info *info = priv;
339
340 trace_xfs_rmap_lookup_le_range_candidate(cur->bc_mp,
341 cur->bc_ag.pag->pag_agno, rec->rm_startblock,
342 rec->rm_blockcount, rec->rm_owner, rec->rm_offset,
343 rec->rm_flags);
344
345 if (rec->rm_owner != info->high.rm_owner)
346 return 0;
347 if (!XFS_RMAP_NON_INODE_OWNER(rec->rm_owner) &&
348 !(rec->rm_flags & XFS_RMAP_BMBT_BLOCK) &&
349 (rec->rm_offset > info->high.rm_offset ||
350 rec->rm_offset + rec->rm_blockcount <= info->high.rm_offset))
351 return 0;
352
353 *info->irec = *rec;
354 *info->stat = 1;
355 return -ECANCELED;
356}
357
358/*
359 * Find the record to the left of the given extent, being careful only to
360 * return a match with the same owner and overlapping physical and logical
361 * block ranges. This is the overlapping-interval version of
362 * xfs_rmap_lookup_le.
363 */
364int
365xfs_rmap_lookup_le_range(
366 struct xfs_btree_cur *cur,
367 xfs_agblock_t bno,
368 uint64_t owner,
369 uint64_t offset,
370 unsigned int flags,
371 struct xfs_rmap_irec *irec,
372 int *stat)
373{
374 struct xfs_find_left_neighbor_info info;
375 int error;
376
377 info.high.rm_startblock = bno;
378 info.high.rm_owner = owner;
379 if (!XFS_RMAP_NON_INODE_OWNER(owner) && !(flags & XFS_RMAP_BMBT_BLOCK))
380 info.high.rm_offset = offset;
381 else
382 info.high.rm_offset = 0;
383 info.high.rm_flags = flags;
384 info.high.rm_blockcount = 0;
385 *stat = 0;
386 info.irec = irec;
387 info.stat = stat;
388
389 trace_xfs_rmap_lookup_le_range(cur->bc_mp,
390 cur->bc_ag.pag->pag_agno, bno, 0, owner, offset, flags);
391 error = xfs_rmap_query_range(cur, &info.high, &info.high,
392 xfs_rmap_lookup_le_range_helper, &info);
393 if (error == -ECANCELED)
394 error = 0;
395 if (*stat)
396 trace_xfs_rmap_lookup_le_range_result(cur->bc_mp,
397 cur->bc_ag.pag->pag_agno, irec->rm_startblock,
398 irec->rm_blockcount, irec->rm_owner,
399 irec->rm_offset, irec->rm_flags);
400 return error;
401}
402
403/*
404 * Perform all the relevant owner checks for a removal op. If we're doing an
405 * unknown-owner removal then we have no owner information to check.
406 */
407static int
408xfs_rmap_free_check_owner(
409 struct xfs_mount *mp,
410 uint64_t ltoff,
411 struct xfs_rmap_irec *rec,
412 xfs_filblks_t len,
413 uint64_t owner,
414 uint64_t offset,
415 unsigned int flags)
416{
417 int error = 0;
418
419 if (owner == XFS_RMAP_OWN_UNKNOWN)
420 return 0;
421
422 /* Make sure the unwritten flag matches. */
423 if (XFS_IS_CORRUPT(mp,
424 (flags & XFS_RMAP_UNWRITTEN) !=
425 (rec->rm_flags & XFS_RMAP_UNWRITTEN))) {
426 error = -EFSCORRUPTED;
427 goto out;
428 }
429
430 /* Make sure the owner matches what we expect to find in the tree. */
431 if (XFS_IS_CORRUPT(mp, owner != rec->rm_owner)) {
432 error = -EFSCORRUPTED;
433 goto out;
434 }
435
436 /* Check the offset, if necessary. */
437 if (XFS_RMAP_NON_INODE_OWNER(owner))
438 goto out;
439
440 if (flags & XFS_RMAP_BMBT_BLOCK) {
441 if (XFS_IS_CORRUPT(mp,
442 !(rec->rm_flags & XFS_RMAP_BMBT_BLOCK))) {
443 error = -EFSCORRUPTED;
444 goto out;
445 }
446 } else {
447 if (XFS_IS_CORRUPT(mp, rec->rm_offset > offset)) {
448 error = -EFSCORRUPTED;
449 goto out;
450 }
451 if (XFS_IS_CORRUPT(mp,
452 offset + len > ltoff + rec->rm_blockcount)) {
453 error = -EFSCORRUPTED;
454 goto out;
455 }
456 }
457
458out:
459 return error;
460}
461
462/*
463 * Find the extent in the rmap btree and remove it.
464 *
465 * The record we find should always be an exact match for the extent that we're
466 * looking for, since we insert them into the btree without modification.
467 *
468 * Special Case #1: when growing the filesystem, we "free" an extent when
469 * growing the last AG. This extent is new space and so it is not tracked as
470 * used space in the btree. The growfs code will pass in an owner of
471 * XFS_RMAP_OWN_NULL to indicate that it expected that there is no owner of this
472 * extent. We verify that - the extent lookup result in a record that does not
473 * overlap.
474 *
475 * Special Case #2: EFIs do not record the owner of the extent, so when
476 * recovering EFIs from the log we pass in XFS_RMAP_OWN_UNKNOWN to tell the rmap
477 * btree to ignore the owner (i.e. wildcard match) so we don't trigger
478 * corruption checks during log recovery.
479 */
480STATIC int
481xfs_rmap_unmap(
482 struct xfs_btree_cur *cur,
483 xfs_agblock_t bno,
484 xfs_extlen_t len,
485 bool unwritten,
486 const struct xfs_owner_info *oinfo)
487{
488 struct xfs_mount *mp = cur->bc_mp;
489 struct xfs_rmap_irec ltrec;
490 uint64_t ltoff;
491 int error = 0;
492 int i;
493 uint64_t owner;
494 uint64_t offset;
495 unsigned int flags;
496 bool ignore_off;
497
498 xfs_owner_info_unpack(oinfo, &owner, &offset, &flags);
499 ignore_off = XFS_RMAP_NON_INODE_OWNER(owner) ||
500 (flags & XFS_RMAP_BMBT_BLOCK);
501 if (unwritten)
502 flags |= XFS_RMAP_UNWRITTEN;
503 trace_xfs_rmap_unmap(mp, cur->bc_ag.pag->pag_agno, bno, len,
504 unwritten, oinfo);
505
506 /*
507 * We should always have a left record because there's a static record
508 * for the AG headers at rm_startblock == 0 created by mkfs/growfs that
509 * will not ever be removed from the tree.
510 */
511 error = xfs_rmap_lookup_le(cur, bno, len, owner, offset, flags, &i);
512 if (error)
513 goto out_error;
514 if (XFS_IS_CORRUPT(mp, i != 1)) {
515 error = -EFSCORRUPTED;
516 goto out_error;
517 }
518
519 error = xfs_rmap_get_rec(cur, <rec, &i);
520 if (error)
521 goto out_error;
522 if (XFS_IS_CORRUPT(mp, i != 1)) {
523 error = -EFSCORRUPTED;
524 goto out_error;
525 }
526 trace_xfs_rmap_lookup_le_range_result(cur->bc_mp,
527 cur->bc_ag.pag->pag_agno, ltrec.rm_startblock,
528 ltrec.rm_blockcount, ltrec.rm_owner,
529 ltrec.rm_offset, ltrec.rm_flags);
530 ltoff = ltrec.rm_offset;
531
532 /*
533 * For growfs, the incoming extent must be beyond the left record we
534 * just found as it is new space and won't be used by anyone. This is
535 * just a corruption check as we don't actually do anything with this
536 * extent. Note that we need to use >= instead of > because it might
537 * be the case that the "left" extent goes all the way to EOFS.
538 */
539 if (owner == XFS_RMAP_OWN_NULL) {
540 if (XFS_IS_CORRUPT(mp,
541 bno <
542 ltrec.rm_startblock + ltrec.rm_blockcount)) {
543 error = -EFSCORRUPTED;
544 goto out_error;
545 }
546 goto out_done;
547 }
548
549 /*
550 * If we're doing an unknown-owner removal for EFI recovery, we expect
551 * to find the full range in the rmapbt or nothing at all. If we
552 * don't find any rmaps overlapping either end of the range, we're
553 * done. Hopefully this means that the EFI creator already queued
554 * (and finished) a RUI to remove the rmap.
555 */
556 if (owner == XFS_RMAP_OWN_UNKNOWN &&
557 ltrec.rm_startblock + ltrec.rm_blockcount <= bno) {
558 struct xfs_rmap_irec rtrec;
559
560 error = xfs_btree_increment(cur, 0, &i);
561 if (error)
562 goto out_error;
563 if (i == 0)
564 goto out_done;
565 error = xfs_rmap_get_rec(cur, &rtrec, &i);
566 if (error)
567 goto out_error;
568 if (XFS_IS_CORRUPT(mp, i != 1)) {
569 error = -EFSCORRUPTED;
570 goto out_error;
571 }
572 if (rtrec.rm_startblock >= bno + len)
573 goto out_done;
574 }
575
576 /* Make sure the extent we found covers the entire freeing range. */
577 if (XFS_IS_CORRUPT(mp,
578 ltrec.rm_startblock > bno ||
579 ltrec.rm_startblock + ltrec.rm_blockcount <
580 bno + len)) {
581 error = -EFSCORRUPTED;
582 goto out_error;
583 }
584
585 /* Check owner information. */
586 error = xfs_rmap_free_check_owner(mp, ltoff, <rec, len, owner,
587 offset, flags);
588 if (error)
589 goto out_error;
590
591 if (ltrec.rm_startblock == bno && ltrec.rm_blockcount == len) {
592 /* exact match, simply remove the record from rmap tree */
593 trace_xfs_rmap_delete(mp, cur->bc_ag.pag->pag_agno,
594 ltrec.rm_startblock, ltrec.rm_blockcount,
595 ltrec.rm_owner, ltrec.rm_offset,
596 ltrec.rm_flags);
597 error = xfs_btree_delete(cur, &i);
598 if (error)
599 goto out_error;
600 if (XFS_IS_CORRUPT(mp, i != 1)) {
601 error = -EFSCORRUPTED;
602 goto out_error;
603 }
604 } else if (ltrec.rm_startblock == bno) {
605 /*
606 * overlap left hand side of extent: move the start, trim the
607 * length and update the current record.
608 *
609 * ltbno ltlen
610 * Orig: |oooooooooooooooooooo|
611 * Freeing: |fffffffff|
612 * Result: |rrrrrrrrrr|
613 * bno len
614 */
615 ltrec.rm_startblock += len;
616 ltrec.rm_blockcount -= len;
617 if (!ignore_off)
618 ltrec.rm_offset += len;
619 error = xfs_rmap_update(cur, <rec);
620 if (error)
621 goto out_error;
622 } else if (ltrec.rm_startblock + ltrec.rm_blockcount == bno + len) {
623 /*
624 * overlap right hand side of extent: trim the length and update
625 * the current record.
626 *
627 * ltbno ltlen
628 * Orig: |oooooooooooooooooooo|
629 * Freeing: |fffffffff|
630 * Result: |rrrrrrrrrr|
631 * bno len
632 */
633 ltrec.rm_blockcount -= len;
634 error = xfs_rmap_update(cur, <rec);
635 if (error)
636 goto out_error;
637 } else {
638
639 /*
640 * overlap middle of extent: trim the length of the existing
641 * record to the length of the new left-extent size, increment
642 * the insertion position so we can insert a new record
643 * containing the remaining right-extent space.
644 *
645 * ltbno ltlen
646 * Orig: |oooooooooooooooooooo|
647 * Freeing: |fffffffff|
648 * Result: |rrrrr| |rrrr|
649 * bno len
650 */
651 xfs_extlen_t orig_len = ltrec.rm_blockcount;
652
653 ltrec.rm_blockcount = bno - ltrec.rm_startblock;
654 error = xfs_rmap_update(cur, <rec);
655 if (error)
656 goto out_error;
657
658 error = xfs_btree_increment(cur, 0, &i);
659 if (error)
660 goto out_error;
661
662 cur->bc_rec.r.rm_startblock = bno + len;
663 cur->bc_rec.r.rm_blockcount = orig_len - len -
664 ltrec.rm_blockcount;
665 cur->bc_rec.r.rm_owner = ltrec.rm_owner;
666 if (ignore_off)
667 cur->bc_rec.r.rm_offset = 0;
668 else
669 cur->bc_rec.r.rm_offset = offset + len;
670 cur->bc_rec.r.rm_flags = flags;
671 trace_xfs_rmap_insert(mp, cur->bc_ag.pag->pag_agno,
672 cur->bc_rec.r.rm_startblock,
673 cur->bc_rec.r.rm_blockcount,
674 cur->bc_rec.r.rm_owner,
675 cur->bc_rec.r.rm_offset,
676 cur->bc_rec.r.rm_flags);
677 error = xfs_btree_insert(cur, &i);
678 if (error)
679 goto out_error;
680 }
681
682out_done:
683 trace_xfs_rmap_unmap_done(mp, cur->bc_ag.pag->pag_agno, bno, len,
684 unwritten, oinfo);
685out_error:
686 if (error)
687 trace_xfs_rmap_unmap_error(mp, cur->bc_ag.pag->pag_agno,
688 error, _RET_IP_);
689 return error;
690}
691
692/*
693 * Remove a reference to an extent in the rmap btree.
694 */
695int
696xfs_rmap_free(
697 struct xfs_trans *tp,
698 struct xfs_buf *agbp,
699 struct xfs_perag *pag,
700 xfs_agblock_t bno,
701 xfs_extlen_t len,
702 const struct xfs_owner_info *oinfo)
703{
704 struct xfs_mount *mp = tp->t_mountp;
705 struct xfs_btree_cur *cur;
706 int error;
707
708 if (!xfs_sb_version_hasrmapbt(&mp->m_sb))
709 return 0;
710
711 cur = xfs_rmapbt_init_cursor(mp, tp, agbp, pag);
712
713 error = xfs_rmap_unmap(cur, bno, len, false, oinfo);
714
715 xfs_btree_del_cursor(cur, error);
716 return error;
717}
718
719/*
720 * A mergeable rmap must have the same owner and the same values for
721 * the unwritten, attr_fork, and bmbt flags. The startblock and
722 * offset are checked separately.
723 */
724static bool
725xfs_rmap_is_mergeable(
726 struct xfs_rmap_irec *irec,
727 uint64_t owner,
728 unsigned int flags)
729{
730 if (irec->rm_owner == XFS_RMAP_OWN_NULL)
731 return false;
732 if (irec->rm_owner != owner)
733 return false;
734 if ((flags & XFS_RMAP_UNWRITTEN) ^
735 (irec->rm_flags & XFS_RMAP_UNWRITTEN))
736 return false;
737 if ((flags & XFS_RMAP_ATTR_FORK) ^
738 (irec->rm_flags & XFS_RMAP_ATTR_FORK))
739 return false;
740 if ((flags & XFS_RMAP_BMBT_BLOCK) ^
741 (irec->rm_flags & XFS_RMAP_BMBT_BLOCK))
742 return false;
743 return true;
744}
745
746/*
747 * When we allocate a new block, the first thing we do is add a reference to
748 * the extent in the rmap btree. This takes the form of a [agbno, length,
749 * owner, offset] record. Flags are encoded in the high bits of the offset
750 * field.
751 */
752STATIC int
753xfs_rmap_map(
754 struct xfs_btree_cur *cur,
755 xfs_agblock_t bno,
756 xfs_extlen_t len,
757 bool unwritten,
758 const struct xfs_owner_info *oinfo)
759{
760 struct xfs_mount *mp = cur->bc_mp;
761 struct xfs_rmap_irec ltrec;
762 struct xfs_rmap_irec gtrec;
763 int have_gt;
764 int have_lt;
765 int error = 0;
766 int i;
767 uint64_t owner;
768 uint64_t offset;
769 unsigned int flags = 0;
770 bool ignore_off;
771
772 xfs_owner_info_unpack(oinfo, &owner, &offset, &flags);
773 ASSERT(owner != 0);
774 ignore_off = XFS_RMAP_NON_INODE_OWNER(owner) ||
775 (flags & XFS_RMAP_BMBT_BLOCK);
776 if (unwritten)
777 flags |= XFS_RMAP_UNWRITTEN;
778 trace_xfs_rmap_map(mp, cur->bc_ag.pag->pag_agno, bno, len,
779 unwritten, oinfo);
780 ASSERT(!xfs_rmap_should_skip_owner_update(oinfo));
781
782 /*
783 * For the initial lookup, look for an exact match or the left-adjacent
784 * record for our insertion point. This will also give us the record for
785 * start block contiguity tests.
786 */
787 error = xfs_rmap_lookup_le(cur, bno, len, owner, offset, flags,
788 &have_lt);
789 if (error)
790 goto out_error;
791 if (have_lt) {
792 error = xfs_rmap_get_rec(cur, <rec, &have_lt);
793 if (error)
794 goto out_error;
795 if (XFS_IS_CORRUPT(mp, have_lt != 1)) {
796 error = -EFSCORRUPTED;
797 goto out_error;
798 }
799 trace_xfs_rmap_lookup_le_range_result(cur->bc_mp,
800 cur->bc_ag.pag->pag_agno, ltrec.rm_startblock,
801 ltrec.rm_blockcount, ltrec.rm_owner,
802 ltrec.rm_offset, ltrec.rm_flags);
803
804 if (!xfs_rmap_is_mergeable(<rec, owner, flags))
805 have_lt = 0;
806 }
807
808 if (XFS_IS_CORRUPT(mp,
809 have_lt != 0 &&
810 ltrec.rm_startblock + ltrec.rm_blockcount > bno)) {
811 error = -EFSCORRUPTED;
812 goto out_error;
813 }
814
815 /*
816 * Increment the cursor to see if we have a right-adjacent record to our
817 * insertion point. This will give us the record for end block
818 * contiguity tests.
819 */
820 error = xfs_btree_increment(cur, 0, &have_gt);
821 if (error)
822 goto out_error;
823 if (have_gt) {
824 error = xfs_rmap_get_rec(cur, >rec, &have_gt);
825 if (error)
826 goto out_error;
827 if (XFS_IS_CORRUPT(mp, have_gt != 1)) {
828 error = -EFSCORRUPTED;
829 goto out_error;
830 }
831 if (XFS_IS_CORRUPT(mp, bno + len > gtrec.rm_startblock)) {
832 error = -EFSCORRUPTED;
833 goto out_error;
834 }
835 trace_xfs_rmap_find_right_neighbor_result(cur->bc_mp,
836 cur->bc_ag.pag->pag_agno, gtrec.rm_startblock,
837 gtrec.rm_blockcount, gtrec.rm_owner,
838 gtrec.rm_offset, gtrec.rm_flags);
839 if (!xfs_rmap_is_mergeable(>rec, owner, flags))
840 have_gt = 0;
841 }
842
843 /*
844 * Note: cursor currently points one record to the right of ltrec, even
845 * if there is no record in the tree to the right.
846 */
847 if (have_lt &&
848 ltrec.rm_startblock + ltrec.rm_blockcount == bno &&
849 (ignore_off || ltrec.rm_offset + ltrec.rm_blockcount == offset)) {
850 /*
851 * left edge contiguous, merge into left record.
852 *
853 * ltbno ltlen
854 * orig: |ooooooooo|
855 * adding: |aaaaaaaaa|
856 * result: |rrrrrrrrrrrrrrrrrrr|
857 * bno len
858 */
859 ltrec.rm_blockcount += len;
860 if (have_gt &&
861 bno + len == gtrec.rm_startblock &&
862 (ignore_off || offset + len == gtrec.rm_offset) &&
863 (unsigned long)ltrec.rm_blockcount + len +
864 gtrec.rm_blockcount <= XFS_RMAP_LEN_MAX) {
865 /*
866 * right edge also contiguous, delete right record
867 * and merge into left record.
868 *
869 * ltbno ltlen gtbno gtlen
870 * orig: |ooooooooo| |ooooooooo|
871 * adding: |aaaaaaaaa|
872 * result: |rrrrrrrrrrrrrrrrrrrrrrrrrrrrr|
873 */
874 ltrec.rm_blockcount += gtrec.rm_blockcount;
875 trace_xfs_rmap_delete(mp, cur->bc_ag.pag->pag_agno,
876 gtrec.rm_startblock,
877 gtrec.rm_blockcount,
878 gtrec.rm_owner,
879 gtrec.rm_offset,
880 gtrec.rm_flags);
881 error = xfs_btree_delete(cur, &i);
882 if (error)
883 goto out_error;
884 if (XFS_IS_CORRUPT(mp, i != 1)) {
885 error = -EFSCORRUPTED;
886 goto out_error;
887 }
888 }
889
890 /* point the cursor back to the left record and update */
891 error = xfs_btree_decrement(cur, 0, &have_gt);
892 if (error)
893 goto out_error;
894 error = xfs_rmap_update(cur, <rec);
895 if (error)
896 goto out_error;
897 } else if (have_gt &&
898 bno + len == gtrec.rm_startblock &&
899 (ignore_off || offset + len == gtrec.rm_offset)) {
900 /*
901 * right edge contiguous, merge into right record.
902 *
903 * gtbno gtlen
904 * Orig: |ooooooooo|
905 * adding: |aaaaaaaaa|
906 * Result: |rrrrrrrrrrrrrrrrrrr|
907 * bno len
908 */
909 gtrec.rm_startblock = bno;
910 gtrec.rm_blockcount += len;
911 if (!ignore_off)
912 gtrec.rm_offset = offset;
913 error = xfs_rmap_update(cur, >rec);
914 if (error)
915 goto out_error;
916 } else {
917 /*
918 * no contiguous edge with identical owner, insert
919 * new record at current cursor position.
920 */
921 cur->bc_rec.r.rm_startblock = bno;
922 cur->bc_rec.r.rm_blockcount = len;
923 cur->bc_rec.r.rm_owner = owner;
924 cur->bc_rec.r.rm_offset = offset;
925 cur->bc_rec.r.rm_flags = flags;
926 trace_xfs_rmap_insert(mp, cur->bc_ag.pag->pag_agno, bno, len,
927 owner, offset, flags);
928 error = xfs_btree_insert(cur, &i);
929 if (error)
930 goto out_error;
931 if (XFS_IS_CORRUPT(mp, i != 1)) {
932 error = -EFSCORRUPTED;
933 goto out_error;
934 }
935 }
936
937 trace_xfs_rmap_map_done(mp, cur->bc_ag.pag->pag_agno, bno, len,
938 unwritten, oinfo);
939out_error:
940 if (error)
941 trace_xfs_rmap_map_error(mp, cur->bc_ag.pag->pag_agno,
942 error, _RET_IP_);
943 return error;
944}
945
946/*
947 * Add a reference to an extent in the rmap btree.
948 */
949int
950xfs_rmap_alloc(
951 struct xfs_trans *tp,
952 struct xfs_buf *agbp,
953 struct xfs_perag *pag,
954 xfs_agblock_t bno,
955 xfs_extlen_t len,
956 const struct xfs_owner_info *oinfo)
957{
958 struct xfs_mount *mp = tp->t_mountp;
959 struct xfs_btree_cur *cur;
960 int error;
961
962 if (!xfs_sb_version_hasrmapbt(&mp->m_sb))
963 return 0;
964
965 cur = xfs_rmapbt_init_cursor(mp, tp, agbp, pag);
966 error = xfs_rmap_map(cur, bno, len, false, oinfo);
967
968 xfs_btree_del_cursor(cur, error);
969 return error;
970}
971
972#define RMAP_LEFT_CONTIG (1 << 0)
973#define RMAP_RIGHT_CONTIG (1 << 1)
974#define RMAP_LEFT_FILLING (1 << 2)
975#define RMAP_RIGHT_FILLING (1 << 3)
976#define RMAP_LEFT_VALID (1 << 6)
977#define RMAP_RIGHT_VALID (1 << 7)
978
979#define LEFT r[0]
980#define RIGHT r[1]
981#define PREV r[2]
982#define NEW r[3]
983
984/*
985 * Convert an unwritten extent to a real extent or vice versa.
986 * Does not handle overlapping extents.
987 */
988STATIC int
989xfs_rmap_convert(
990 struct xfs_btree_cur *cur,
991 xfs_agblock_t bno,
992 xfs_extlen_t len,
993 bool unwritten,
994 const struct xfs_owner_info *oinfo)
995{
996 struct xfs_mount *mp = cur->bc_mp;
997 struct xfs_rmap_irec r[4]; /* neighbor extent entries */
998 /* left is 0, right is 1, */
999 /* prev is 2, new is 3 */
1000 uint64_t owner;
1001 uint64_t offset;
1002 uint64_t new_endoff;
1003 unsigned int oldext;
1004 unsigned int newext;
1005 unsigned int flags = 0;
1006 int i;
1007 int state = 0;
1008 int error;
1009
1010 xfs_owner_info_unpack(oinfo, &owner, &offset, &flags);
1011 ASSERT(!(XFS_RMAP_NON_INODE_OWNER(owner) ||
1012 (flags & (XFS_RMAP_ATTR_FORK | XFS_RMAP_BMBT_BLOCK))));
1013 oldext = unwritten ? XFS_RMAP_UNWRITTEN : 0;
1014 new_endoff = offset + len;
1015 trace_xfs_rmap_convert(mp, cur->bc_ag.pag->pag_agno, bno, len,
1016 unwritten, oinfo);
1017
1018 /*
1019 * For the initial lookup, look for an exact match or the left-adjacent
1020 * record for our insertion point. This will also give us the record for
1021 * start block contiguity tests.
1022 */
1023 error = xfs_rmap_lookup_le(cur, bno, len, owner, offset, oldext, &i);
1024 if (error)
1025 goto done;
1026 if (XFS_IS_CORRUPT(mp, i != 1)) {
1027 error = -EFSCORRUPTED;
1028 goto done;
1029 }
1030
1031 error = xfs_rmap_get_rec(cur, &PREV, &i);
1032 if (error)
1033 goto done;
1034 if (XFS_IS_CORRUPT(mp, i != 1)) {
1035 error = -EFSCORRUPTED;
1036 goto done;
1037 }
1038 trace_xfs_rmap_lookup_le_range_result(cur->bc_mp,
1039 cur->bc_ag.pag->pag_agno, PREV.rm_startblock,
1040 PREV.rm_blockcount, PREV.rm_owner,
1041 PREV.rm_offset, PREV.rm_flags);
1042
1043 ASSERT(PREV.rm_offset <= offset);
1044 ASSERT(PREV.rm_offset + PREV.rm_blockcount >= new_endoff);
1045 ASSERT((PREV.rm_flags & XFS_RMAP_UNWRITTEN) == oldext);
1046 newext = ~oldext & XFS_RMAP_UNWRITTEN;
1047
1048 /*
1049 * Set flags determining what part of the previous oldext allocation
1050 * extent is being replaced by a newext allocation.
1051 */
1052 if (PREV.rm_offset == offset)
1053 state |= RMAP_LEFT_FILLING;
1054 if (PREV.rm_offset + PREV.rm_blockcount == new_endoff)
1055 state |= RMAP_RIGHT_FILLING;
1056
1057 /*
1058 * Decrement the cursor to see if we have a left-adjacent record to our
1059 * insertion point. This will give us the record for end block
1060 * contiguity tests.
1061 */
1062 error = xfs_btree_decrement(cur, 0, &i);
1063 if (error)
1064 goto done;
1065 if (i) {
1066 state |= RMAP_LEFT_VALID;
1067 error = xfs_rmap_get_rec(cur, &LEFT, &i);
1068 if (error)
1069 goto done;
1070 if (XFS_IS_CORRUPT(mp, i != 1)) {
1071 error = -EFSCORRUPTED;
1072 goto done;
1073 }
1074 if (XFS_IS_CORRUPT(mp,
1075 LEFT.rm_startblock + LEFT.rm_blockcount >
1076 bno)) {
1077 error = -EFSCORRUPTED;
1078 goto done;
1079 }
1080 trace_xfs_rmap_find_left_neighbor_result(cur->bc_mp,
1081 cur->bc_ag.pag->pag_agno, LEFT.rm_startblock,
1082 LEFT.rm_blockcount, LEFT.rm_owner,
1083 LEFT.rm_offset, LEFT.rm_flags);
1084 if (LEFT.rm_startblock + LEFT.rm_blockcount == bno &&
1085 LEFT.rm_offset + LEFT.rm_blockcount == offset &&
1086 xfs_rmap_is_mergeable(&LEFT, owner, newext))
1087 state |= RMAP_LEFT_CONTIG;
1088 }
1089
1090 /*
1091 * Increment the cursor to see if we have a right-adjacent record to our
1092 * insertion point. This will give us the record for end block
1093 * contiguity tests.
1094 */
1095 error = xfs_btree_increment(cur, 0, &i);
1096 if (error)
1097 goto done;
1098 if (XFS_IS_CORRUPT(mp, i != 1)) {
1099 error = -EFSCORRUPTED;
1100 goto done;
1101 }
1102 error = xfs_btree_increment(cur, 0, &i);
1103 if (error)
1104 goto done;
1105 if (i) {
1106 state |= RMAP_RIGHT_VALID;
1107 error = xfs_rmap_get_rec(cur, &RIGHT, &i);
1108 if (error)
1109 goto done;
1110 if (XFS_IS_CORRUPT(mp, i != 1)) {
1111 error = -EFSCORRUPTED;
1112 goto done;
1113 }
1114 if (XFS_IS_CORRUPT(mp, bno + len > RIGHT.rm_startblock)) {
1115 error = -EFSCORRUPTED;
1116 goto done;
1117 }
1118 trace_xfs_rmap_find_right_neighbor_result(cur->bc_mp,
1119 cur->bc_ag.pag->pag_agno, RIGHT.rm_startblock,
1120 RIGHT.rm_blockcount, RIGHT.rm_owner,
1121 RIGHT.rm_offset, RIGHT.rm_flags);
1122 if (bno + len == RIGHT.rm_startblock &&
1123 offset + len == RIGHT.rm_offset &&
1124 xfs_rmap_is_mergeable(&RIGHT, owner, newext))
1125 state |= RMAP_RIGHT_CONTIG;
1126 }
1127
1128 /* check that left + prev + right is not too long */
1129 if ((state & (RMAP_LEFT_FILLING | RMAP_LEFT_CONTIG |
1130 RMAP_RIGHT_FILLING | RMAP_RIGHT_CONTIG)) ==
1131 (RMAP_LEFT_FILLING | RMAP_LEFT_CONTIG |
1132 RMAP_RIGHT_FILLING | RMAP_RIGHT_CONTIG) &&
1133 (unsigned long)LEFT.rm_blockcount + len +
1134 RIGHT.rm_blockcount > XFS_RMAP_LEN_MAX)
1135 state &= ~RMAP_RIGHT_CONTIG;
1136
1137 trace_xfs_rmap_convert_state(mp, cur->bc_ag.pag->pag_agno, state,
1138 _RET_IP_);
1139
1140 /* reset the cursor back to PREV */
1141 error = xfs_rmap_lookup_le(cur, bno, len, owner, offset, oldext, &i);
1142 if (error)
1143 goto done;
1144 if (XFS_IS_CORRUPT(mp, i != 1)) {
1145 error = -EFSCORRUPTED;
1146 goto done;
1147 }
1148
1149 /*
1150 * Switch out based on the FILLING and CONTIG state bits.
1151 */
1152 switch (state & (RMAP_LEFT_FILLING | RMAP_LEFT_CONTIG |
1153 RMAP_RIGHT_FILLING | RMAP_RIGHT_CONTIG)) {
1154 case RMAP_LEFT_FILLING | RMAP_LEFT_CONTIG |
1155 RMAP_RIGHT_FILLING | RMAP_RIGHT_CONTIG:
1156 /*
1157 * Setting all of a previous oldext extent to newext.
1158 * The left and right neighbors are both contiguous with new.
1159 */
1160 error = xfs_btree_increment(cur, 0, &i);
1161 if (error)
1162 goto done;
1163 if (XFS_IS_CORRUPT(mp, i != 1)) {
1164 error = -EFSCORRUPTED;
1165 goto done;
1166 }
1167 trace_xfs_rmap_delete(mp, cur->bc_ag.pag->pag_agno,
1168 RIGHT.rm_startblock, RIGHT.rm_blockcount,
1169 RIGHT.rm_owner, RIGHT.rm_offset,
1170 RIGHT.rm_flags);
1171 error = xfs_btree_delete(cur, &i);
1172 if (error)
1173 goto done;
1174 if (XFS_IS_CORRUPT(mp, i != 1)) {
1175 error = -EFSCORRUPTED;
1176 goto done;
1177 }
1178 error = xfs_btree_decrement(cur, 0, &i);
1179 if (error)
1180 goto done;
1181 if (XFS_IS_CORRUPT(mp, i != 1)) {
1182 error = -EFSCORRUPTED;
1183 goto done;
1184 }
1185 trace_xfs_rmap_delete(mp, cur->bc_ag.pag->pag_agno,
1186 PREV.rm_startblock, PREV.rm_blockcount,
1187 PREV.rm_owner, PREV.rm_offset,
1188 PREV.rm_flags);
1189 error = xfs_btree_delete(cur, &i);
1190 if (error)
1191 goto done;
1192 if (XFS_IS_CORRUPT(mp, i != 1)) {
1193 error = -EFSCORRUPTED;
1194 goto done;
1195 }
1196 error = xfs_btree_decrement(cur, 0, &i);
1197 if (error)
1198 goto done;
1199 if (XFS_IS_CORRUPT(mp, i != 1)) {
1200 error = -EFSCORRUPTED;
1201 goto done;
1202 }
1203 NEW = LEFT;
1204 NEW.rm_blockcount += PREV.rm_blockcount + RIGHT.rm_blockcount;
1205 error = xfs_rmap_update(cur, &NEW);
1206 if (error)
1207 goto done;
1208 break;
1209
1210 case RMAP_LEFT_FILLING | RMAP_RIGHT_FILLING | RMAP_LEFT_CONTIG:
1211 /*
1212 * Setting all of a previous oldext extent to newext.
1213 * The left neighbor is contiguous, the right is not.
1214 */
1215 trace_xfs_rmap_delete(mp, cur->bc_ag.pag->pag_agno,
1216 PREV.rm_startblock, PREV.rm_blockcount,
1217 PREV.rm_owner, PREV.rm_offset,
1218 PREV.rm_flags);
1219 error = xfs_btree_delete(cur, &i);
1220 if (error)
1221 goto done;
1222 if (XFS_IS_CORRUPT(mp, i != 1)) {
1223 error = -EFSCORRUPTED;
1224 goto done;
1225 }
1226 error = xfs_btree_decrement(cur, 0, &i);
1227 if (error)
1228 goto done;
1229 if (XFS_IS_CORRUPT(mp, i != 1)) {
1230 error = -EFSCORRUPTED;
1231 goto done;
1232 }
1233 NEW = LEFT;
1234 NEW.rm_blockcount += PREV.rm_blockcount;
1235 error = xfs_rmap_update(cur, &NEW);
1236 if (error)
1237 goto done;
1238 break;
1239
1240 case RMAP_LEFT_FILLING | RMAP_RIGHT_FILLING | RMAP_RIGHT_CONTIG:
1241 /*
1242 * Setting all of a previous oldext extent to newext.
1243 * The right neighbor is contiguous, the left is not.
1244 */
1245 error = xfs_btree_increment(cur, 0, &i);
1246 if (error)
1247 goto done;
1248 if (XFS_IS_CORRUPT(mp, i != 1)) {
1249 error = -EFSCORRUPTED;
1250 goto done;
1251 }
1252 trace_xfs_rmap_delete(mp, cur->bc_ag.pag->pag_agno,
1253 RIGHT.rm_startblock, RIGHT.rm_blockcount,
1254 RIGHT.rm_owner, RIGHT.rm_offset,
1255 RIGHT.rm_flags);
1256 error = xfs_btree_delete(cur, &i);
1257 if (error)
1258 goto done;
1259 if (XFS_IS_CORRUPT(mp, i != 1)) {
1260 error = -EFSCORRUPTED;
1261 goto done;
1262 }
1263 error = xfs_btree_decrement(cur, 0, &i);
1264 if (error)
1265 goto done;
1266 if (XFS_IS_CORRUPT(mp, i != 1)) {
1267 error = -EFSCORRUPTED;
1268 goto done;
1269 }
1270 NEW = PREV;
1271 NEW.rm_blockcount = len + RIGHT.rm_blockcount;
1272 NEW.rm_flags = newext;
1273 error = xfs_rmap_update(cur, &NEW);
1274 if (error)
1275 goto done;
1276 break;
1277
1278 case RMAP_LEFT_FILLING | RMAP_RIGHT_FILLING:
1279 /*
1280 * Setting all of a previous oldext extent to newext.
1281 * Neither the left nor right neighbors are contiguous with
1282 * the new one.
1283 */
1284 NEW = PREV;
1285 NEW.rm_flags = newext;
1286 error = xfs_rmap_update(cur, &NEW);
1287 if (error)
1288 goto done;
1289 break;
1290
1291 case RMAP_LEFT_FILLING | RMAP_LEFT_CONTIG:
1292 /*
1293 * Setting the first part of a previous oldext extent to newext.
1294 * The left neighbor is contiguous.
1295 */
1296 NEW = PREV;
1297 NEW.rm_offset += len;
1298 NEW.rm_startblock += len;
1299 NEW.rm_blockcount -= len;
1300 error = xfs_rmap_update(cur, &NEW);
1301 if (error)
1302 goto done;
1303 error = xfs_btree_decrement(cur, 0, &i);
1304 if (error)
1305 goto done;
1306 NEW = LEFT;
1307 NEW.rm_blockcount += len;
1308 error = xfs_rmap_update(cur, &NEW);
1309 if (error)
1310 goto done;
1311 break;
1312
1313 case RMAP_LEFT_FILLING:
1314 /*
1315 * Setting the first part of a previous oldext extent to newext.
1316 * The left neighbor is not contiguous.
1317 */
1318 NEW = PREV;
1319 NEW.rm_startblock += len;
1320 NEW.rm_offset += len;
1321 NEW.rm_blockcount -= len;
1322 error = xfs_rmap_update(cur, &NEW);
1323 if (error)
1324 goto done;
1325 NEW.rm_startblock = bno;
1326 NEW.rm_owner = owner;
1327 NEW.rm_offset = offset;
1328 NEW.rm_blockcount = len;
1329 NEW.rm_flags = newext;
1330 cur->bc_rec.r = NEW;
1331 trace_xfs_rmap_insert(mp, cur->bc_ag.pag->pag_agno, bno,
1332 len, owner, offset, newext);
1333 error = xfs_btree_insert(cur, &i);
1334 if (error)
1335 goto done;
1336 if (XFS_IS_CORRUPT(mp, i != 1)) {
1337 error = -EFSCORRUPTED;
1338 goto done;
1339 }
1340 break;
1341
1342 case RMAP_RIGHT_FILLING | RMAP_RIGHT_CONTIG:
1343 /*
1344 * Setting the last part of a previous oldext extent to newext.
1345 * The right neighbor is contiguous with the new allocation.
1346 */
1347 NEW = PREV;
1348 NEW.rm_blockcount -= len;
1349 error = xfs_rmap_update(cur, &NEW);
1350 if (error)
1351 goto done;
1352 error = xfs_btree_increment(cur, 0, &i);
1353 if (error)
1354 goto done;
1355 NEW = RIGHT;
1356 NEW.rm_offset = offset;
1357 NEW.rm_startblock = bno;
1358 NEW.rm_blockcount += len;
1359 error = xfs_rmap_update(cur, &NEW);
1360 if (error)
1361 goto done;
1362 break;
1363
1364 case RMAP_RIGHT_FILLING:
1365 /*
1366 * Setting the last part of a previous oldext extent to newext.
1367 * The right neighbor is not contiguous.
1368 */
1369 NEW = PREV;
1370 NEW.rm_blockcount -= len;
1371 error = xfs_rmap_update(cur, &NEW);
1372 if (error)
1373 goto done;
1374 error = xfs_rmap_lookup_eq(cur, bno, len, owner, offset,
1375 oldext, &i);
1376 if (error)
1377 goto done;
1378 if (XFS_IS_CORRUPT(mp, i != 0)) {
1379 error = -EFSCORRUPTED;
1380 goto done;
1381 }
1382 NEW.rm_startblock = bno;
1383 NEW.rm_owner = owner;
1384 NEW.rm_offset = offset;
1385 NEW.rm_blockcount = len;
1386 NEW.rm_flags = newext;
1387 cur->bc_rec.r = NEW;
1388 trace_xfs_rmap_insert(mp, cur->bc_ag.pag->pag_agno, bno,
1389 len, owner, offset, newext);
1390 error = xfs_btree_insert(cur, &i);
1391 if (error)
1392 goto done;
1393 if (XFS_IS_CORRUPT(mp, i != 1)) {
1394 error = -EFSCORRUPTED;
1395 goto done;
1396 }
1397 break;
1398
1399 case 0:
1400 /*
1401 * Setting the middle part of a previous oldext extent to
1402 * newext. Contiguity is impossible here.
1403 * One extent becomes three extents.
1404 */
1405 /* new right extent - oldext */
1406 NEW.rm_startblock = bno + len;
1407 NEW.rm_owner = owner;
1408 NEW.rm_offset = new_endoff;
1409 NEW.rm_blockcount = PREV.rm_offset + PREV.rm_blockcount -
1410 new_endoff;
1411 NEW.rm_flags = PREV.rm_flags;
1412 error = xfs_rmap_update(cur, &NEW);
1413 if (error)
1414 goto done;
1415 /* new left extent - oldext */
1416 NEW = PREV;
1417 NEW.rm_blockcount = offset - PREV.rm_offset;
1418 cur->bc_rec.r = NEW;
1419 trace_xfs_rmap_insert(mp, cur->bc_ag.pag->pag_agno,
1420 NEW.rm_startblock, NEW.rm_blockcount,
1421 NEW.rm_owner, NEW.rm_offset,
1422 NEW.rm_flags);
1423 error = xfs_btree_insert(cur, &i);
1424 if (error)
1425 goto done;
1426 if (XFS_IS_CORRUPT(mp, i != 1)) {
1427 error = -EFSCORRUPTED;
1428 goto done;
1429 }
1430 /*
1431 * Reset the cursor to the position of the new extent
1432 * we are about to insert as we can't trust it after
1433 * the previous insert.
1434 */
1435 error = xfs_rmap_lookup_eq(cur, bno, len, owner, offset,
1436 oldext, &i);
1437 if (error)
1438 goto done;
1439 if (XFS_IS_CORRUPT(mp, i != 0)) {
1440 error = -EFSCORRUPTED;
1441 goto done;
1442 }
1443 /* new middle extent - newext */
1444 cur->bc_rec.r.rm_flags &= ~XFS_RMAP_UNWRITTEN;
1445 cur->bc_rec.r.rm_flags |= newext;
1446 trace_xfs_rmap_insert(mp, cur->bc_ag.pag->pag_agno, bno, len,
1447 owner, offset, newext);
1448 error = xfs_btree_insert(cur, &i);
1449 if (error)
1450 goto done;
1451 if (XFS_IS_CORRUPT(mp, i != 1)) {
1452 error = -EFSCORRUPTED;
1453 goto done;
1454 }
1455 break;
1456
1457 case RMAP_LEFT_FILLING | RMAP_LEFT_CONTIG | RMAP_RIGHT_CONTIG:
1458 case RMAP_RIGHT_FILLING | RMAP_LEFT_CONTIG | RMAP_RIGHT_CONTIG:
1459 case RMAP_LEFT_FILLING | RMAP_RIGHT_CONTIG:
1460 case RMAP_RIGHT_FILLING | RMAP_LEFT_CONTIG:
1461 case RMAP_LEFT_CONTIG | RMAP_RIGHT_CONTIG:
1462 case RMAP_LEFT_CONTIG:
1463 case RMAP_RIGHT_CONTIG:
1464 /*
1465 * These cases are all impossible.
1466 */
1467 ASSERT(0);
1468 }
1469
1470 trace_xfs_rmap_convert_done(mp, cur->bc_ag.pag->pag_agno, bno, len,
1471 unwritten, oinfo);
1472done:
1473 if (error)
1474 trace_xfs_rmap_convert_error(cur->bc_mp,
1475 cur->bc_ag.pag->pag_agno, error, _RET_IP_);
1476 return error;
1477}
1478
1479/*
1480 * Convert an unwritten extent to a real extent or vice versa. If there is no
1481 * possibility of overlapping extents, delegate to the simpler convert
1482 * function.
1483 */
1484STATIC int
1485xfs_rmap_convert_shared(
1486 struct xfs_btree_cur *cur,
1487 xfs_agblock_t bno,
1488 xfs_extlen_t len,
1489 bool unwritten,
1490 const struct xfs_owner_info *oinfo)
1491{
1492 struct xfs_mount *mp = cur->bc_mp;
1493 struct xfs_rmap_irec r[4]; /* neighbor extent entries */
1494 /* left is 0, right is 1, */
1495 /* prev is 2, new is 3 */
1496 uint64_t owner;
1497 uint64_t offset;
1498 uint64_t new_endoff;
1499 unsigned int oldext;
1500 unsigned int newext;
1501 unsigned int flags = 0;
1502 int i;
1503 int state = 0;
1504 int error;
1505
1506 xfs_owner_info_unpack(oinfo, &owner, &offset, &flags);
1507 ASSERT(!(XFS_RMAP_NON_INODE_OWNER(owner) ||
1508 (flags & (XFS_RMAP_ATTR_FORK | XFS_RMAP_BMBT_BLOCK))));
1509 oldext = unwritten ? XFS_RMAP_UNWRITTEN : 0;
1510 new_endoff = offset + len;
1511 trace_xfs_rmap_convert(mp, cur->bc_ag.pag->pag_agno, bno, len,
1512 unwritten, oinfo);
1513
1514 /*
1515 * For the initial lookup, look for and exact match or the left-adjacent
1516 * record for our insertion point. This will also give us the record for
1517 * start block contiguity tests.
1518 */
1519 error = xfs_rmap_lookup_le_range(cur, bno, owner, offset, oldext,
1520 &PREV, &i);
1521 if (error)
1522 goto done;
1523 if (XFS_IS_CORRUPT(mp, i != 1)) {
1524 error = -EFSCORRUPTED;
1525 goto done;
1526 }
1527
1528 ASSERT(PREV.rm_offset <= offset);
1529 ASSERT(PREV.rm_offset + PREV.rm_blockcount >= new_endoff);
1530 ASSERT((PREV.rm_flags & XFS_RMAP_UNWRITTEN) == oldext);
1531 newext = ~oldext & XFS_RMAP_UNWRITTEN;
1532
1533 /*
1534 * Set flags determining what part of the previous oldext allocation
1535 * extent is being replaced by a newext allocation.
1536 */
1537 if (PREV.rm_offset == offset)
1538 state |= RMAP_LEFT_FILLING;
1539 if (PREV.rm_offset + PREV.rm_blockcount == new_endoff)
1540 state |= RMAP_RIGHT_FILLING;
1541
1542 /* Is there a left record that abuts our range? */
1543 error = xfs_rmap_find_left_neighbor(cur, bno, owner, offset, newext,
1544 &LEFT, &i);
1545 if (error)
1546 goto done;
1547 if (i) {
1548 state |= RMAP_LEFT_VALID;
1549 if (XFS_IS_CORRUPT(mp,
1550 LEFT.rm_startblock + LEFT.rm_blockcount >
1551 bno)) {
1552 error = -EFSCORRUPTED;
1553 goto done;
1554 }
1555 if (xfs_rmap_is_mergeable(&LEFT, owner, newext))
1556 state |= RMAP_LEFT_CONTIG;
1557 }
1558
1559 /* Is there a right record that abuts our range? */
1560 error = xfs_rmap_lookup_eq(cur, bno + len, len, owner, offset + len,
1561 newext, &i);
1562 if (error)
1563 goto done;
1564 if (i) {
1565 state |= RMAP_RIGHT_VALID;
1566 error = xfs_rmap_get_rec(cur, &RIGHT, &i);
1567 if (error)
1568 goto done;
1569 if (XFS_IS_CORRUPT(mp, i != 1)) {
1570 error = -EFSCORRUPTED;
1571 goto done;
1572 }
1573 if (XFS_IS_CORRUPT(mp, bno + len > RIGHT.rm_startblock)) {
1574 error = -EFSCORRUPTED;
1575 goto done;
1576 }
1577 trace_xfs_rmap_find_right_neighbor_result(cur->bc_mp,
1578 cur->bc_ag.pag->pag_agno, RIGHT.rm_startblock,
1579 RIGHT.rm_blockcount, RIGHT.rm_owner,
1580 RIGHT.rm_offset, RIGHT.rm_flags);
1581 if (xfs_rmap_is_mergeable(&RIGHT, owner, newext))
1582 state |= RMAP_RIGHT_CONTIG;
1583 }
1584
1585 /* check that left + prev + right is not too long */
1586 if ((state & (RMAP_LEFT_FILLING | RMAP_LEFT_CONTIG |
1587 RMAP_RIGHT_FILLING | RMAP_RIGHT_CONTIG)) ==
1588 (RMAP_LEFT_FILLING | RMAP_LEFT_CONTIG |
1589 RMAP_RIGHT_FILLING | RMAP_RIGHT_CONTIG) &&
1590 (unsigned long)LEFT.rm_blockcount + len +
1591 RIGHT.rm_blockcount > XFS_RMAP_LEN_MAX)
1592 state &= ~RMAP_RIGHT_CONTIG;
1593
1594 trace_xfs_rmap_convert_state(mp, cur->bc_ag.pag->pag_agno, state,
1595 _RET_IP_);
1596 /*
1597 * Switch out based on the FILLING and CONTIG state bits.
1598 */
1599 switch (state & (RMAP_LEFT_FILLING | RMAP_LEFT_CONTIG |
1600 RMAP_RIGHT_FILLING | RMAP_RIGHT_CONTIG)) {
1601 case RMAP_LEFT_FILLING | RMAP_LEFT_CONTIG |
1602 RMAP_RIGHT_FILLING | RMAP_RIGHT_CONTIG:
1603 /*
1604 * Setting all of a previous oldext extent to newext.
1605 * The left and right neighbors are both contiguous with new.
1606 */
1607 error = xfs_rmap_delete(cur, RIGHT.rm_startblock,
1608 RIGHT.rm_blockcount, RIGHT.rm_owner,
1609 RIGHT.rm_offset, RIGHT.rm_flags);
1610 if (error)
1611 goto done;
1612 error = xfs_rmap_delete(cur, PREV.rm_startblock,
1613 PREV.rm_blockcount, PREV.rm_owner,
1614 PREV.rm_offset, PREV.rm_flags);
1615 if (error)
1616 goto done;
1617 NEW = LEFT;
1618 error = xfs_rmap_lookup_eq(cur, NEW.rm_startblock,
1619 NEW.rm_blockcount, NEW.rm_owner,
1620 NEW.rm_offset, NEW.rm_flags, &i);
1621 if (error)
1622 goto done;
1623 if (XFS_IS_CORRUPT(mp, i != 1)) {
1624 error = -EFSCORRUPTED;
1625 goto done;
1626 }
1627 NEW.rm_blockcount += PREV.rm_blockcount + RIGHT.rm_blockcount;
1628 error = xfs_rmap_update(cur, &NEW);
1629 if (error)
1630 goto done;
1631 break;
1632
1633 case RMAP_LEFT_FILLING | RMAP_RIGHT_FILLING | RMAP_LEFT_CONTIG:
1634 /*
1635 * Setting all of a previous oldext extent to newext.
1636 * The left neighbor is contiguous, the right is not.
1637 */
1638 error = xfs_rmap_delete(cur, PREV.rm_startblock,
1639 PREV.rm_blockcount, PREV.rm_owner,
1640 PREV.rm_offset, PREV.rm_flags);
1641 if (error)
1642 goto done;
1643 NEW = LEFT;
1644 error = xfs_rmap_lookup_eq(cur, NEW.rm_startblock,
1645 NEW.rm_blockcount, NEW.rm_owner,
1646 NEW.rm_offset, NEW.rm_flags, &i);
1647 if (error)
1648 goto done;
1649 if (XFS_IS_CORRUPT(mp, i != 1)) {
1650 error = -EFSCORRUPTED;
1651 goto done;
1652 }
1653 NEW.rm_blockcount += PREV.rm_blockcount;
1654 error = xfs_rmap_update(cur, &NEW);
1655 if (error)
1656 goto done;
1657 break;
1658
1659 case RMAP_LEFT_FILLING | RMAP_RIGHT_FILLING | RMAP_RIGHT_CONTIG:
1660 /*
1661 * Setting all of a previous oldext extent to newext.
1662 * The right neighbor is contiguous, the left is not.
1663 */
1664 error = xfs_rmap_delete(cur, RIGHT.rm_startblock,
1665 RIGHT.rm_blockcount, RIGHT.rm_owner,
1666 RIGHT.rm_offset, RIGHT.rm_flags);
1667 if (error)
1668 goto done;
1669 NEW = PREV;
1670 error = xfs_rmap_lookup_eq(cur, NEW.rm_startblock,
1671 NEW.rm_blockcount, NEW.rm_owner,
1672 NEW.rm_offset, NEW.rm_flags, &i);
1673 if (error)
1674 goto done;
1675 if (XFS_IS_CORRUPT(mp, i != 1)) {
1676 error = -EFSCORRUPTED;
1677 goto done;
1678 }
1679 NEW.rm_blockcount += RIGHT.rm_blockcount;
1680 NEW.rm_flags = RIGHT.rm_flags;
1681 error = xfs_rmap_update(cur, &NEW);
1682 if (error)
1683 goto done;
1684 break;
1685
1686 case RMAP_LEFT_FILLING | RMAP_RIGHT_FILLING:
1687 /*
1688 * Setting all of a previous oldext extent to newext.
1689 * Neither the left nor right neighbors are contiguous with
1690 * the new one.
1691 */
1692 NEW = PREV;
1693 error = xfs_rmap_lookup_eq(cur, NEW.rm_startblock,
1694 NEW.rm_blockcount, NEW.rm_owner,
1695 NEW.rm_offset, NEW.rm_flags, &i);
1696 if (error)
1697 goto done;
1698 if (XFS_IS_CORRUPT(mp, i != 1)) {
1699 error = -EFSCORRUPTED;
1700 goto done;
1701 }
1702 NEW.rm_flags = newext;
1703 error = xfs_rmap_update(cur, &NEW);
1704 if (error)
1705 goto done;
1706 break;
1707
1708 case RMAP_LEFT_FILLING | RMAP_LEFT_CONTIG:
1709 /*
1710 * Setting the first part of a previous oldext extent to newext.
1711 * The left neighbor is contiguous.
1712 */
1713 NEW = PREV;
1714 error = xfs_rmap_delete(cur, NEW.rm_startblock,
1715 NEW.rm_blockcount, NEW.rm_owner,
1716 NEW.rm_offset, NEW.rm_flags);
1717 if (error)
1718 goto done;
1719 NEW.rm_offset += len;
1720 NEW.rm_startblock += len;
1721 NEW.rm_blockcount -= len;
1722 error = xfs_rmap_insert(cur, NEW.rm_startblock,
1723 NEW.rm_blockcount, NEW.rm_owner,
1724 NEW.rm_offset, NEW.rm_flags);
1725 if (error)
1726 goto done;
1727 NEW = LEFT;
1728 error = xfs_rmap_lookup_eq(cur, NEW.rm_startblock,
1729 NEW.rm_blockcount, NEW.rm_owner,
1730 NEW.rm_offset, NEW.rm_flags, &i);
1731 if (error)
1732 goto done;
1733 if (XFS_IS_CORRUPT(mp, i != 1)) {
1734 error = -EFSCORRUPTED;
1735 goto done;
1736 }
1737 NEW.rm_blockcount += len;
1738 error = xfs_rmap_update(cur, &NEW);
1739 if (error)
1740 goto done;
1741 break;
1742
1743 case RMAP_LEFT_FILLING:
1744 /*
1745 * Setting the first part of a previous oldext extent to newext.
1746 * The left neighbor is not contiguous.
1747 */
1748 NEW = PREV;
1749 error = xfs_rmap_delete(cur, NEW.rm_startblock,
1750 NEW.rm_blockcount, NEW.rm_owner,
1751 NEW.rm_offset, NEW.rm_flags);
1752 if (error)
1753 goto done;
1754 NEW.rm_offset += len;
1755 NEW.rm_startblock += len;
1756 NEW.rm_blockcount -= len;
1757 error = xfs_rmap_insert(cur, NEW.rm_startblock,
1758 NEW.rm_blockcount, NEW.rm_owner,
1759 NEW.rm_offset, NEW.rm_flags);
1760 if (error)
1761 goto done;
1762 error = xfs_rmap_insert(cur, bno, len, owner, offset, newext);
1763 if (error)
1764 goto done;
1765 break;
1766
1767 case RMAP_RIGHT_FILLING | RMAP_RIGHT_CONTIG:
1768 /*
1769 * Setting the last part of a previous oldext extent to newext.
1770 * The right neighbor is contiguous with the new allocation.
1771 */
1772 NEW = PREV;
1773 error = xfs_rmap_lookup_eq(cur, NEW.rm_startblock,
1774 NEW.rm_blockcount, NEW.rm_owner,
1775 NEW.rm_offset, NEW.rm_flags, &i);
1776 if (error)
1777 goto done;
1778 if (XFS_IS_CORRUPT(mp, i != 1)) {
1779 error = -EFSCORRUPTED;
1780 goto done;
1781 }
1782 NEW.rm_blockcount = offset - NEW.rm_offset;
1783 error = xfs_rmap_update(cur, &NEW);
1784 if (error)
1785 goto done;
1786 NEW = RIGHT;
1787 error = xfs_rmap_delete(cur, NEW.rm_startblock,
1788 NEW.rm_blockcount, NEW.rm_owner,
1789 NEW.rm_offset, NEW.rm_flags);
1790 if (error)
1791 goto done;
1792 NEW.rm_offset = offset;
1793 NEW.rm_startblock = bno;
1794 NEW.rm_blockcount += len;
1795 error = xfs_rmap_insert(cur, NEW.rm_startblock,
1796 NEW.rm_blockcount, NEW.rm_owner,
1797 NEW.rm_offset, NEW.rm_flags);
1798 if (error)
1799 goto done;
1800 break;
1801
1802 case RMAP_RIGHT_FILLING:
1803 /*
1804 * Setting the last part of a previous oldext extent to newext.
1805 * The right neighbor is not contiguous.
1806 */
1807 NEW = PREV;
1808 error = xfs_rmap_lookup_eq(cur, NEW.rm_startblock,
1809 NEW.rm_blockcount, NEW.rm_owner,
1810 NEW.rm_offset, NEW.rm_flags, &i);
1811 if (error)
1812 goto done;
1813 if (XFS_IS_CORRUPT(mp, i != 1)) {
1814 error = -EFSCORRUPTED;
1815 goto done;
1816 }
1817 NEW.rm_blockcount -= len;
1818 error = xfs_rmap_update(cur, &NEW);
1819 if (error)
1820 goto done;
1821 error = xfs_rmap_insert(cur, bno, len, owner, offset, newext);
1822 if (error)
1823 goto done;
1824 break;
1825
1826 case 0:
1827 /*
1828 * Setting the middle part of a previous oldext extent to
1829 * newext. Contiguity is impossible here.
1830 * One extent becomes three extents.
1831 */
1832 /* new right extent - oldext */
1833 NEW.rm_startblock = bno + len;
1834 NEW.rm_owner = owner;
1835 NEW.rm_offset = new_endoff;
1836 NEW.rm_blockcount = PREV.rm_offset + PREV.rm_blockcount -
1837 new_endoff;
1838 NEW.rm_flags = PREV.rm_flags;
1839 error = xfs_rmap_insert(cur, NEW.rm_startblock,
1840 NEW.rm_blockcount, NEW.rm_owner, NEW.rm_offset,
1841 NEW.rm_flags);
1842 if (error)
1843 goto done;
1844 /* new left extent - oldext */
1845 NEW = PREV;
1846 error = xfs_rmap_lookup_eq(cur, NEW.rm_startblock,
1847 NEW.rm_blockcount, NEW.rm_owner,
1848 NEW.rm_offset, NEW.rm_flags, &i);
1849 if (error)
1850 goto done;
1851 if (XFS_IS_CORRUPT(mp, i != 1)) {
1852 error = -EFSCORRUPTED;
1853 goto done;
1854 }
1855 NEW.rm_blockcount = offset - NEW.rm_offset;
1856 error = xfs_rmap_update(cur, &NEW);
1857 if (error)
1858 goto done;
1859 /* new middle extent - newext */
1860 NEW.rm_startblock = bno;
1861 NEW.rm_blockcount = len;
1862 NEW.rm_owner = owner;
1863 NEW.rm_offset = offset;
1864 NEW.rm_flags = newext;
1865 error = xfs_rmap_insert(cur, NEW.rm_startblock,
1866 NEW.rm_blockcount, NEW.rm_owner, NEW.rm_offset,
1867 NEW.rm_flags);
1868 if (error)
1869 goto done;
1870 break;
1871
1872 case RMAP_LEFT_FILLING | RMAP_LEFT_CONTIG | RMAP_RIGHT_CONTIG:
1873 case RMAP_RIGHT_FILLING | RMAP_LEFT_CONTIG | RMAP_RIGHT_CONTIG:
1874 case RMAP_LEFT_FILLING | RMAP_RIGHT_CONTIG:
1875 case RMAP_RIGHT_FILLING | RMAP_LEFT_CONTIG:
1876 case RMAP_LEFT_CONTIG | RMAP_RIGHT_CONTIG:
1877 case RMAP_LEFT_CONTIG:
1878 case RMAP_RIGHT_CONTIG:
1879 /*
1880 * These cases are all impossible.
1881 */
1882 ASSERT(0);
1883 }
1884
1885 trace_xfs_rmap_convert_done(mp, cur->bc_ag.pag->pag_agno, bno, len,
1886 unwritten, oinfo);
1887done:
1888 if (error)
1889 trace_xfs_rmap_convert_error(cur->bc_mp,
1890 cur->bc_ag.pag->pag_agno, error, _RET_IP_);
1891 return error;
1892}
1893
1894#undef NEW
1895#undef LEFT
1896#undef RIGHT
1897#undef PREV
1898
1899/*
1900 * Find an extent in the rmap btree and unmap it. For rmap extent types that
1901 * can overlap (data fork rmaps on reflink filesystems) we must be careful
1902 * that the prev/next records in the btree might belong to another owner.
1903 * Therefore we must use delete+insert to alter any of the key fields.
1904 *
1905 * For every other situation there can only be one owner for a given extent,
1906 * so we can call the regular _free function.
1907 */
1908STATIC int
1909xfs_rmap_unmap_shared(
1910 struct xfs_btree_cur *cur,
1911 xfs_agblock_t bno,
1912 xfs_extlen_t len,
1913 bool unwritten,
1914 const struct xfs_owner_info *oinfo)
1915{
1916 struct xfs_mount *mp = cur->bc_mp;
1917 struct xfs_rmap_irec ltrec;
1918 uint64_t ltoff;
1919 int error = 0;
1920 int i;
1921 uint64_t owner;
1922 uint64_t offset;
1923 unsigned int flags;
1924
1925 xfs_owner_info_unpack(oinfo, &owner, &offset, &flags);
1926 if (unwritten)
1927 flags |= XFS_RMAP_UNWRITTEN;
1928 trace_xfs_rmap_unmap(mp, cur->bc_ag.pag->pag_agno, bno, len,
1929 unwritten, oinfo);
1930
1931 /*
1932 * We should always have a left record because there's a static record
1933 * for the AG headers at rm_startblock == 0 created by mkfs/growfs that
1934 * will not ever be removed from the tree.
1935 */
1936 error = xfs_rmap_lookup_le_range(cur, bno, owner, offset, flags,
1937 <rec, &i);
1938 if (error)
1939 goto out_error;
1940 if (XFS_IS_CORRUPT(mp, i != 1)) {
1941 error = -EFSCORRUPTED;
1942 goto out_error;
1943 }
1944 ltoff = ltrec.rm_offset;
1945
1946 /* Make sure the extent we found covers the entire freeing range. */
1947 if (XFS_IS_CORRUPT(mp,
1948 ltrec.rm_startblock > bno ||
1949 ltrec.rm_startblock + ltrec.rm_blockcount <
1950 bno + len)) {
1951 error = -EFSCORRUPTED;
1952 goto out_error;
1953 }
1954
1955 /* Make sure the owner matches what we expect to find in the tree. */
1956 if (XFS_IS_CORRUPT(mp, owner != ltrec.rm_owner)) {
1957 error = -EFSCORRUPTED;
1958 goto out_error;
1959 }
1960
1961 /* Make sure the unwritten flag matches. */
1962 if (XFS_IS_CORRUPT(mp,
1963 (flags & XFS_RMAP_UNWRITTEN) !=
1964 (ltrec.rm_flags & XFS_RMAP_UNWRITTEN))) {
1965 error = -EFSCORRUPTED;
1966 goto out_error;
1967 }
1968
1969 /* Check the offset. */
1970 if (XFS_IS_CORRUPT(mp, ltrec.rm_offset > offset)) {
1971 error = -EFSCORRUPTED;
1972 goto out_error;
1973 }
1974 if (XFS_IS_CORRUPT(mp, offset > ltoff + ltrec.rm_blockcount)) {
1975 error = -EFSCORRUPTED;
1976 goto out_error;
1977 }
1978
1979 if (ltrec.rm_startblock == bno && ltrec.rm_blockcount == len) {
1980 /* Exact match, simply remove the record from rmap tree. */
1981 error = xfs_rmap_delete(cur, ltrec.rm_startblock,
1982 ltrec.rm_blockcount, ltrec.rm_owner,
1983 ltrec.rm_offset, ltrec.rm_flags);
1984 if (error)
1985 goto out_error;
1986 } else if (ltrec.rm_startblock == bno) {
1987 /*
1988 * Overlap left hand side of extent: move the start, trim the
1989 * length and update the current record.
1990 *
1991 * ltbno ltlen
1992 * Orig: |oooooooooooooooooooo|
1993 * Freeing: |fffffffff|
1994 * Result: |rrrrrrrrrr|
1995 * bno len
1996 */
1997
1998 /* Delete prev rmap. */
1999 error = xfs_rmap_delete(cur, ltrec.rm_startblock,
2000 ltrec.rm_blockcount, ltrec.rm_owner,
2001 ltrec.rm_offset, ltrec.rm_flags);
2002 if (error)
2003 goto out_error;
2004
2005 /* Add an rmap at the new offset. */
2006 ltrec.rm_startblock += len;
2007 ltrec.rm_blockcount -= len;
2008 ltrec.rm_offset += len;
2009 error = xfs_rmap_insert(cur, ltrec.rm_startblock,
2010 ltrec.rm_blockcount, ltrec.rm_owner,
2011 ltrec.rm_offset, ltrec.rm_flags);
2012 if (error)
2013 goto out_error;
2014 } else if (ltrec.rm_startblock + ltrec.rm_blockcount == bno + len) {
2015 /*
2016 * Overlap right hand side of extent: trim the length and
2017 * update the current record.
2018 *
2019 * ltbno ltlen
2020 * Orig: |oooooooooooooooooooo|
2021 * Freeing: |fffffffff|
2022 * Result: |rrrrrrrrrr|
2023 * bno len
2024 */
2025 error = xfs_rmap_lookup_eq(cur, ltrec.rm_startblock,
2026 ltrec.rm_blockcount, ltrec.rm_owner,
2027 ltrec.rm_offset, ltrec.rm_flags, &i);
2028 if (error)
2029 goto out_error;
2030 if (XFS_IS_CORRUPT(mp, i != 1)) {
2031 error = -EFSCORRUPTED;
2032 goto out_error;
2033 }
2034 ltrec.rm_blockcount -= len;
2035 error = xfs_rmap_update(cur, <rec);
2036 if (error)
2037 goto out_error;
2038 } else {
2039 /*
2040 * Overlap middle of extent: trim the length of the existing
2041 * record to the length of the new left-extent size, increment
2042 * the insertion position so we can insert a new record
2043 * containing the remaining right-extent space.
2044 *
2045 * ltbno ltlen
2046 * Orig: |oooooooooooooooooooo|
2047 * Freeing: |fffffffff|
2048 * Result: |rrrrr| |rrrr|
2049 * bno len
2050 */
2051 xfs_extlen_t orig_len = ltrec.rm_blockcount;
2052
2053 /* Shrink the left side of the rmap */
2054 error = xfs_rmap_lookup_eq(cur, ltrec.rm_startblock,
2055 ltrec.rm_blockcount, ltrec.rm_owner,
2056 ltrec.rm_offset, ltrec.rm_flags, &i);
2057 if (error)
2058 goto out_error;
2059 if (XFS_IS_CORRUPT(mp, i != 1)) {
2060 error = -EFSCORRUPTED;
2061 goto out_error;
2062 }
2063 ltrec.rm_blockcount = bno - ltrec.rm_startblock;
2064 error = xfs_rmap_update(cur, <rec);
2065 if (error)
2066 goto out_error;
2067
2068 /* Add an rmap at the new offset */
2069 error = xfs_rmap_insert(cur, bno + len,
2070 orig_len - len - ltrec.rm_blockcount,
2071 ltrec.rm_owner, offset + len,
2072 ltrec.rm_flags);
2073 if (error)
2074 goto out_error;
2075 }
2076
2077 trace_xfs_rmap_unmap_done(mp, cur->bc_ag.pag->pag_agno, bno, len,
2078 unwritten, oinfo);
2079out_error:
2080 if (error)
2081 trace_xfs_rmap_unmap_error(cur->bc_mp,
2082 cur->bc_ag.pag->pag_agno, error, _RET_IP_);
2083 return error;
2084}
2085
2086/*
2087 * Find an extent in the rmap btree and map it. For rmap extent types that
2088 * can overlap (data fork rmaps on reflink filesystems) we must be careful
2089 * that the prev/next records in the btree might belong to another owner.
2090 * Therefore we must use delete+insert to alter any of the key fields.
2091 *
2092 * For every other situation there can only be one owner for a given extent,
2093 * so we can call the regular _alloc function.
2094 */
2095STATIC int
2096xfs_rmap_map_shared(
2097 struct xfs_btree_cur *cur,
2098 xfs_agblock_t bno,
2099 xfs_extlen_t len,
2100 bool unwritten,
2101 const struct xfs_owner_info *oinfo)
2102{
2103 struct xfs_mount *mp = cur->bc_mp;
2104 struct xfs_rmap_irec ltrec;
2105 struct xfs_rmap_irec gtrec;
2106 int have_gt;
2107 int have_lt;
2108 int error = 0;
2109 int i;
2110 uint64_t owner;
2111 uint64_t offset;
2112 unsigned int flags = 0;
2113
2114 xfs_owner_info_unpack(oinfo, &owner, &offset, &flags);
2115 if (unwritten)
2116 flags |= XFS_RMAP_UNWRITTEN;
2117 trace_xfs_rmap_map(mp, cur->bc_ag.pag->pag_agno, bno, len,
2118 unwritten, oinfo);
2119
2120 /* Is there a left record that abuts our range? */
2121 error = xfs_rmap_find_left_neighbor(cur, bno, owner, offset, flags,
2122 <rec, &have_lt);
2123 if (error)
2124 goto out_error;
2125 if (have_lt &&
2126 !xfs_rmap_is_mergeable(<rec, owner, flags))
2127 have_lt = 0;
2128
2129 /* Is there a right record that abuts our range? */
2130 error = xfs_rmap_lookup_eq(cur, bno + len, len, owner, offset + len,
2131 flags, &have_gt);
2132 if (error)
2133 goto out_error;
2134 if (have_gt) {
2135 error = xfs_rmap_get_rec(cur, >rec, &have_gt);
2136 if (error)
2137 goto out_error;
2138 if (XFS_IS_CORRUPT(mp, have_gt != 1)) {
2139 error = -EFSCORRUPTED;
2140 goto out_error;
2141 }
2142 trace_xfs_rmap_find_right_neighbor_result(cur->bc_mp,
2143 cur->bc_ag.pag->pag_agno, gtrec.rm_startblock,
2144 gtrec.rm_blockcount, gtrec.rm_owner,
2145 gtrec.rm_offset, gtrec.rm_flags);
2146
2147 if (!xfs_rmap_is_mergeable(>rec, owner, flags))
2148 have_gt = 0;
2149 }
2150
2151 if (have_lt &&
2152 ltrec.rm_startblock + ltrec.rm_blockcount == bno &&
2153 ltrec.rm_offset + ltrec.rm_blockcount == offset) {
2154 /*
2155 * Left edge contiguous, merge into left record.
2156 *
2157 * ltbno ltlen
2158 * orig: |ooooooooo|
2159 * adding: |aaaaaaaaa|
2160 * result: |rrrrrrrrrrrrrrrrrrr|
2161 * bno len
2162 */
2163 ltrec.rm_blockcount += len;
2164 if (have_gt &&
2165 bno + len == gtrec.rm_startblock &&
2166 offset + len == gtrec.rm_offset) {
2167 /*
2168 * Right edge also contiguous, delete right record
2169 * and merge into left record.
2170 *
2171 * ltbno ltlen gtbno gtlen
2172 * orig: |ooooooooo| |ooooooooo|
2173 * adding: |aaaaaaaaa|
2174 * result: |rrrrrrrrrrrrrrrrrrrrrrrrrrrrr|
2175 */
2176 ltrec.rm_blockcount += gtrec.rm_blockcount;
2177 error = xfs_rmap_delete(cur, gtrec.rm_startblock,
2178 gtrec.rm_blockcount, gtrec.rm_owner,
2179 gtrec.rm_offset, gtrec.rm_flags);
2180 if (error)
2181 goto out_error;
2182 }
2183
2184 /* Point the cursor back to the left record and update. */
2185 error = xfs_rmap_lookup_eq(cur, ltrec.rm_startblock,
2186 ltrec.rm_blockcount, ltrec.rm_owner,
2187 ltrec.rm_offset, ltrec.rm_flags, &i);
2188 if (error)
2189 goto out_error;
2190 if (XFS_IS_CORRUPT(mp, i != 1)) {
2191 error = -EFSCORRUPTED;
2192 goto out_error;
2193 }
2194
2195 error = xfs_rmap_update(cur, <rec);
2196 if (error)
2197 goto out_error;
2198 } else if (have_gt &&
2199 bno + len == gtrec.rm_startblock &&
2200 offset + len == gtrec.rm_offset) {
2201 /*
2202 * Right edge contiguous, merge into right record.
2203 *
2204 * gtbno gtlen
2205 * Orig: |ooooooooo|
2206 * adding: |aaaaaaaaa|
2207 * Result: |rrrrrrrrrrrrrrrrrrr|
2208 * bno len
2209 */
2210 /* Delete the old record. */
2211 error = xfs_rmap_delete(cur, gtrec.rm_startblock,
2212 gtrec.rm_blockcount, gtrec.rm_owner,
2213 gtrec.rm_offset, gtrec.rm_flags);
2214 if (error)
2215 goto out_error;
2216
2217 /* Move the start and re-add it. */
2218 gtrec.rm_startblock = bno;
2219 gtrec.rm_blockcount += len;
2220 gtrec.rm_offset = offset;
2221 error = xfs_rmap_insert(cur, gtrec.rm_startblock,
2222 gtrec.rm_blockcount, gtrec.rm_owner,
2223 gtrec.rm_offset, gtrec.rm_flags);
2224 if (error)
2225 goto out_error;
2226 } else {
2227 /*
2228 * No contiguous edge with identical owner, insert
2229 * new record at current cursor position.
2230 */
2231 error = xfs_rmap_insert(cur, bno, len, owner, offset, flags);
2232 if (error)
2233 goto out_error;
2234 }
2235
2236 trace_xfs_rmap_map_done(mp, cur->bc_ag.pag->pag_agno, bno, len,
2237 unwritten, oinfo);
2238out_error:
2239 if (error)
2240 trace_xfs_rmap_map_error(cur->bc_mp,
2241 cur->bc_ag.pag->pag_agno, error, _RET_IP_);
2242 return error;
2243}
2244
2245/* Insert a raw rmap into the rmapbt. */
2246int
2247xfs_rmap_map_raw(
2248 struct xfs_btree_cur *cur,
2249 struct xfs_rmap_irec *rmap)
2250{
2251 struct xfs_owner_info oinfo;
2252
2253 oinfo.oi_owner = rmap->rm_owner;
2254 oinfo.oi_offset = rmap->rm_offset;
2255 oinfo.oi_flags = 0;
2256 if (rmap->rm_flags & XFS_RMAP_ATTR_FORK)
2257 oinfo.oi_flags |= XFS_OWNER_INFO_ATTR_FORK;
2258 if (rmap->rm_flags & XFS_RMAP_BMBT_BLOCK)
2259 oinfo.oi_flags |= XFS_OWNER_INFO_BMBT_BLOCK;
2260
2261 if (rmap->rm_flags || XFS_RMAP_NON_INODE_OWNER(rmap->rm_owner))
2262 return xfs_rmap_map(cur, rmap->rm_startblock,
2263 rmap->rm_blockcount,
2264 rmap->rm_flags & XFS_RMAP_UNWRITTEN,
2265 &oinfo);
2266
2267 return xfs_rmap_map_shared(cur, rmap->rm_startblock,
2268 rmap->rm_blockcount,
2269 rmap->rm_flags & XFS_RMAP_UNWRITTEN,
2270 &oinfo);
2271}
2272
2273struct xfs_rmap_query_range_info {
2274 xfs_rmap_query_range_fn fn;
2275 void *priv;
2276};
2277
2278/* Format btree record and pass to our callback. */
2279STATIC int
2280xfs_rmap_query_range_helper(
2281 struct xfs_btree_cur *cur,
2282 union xfs_btree_rec *rec,
2283 void *priv)
2284{
2285 struct xfs_rmap_query_range_info *query = priv;
2286 struct xfs_rmap_irec irec;
2287 int error;
2288
2289 error = xfs_rmap_btrec_to_irec(rec, &irec);
2290 if (error)
2291 return error;
2292 return query->fn(cur, &irec, query->priv);
2293}
2294
2295/* Find all rmaps between two keys. */
2296int
2297xfs_rmap_query_range(
2298 struct xfs_btree_cur *cur,
2299 struct xfs_rmap_irec *low_rec,
2300 struct xfs_rmap_irec *high_rec,
2301 xfs_rmap_query_range_fn fn,
2302 void *priv)
2303{
2304 union xfs_btree_irec low_brec;
2305 union xfs_btree_irec high_brec;
2306 struct xfs_rmap_query_range_info query;
2307
2308 low_brec.r = *low_rec;
2309 high_brec.r = *high_rec;
2310 query.priv = priv;
2311 query.fn = fn;
2312 return xfs_btree_query_range(cur, &low_brec, &high_brec,
2313 xfs_rmap_query_range_helper, &query);
2314}
2315
2316/* Find all rmaps. */
2317int
2318xfs_rmap_query_all(
2319 struct xfs_btree_cur *cur,
2320 xfs_rmap_query_range_fn fn,
2321 void *priv)
2322{
2323 struct xfs_rmap_query_range_info query;
2324
2325 query.priv = priv;
2326 query.fn = fn;
2327 return xfs_btree_query_all(cur, xfs_rmap_query_range_helper, &query);
2328}
2329
2330/* Clean up after calling xfs_rmap_finish_one. */
2331void
2332xfs_rmap_finish_one_cleanup(
2333 struct xfs_trans *tp,
2334 struct xfs_btree_cur *rcur,
2335 int error)
2336{
2337 struct xfs_buf *agbp;
2338
2339 if (rcur == NULL)
2340 return;
2341 agbp = rcur->bc_ag.agbp;
2342 xfs_btree_del_cursor(rcur, error);
2343 if (error)
2344 xfs_trans_brelse(tp, agbp);
2345}
2346
2347/*
2348 * Process one of the deferred rmap operations. We pass back the
2349 * btree cursor to maintain our lock on the rmapbt between calls.
2350 * This saves time and eliminates a buffer deadlock between the
2351 * superblock and the AGF because we'll always grab them in the same
2352 * order.
2353 */
2354int
2355xfs_rmap_finish_one(
2356 struct xfs_trans *tp,
2357 enum xfs_rmap_intent_type type,
2358 uint64_t owner,
2359 int whichfork,
2360 xfs_fileoff_t startoff,
2361 xfs_fsblock_t startblock,
2362 xfs_filblks_t blockcount,
2363 xfs_exntst_t state,
2364 struct xfs_btree_cur **pcur)
2365{
2366 struct xfs_mount *mp = tp->t_mountp;
2367 struct xfs_perag *pag;
2368 struct xfs_btree_cur *rcur;
2369 struct xfs_buf *agbp = NULL;
2370 int error = 0;
2371 struct xfs_owner_info oinfo;
2372 xfs_agblock_t bno;
2373 bool unwritten;
2374
2375 pag = xfs_perag_get(mp, XFS_FSB_TO_AGNO(mp, startblock));
2376 bno = XFS_FSB_TO_AGBNO(mp, startblock);
2377
2378 trace_xfs_rmap_deferred(mp, pag->pag_agno, type, bno, owner, whichfork,
2379 startoff, blockcount, state);
2380
2381 if (XFS_TEST_ERROR(false, mp, XFS_ERRTAG_RMAP_FINISH_ONE)) {
2382 error = -EIO;
2383 goto out_drop;
2384 }
2385
2386
2387 /*
2388 * If we haven't gotten a cursor or the cursor AG doesn't match
2389 * the startblock, get one now.
2390 */
2391 rcur = *pcur;
2392 if (rcur != NULL && rcur->bc_ag.pag != pag) {
2393 xfs_rmap_finish_one_cleanup(tp, rcur, 0);
2394 rcur = NULL;
2395 *pcur = NULL;
2396 }
2397 if (rcur == NULL) {
2398 /*
2399 * Refresh the freelist before we start changing the
2400 * rmapbt, because a shape change could cause us to
2401 * allocate blocks.
2402 */
2403 error = xfs_free_extent_fix_freelist(tp, pag, &agbp);
2404 if (error)
2405 goto out_drop;
2406 if (XFS_IS_CORRUPT(tp->t_mountp, !agbp)) {
2407 error = -EFSCORRUPTED;
2408 goto out_drop;
2409 }
2410
2411 rcur = xfs_rmapbt_init_cursor(mp, tp, agbp, pag);
2412 }
2413 *pcur = rcur;
2414
2415 xfs_rmap_ino_owner(&oinfo, owner, whichfork, startoff);
2416 unwritten = state == XFS_EXT_UNWRITTEN;
2417 bno = XFS_FSB_TO_AGBNO(rcur->bc_mp, startblock);
2418
2419 switch (type) {
2420 case XFS_RMAP_ALLOC:
2421 case XFS_RMAP_MAP:
2422 error = xfs_rmap_map(rcur, bno, blockcount, unwritten, &oinfo);
2423 break;
2424 case XFS_RMAP_MAP_SHARED:
2425 error = xfs_rmap_map_shared(rcur, bno, blockcount, unwritten,
2426 &oinfo);
2427 break;
2428 case XFS_RMAP_FREE:
2429 case XFS_RMAP_UNMAP:
2430 error = xfs_rmap_unmap(rcur, bno, blockcount, unwritten,
2431 &oinfo);
2432 break;
2433 case XFS_RMAP_UNMAP_SHARED:
2434 error = xfs_rmap_unmap_shared(rcur, bno, blockcount, unwritten,
2435 &oinfo);
2436 break;
2437 case XFS_RMAP_CONVERT:
2438 error = xfs_rmap_convert(rcur, bno, blockcount, !unwritten,
2439 &oinfo);
2440 break;
2441 case XFS_RMAP_CONVERT_SHARED:
2442 error = xfs_rmap_convert_shared(rcur, bno, blockcount,
2443 !unwritten, &oinfo);
2444 break;
2445 default:
2446 ASSERT(0);
2447 error = -EFSCORRUPTED;
2448 }
2449out_drop:
2450 xfs_perag_put(pag);
2451 return error;
2452}
2453
2454/*
2455 * Don't defer an rmap if we aren't an rmap filesystem.
2456 */
2457static bool
2458xfs_rmap_update_is_needed(
2459 struct xfs_mount *mp,
2460 int whichfork)
2461{
2462 return xfs_sb_version_hasrmapbt(&mp->m_sb) && whichfork != XFS_COW_FORK;
2463}
2464
2465/*
2466 * Record a rmap intent; the list is kept sorted first by AG and then by
2467 * increasing age.
2468 */
2469static void
2470__xfs_rmap_add(
2471 struct xfs_trans *tp,
2472 enum xfs_rmap_intent_type type,
2473 uint64_t owner,
2474 int whichfork,
2475 struct xfs_bmbt_irec *bmap)
2476{
2477 struct xfs_rmap_intent *ri;
2478
2479 trace_xfs_rmap_defer(tp->t_mountp,
2480 XFS_FSB_TO_AGNO(tp->t_mountp, bmap->br_startblock),
2481 type,
2482 XFS_FSB_TO_AGBNO(tp->t_mountp, bmap->br_startblock),
2483 owner, whichfork,
2484 bmap->br_startoff,
2485 bmap->br_blockcount,
2486 bmap->br_state);
2487
2488 ri = kmem_alloc(sizeof(struct xfs_rmap_intent), KM_NOFS);
2489 INIT_LIST_HEAD(&ri->ri_list);
2490 ri->ri_type = type;
2491 ri->ri_owner = owner;
2492 ri->ri_whichfork = whichfork;
2493 ri->ri_bmap = *bmap;
2494
2495 xfs_defer_add(tp, XFS_DEFER_OPS_TYPE_RMAP, &ri->ri_list);
2496}
2497
2498/* Map an extent into a file. */
2499void
2500xfs_rmap_map_extent(
2501 struct xfs_trans *tp,
2502 struct xfs_inode *ip,
2503 int whichfork,
2504 struct xfs_bmbt_irec *PREV)
2505{
2506 enum xfs_rmap_intent_type type = XFS_RMAP_MAP;
2507
2508 if (!xfs_rmap_update_is_needed(tp->t_mountp, whichfork))
2509 return;
2510
2511 if (whichfork != XFS_ATTR_FORK && xfs_is_reflink_inode(ip))
2512 type = XFS_RMAP_MAP_SHARED;
2513
2514 __xfs_rmap_add(tp, type, ip->i_ino, whichfork, PREV);
2515}
2516
2517/* Unmap an extent out of a file. */
2518void
2519xfs_rmap_unmap_extent(
2520 struct xfs_trans *tp,
2521 struct xfs_inode *ip,
2522 int whichfork,
2523 struct xfs_bmbt_irec *PREV)
2524{
2525 enum xfs_rmap_intent_type type = XFS_RMAP_UNMAP;
2526
2527 if (!xfs_rmap_update_is_needed(tp->t_mountp, whichfork))
2528 return;
2529
2530 if (whichfork != XFS_ATTR_FORK && xfs_is_reflink_inode(ip))
2531 type = XFS_RMAP_UNMAP_SHARED;
2532
2533 __xfs_rmap_add(tp, type, ip->i_ino, whichfork, PREV);
2534}
2535
2536/*
2537 * Convert a data fork extent from unwritten to real or vice versa.
2538 *
2539 * Note that tp can be NULL here as no transaction is used for COW fork
2540 * unwritten conversion.
2541 */
2542void
2543xfs_rmap_convert_extent(
2544 struct xfs_mount *mp,
2545 struct xfs_trans *tp,
2546 struct xfs_inode *ip,
2547 int whichfork,
2548 struct xfs_bmbt_irec *PREV)
2549{
2550 enum xfs_rmap_intent_type type = XFS_RMAP_CONVERT;
2551
2552 if (!xfs_rmap_update_is_needed(mp, whichfork))
2553 return;
2554
2555 if (whichfork != XFS_ATTR_FORK && xfs_is_reflink_inode(ip))
2556 type = XFS_RMAP_CONVERT_SHARED;
2557
2558 __xfs_rmap_add(tp, type, ip->i_ino, whichfork, PREV);
2559}
2560
2561/* Schedule the creation of an rmap for non-file data. */
2562void
2563xfs_rmap_alloc_extent(
2564 struct xfs_trans *tp,
2565 xfs_agnumber_t agno,
2566 xfs_agblock_t bno,
2567 xfs_extlen_t len,
2568 uint64_t owner)
2569{
2570 struct xfs_bmbt_irec bmap;
2571
2572 if (!xfs_rmap_update_is_needed(tp->t_mountp, XFS_DATA_FORK))
2573 return;
2574
2575 bmap.br_startblock = XFS_AGB_TO_FSB(tp->t_mountp, agno, bno);
2576 bmap.br_blockcount = len;
2577 bmap.br_startoff = 0;
2578 bmap.br_state = XFS_EXT_NORM;
2579
2580 __xfs_rmap_add(tp, XFS_RMAP_ALLOC, owner, XFS_DATA_FORK, &bmap);
2581}
2582
2583/* Schedule the deletion of an rmap for non-file data. */
2584void
2585xfs_rmap_free_extent(
2586 struct xfs_trans *tp,
2587 xfs_agnumber_t agno,
2588 xfs_agblock_t bno,
2589 xfs_extlen_t len,
2590 uint64_t owner)
2591{
2592 struct xfs_bmbt_irec bmap;
2593
2594 if (!xfs_rmap_update_is_needed(tp->t_mountp, XFS_DATA_FORK))
2595 return;
2596
2597 bmap.br_startblock = XFS_AGB_TO_FSB(tp->t_mountp, agno, bno);
2598 bmap.br_blockcount = len;
2599 bmap.br_startoff = 0;
2600 bmap.br_state = XFS_EXT_NORM;
2601
2602 __xfs_rmap_add(tp, XFS_RMAP_FREE, owner, XFS_DATA_FORK, &bmap);
2603}
2604
2605/* Compare rmap records. Returns -1 if a < b, 1 if a > b, and 0 if equal. */
2606int
2607xfs_rmap_compare(
2608 const struct xfs_rmap_irec *a,
2609 const struct xfs_rmap_irec *b)
2610{
2611 __u64 oa;
2612 __u64 ob;
2613
2614 oa = xfs_rmap_irec_offset_pack(a);
2615 ob = xfs_rmap_irec_offset_pack(b);
2616
2617 if (a->rm_startblock < b->rm_startblock)
2618 return -1;
2619 else if (a->rm_startblock > b->rm_startblock)
2620 return 1;
2621 else if (a->rm_owner < b->rm_owner)
2622 return -1;
2623 else if (a->rm_owner > b->rm_owner)
2624 return 1;
2625 else if (oa < ob)
2626 return -1;
2627 else if (oa > ob)
2628 return 1;
2629 else
2630 return 0;
2631}
2632
2633/* Is there a record covering a given extent? */
2634int
2635xfs_rmap_has_record(
2636 struct xfs_btree_cur *cur,
2637 xfs_agblock_t bno,
2638 xfs_extlen_t len,
2639 bool *exists)
2640{
2641 union xfs_btree_irec low;
2642 union xfs_btree_irec high;
2643
2644 memset(&low, 0, sizeof(low));
2645 low.r.rm_startblock = bno;
2646 memset(&high, 0xFF, sizeof(high));
2647 high.r.rm_startblock = bno + len - 1;
2648
2649 return xfs_btree_has_record(cur, &low, &high, exists);
2650}
2651
2652/*
2653 * Is there a record for this owner completely covering a given physical
2654 * extent? If so, *has_rmap will be set to true. If there is no record
2655 * or the record only covers part of the range, we set *has_rmap to false.
2656 * This function doesn't perform range lookups or offset checks, so it is
2657 * not suitable for checking data fork blocks.
2658 */
2659int
2660xfs_rmap_record_exists(
2661 struct xfs_btree_cur *cur,
2662 xfs_agblock_t bno,
2663 xfs_extlen_t len,
2664 const struct xfs_owner_info *oinfo,
2665 bool *has_rmap)
2666{
2667 uint64_t owner;
2668 uint64_t offset;
2669 unsigned int flags;
2670 int has_record;
2671 struct xfs_rmap_irec irec;
2672 int error;
2673
2674 xfs_owner_info_unpack(oinfo, &owner, &offset, &flags);
2675 ASSERT(XFS_RMAP_NON_INODE_OWNER(owner) ||
2676 (flags & XFS_RMAP_BMBT_BLOCK));
2677
2678 error = xfs_rmap_lookup_le(cur, bno, len, owner, offset, flags,
2679 &has_record);
2680 if (error)
2681 return error;
2682 if (!has_record) {
2683 *has_rmap = false;
2684 return 0;
2685 }
2686
2687 error = xfs_rmap_get_rec(cur, &irec, &has_record);
2688 if (error)
2689 return error;
2690 if (!has_record) {
2691 *has_rmap = false;
2692 return 0;
2693 }
2694
2695 *has_rmap = (irec.rm_owner == owner && irec.rm_startblock <= bno &&
2696 irec.rm_startblock + irec.rm_blockcount >= bno + len);
2697 return 0;
2698}
2699
2700struct xfs_rmap_key_state {
2701 uint64_t owner;
2702 uint64_t offset;
2703 unsigned int flags;
2704};
2705
2706/* For each rmap given, figure out if it doesn't match the key we want. */
2707STATIC int
2708xfs_rmap_has_other_keys_helper(
2709 struct xfs_btree_cur *cur,
2710 struct xfs_rmap_irec *rec,
2711 void *priv)
2712{
2713 struct xfs_rmap_key_state *rks = priv;
2714
2715 if (rks->owner == rec->rm_owner && rks->offset == rec->rm_offset &&
2716 ((rks->flags & rec->rm_flags) & XFS_RMAP_KEY_FLAGS) == rks->flags)
2717 return 0;
2718 return -ECANCELED;
2719}
2720
2721/*
2722 * Given an extent and some owner info, can we find records overlapping
2723 * the extent whose owner info does not match the given owner?
2724 */
2725int
2726xfs_rmap_has_other_keys(
2727 struct xfs_btree_cur *cur,
2728 xfs_agblock_t bno,
2729 xfs_extlen_t len,
2730 const struct xfs_owner_info *oinfo,
2731 bool *has_rmap)
2732{
2733 struct xfs_rmap_irec low = {0};
2734 struct xfs_rmap_irec high;
2735 struct xfs_rmap_key_state rks;
2736 int error;
2737
2738 xfs_owner_info_unpack(oinfo, &rks.owner, &rks.offset, &rks.flags);
2739 *has_rmap = false;
2740
2741 low.rm_startblock = bno;
2742 memset(&high, 0xFF, sizeof(high));
2743 high.rm_startblock = bno + len - 1;
2744
2745 error = xfs_rmap_query_range(cur, &low, &high,
2746 xfs_rmap_has_other_keys_helper, &rks);
2747 if (error == -ECANCELED) {
2748 *has_rmap = true;
2749 return 0;
2750 }
2751
2752 return error;
2753}
2754
2755const struct xfs_owner_info XFS_RMAP_OINFO_SKIP_UPDATE = {
2756 .oi_owner = XFS_RMAP_OWN_NULL,
2757};
2758const struct xfs_owner_info XFS_RMAP_OINFO_ANY_OWNER = {
2759 .oi_owner = XFS_RMAP_OWN_UNKNOWN,
2760};
2761const struct xfs_owner_info XFS_RMAP_OINFO_FS = {
2762 .oi_owner = XFS_RMAP_OWN_FS,
2763};
2764const struct xfs_owner_info XFS_RMAP_OINFO_LOG = {
2765 .oi_owner = XFS_RMAP_OWN_LOG,
2766};
2767const struct xfs_owner_info XFS_RMAP_OINFO_AG = {
2768 .oi_owner = XFS_RMAP_OWN_AG,
2769};
2770const struct xfs_owner_info XFS_RMAP_OINFO_INOBT = {
2771 .oi_owner = XFS_RMAP_OWN_INOBT,
2772};
2773const struct xfs_owner_info XFS_RMAP_OINFO_INODES = {
2774 .oi_owner = XFS_RMAP_OWN_INODES,
2775};
2776const struct xfs_owner_info XFS_RMAP_OINFO_REFC = {
2777 .oi_owner = XFS_RMAP_OWN_REFC,
2778};
2779const struct xfs_owner_info XFS_RMAP_OINFO_COW = {
2780 .oi_owner = XFS_RMAP_OWN_COW,
2781};
1// SPDX-License-Identifier: GPL-2.0
2/*
3 * Copyright (c) 2014 Red Hat, Inc.
4 * All Rights Reserved.
5 */
6#include "xfs.h"
7#include "xfs_fs.h"
8#include "xfs_shared.h"
9#include "xfs_format.h"
10#include "xfs_log_format.h"
11#include "xfs_trans_resv.h"
12#include "xfs_bit.h"
13#include "xfs_mount.h"
14#include "xfs_sb.h"
15#include "xfs_defer.h"
16#include "xfs_btree.h"
17#include "xfs_trans.h"
18#include "xfs_alloc.h"
19#include "xfs_rmap.h"
20#include "xfs_rmap_btree.h"
21#include "xfs_trace.h"
22#include "xfs_errortag.h"
23#include "xfs_error.h"
24#include "xfs_inode.h"
25#include "xfs_ag.h"
26
27struct kmem_cache *xfs_rmap_intent_cache;
28
29/*
30 * Lookup the first record less than or equal to [bno, len, owner, offset]
31 * in the btree given by cur.
32 */
33int
34xfs_rmap_lookup_le(
35 struct xfs_btree_cur *cur,
36 xfs_agblock_t bno,
37 uint64_t owner,
38 uint64_t offset,
39 unsigned int flags,
40 struct xfs_rmap_irec *irec,
41 int *stat)
42{
43 int get_stat = 0;
44 int error;
45
46 cur->bc_rec.r.rm_startblock = bno;
47 cur->bc_rec.r.rm_blockcount = 0;
48 cur->bc_rec.r.rm_owner = owner;
49 cur->bc_rec.r.rm_offset = offset;
50 cur->bc_rec.r.rm_flags = flags;
51
52 error = xfs_btree_lookup(cur, XFS_LOOKUP_LE, stat);
53 if (error || !(*stat) || !irec)
54 return error;
55
56 error = xfs_rmap_get_rec(cur, irec, &get_stat);
57 if (error)
58 return error;
59 if (!get_stat)
60 return -EFSCORRUPTED;
61
62 return 0;
63}
64
65/*
66 * Lookup the record exactly matching [bno, len, owner, offset]
67 * in the btree given by cur.
68 */
69int
70xfs_rmap_lookup_eq(
71 struct xfs_btree_cur *cur,
72 xfs_agblock_t bno,
73 xfs_extlen_t len,
74 uint64_t owner,
75 uint64_t offset,
76 unsigned int flags,
77 int *stat)
78{
79 cur->bc_rec.r.rm_startblock = bno;
80 cur->bc_rec.r.rm_blockcount = len;
81 cur->bc_rec.r.rm_owner = owner;
82 cur->bc_rec.r.rm_offset = offset;
83 cur->bc_rec.r.rm_flags = flags;
84 return xfs_btree_lookup(cur, XFS_LOOKUP_EQ, stat);
85}
86
87/*
88 * Update the record referred to by cur to the value given
89 * by [bno, len, owner, offset].
90 * This either works (return 0) or gets an EFSCORRUPTED error.
91 */
92STATIC int
93xfs_rmap_update(
94 struct xfs_btree_cur *cur,
95 struct xfs_rmap_irec *irec)
96{
97 union xfs_btree_rec rec;
98 int error;
99
100 trace_xfs_rmap_update(cur->bc_mp, cur->bc_ag.pag->pag_agno,
101 irec->rm_startblock, irec->rm_blockcount,
102 irec->rm_owner, irec->rm_offset, irec->rm_flags);
103
104 rec.rmap.rm_startblock = cpu_to_be32(irec->rm_startblock);
105 rec.rmap.rm_blockcount = cpu_to_be32(irec->rm_blockcount);
106 rec.rmap.rm_owner = cpu_to_be64(irec->rm_owner);
107 rec.rmap.rm_offset = cpu_to_be64(
108 xfs_rmap_irec_offset_pack(irec));
109 error = xfs_btree_update(cur, &rec);
110 if (error)
111 trace_xfs_rmap_update_error(cur->bc_mp,
112 cur->bc_ag.pag->pag_agno, error, _RET_IP_);
113 return error;
114}
115
116int
117xfs_rmap_insert(
118 struct xfs_btree_cur *rcur,
119 xfs_agblock_t agbno,
120 xfs_extlen_t len,
121 uint64_t owner,
122 uint64_t offset,
123 unsigned int flags)
124{
125 int i;
126 int error;
127
128 trace_xfs_rmap_insert(rcur->bc_mp, rcur->bc_ag.pag->pag_agno, agbno,
129 len, owner, offset, flags);
130
131 error = xfs_rmap_lookup_eq(rcur, agbno, len, owner, offset, flags, &i);
132 if (error)
133 goto done;
134 if (XFS_IS_CORRUPT(rcur->bc_mp, i != 0)) {
135 error = -EFSCORRUPTED;
136 goto done;
137 }
138
139 rcur->bc_rec.r.rm_startblock = agbno;
140 rcur->bc_rec.r.rm_blockcount = len;
141 rcur->bc_rec.r.rm_owner = owner;
142 rcur->bc_rec.r.rm_offset = offset;
143 rcur->bc_rec.r.rm_flags = flags;
144 error = xfs_btree_insert(rcur, &i);
145 if (error)
146 goto done;
147 if (XFS_IS_CORRUPT(rcur->bc_mp, i != 1)) {
148 error = -EFSCORRUPTED;
149 goto done;
150 }
151done:
152 if (error)
153 trace_xfs_rmap_insert_error(rcur->bc_mp,
154 rcur->bc_ag.pag->pag_agno, error, _RET_IP_);
155 return error;
156}
157
158STATIC int
159xfs_rmap_delete(
160 struct xfs_btree_cur *rcur,
161 xfs_agblock_t agbno,
162 xfs_extlen_t len,
163 uint64_t owner,
164 uint64_t offset,
165 unsigned int flags)
166{
167 int i;
168 int error;
169
170 trace_xfs_rmap_delete(rcur->bc_mp, rcur->bc_ag.pag->pag_agno, agbno,
171 len, owner, offset, flags);
172
173 error = xfs_rmap_lookup_eq(rcur, agbno, len, owner, offset, flags, &i);
174 if (error)
175 goto done;
176 if (XFS_IS_CORRUPT(rcur->bc_mp, i != 1)) {
177 error = -EFSCORRUPTED;
178 goto done;
179 }
180
181 error = xfs_btree_delete(rcur, &i);
182 if (error)
183 goto done;
184 if (XFS_IS_CORRUPT(rcur->bc_mp, i != 1)) {
185 error = -EFSCORRUPTED;
186 goto done;
187 }
188done:
189 if (error)
190 trace_xfs_rmap_delete_error(rcur->bc_mp,
191 rcur->bc_ag.pag->pag_agno, error, _RET_IP_);
192 return error;
193}
194
195/* Convert an internal btree record to an rmap record. */
196int
197xfs_rmap_btrec_to_irec(
198 const union xfs_btree_rec *rec,
199 struct xfs_rmap_irec *irec)
200{
201 irec->rm_startblock = be32_to_cpu(rec->rmap.rm_startblock);
202 irec->rm_blockcount = be32_to_cpu(rec->rmap.rm_blockcount);
203 irec->rm_owner = be64_to_cpu(rec->rmap.rm_owner);
204 return xfs_rmap_irec_offset_unpack(be64_to_cpu(rec->rmap.rm_offset),
205 irec);
206}
207
208/*
209 * Get the data from the pointed-to record.
210 */
211int
212xfs_rmap_get_rec(
213 struct xfs_btree_cur *cur,
214 struct xfs_rmap_irec *irec,
215 int *stat)
216{
217 struct xfs_mount *mp = cur->bc_mp;
218 struct xfs_perag *pag = cur->bc_ag.pag;
219 union xfs_btree_rec *rec;
220 int error;
221
222 error = xfs_btree_get_rec(cur, &rec, stat);
223 if (error || !*stat)
224 return error;
225
226 if (xfs_rmap_btrec_to_irec(rec, irec))
227 goto out_bad_rec;
228
229 if (irec->rm_blockcount == 0)
230 goto out_bad_rec;
231 if (irec->rm_startblock <= XFS_AGFL_BLOCK(mp)) {
232 if (irec->rm_owner != XFS_RMAP_OWN_FS)
233 goto out_bad_rec;
234 if (irec->rm_blockcount != XFS_AGFL_BLOCK(mp) + 1)
235 goto out_bad_rec;
236 } else {
237 /* check for valid extent range, including overflow */
238 if (!xfs_verify_agbext(pag, irec->rm_startblock,
239 irec->rm_blockcount))
240 goto out_bad_rec;
241 }
242
243 if (!(xfs_verify_ino(mp, irec->rm_owner) ||
244 (irec->rm_owner <= XFS_RMAP_OWN_FS &&
245 irec->rm_owner >= XFS_RMAP_OWN_MIN)))
246 goto out_bad_rec;
247
248 return 0;
249out_bad_rec:
250 xfs_warn(mp,
251 "Reverse Mapping BTree record corruption in AG %d detected!",
252 pag->pag_agno);
253 xfs_warn(mp,
254 "Owner 0x%llx, flags 0x%x, start block 0x%x block count 0x%x",
255 irec->rm_owner, irec->rm_flags, irec->rm_startblock,
256 irec->rm_blockcount);
257 return -EFSCORRUPTED;
258}
259
260struct xfs_find_left_neighbor_info {
261 struct xfs_rmap_irec high;
262 struct xfs_rmap_irec *irec;
263};
264
265/* For each rmap given, figure out if it matches the key we want. */
266STATIC int
267xfs_rmap_find_left_neighbor_helper(
268 struct xfs_btree_cur *cur,
269 const struct xfs_rmap_irec *rec,
270 void *priv)
271{
272 struct xfs_find_left_neighbor_info *info = priv;
273
274 trace_xfs_rmap_find_left_neighbor_candidate(cur->bc_mp,
275 cur->bc_ag.pag->pag_agno, rec->rm_startblock,
276 rec->rm_blockcount, rec->rm_owner, rec->rm_offset,
277 rec->rm_flags);
278
279 if (rec->rm_owner != info->high.rm_owner)
280 return 0;
281 if (!XFS_RMAP_NON_INODE_OWNER(rec->rm_owner) &&
282 !(rec->rm_flags & XFS_RMAP_BMBT_BLOCK) &&
283 rec->rm_offset + rec->rm_blockcount - 1 != info->high.rm_offset)
284 return 0;
285
286 *info->irec = *rec;
287 return -ECANCELED;
288}
289
290/*
291 * Find the record to the left of the given extent, being careful only to
292 * return a match with the same owner and adjacent physical and logical
293 * block ranges.
294 */
295STATIC int
296xfs_rmap_find_left_neighbor(
297 struct xfs_btree_cur *cur,
298 xfs_agblock_t bno,
299 uint64_t owner,
300 uint64_t offset,
301 unsigned int flags,
302 struct xfs_rmap_irec *irec,
303 int *stat)
304{
305 struct xfs_find_left_neighbor_info info;
306 int found = 0;
307 int error;
308
309 *stat = 0;
310 if (bno == 0)
311 return 0;
312 info.high.rm_startblock = bno - 1;
313 info.high.rm_owner = owner;
314 if (!XFS_RMAP_NON_INODE_OWNER(owner) &&
315 !(flags & XFS_RMAP_BMBT_BLOCK)) {
316 if (offset == 0)
317 return 0;
318 info.high.rm_offset = offset - 1;
319 } else
320 info.high.rm_offset = 0;
321 info.high.rm_flags = flags;
322 info.high.rm_blockcount = 0;
323 info.irec = irec;
324
325 trace_xfs_rmap_find_left_neighbor_query(cur->bc_mp,
326 cur->bc_ag.pag->pag_agno, bno, 0, owner, offset, flags);
327
328 /*
329 * Historically, we always used the range query to walk every reverse
330 * mapping that could possibly overlap the key that the caller asked
331 * for, and filter out the ones that don't. That is very slow when
332 * there are a lot of records.
333 *
334 * However, there are two scenarios where the classic btree search can
335 * produce correct results -- if the index contains a record that is an
336 * exact match for the lookup key; and if there are no other records
337 * between the record we want and the key we supplied.
338 *
339 * As an optimization, try a non-overlapped lookup first. This makes
340 * extent conversion and remap operations run a bit faster if the
341 * physical extents aren't being shared. If we don't find what we
342 * want, we fall back to the overlapped query.
343 */
344 error = xfs_rmap_lookup_le(cur, bno, owner, offset, flags, irec,
345 &found);
346 if (error)
347 return error;
348 if (found)
349 error = xfs_rmap_find_left_neighbor_helper(cur, irec, &info);
350 if (!error)
351 error = xfs_rmap_query_range(cur, &info.high, &info.high,
352 xfs_rmap_find_left_neighbor_helper, &info);
353 if (error != -ECANCELED)
354 return error;
355
356 *stat = 1;
357 trace_xfs_rmap_find_left_neighbor_result(cur->bc_mp,
358 cur->bc_ag.pag->pag_agno, irec->rm_startblock,
359 irec->rm_blockcount, irec->rm_owner, irec->rm_offset,
360 irec->rm_flags);
361 return 0;
362}
363
364/* For each rmap given, figure out if it matches the key we want. */
365STATIC int
366xfs_rmap_lookup_le_range_helper(
367 struct xfs_btree_cur *cur,
368 const struct xfs_rmap_irec *rec,
369 void *priv)
370{
371 struct xfs_find_left_neighbor_info *info = priv;
372
373 trace_xfs_rmap_lookup_le_range_candidate(cur->bc_mp,
374 cur->bc_ag.pag->pag_agno, rec->rm_startblock,
375 rec->rm_blockcount, rec->rm_owner, rec->rm_offset,
376 rec->rm_flags);
377
378 if (rec->rm_owner != info->high.rm_owner)
379 return 0;
380 if (!XFS_RMAP_NON_INODE_OWNER(rec->rm_owner) &&
381 !(rec->rm_flags & XFS_RMAP_BMBT_BLOCK) &&
382 (rec->rm_offset > info->high.rm_offset ||
383 rec->rm_offset + rec->rm_blockcount <= info->high.rm_offset))
384 return 0;
385
386 *info->irec = *rec;
387 return -ECANCELED;
388}
389
390/*
391 * Find the record to the left of the given extent, being careful only to
392 * return a match with the same owner and overlapping physical and logical
393 * block ranges. This is the overlapping-interval version of
394 * xfs_rmap_lookup_le.
395 */
396int
397xfs_rmap_lookup_le_range(
398 struct xfs_btree_cur *cur,
399 xfs_agblock_t bno,
400 uint64_t owner,
401 uint64_t offset,
402 unsigned int flags,
403 struct xfs_rmap_irec *irec,
404 int *stat)
405{
406 struct xfs_find_left_neighbor_info info;
407 int found = 0;
408 int error;
409
410 info.high.rm_startblock = bno;
411 info.high.rm_owner = owner;
412 if (!XFS_RMAP_NON_INODE_OWNER(owner) && !(flags & XFS_RMAP_BMBT_BLOCK))
413 info.high.rm_offset = offset;
414 else
415 info.high.rm_offset = 0;
416 info.high.rm_flags = flags;
417 info.high.rm_blockcount = 0;
418 *stat = 0;
419 info.irec = irec;
420
421 trace_xfs_rmap_lookup_le_range(cur->bc_mp, cur->bc_ag.pag->pag_agno,
422 bno, 0, owner, offset, flags);
423
424 /*
425 * Historically, we always used the range query to walk every reverse
426 * mapping that could possibly overlap the key that the caller asked
427 * for, and filter out the ones that don't. That is very slow when
428 * there are a lot of records.
429 *
430 * However, there are two scenarios where the classic btree search can
431 * produce correct results -- if the index contains a record that is an
432 * exact match for the lookup key; and if there are no other records
433 * between the record we want and the key we supplied.
434 *
435 * As an optimization, try a non-overlapped lookup first. This makes
436 * scrub run much faster on most filesystems because bmbt records are
437 * usually an exact match for rmap records. If we don't find what we
438 * want, we fall back to the overlapped query.
439 */
440 error = xfs_rmap_lookup_le(cur, bno, owner, offset, flags, irec,
441 &found);
442 if (error)
443 return error;
444 if (found)
445 error = xfs_rmap_lookup_le_range_helper(cur, irec, &info);
446 if (!error)
447 error = xfs_rmap_query_range(cur, &info.high, &info.high,
448 xfs_rmap_lookup_le_range_helper, &info);
449 if (error != -ECANCELED)
450 return error;
451
452 *stat = 1;
453 trace_xfs_rmap_lookup_le_range_result(cur->bc_mp,
454 cur->bc_ag.pag->pag_agno, irec->rm_startblock,
455 irec->rm_blockcount, irec->rm_owner, irec->rm_offset,
456 irec->rm_flags);
457 return 0;
458}
459
460/*
461 * Perform all the relevant owner checks for a removal op. If we're doing an
462 * unknown-owner removal then we have no owner information to check.
463 */
464static int
465xfs_rmap_free_check_owner(
466 struct xfs_mount *mp,
467 uint64_t ltoff,
468 struct xfs_rmap_irec *rec,
469 xfs_filblks_t len,
470 uint64_t owner,
471 uint64_t offset,
472 unsigned int flags)
473{
474 int error = 0;
475
476 if (owner == XFS_RMAP_OWN_UNKNOWN)
477 return 0;
478
479 /* Make sure the unwritten flag matches. */
480 if (XFS_IS_CORRUPT(mp,
481 (flags & XFS_RMAP_UNWRITTEN) !=
482 (rec->rm_flags & XFS_RMAP_UNWRITTEN))) {
483 error = -EFSCORRUPTED;
484 goto out;
485 }
486
487 /* Make sure the owner matches what we expect to find in the tree. */
488 if (XFS_IS_CORRUPT(mp, owner != rec->rm_owner)) {
489 error = -EFSCORRUPTED;
490 goto out;
491 }
492
493 /* Check the offset, if necessary. */
494 if (XFS_RMAP_NON_INODE_OWNER(owner))
495 goto out;
496
497 if (flags & XFS_RMAP_BMBT_BLOCK) {
498 if (XFS_IS_CORRUPT(mp,
499 !(rec->rm_flags & XFS_RMAP_BMBT_BLOCK))) {
500 error = -EFSCORRUPTED;
501 goto out;
502 }
503 } else {
504 if (XFS_IS_CORRUPT(mp, rec->rm_offset > offset)) {
505 error = -EFSCORRUPTED;
506 goto out;
507 }
508 if (XFS_IS_CORRUPT(mp,
509 offset + len > ltoff + rec->rm_blockcount)) {
510 error = -EFSCORRUPTED;
511 goto out;
512 }
513 }
514
515out:
516 return error;
517}
518
519/*
520 * Find the extent in the rmap btree and remove it.
521 *
522 * The record we find should always be an exact match for the extent that we're
523 * looking for, since we insert them into the btree without modification.
524 *
525 * Special Case #1: when growing the filesystem, we "free" an extent when
526 * growing the last AG. This extent is new space and so it is not tracked as
527 * used space in the btree. The growfs code will pass in an owner of
528 * XFS_RMAP_OWN_NULL to indicate that it expected that there is no owner of this
529 * extent. We verify that - the extent lookup result in a record that does not
530 * overlap.
531 *
532 * Special Case #2: EFIs do not record the owner of the extent, so when
533 * recovering EFIs from the log we pass in XFS_RMAP_OWN_UNKNOWN to tell the rmap
534 * btree to ignore the owner (i.e. wildcard match) so we don't trigger
535 * corruption checks during log recovery.
536 */
537STATIC int
538xfs_rmap_unmap(
539 struct xfs_btree_cur *cur,
540 xfs_agblock_t bno,
541 xfs_extlen_t len,
542 bool unwritten,
543 const struct xfs_owner_info *oinfo)
544{
545 struct xfs_mount *mp = cur->bc_mp;
546 struct xfs_rmap_irec ltrec;
547 uint64_t ltoff;
548 int error = 0;
549 int i;
550 uint64_t owner;
551 uint64_t offset;
552 unsigned int flags;
553 bool ignore_off;
554
555 xfs_owner_info_unpack(oinfo, &owner, &offset, &flags);
556 ignore_off = XFS_RMAP_NON_INODE_OWNER(owner) ||
557 (flags & XFS_RMAP_BMBT_BLOCK);
558 if (unwritten)
559 flags |= XFS_RMAP_UNWRITTEN;
560 trace_xfs_rmap_unmap(mp, cur->bc_ag.pag->pag_agno, bno, len,
561 unwritten, oinfo);
562
563 /*
564 * We should always have a left record because there's a static record
565 * for the AG headers at rm_startblock == 0 created by mkfs/growfs that
566 * will not ever be removed from the tree.
567 */
568 error = xfs_rmap_lookup_le(cur, bno, owner, offset, flags, <rec, &i);
569 if (error)
570 goto out_error;
571 if (XFS_IS_CORRUPT(mp, i != 1)) {
572 error = -EFSCORRUPTED;
573 goto out_error;
574 }
575
576 trace_xfs_rmap_lookup_le_range_result(cur->bc_mp,
577 cur->bc_ag.pag->pag_agno, ltrec.rm_startblock,
578 ltrec.rm_blockcount, ltrec.rm_owner,
579 ltrec.rm_offset, ltrec.rm_flags);
580 ltoff = ltrec.rm_offset;
581
582 /*
583 * For growfs, the incoming extent must be beyond the left record we
584 * just found as it is new space and won't be used by anyone. This is
585 * just a corruption check as we don't actually do anything with this
586 * extent. Note that we need to use >= instead of > because it might
587 * be the case that the "left" extent goes all the way to EOFS.
588 */
589 if (owner == XFS_RMAP_OWN_NULL) {
590 if (XFS_IS_CORRUPT(mp,
591 bno <
592 ltrec.rm_startblock + ltrec.rm_blockcount)) {
593 error = -EFSCORRUPTED;
594 goto out_error;
595 }
596 goto out_done;
597 }
598
599 /*
600 * If we're doing an unknown-owner removal for EFI recovery, we expect
601 * to find the full range in the rmapbt or nothing at all. If we
602 * don't find any rmaps overlapping either end of the range, we're
603 * done. Hopefully this means that the EFI creator already queued
604 * (and finished) a RUI to remove the rmap.
605 */
606 if (owner == XFS_RMAP_OWN_UNKNOWN &&
607 ltrec.rm_startblock + ltrec.rm_blockcount <= bno) {
608 struct xfs_rmap_irec rtrec;
609
610 error = xfs_btree_increment(cur, 0, &i);
611 if (error)
612 goto out_error;
613 if (i == 0)
614 goto out_done;
615 error = xfs_rmap_get_rec(cur, &rtrec, &i);
616 if (error)
617 goto out_error;
618 if (XFS_IS_CORRUPT(mp, i != 1)) {
619 error = -EFSCORRUPTED;
620 goto out_error;
621 }
622 if (rtrec.rm_startblock >= bno + len)
623 goto out_done;
624 }
625
626 /* Make sure the extent we found covers the entire freeing range. */
627 if (XFS_IS_CORRUPT(mp,
628 ltrec.rm_startblock > bno ||
629 ltrec.rm_startblock + ltrec.rm_blockcount <
630 bno + len)) {
631 error = -EFSCORRUPTED;
632 goto out_error;
633 }
634
635 /* Check owner information. */
636 error = xfs_rmap_free_check_owner(mp, ltoff, <rec, len, owner,
637 offset, flags);
638 if (error)
639 goto out_error;
640
641 if (ltrec.rm_startblock == bno && ltrec.rm_blockcount == len) {
642 /* exact match, simply remove the record from rmap tree */
643 trace_xfs_rmap_delete(mp, cur->bc_ag.pag->pag_agno,
644 ltrec.rm_startblock, ltrec.rm_blockcount,
645 ltrec.rm_owner, ltrec.rm_offset,
646 ltrec.rm_flags);
647 error = xfs_btree_delete(cur, &i);
648 if (error)
649 goto out_error;
650 if (XFS_IS_CORRUPT(mp, i != 1)) {
651 error = -EFSCORRUPTED;
652 goto out_error;
653 }
654 } else if (ltrec.rm_startblock == bno) {
655 /*
656 * overlap left hand side of extent: move the start, trim the
657 * length and update the current record.
658 *
659 * ltbno ltlen
660 * Orig: |oooooooooooooooooooo|
661 * Freeing: |fffffffff|
662 * Result: |rrrrrrrrrr|
663 * bno len
664 */
665 ltrec.rm_startblock += len;
666 ltrec.rm_blockcount -= len;
667 if (!ignore_off)
668 ltrec.rm_offset += len;
669 error = xfs_rmap_update(cur, <rec);
670 if (error)
671 goto out_error;
672 } else if (ltrec.rm_startblock + ltrec.rm_blockcount == bno + len) {
673 /*
674 * overlap right hand side of extent: trim the length and update
675 * the current record.
676 *
677 * ltbno ltlen
678 * Orig: |oooooooooooooooooooo|
679 * Freeing: |fffffffff|
680 * Result: |rrrrrrrrrr|
681 * bno len
682 */
683 ltrec.rm_blockcount -= len;
684 error = xfs_rmap_update(cur, <rec);
685 if (error)
686 goto out_error;
687 } else {
688
689 /*
690 * overlap middle of extent: trim the length of the existing
691 * record to the length of the new left-extent size, increment
692 * the insertion position so we can insert a new record
693 * containing the remaining right-extent space.
694 *
695 * ltbno ltlen
696 * Orig: |oooooooooooooooooooo|
697 * Freeing: |fffffffff|
698 * Result: |rrrrr| |rrrr|
699 * bno len
700 */
701 xfs_extlen_t orig_len = ltrec.rm_blockcount;
702
703 ltrec.rm_blockcount = bno - ltrec.rm_startblock;
704 error = xfs_rmap_update(cur, <rec);
705 if (error)
706 goto out_error;
707
708 error = xfs_btree_increment(cur, 0, &i);
709 if (error)
710 goto out_error;
711
712 cur->bc_rec.r.rm_startblock = bno + len;
713 cur->bc_rec.r.rm_blockcount = orig_len - len -
714 ltrec.rm_blockcount;
715 cur->bc_rec.r.rm_owner = ltrec.rm_owner;
716 if (ignore_off)
717 cur->bc_rec.r.rm_offset = 0;
718 else
719 cur->bc_rec.r.rm_offset = offset + len;
720 cur->bc_rec.r.rm_flags = flags;
721 trace_xfs_rmap_insert(mp, cur->bc_ag.pag->pag_agno,
722 cur->bc_rec.r.rm_startblock,
723 cur->bc_rec.r.rm_blockcount,
724 cur->bc_rec.r.rm_owner,
725 cur->bc_rec.r.rm_offset,
726 cur->bc_rec.r.rm_flags);
727 error = xfs_btree_insert(cur, &i);
728 if (error)
729 goto out_error;
730 }
731
732out_done:
733 trace_xfs_rmap_unmap_done(mp, cur->bc_ag.pag->pag_agno, bno, len,
734 unwritten, oinfo);
735out_error:
736 if (error)
737 trace_xfs_rmap_unmap_error(mp, cur->bc_ag.pag->pag_agno,
738 error, _RET_IP_);
739 return error;
740}
741
742/*
743 * Remove a reference to an extent in the rmap btree.
744 */
745int
746xfs_rmap_free(
747 struct xfs_trans *tp,
748 struct xfs_buf *agbp,
749 struct xfs_perag *pag,
750 xfs_agblock_t bno,
751 xfs_extlen_t len,
752 const struct xfs_owner_info *oinfo)
753{
754 struct xfs_mount *mp = tp->t_mountp;
755 struct xfs_btree_cur *cur;
756 int error;
757
758 if (!xfs_has_rmapbt(mp))
759 return 0;
760
761 cur = xfs_rmapbt_init_cursor(mp, tp, agbp, pag);
762
763 error = xfs_rmap_unmap(cur, bno, len, false, oinfo);
764
765 xfs_btree_del_cursor(cur, error);
766 return error;
767}
768
769/*
770 * A mergeable rmap must have the same owner and the same values for
771 * the unwritten, attr_fork, and bmbt flags. The startblock and
772 * offset are checked separately.
773 */
774static bool
775xfs_rmap_is_mergeable(
776 struct xfs_rmap_irec *irec,
777 uint64_t owner,
778 unsigned int flags)
779{
780 if (irec->rm_owner == XFS_RMAP_OWN_NULL)
781 return false;
782 if (irec->rm_owner != owner)
783 return false;
784 if ((flags & XFS_RMAP_UNWRITTEN) ^
785 (irec->rm_flags & XFS_RMAP_UNWRITTEN))
786 return false;
787 if ((flags & XFS_RMAP_ATTR_FORK) ^
788 (irec->rm_flags & XFS_RMAP_ATTR_FORK))
789 return false;
790 if ((flags & XFS_RMAP_BMBT_BLOCK) ^
791 (irec->rm_flags & XFS_RMAP_BMBT_BLOCK))
792 return false;
793 return true;
794}
795
796/*
797 * When we allocate a new block, the first thing we do is add a reference to
798 * the extent in the rmap btree. This takes the form of a [agbno, length,
799 * owner, offset] record. Flags are encoded in the high bits of the offset
800 * field.
801 */
802STATIC int
803xfs_rmap_map(
804 struct xfs_btree_cur *cur,
805 xfs_agblock_t bno,
806 xfs_extlen_t len,
807 bool unwritten,
808 const struct xfs_owner_info *oinfo)
809{
810 struct xfs_mount *mp = cur->bc_mp;
811 struct xfs_rmap_irec ltrec;
812 struct xfs_rmap_irec gtrec;
813 int have_gt;
814 int have_lt;
815 int error = 0;
816 int i;
817 uint64_t owner;
818 uint64_t offset;
819 unsigned int flags = 0;
820 bool ignore_off;
821
822 xfs_owner_info_unpack(oinfo, &owner, &offset, &flags);
823 ASSERT(owner != 0);
824 ignore_off = XFS_RMAP_NON_INODE_OWNER(owner) ||
825 (flags & XFS_RMAP_BMBT_BLOCK);
826 if (unwritten)
827 flags |= XFS_RMAP_UNWRITTEN;
828 trace_xfs_rmap_map(mp, cur->bc_ag.pag->pag_agno, bno, len,
829 unwritten, oinfo);
830 ASSERT(!xfs_rmap_should_skip_owner_update(oinfo));
831
832 /*
833 * For the initial lookup, look for an exact match or the left-adjacent
834 * record for our insertion point. This will also give us the record for
835 * start block contiguity tests.
836 */
837 error = xfs_rmap_lookup_le(cur, bno, owner, offset, flags, <rec,
838 &have_lt);
839 if (error)
840 goto out_error;
841 if (have_lt) {
842 trace_xfs_rmap_lookup_le_range_result(cur->bc_mp,
843 cur->bc_ag.pag->pag_agno, ltrec.rm_startblock,
844 ltrec.rm_blockcount, ltrec.rm_owner,
845 ltrec.rm_offset, ltrec.rm_flags);
846
847 if (!xfs_rmap_is_mergeable(<rec, owner, flags))
848 have_lt = 0;
849 }
850
851 if (XFS_IS_CORRUPT(mp,
852 have_lt != 0 &&
853 ltrec.rm_startblock + ltrec.rm_blockcount > bno)) {
854 error = -EFSCORRUPTED;
855 goto out_error;
856 }
857
858 /*
859 * Increment the cursor to see if we have a right-adjacent record to our
860 * insertion point. This will give us the record for end block
861 * contiguity tests.
862 */
863 error = xfs_btree_increment(cur, 0, &have_gt);
864 if (error)
865 goto out_error;
866 if (have_gt) {
867 error = xfs_rmap_get_rec(cur, >rec, &have_gt);
868 if (error)
869 goto out_error;
870 if (XFS_IS_CORRUPT(mp, have_gt != 1)) {
871 error = -EFSCORRUPTED;
872 goto out_error;
873 }
874 if (XFS_IS_CORRUPT(mp, bno + len > gtrec.rm_startblock)) {
875 error = -EFSCORRUPTED;
876 goto out_error;
877 }
878 trace_xfs_rmap_find_right_neighbor_result(cur->bc_mp,
879 cur->bc_ag.pag->pag_agno, gtrec.rm_startblock,
880 gtrec.rm_blockcount, gtrec.rm_owner,
881 gtrec.rm_offset, gtrec.rm_flags);
882 if (!xfs_rmap_is_mergeable(>rec, owner, flags))
883 have_gt = 0;
884 }
885
886 /*
887 * Note: cursor currently points one record to the right of ltrec, even
888 * if there is no record in the tree to the right.
889 */
890 if (have_lt &&
891 ltrec.rm_startblock + ltrec.rm_blockcount == bno &&
892 (ignore_off || ltrec.rm_offset + ltrec.rm_blockcount == offset)) {
893 /*
894 * left edge contiguous, merge into left record.
895 *
896 * ltbno ltlen
897 * orig: |ooooooooo|
898 * adding: |aaaaaaaaa|
899 * result: |rrrrrrrrrrrrrrrrrrr|
900 * bno len
901 */
902 ltrec.rm_blockcount += len;
903 if (have_gt &&
904 bno + len == gtrec.rm_startblock &&
905 (ignore_off || offset + len == gtrec.rm_offset) &&
906 (unsigned long)ltrec.rm_blockcount + len +
907 gtrec.rm_blockcount <= XFS_RMAP_LEN_MAX) {
908 /*
909 * right edge also contiguous, delete right record
910 * and merge into left record.
911 *
912 * ltbno ltlen gtbno gtlen
913 * orig: |ooooooooo| |ooooooooo|
914 * adding: |aaaaaaaaa|
915 * result: |rrrrrrrrrrrrrrrrrrrrrrrrrrrrr|
916 */
917 ltrec.rm_blockcount += gtrec.rm_blockcount;
918 trace_xfs_rmap_delete(mp, cur->bc_ag.pag->pag_agno,
919 gtrec.rm_startblock,
920 gtrec.rm_blockcount,
921 gtrec.rm_owner,
922 gtrec.rm_offset,
923 gtrec.rm_flags);
924 error = xfs_btree_delete(cur, &i);
925 if (error)
926 goto out_error;
927 if (XFS_IS_CORRUPT(mp, i != 1)) {
928 error = -EFSCORRUPTED;
929 goto out_error;
930 }
931 }
932
933 /* point the cursor back to the left record and update */
934 error = xfs_btree_decrement(cur, 0, &have_gt);
935 if (error)
936 goto out_error;
937 error = xfs_rmap_update(cur, <rec);
938 if (error)
939 goto out_error;
940 } else if (have_gt &&
941 bno + len == gtrec.rm_startblock &&
942 (ignore_off || offset + len == gtrec.rm_offset)) {
943 /*
944 * right edge contiguous, merge into right record.
945 *
946 * gtbno gtlen
947 * Orig: |ooooooooo|
948 * adding: |aaaaaaaaa|
949 * Result: |rrrrrrrrrrrrrrrrrrr|
950 * bno len
951 */
952 gtrec.rm_startblock = bno;
953 gtrec.rm_blockcount += len;
954 if (!ignore_off)
955 gtrec.rm_offset = offset;
956 error = xfs_rmap_update(cur, >rec);
957 if (error)
958 goto out_error;
959 } else {
960 /*
961 * no contiguous edge with identical owner, insert
962 * new record at current cursor position.
963 */
964 cur->bc_rec.r.rm_startblock = bno;
965 cur->bc_rec.r.rm_blockcount = len;
966 cur->bc_rec.r.rm_owner = owner;
967 cur->bc_rec.r.rm_offset = offset;
968 cur->bc_rec.r.rm_flags = flags;
969 trace_xfs_rmap_insert(mp, cur->bc_ag.pag->pag_agno, bno, len,
970 owner, offset, flags);
971 error = xfs_btree_insert(cur, &i);
972 if (error)
973 goto out_error;
974 if (XFS_IS_CORRUPT(mp, i != 1)) {
975 error = -EFSCORRUPTED;
976 goto out_error;
977 }
978 }
979
980 trace_xfs_rmap_map_done(mp, cur->bc_ag.pag->pag_agno, bno, len,
981 unwritten, oinfo);
982out_error:
983 if (error)
984 trace_xfs_rmap_map_error(mp, cur->bc_ag.pag->pag_agno,
985 error, _RET_IP_);
986 return error;
987}
988
989/*
990 * Add a reference to an extent in the rmap btree.
991 */
992int
993xfs_rmap_alloc(
994 struct xfs_trans *tp,
995 struct xfs_buf *agbp,
996 struct xfs_perag *pag,
997 xfs_agblock_t bno,
998 xfs_extlen_t len,
999 const struct xfs_owner_info *oinfo)
1000{
1001 struct xfs_mount *mp = tp->t_mountp;
1002 struct xfs_btree_cur *cur;
1003 int error;
1004
1005 if (!xfs_has_rmapbt(mp))
1006 return 0;
1007
1008 cur = xfs_rmapbt_init_cursor(mp, tp, agbp, pag);
1009 error = xfs_rmap_map(cur, bno, len, false, oinfo);
1010
1011 xfs_btree_del_cursor(cur, error);
1012 return error;
1013}
1014
1015#define RMAP_LEFT_CONTIG (1 << 0)
1016#define RMAP_RIGHT_CONTIG (1 << 1)
1017#define RMAP_LEFT_FILLING (1 << 2)
1018#define RMAP_RIGHT_FILLING (1 << 3)
1019#define RMAP_LEFT_VALID (1 << 6)
1020#define RMAP_RIGHT_VALID (1 << 7)
1021
1022#define LEFT r[0]
1023#define RIGHT r[1]
1024#define PREV r[2]
1025#define NEW r[3]
1026
1027/*
1028 * Convert an unwritten extent to a real extent or vice versa.
1029 * Does not handle overlapping extents.
1030 */
1031STATIC int
1032xfs_rmap_convert(
1033 struct xfs_btree_cur *cur,
1034 xfs_agblock_t bno,
1035 xfs_extlen_t len,
1036 bool unwritten,
1037 const struct xfs_owner_info *oinfo)
1038{
1039 struct xfs_mount *mp = cur->bc_mp;
1040 struct xfs_rmap_irec r[4]; /* neighbor extent entries */
1041 /* left is 0, right is 1, */
1042 /* prev is 2, new is 3 */
1043 uint64_t owner;
1044 uint64_t offset;
1045 uint64_t new_endoff;
1046 unsigned int oldext;
1047 unsigned int newext;
1048 unsigned int flags = 0;
1049 int i;
1050 int state = 0;
1051 int error;
1052
1053 xfs_owner_info_unpack(oinfo, &owner, &offset, &flags);
1054 ASSERT(!(XFS_RMAP_NON_INODE_OWNER(owner) ||
1055 (flags & (XFS_RMAP_ATTR_FORK | XFS_RMAP_BMBT_BLOCK))));
1056 oldext = unwritten ? XFS_RMAP_UNWRITTEN : 0;
1057 new_endoff = offset + len;
1058 trace_xfs_rmap_convert(mp, cur->bc_ag.pag->pag_agno, bno, len,
1059 unwritten, oinfo);
1060
1061 /*
1062 * For the initial lookup, look for an exact match or the left-adjacent
1063 * record for our insertion point. This will also give us the record for
1064 * start block contiguity tests.
1065 */
1066 error = xfs_rmap_lookup_le(cur, bno, owner, offset, oldext, &PREV, &i);
1067 if (error)
1068 goto done;
1069 if (XFS_IS_CORRUPT(mp, i != 1)) {
1070 error = -EFSCORRUPTED;
1071 goto done;
1072 }
1073
1074 trace_xfs_rmap_lookup_le_range_result(cur->bc_mp,
1075 cur->bc_ag.pag->pag_agno, PREV.rm_startblock,
1076 PREV.rm_blockcount, PREV.rm_owner,
1077 PREV.rm_offset, PREV.rm_flags);
1078
1079 ASSERT(PREV.rm_offset <= offset);
1080 ASSERT(PREV.rm_offset + PREV.rm_blockcount >= new_endoff);
1081 ASSERT((PREV.rm_flags & XFS_RMAP_UNWRITTEN) == oldext);
1082 newext = ~oldext & XFS_RMAP_UNWRITTEN;
1083
1084 /*
1085 * Set flags determining what part of the previous oldext allocation
1086 * extent is being replaced by a newext allocation.
1087 */
1088 if (PREV.rm_offset == offset)
1089 state |= RMAP_LEFT_FILLING;
1090 if (PREV.rm_offset + PREV.rm_blockcount == new_endoff)
1091 state |= RMAP_RIGHT_FILLING;
1092
1093 /*
1094 * Decrement the cursor to see if we have a left-adjacent record to our
1095 * insertion point. This will give us the record for end block
1096 * contiguity tests.
1097 */
1098 error = xfs_btree_decrement(cur, 0, &i);
1099 if (error)
1100 goto done;
1101 if (i) {
1102 state |= RMAP_LEFT_VALID;
1103 error = xfs_rmap_get_rec(cur, &LEFT, &i);
1104 if (error)
1105 goto done;
1106 if (XFS_IS_CORRUPT(mp, i != 1)) {
1107 error = -EFSCORRUPTED;
1108 goto done;
1109 }
1110 if (XFS_IS_CORRUPT(mp,
1111 LEFT.rm_startblock + LEFT.rm_blockcount >
1112 bno)) {
1113 error = -EFSCORRUPTED;
1114 goto done;
1115 }
1116 trace_xfs_rmap_find_left_neighbor_result(cur->bc_mp,
1117 cur->bc_ag.pag->pag_agno, LEFT.rm_startblock,
1118 LEFT.rm_blockcount, LEFT.rm_owner,
1119 LEFT.rm_offset, LEFT.rm_flags);
1120 if (LEFT.rm_startblock + LEFT.rm_blockcount == bno &&
1121 LEFT.rm_offset + LEFT.rm_blockcount == offset &&
1122 xfs_rmap_is_mergeable(&LEFT, owner, newext))
1123 state |= RMAP_LEFT_CONTIG;
1124 }
1125
1126 /*
1127 * Increment the cursor to see if we have a right-adjacent record to our
1128 * insertion point. This will give us the record for end block
1129 * contiguity tests.
1130 */
1131 error = xfs_btree_increment(cur, 0, &i);
1132 if (error)
1133 goto done;
1134 if (XFS_IS_CORRUPT(mp, i != 1)) {
1135 error = -EFSCORRUPTED;
1136 goto done;
1137 }
1138 error = xfs_btree_increment(cur, 0, &i);
1139 if (error)
1140 goto done;
1141 if (i) {
1142 state |= RMAP_RIGHT_VALID;
1143 error = xfs_rmap_get_rec(cur, &RIGHT, &i);
1144 if (error)
1145 goto done;
1146 if (XFS_IS_CORRUPT(mp, i != 1)) {
1147 error = -EFSCORRUPTED;
1148 goto done;
1149 }
1150 if (XFS_IS_CORRUPT(mp, bno + len > RIGHT.rm_startblock)) {
1151 error = -EFSCORRUPTED;
1152 goto done;
1153 }
1154 trace_xfs_rmap_find_right_neighbor_result(cur->bc_mp,
1155 cur->bc_ag.pag->pag_agno, RIGHT.rm_startblock,
1156 RIGHT.rm_blockcount, RIGHT.rm_owner,
1157 RIGHT.rm_offset, RIGHT.rm_flags);
1158 if (bno + len == RIGHT.rm_startblock &&
1159 offset + len == RIGHT.rm_offset &&
1160 xfs_rmap_is_mergeable(&RIGHT, owner, newext))
1161 state |= RMAP_RIGHT_CONTIG;
1162 }
1163
1164 /* check that left + prev + right is not too long */
1165 if ((state & (RMAP_LEFT_FILLING | RMAP_LEFT_CONTIG |
1166 RMAP_RIGHT_FILLING | RMAP_RIGHT_CONTIG)) ==
1167 (RMAP_LEFT_FILLING | RMAP_LEFT_CONTIG |
1168 RMAP_RIGHT_FILLING | RMAP_RIGHT_CONTIG) &&
1169 (unsigned long)LEFT.rm_blockcount + len +
1170 RIGHT.rm_blockcount > XFS_RMAP_LEN_MAX)
1171 state &= ~RMAP_RIGHT_CONTIG;
1172
1173 trace_xfs_rmap_convert_state(mp, cur->bc_ag.pag->pag_agno, state,
1174 _RET_IP_);
1175
1176 /* reset the cursor back to PREV */
1177 error = xfs_rmap_lookup_le(cur, bno, owner, offset, oldext, NULL, &i);
1178 if (error)
1179 goto done;
1180 if (XFS_IS_CORRUPT(mp, i != 1)) {
1181 error = -EFSCORRUPTED;
1182 goto done;
1183 }
1184
1185 /*
1186 * Switch out based on the FILLING and CONTIG state bits.
1187 */
1188 switch (state & (RMAP_LEFT_FILLING | RMAP_LEFT_CONTIG |
1189 RMAP_RIGHT_FILLING | RMAP_RIGHT_CONTIG)) {
1190 case RMAP_LEFT_FILLING | RMAP_LEFT_CONTIG |
1191 RMAP_RIGHT_FILLING | RMAP_RIGHT_CONTIG:
1192 /*
1193 * Setting all of a previous oldext extent to newext.
1194 * The left and right neighbors are both contiguous with new.
1195 */
1196 error = xfs_btree_increment(cur, 0, &i);
1197 if (error)
1198 goto done;
1199 if (XFS_IS_CORRUPT(mp, i != 1)) {
1200 error = -EFSCORRUPTED;
1201 goto done;
1202 }
1203 trace_xfs_rmap_delete(mp, cur->bc_ag.pag->pag_agno,
1204 RIGHT.rm_startblock, RIGHT.rm_blockcount,
1205 RIGHT.rm_owner, RIGHT.rm_offset,
1206 RIGHT.rm_flags);
1207 error = xfs_btree_delete(cur, &i);
1208 if (error)
1209 goto done;
1210 if (XFS_IS_CORRUPT(mp, i != 1)) {
1211 error = -EFSCORRUPTED;
1212 goto done;
1213 }
1214 error = xfs_btree_decrement(cur, 0, &i);
1215 if (error)
1216 goto done;
1217 if (XFS_IS_CORRUPT(mp, i != 1)) {
1218 error = -EFSCORRUPTED;
1219 goto done;
1220 }
1221 trace_xfs_rmap_delete(mp, cur->bc_ag.pag->pag_agno,
1222 PREV.rm_startblock, PREV.rm_blockcount,
1223 PREV.rm_owner, PREV.rm_offset,
1224 PREV.rm_flags);
1225 error = xfs_btree_delete(cur, &i);
1226 if (error)
1227 goto done;
1228 if (XFS_IS_CORRUPT(mp, i != 1)) {
1229 error = -EFSCORRUPTED;
1230 goto done;
1231 }
1232 error = xfs_btree_decrement(cur, 0, &i);
1233 if (error)
1234 goto done;
1235 if (XFS_IS_CORRUPT(mp, i != 1)) {
1236 error = -EFSCORRUPTED;
1237 goto done;
1238 }
1239 NEW = LEFT;
1240 NEW.rm_blockcount += PREV.rm_blockcount + RIGHT.rm_blockcount;
1241 error = xfs_rmap_update(cur, &NEW);
1242 if (error)
1243 goto done;
1244 break;
1245
1246 case RMAP_LEFT_FILLING | RMAP_RIGHT_FILLING | RMAP_LEFT_CONTIG:
1247 /*
1248 * Setting all of a previous oldext extent to newext.
1249 * The left neighbor is contiguous, the right is not.
1250 */
1251 trace_xfs_rmap_delete(mp, cur->bc_ag.pag->pag_agno,
1252 PREV.rm_startblock, PREV.rm_blockcount,
1253 PREV.rm_owner, PREV.rm_offset,
1254 PREV.rm_flags);
1255 error = xfs_btree_delete(cur, &i);
1256 if (error)
1257 goto done;
1258 if (XFS_IS_CORRUPT(mp, i != 1)) {
1259 error = -EFSCORRUPTED;
1260 goto done;
1261 }
1262 error = xfs_btree_decrement(cur, 0, &i);
1263 if (error)
1264 goto done;
1265 if (XFS_IS_CORRUPT(mp, i != 1)) {
1266 error = -EFSCORRUPTED;
1267 goto done;
1268 }
1269 NEW = LEFT;
1270 NEW.rm_blockcount += PREV.rm_blockcount;
1271 error = xfs_rmap_update(cur, &NEW);
1272 if (error)
1273 goto done;
1274 break;
1275
1276 case RMAP_LEFT_FILLING | RMAP_RIGHT_FILLING | RMAP_RIGHT_CONTIG:
1277 /*
1278 * Setting all of a previous oldext extent to newext.
1279 * The right neighbor is contiguous, the left is not.
1280 */
1281 error = xfs_btree_increment(cur, 0, &i);
1282 if (error)
1283 goto done;
1284 if (XFS_IS_CORRUPT(mp, i != 1)) {
1285 error = -EFSCORRUPTED;
1286 goto done;
1287 }
1288 trace_xfs_rmap_delete(mp, cur->bc_ag.pag->pag_agno,
1289 RIGHT.rm_startblock, RIGHT.rm_blockcount,
1290 RIGHT.rm_owner, RIGHT.rm_offset,
1291 RIGHT.rm_flags);
1292 error = xfs_btree_delete(cur, &i);
1293 if (error)
1294 goto done;
1295 if (XFS_IS_CORRUPT(mp, i != 1)) {
1296 error = -EFSCORRUPTED;
1297 goto done;
1298 }
1299 error = xfs_btree_decrement(cur, 0, &i);
1300 if (error)
1301 goto done;
1302 if (XFS_IS_CORRUPT(mp, i != 1)) {
1303 error = -EFSCORRUPTED;
1304 goto done;
1305 }
1306 NEW = PREV;
1307 NEW.rm_blockcount = len + RIGHT.rm_blockcount;
1308 NEW.rm_flags = newext;
1309 error = xfs_rmap_update(cur, &NEW);
1310 if (error)
1311 goto done;
1312 break;
1313
1314 case RMAP_LEFT_FILLING | RMAP_RIGHT_FILLING:
1315 /*
1316 * Setting all of a previous oldext extent to newext.
1317 * Neither the left nor right neighbors are contiguous with
1318 * the new one.
1319 */
1320 NEW = PREV;
1321 NEW.rm_flags = newext;
1322 error = xfs_rmap_update(cur, &NEW);
1323 if (error)
1324 goto done;
1325 break;
1326
1327 case RMAP_LEFT_FILLING | RMAP_LEFT_CONTIG:
1328 /*
1329 * Setting the first part of a previous oldext extent to newext.
1330 * The left neighbor is contiguous.
1331 */
1332 NEW = PREV;
1333 NEW.rm_offset += len;
1334 NEW.rm_startblock += len;
1335 NEW.rm_blockcount -= len;
1336 error = xfs_rmap_update(cur, &NEW);
1337 if (error)
1338 goto done;
1339 error = xfs_btree_decrement(cur, 0, &i);
1340 if (error)
1341 goto done;
1342 NEW = LEFT;
1343 NEW.rm_blockcount += len;
1344 error = xfs_rmap_update(cur, &NEW);
1345 if (error)
1346 goto done;
1347 break;
1348
1349 case RMAP_LEFT_FILLING:
1350 /*
1351 * Setting the first part of a previous oldext extent to newext.
1352 * The left neighbor is not contiguous.
1353 */
1354 NEW = PREV;
1355 NEW.rm_startblock += len;
1356 NEW.rm_offset += len;
1357 NEW.rm_blockcount -= len;
1358 error = xfs_rmap_update(cur, &NEW);
1359 if (error)
1360 goto done;
1361 NEW.rm_startblock = bno;
1362 NEW.rm_owner = owner;
1363 NEW.rm_offset = offset;
1364 NEW.rm_blockcount = len;
1365 NEW.rm_flags = newext;
1366 cur->bc_rec.r = NEW;
1367 trace_xfs_rmap_insert(mp, cur->bc_ag.pag->pag_agno, bno,
1368 len, owner, offset, newext);
1369 error = xfs_btree_insert(cur, &i);
1370 if (error)
1371 goto done;
1372 if (XFS_IS_CORRUPT(mp, i != 1)) {
1373 error = -EFSCORRUPTED;
1374 goto done;
1375 }
1376 break;
1377
1378 case RMAP_RIGHT_FILLING | RMAP_RIGHT_CONTIG:
1379 /*
1380 * Setting the last part of a previous oldext extent to newext.
1381 * The right neighbor is contiguous with the new allocation.
1382 */
1383 NEW = PREV;
1384 NEW.rm_blockcount -= len;
1385 error = xfs_rmap_update(cur, &NEW);
1386 if (error)
1387 goto done;
1388 error = xfs_btree_increment(cur, 0, &i);
1389 if (error)
1390 goto done;
1391 NEW = RIGHT;
1392 NEW.rm_offset = offset;
1393 NEW.rm_startblock = bno;
1394 NEW.rm_blockcount += len;
1395 error = xfs_rmap_update(cur, &NEW);
1396 if (error)
1397 goto done;
1398 break;
1399
1400 case RMAP_RIGHT_FILLING:
1401 /*
1402 * Setting the last part of a previous oldext extent to newext.
1403 * The right neighbor is not contiguous.
1404 */
1405 NEW = PREV;
1406 NEW.rm_blockcount -= len;
1407 error = xfs_rmap_update(cur, &NEW);
1408 if (error)
1409 goto done;
1410 error = xfs_rmap_lookup_eq(cur, bno, len, owner, offset,
1411 oldext, &i);
1412 if (error)
1413 goto done;
1414 if (XFS_IS_CORRUPT(mp, i != 0)) {
1415 error = -EFSCORRUPTED;
1416 goto done;
1417 }
1418 NEW.rm_startblock = bno;
1419 NEW.rm_owner = owner;
1420 NEW.rm_offset = offset;
1421 NEW.rm_blockcount = len;
1422 NEW.rm_flags = newext;
1423 cur->bc_rec.r = NEW;
1424 trace_xfs_rmap_insert(mp, cur->bc_ag.pag->pag_agno, bno,
1425 len, owner, offset, newext);
1426 error = xfs_btree_insert(cur, &i);
1427 if (error)
1428 goto done;
1429 if (XFS_IS_CORRUPT(mp, i != 1)) {
1430 error = -EFSCORRUPTED;
1431 goto done;
1432 }
1433 break;
1434
1435 case 0:
1436 /*
1437 * Setting the middle part of a previous oldext extent to
1438 * newext. Contiguity is impossible here.
1439 * One extent becomes three extents.
1440 */
1441 /* new right extent - oldext */
1442 NEW.rm_startblock = bno + len;
1443 NEW.rm_owner = owner;
1444 NEW.rm_offset = new_endoff;
1445 NEW.rm_blockcount = PREV.rm_offset + PREV.rm_blockcount -
1446 new_endoff;
1447 NEW.rm_flags = PREV.rm_flags;
1448 error = xfs_rmap_update(cur, &NEW);
1449 if (error)
1450 goto done;
1451 /* new left extent - oldext */
1452 NEW = PREV;
1453 NEW.rm_blockcount = offset - PREV.rm_offset;
1454 cur->bc_rec.r = NEW;
1455 trace_xfs_rmap_insert(mp, cur->bc_ag.pag->pag_agno,
1456 NEW.rm_startblock, NEW.rm_blockcount,
1457 NEW.rm_owner, NEW.rm_offset,
1458 NEW.rm_flags);
1459 error = xfs_btree_insert(cur, &i);
1460 if (error)
1461 goto done;
1462 if (XFS_IS_CORRUPT(mp, i != 1)) {
1463 error = -EFSCORRUPTED;
1464 goto done;
1465 }
1466 /*
1467 * Reset the cursor to the position of the new extent
1468 * we are about to insert as we can't trust it after
1469 * the previous insert.
1470 */
1471 error = xfs_rmap_lookup_eq(cur, bno, len, owner, offset,
1472 oldext, &i);
1473 if (error)
1474 goto done;
1475 if (XFS_IS_CORRUPT(mp, i != 0)) {
1476 error = -EFSCORRUPTED;
1477 goto done;
1478 }
1479 /* new middle extent - newext */
1480 cur->bc_rec.r.rm_flags &= ~XFS_RMAP_UNWRITTEN;
1481 cur->bc_rec.r.rm_flags |= newext;
1482 trace_xfs_rmap_insert(mp, cur->bc_ag.pag->pag_agno, bno, len,
1483 owner, offset, newext);
1484 error = xfs_btree_insert(cur, &i);
1485 if (error)
1486 goto done;
1487 if (XFS_IS_CORRUPT(mp, i != 1)) {
1488 error = -EFSCORRUPTED;
1489 goto done;
1490 }
1491 break;
1492
1493 case RMAP_LEFT_FILLING | RMAP_LEFT_CONTIG | RMAP_RIGHT_CONTIG:
1494 case RMAP_RIGHT_FILLING | RMAP_LEFT_CONTIG | RMAP_RIGHT_CONTIG:
1495 case RMAP_LEFT_FILLING | RMAP_RIGHT_CONTIG:
1496 case RMAP_RIGHT_FILLING | RMAP_LEFT_CONTIG:
1497 case RMAP_LEFT_CONTIG | RMAP_RIGHT_CONTIG:
1498 case RMAP_LEFT_CONTIG:
1499 case RMAP_RIGHT_CONTIG:
1500 /*
1501 * These cases are all impossible.
1502 */
1503 ASSERT(0);
1504 }
1505
1506 trace_xfs_rmap_convert_done(mp, cur->bc_ag.pag->pag_agno, bno, len,
1507 unwritten, oinfo);
1508done:
1509 if (error)
1510 trace_xfs_rmap_convert_error(cur->bc_mp,
1511 cur->bc_ag.pag->pag_agno, error, _RET_IP_);
1512 return error;
1513}
1514
1515/*
1516 * Convert an unwritten extent to a real extent or vice versa. If there is no
1517 * possibility of overlapping extents, delegate to the simpler convert
1518 * function.
1519 */
1520STATIC int
1521xfs_rmap_convert_shared(
1522 struct xfs_btree_cur *cur,
1523 xfs_agblock_t bno,
1524 xfs_extlen_t len,
1525 bool unwritten,
1526 const struct xfs_owner_info *oinfo)
1527{
1528 struct xfs_mount *mp = cur->bc_mp;
1529 struct xfs_rmap_irec r[4]; /* neighbor extent entries */
1530 /* left is 0, right is 1, */
1531 /* prev is 2, new is 3 */
1532 uint64_t owner;
1533 uint64_t offset;
1534 uint64_t new_endoff;
1535 unsigned int oldext;
1536 unsigned int newext;
1537 unsigned int flags = 0;
1538 int i;
1539 int state = 0;
1540 int error;
1541
1542 xfs_owner_info_unpack(oinfo, &owner, &offset, &flags);
1543 ASSERT(!(XFS_RMAP_NON_INODE_OWNER(owner) ||
1544 (flags & (XFS_RMAP_ATTR_FORK | XFS_RMAP_BMBT_BLOCK))));
1545 oldext = unwritten ? XFS_RMAP_UNWRITTEN : 0;
1546 new_endoff = offset + len;
1547 trace_xfs_rmap_convert(mp, cur->bc_ag.pag->pag_agno, bno, len,
1548 unwritten, oinfo);
1549
1550 /*
1551 * For the initial lookup, look for and exact match or the left-adjacent
1552 * record for our insertion point. This will also give us the record for
1553 * start block contiguity tests.
1554 */
1555 error = xfs_rmap_lookup_le_range(cur, bno, owner, offset, oldext,
1556 &PREV, &i);
1557 if (error)
1558 goto done;
1559 if (XFS_IS_CORRUPT(mp, i != 1)) {
1560 error = -EFSCORRUPTED;
1561 goto done;
1562 }
1563
1564 ASSERT(PREV.rm_offset <= offset);
1565 ASSERT(PREV.rm_offset + PREV.rm_blockcount >= new_endoff);
1566 ASSERT((PREV.rm_flags & XFS_RMAP_UNWRITTEN) == oldext);
1567 newext = ~oldext & XFS_RMAP_UNWRITTEN;
1568
1569 /*
1570 * Set flags determining what part of the previous oldext allocation
1571 * extent is being replaced by a newext allocation.
1572 */
1573 if (PREV.rm_offset == offset)
1574 state |= RMAP_LEFT_FILLING;
1575 if (PREV.rm_offset + PREV.rm_blockcount == new_endoff)
1576 state |= RMAP_RIGHT_FILLING;
1577
1578 /* Is there a left record that abuts our range? */
1579 error = xfs_rmap_find_left_neighbor(cur, bno, owner, offset, newext,
1580 &LEFT, &i);
1581 if (error)
1582 goto done;
1583 if (i) {
1584 state |= RMAP_LEFT_VALID;
1585 if (XFS_IS_CORRUPT(mp,
1586 LEFT.rm_startblock + LEFT.rm_blockcount >
1587 bno)) {
1588 error = -EFSCORRUPTED;
1589 goto done;
1590 }
1591 if (xfs_rmap_is_mergeable(&LEFT, owner, newext))
1592 state |= RMAP_LEFT_CONTIG;
1593 }
1594
1595 /* Is there a right record that abuts our range? */
1596 error = xfs_rmap_lookup_eq(cur, bno + len, len, owner, offset + len,
1597 newext, &i);
1598 if (error)
1599 goto done;
1600 if (i) {
1601 state |= RMAP_RIGHT_VALID;
1602 error = xfs_rmap_get_rec(cur, &RIGHT, &i);
1603 if (error)
1604 goto done;
1605 if (XFS_IS_CORRUPT(mp, i != 1)) {
1606 error = -EFSCORRUPTED;
1607 goto done;
1608 }
1609 if (XFS_IS_CORRUPT(mp, bno + len > RIGHT.rm_startblock)) {
1610 error = -EFSCORRUPTED;
1611 goto done;
1612 }
1613 trace_xfs_rmap_find_right_neighbor_result(cur->bc_mp,
1614 cur->bc_ag.pag->pag_agno, RIGHT.rm_startblock,
1615 RIGHT.rm_blockcount, RIGHT.rm_owner,
1616 RIGHT.rm_offset, RIGHT.rm_flags);
1617 if (xfs_rmap_is_mergeable(&RIGHT, owner, newext))
1618 state |= RMAP_RIGHT_CONTIG;
1619 }
1620
1621 /* check that left + prev + right is not too long */
1622 if ((state & (RMAP_LEFT_FILLING | RMAP_LEFT_CONTIG |
1623 RMAP_RIGHT_FILLING | RMAP_RIGHT_CONTIG)) ==
1624 (RMAP_LEFT_FILLING | RMAP_LEFT_CONTIG |
1625 RMAP_RIGHT_FILLING | RMAP_RIGHT_CONTIG) &&
1626 (unsigned long)LEFT.rm_blockcount + len +
1627 RIGHT.rm_blockcount > XFS_RMAP_LEN_MAX)
1628 state &= ~RMAP_RIGHT_CONTIG;
1629
1630 trace_xfs_rmap_convert_state(mp, cur->bc_ag.pag->pag_agno, state,
1631 _RET_IP_);
1632 /*
1633 * Switch out based on the FILLING and CONTIG state bits.
1634 */
1635 switch (state & (RMAP_LEFT_FILLING | RMAP_LEFT_CONTIG |
1636 RMAP_RIGHT_FILLING | RMAP_RIGHT_CONTIG)) {
1637 case RMAP_LEFT_FILLING | RMAP_LEFT_CONTIG |
1638 RMAP_RIGHT_FILLING | RMAP_RIGHT_CONTIG:
1639 /*
1640 * Setting all of a previous oldext extent to newext.
1641 * The left and right neighbors are both contiguous with new.
1642 */
1643 error = xfs_rmap_delete(cur, RIGHT.rm_startblock,
1644 RIGHT.rm_blockcount, RIGHT.rm_owner,
1645 RIGHT.rm_offset, RIGHT.rm_flags);
1646 if (error)
1647 goto done;
1648 error = xfs_rmap_delete(cur, PREV.rm_startblock,
1649 PREV.rm_blockcount, PREV.rm_owner,
1650 PREV.rm_offset, PREV.rm_flags);
1651 if (error)
1652 goto done;
1653 NEW = LEFT;
1654 error = xfs_rmap_lookup_eq(cur, NEW.rm_startblock,
1655 NEW.rm_blockcount, NEW.rm_owner,
1656 NEW.rm_offset, NEW.rm_flags, &i);
1657 if (error)
1658 goto done;
1659 if (XFS_IS_CORRUPT(mp, i != 1)) {
1660 error = -EFSCORRUPTED;
1661 goto done;
1662 }
1663 NEW.rm_blockcount += PREV.rm_blockcount + RIGHT.rm_blockcount;
1664 error = xfs_rmap_update(cur, &NEW);
1665 if (error)
1666 goto done;
1667 break;
1668
1669 case RMAP_LEFT_FILLING | RMAP_RIGHT_FILLING | RMAP_LEFT_CONTIG:
1670 /*
1671 * Setting all of a previous oldext extent to newext.
1672 * The left neighbor is contiguous, the right is not.
1673 */
1674 error = xfs_rmap_delete(cur, PREV.rm_startblock,
1675 PREV.rm_blockcount, PREV.rm_owner,
1676 PREV.rm_offset, PREV.rm_flags);
1677 if (error)
1678 goto done;
1679 NEW = LEFT;
1680 error = xfs_rmap_lookup_eq(cur, NEW.rm_startblock,
1681 NEW.rm_blockcount, NEW.rm_owner,
1682 NEW.rm_offset, NEW.rm_flags, &i);
1683 if (error)
1684 goto done;
1685 if (XFS_IS_CORRUPT(mp, i != 1)) {
1686 error = -EFSCORRUPTED;
1687 goto done;
1688 }
1689 NEW.rm_blockcount += PREV.rm_blockcount;
1690 error = xfs_rmap_update(cur, &NEW);
1691 if (error)
1692 goto done;
1693 break;
1694
1695 case RMAP_LEFT_FILLING | RMAP_RIGHT_FILLING | RMAP_RIGHT_CONTIG:
1696 /*
1697 * Setting all of a previous oldext extent to newext.
1698 * The right neighbor is contiguous, the left is not.
1699 */
1700 error = xfs_rmap_delete(cur, RIGHT.rm_startblock,
1701 RIGHT.rm_blockcount, RIGHT.rm_owner,
1702 RIGHT.rm_offset, RIGHT.rm_flags);
1703 if (error)
1704 goto done;
1705 NEW = PREV;
1706 error = xfs_rmap_lookup_eq(cur, NEW.rm_startblock,
1707 NEW.rm_blockcount, NEW.rm_owner,
1708 NEW.rm_offset, NEW.rm_flags, &i);
1709 if (error)
1710 goto done;
1711 if (XFS_IS_CORRUPT(mp, i != 1)) {
1712 error = -EFSCORRUPTED;
1713 goto done;
1714 }
1715 NEW.rm_blockcount += RIGHT.rm_blockcount;
1716 NEW.rm_flags = RIGHT.rm_flags;
1717 error = xfs_rmap_update(cur, &NEW);
1718 if (error)
1719 goto done;
1720 break;
1721
1722 case RMAP_LEFT_FILLING | RMAP_RIGHT_FILLING:
1723 /*
1724 * Setting all of a previous oldext extent to newext.
1725 * Neither the left nor right neighbors are contiguous with
1726 * the new one.
1727 */
1728 NEW = PREV;
1729 error = xfs_rmap_lookup_eq(cur, NEW.rm_startblock,
1730 NEW.rm_blockcount, NEW.rm_owner,
1731 NEW.rm_offset, NEW.rm_flags, &i);
1732 if (error)
1733 goto done;
1734 if (XFS_IS_CORRUPT(mp, i != 1)) {
1735 error = -EFSCORRUPTED;
1736 goto done;
1737 }
1738 NEW.rm_flags = newext;
1739 error = xfs_rmap_update(cur, &NEW);
1740 if (error)
1741 goto done;
1742 break;
1743
1744 case RMAP_LEFT_FILLING | RMAP_LEFT_CONTIG:
1745 /*
1746 * Setting the first part of a previous oldext extent to newext.
1747 * The left neighbor is contiguous.
1748 */
1749 NEW = PREV;
1750 error = xfs_rmap_delete(cur, NEW.rm_startblock,
1751 NEW.rm_blockcount, NEW.rm_owner,
1752 NEW.rm_offset, NEW.rm_flags);
1753 if (error)
1754 goto done;
1755 NEW.rm_offset += len;
1756 NEW.rm_startblock += len;
1757 NEW.rm_blockcount -= len;
1758 error = xfs_rmap_insert(cur, NEW.rm_startblock,
1759 NEW.rm_blockcount, NEW.rm_owner,
1760 NEW.rm_offset, NEW.rm_flags);
1761 if (error)
1762 goto done;
1763 NEW = LEFT;
1764 error = xfs_rmap_lookup_eq(cur, NEW.rm_startblock,
1765 NEW.rm_blockcount, NEW.rm_owner,
1766 NEW.rm_offset, NEW.rm_flags, &i);
1767 if (error)
1768 goto done;
1769 if (XFS_IS_CORRUPT(mp, i != 1)) {
1770 error = -EFSCORRUPTED;
1771 goto done;
1772 }
1773 NEW.rm_blockcount += len;
1774 error = xfs_rmap_update(cur, &NEW);
1775 if (error)
1776 goto done;
1777 break;
1778
1779 case RMAP_LEFT_FILLING:
1780 /*
1781 * Setting the first part of a previous oldext extent to newext.
1782 * The left neighbor is not contiguous.
1783 */
1784 NEW = PREV;
1785 error = xfs_rmap_delete(cur, NEW.rm_startblock,
1786 NEW.rm_blockcount, NEW.rm_owner,
1787 NEW.rm_offset, NEW.rm_flags);
1788 if (error)
1789 goto done;
1790 NEW.rm_offset += len;
1791 NEW.rm_startblock += len;
1792 NEW.rm_blockcount -= len;
1793 error = xfs_rmap_insert(cur, NEW.rm_startblock,
1794 NEW.rm_blockcount, NEW.rm_owner,
1795 NEW.rm_offset, NEW.rm_flags);
1796 if (error)
1797 goto done;
1798 error = xfs_rmap_insert(cur, bno, len, owner, offset, newext);
1799 if (error)
1800 goto done;
1801 break;
1802
1803 case RMAP_RIGHT_FILLING | RMAP_RIGHT_CONTIG:
1804 /*
1805 * Setting the last part of a previous oldext extent to newext.
1806 * The right neighbor is contiguous with the new allocation.
1807 */
1808 NEW = PREV;
1809 error = xfs_rmap_lookup_eq(cur, NEW.rm_startblock,
1810 NEW.rm_blockcount, NEW.rm_owner,
1811 NEW.rm_offset, NEW.rm_flags, &i);
1812 if (error)
1813 goto done;
1814 if (XFS_IS_CORRUPT(mp, i != 1)) {
1815 error = -EFSCORRUPTED;
1816 goto done;
1817 }
1818 NEW.rm_blockcount = offset - NEW.rm_offset;
1819 error = xfs_rmap_update(cur, &NEW);
1820 if (error)
1821 goto done;
1822 NEW = RIGHT;
1823 error = xfs_rmap_delete(cur, NEW.rm_startblock,
1824 NEW.rm_blockcount, NEW.rm_owner,
1825 NEW.rm_offset, NEW.rm_flags);
1826 if (error)
1827 goto done;
1828 NEW.rm_offset = offset;
1829 NEW.rm_startblock = bno;
1830 NEW.rm_blockcount += len;
1831 error = xfs_rmap_insert(cur, NEW.rm_startblock,
1832 NEW.rm_blockcount, NEW.rm_owner,
1833 NEW.rm_offset, NEW.rm_flags);
1834 if (error)
1835 goto done;
1836 break;
1837
1838 case RMAP_RIGHT_FILLING:
1839 /*
1840 * Setting the last part of a previous oldext extent to newext.
1841 * The right neighbor is not contiguous.
1842 */
1843 NEW = PREV;
1844 error = xfs_rmap_lookup_eq(cur, NEW.rm_startblock,
1845 NEW.rm_blockcount, NEW.rm_owner,
1846 NEW.rm_offset, NEW.rm_flags, &i);
1847 if (error)
1848 goto done;
1849 if (XFS_IS_CORRUPT(mp, i != 1)) {
1850 error = -EFSCORRUPTED;
1851 goto done;
1852 }
1853 NEW.rm_blockcount -= len;
1854 error = xfs_rmap_update(cur, &NEW);
1855 if (error)
1856 goto done;
1857 error = xfs_rmap_insert(cur, bno, len, owner, offset, newext);
1858 if (error)
1859 goto done;
1860 break;
1861
1862 case 0:
1863 /*
1864 * Setting the middle part of a previous oldext extent to
1865 * newext. Contiguity is impossible here.
1866 * One extent becomes three extents.
1867 */
1868 /* new right extent - oldext */
1869 NEW.rm_startblock = bno + len;
1870 NEW.rm_owner = owner;
1871 NEW.rm_offset = new_endoff;
1872 NEW.rm_blockcount = PREV.rm_offset + PREV.rm_blockcount -
1873 new_endoff;
1874 NEW.rm_flags = PREV.rm_flags;
1875 error = xfs_rmap_insert(cur, NEW.rm_startblock,
1876 NEW.rm_blockcount, NEW.rm_owner, NEW.rm_offset,
1877 NEW.rm_flags);
1878 if (error)
1879 goto done;
1880 /* new left extent - oldext */
1881 NEW = PREV;
1882 error = xfs_rmap_lookup_eq(cur, NEW.rm_startblock,
1883 NEW.rm_blockcount, NEW.rm_owner,
1884 NEW.rm_offset, NEW.rm_flags, &i);
1885 if (error)
1886 goto done;
1887 if (XFS_IS_CORRUPT(mp, i != 1)) {
1888 error = -EFSCORRUPTED;
1889 goto done;
1890 }
1891 NEW.rm_blockcount = offset - NEW.rm_offset;
1892 error = xfs_rmap_update(cur, &NEW);
1893 if (error)
1894 goto done;
1895 /* new middle extent - newext */
1896 NEW.rm_startblock = bno;
1897 NEW.rm_blockcount = len;
1898 NEW.rm_owner = owner;
1899 NEW.rm_offset = offset;
1900 NEW.rm_flags = newext;
1901 error = xfs_rmap_insert(cur, NEW.rm_startblock,
1902 NEW.rm_blockcount, NEW.rm_owner, NEW.rm_offset,
1903 NEW.rm_flags);
1904 if (error)
1905 goto done;
1906 break;
1907
1908 case RMAP_LEFT_FILLING | RMAP_LEFT_CONTIG | RMAP_RIGHT_CONTIG:
1909 case RMAP_RIGHT_FILLING | RMAP_LEFT_CONTIG | RMAP_RIGHT_CONTIG:
1910 case RMAP_LEFT_FILLING | RMAP_RIGHT_CONTIG:
1911 case RMAP_RIGHT_FILLING | RMAP_LEFT_CONTIG:
1912 case RMAP_LEFT_CONTIG | RMAP_RIGHT_CONTIG:
1913 case RMAP_LEFT_CONTIG:
1914 case RMAP_RIGHT_CONTIG:
1915 /*
1916 * These cases are all impossible.
1917 */
1918 ASSERT(0);
1919 }
1920
1921 trace_xfs_rmap_convert_done(mp, cur->bc_ag.pag->pag_agno, bno, len,
1922 unwritten, oinfo);
1923done:
1924 if (error)
1925 trace_xfs_rmap_convert_error(cur->bc_mp,
1926 cur->bc_ag.pag->pag_agno, error, _RET_IP_);
1927 return error;
1928}
1929
1930#undef NEW
1931#undef LEFT
1932#undef RIGHT
1933#undef PREV
1934
1935/*
1936 * Find an extent in the rmap btree and unmap it. For rmap extent types that
1937 * can overlap (data fork rmaps on reflink filesystems) we must be careful
1938 * that the prev/next records in the btree might belong to another owner.
1939 * Therefore we must use delete+insert to alter any of the key fields.
1940 *
1941 * For every other situation there can only be one owner for a given extent,
1942 * so we can call the regular _free function.
1943 */
1944STATIC int
1945xfs_rmap_unmap_shared(
1946 struct xfs_btree_cur *cur,
1947 xfs_agblock_t bno,
1948 xfs_extlen_t len,
1949 bool unwritten,
1950 const struct xfs_owner_info *oinfo)
1951{
1952 struct xfs_mount *mp = cur->bc_mp;
1953 struct xfs_rmap_irec ltrec;
1954 uint64_t ltoff;
1955 int error = 0;
1956 int i;
1957 uint64_t owner;
1958 uint64_t offset;
1959 unsigned int flags;
1960
1961 xfs_owner_info_unpack(oinfo, &owner, &offset, &flags);
1962 if (unwritten)
1963 flags |= XFS_RMAP_UNWRITTEN;
1964 trace_xfs_rmap_unmap(mp, cur->bc_ag.pag->pag_agno, bno, len,
1965 unwritten, oinfo);
1966
1967 /*
1968 * We should always have a left record because there's a static record
1969 * for the AG headers at rm_startblock == 0 created by mkfs/growfs that
1970 * will not ever be removed from the tree.
1971 */
1972 error = xfs_rmap_lookup_le_range(cur, bno, owner, offset, flags,
1973 <rec, &i);
1974 if (error)
1975 goto out_error;
1976 if (XFS_IS_CORRUPT(mp, i != 1)) {
1977 error = -EFSCORRUPTED;
1978 goto out_error;
1979 }
1980 ltoff = ltrec.rm_offset;
1981
1982 /* Make sure the extent we found covers the entire freeing range. */
1983 if (XFS_IS_CORRUPT(mp,
1984 ltrec.rm_startblock > bno ||
1985 ltrec.rm_startblock + ltrec.rm_blockcount <
1986 bno + len)) {
1987 error = -EFSCORRUPTED;
1988 goto out_error;
1989 }
1990
1991 /* Make sure the owner matches what we expect to find in the tree. */
1992 if (XFS_IS_CORRUPT(mp, owner != ltrec.rm_owner)) {
1993 error = -EFSCORRUPTED;
1994 goto out_error;
1995 }
1996
1997 /* Make sure the unwritten flag matches. */
1998 if (XFS_IS_CORRUPT(mp,
1999 (flags & XFS_RMAP_UNWRITTEN) !=
2000 (ltrec.rm_flags & XFS_RMAP_UNWRITTEN))) {
2001 error = -EFSCORRUPTED;
2002 goto out_error;
2003 }
2004
2005 /* Check the offset. */
2006 if (XFS_IS_CORRUPT(mp, ltrec.rm_offset > offset)) {
2007 error = -EFSCORRUPTED;
2008 goto out_error;
2009 }
2010 if (XFS_IS_CORRUPT(mp, offset > ltoff + ltrec.rm_blockcount)) {
2011 error = -EFSCORRUPTED;
2012 goto out_error;
2013 }
2014
2015 if (ltrec.rm_startblock == bno && ltrec.rm_blockcount == len) {
2016 /* Exact match, simply remove the record from rmap tree. */
2017 error = xfs_rmap_delete(cur, ltrec.rm_startblock,
2018 ltrec.rm_blockcount, ltrec.rm_owner,
2019 ltrec.rm_offset, ltrec.rm_flags);
2020 if (error)
2021 goto out_error;
2022 } else if (ltrec.rm_startblock == bno) {
2023 /*
2024 * Overlap left hand side of extent: move the start, trim the
2025 * length and update the current record.
2026 *
2027 * ltbno ltlen
2028 * Orig: |oooooooooooooooooooo|
2029 * Freeing: |fffffffff|
2030 * Result: |rrrrrrrrrr|
2031 * bno len
2032 */
2033
2034 /* Delete prev rmap. */
2035 error = xfs_rmap_delete(cur, ltrec.rm_startblock,
2036 ltrec.rm_blockcount, ltrec.rm_owner,
2037 ltrec.rm_offset, ltrec.rm_flags);
2038 if (error)
2039 goto out_error;
2040
2041 /* Add an rmap at the new offset. */
2042 ltrec.rm_startblock += len;
2043 ltrec.rm_blockcount -= len;
2044 ltrec.rm_offset += len;
2045 error = xfs_rmap_insert(cur, ltrec.rm_startblock,
2046 ltrec.rm_blockcount, ltrec.rm_owner,
2047 ltrec.rm_offset, ltrec.rm_flags);
2048 if (error)
2049 goto out_error;
2050 } else if (ltrec.rm_startblock + ltrec.rm_blockcount == bno + len) {
2051 /*
2052 * Overlap right hand side of extent: trim the length and
2053 * update the current record.
2054 *
2055 * ltbno ltlen
2056 * Orig: |oooooooooooooooooooo|
2057 * Freeing: |fffffffff|
2058 * Result: |rrrrrrrrrr|
2059 * bno len
2060 */
2061 error = xfs_rmap_lookup_eq(cur, ltrec.rm_startblock,
2062 ltrec.rm_blockcount, ltrec.rm_owner,
2063 ltrec.rm_offset, ltrec.rm_flags, &i);
2064 if (error)
2065 goto out_error;
2066 if (XFS_IS_CORRUPT(mp, i != 1)) {
2067 error = -EFSCORRUPTED;
2068 goto out_error;
2069 }
2070 ltrec.rm_blockcount -= len;
2071 error = xfs_rmap_update(cur, <rec);
2072 if (error)
2073 goto out_error;
2074 } else {
2075 /*
2076 * Overlap middle of extent: trim the length of the existing
2077 * record to the length of the new left-extent size, increment
2078 * the insertion position so we can insert a new record
2079 * containing the remaining right-extent space.
2080 *
2081 * ltbno ltlen
2082 * Orig: |oooooooooooooooooooo|
2083 * Freeing: |fffffffff|
2084 * Result: |rrrrr| |rrrr|
2085 * bno len
2086 */
2087 xfs_extlen_t orig_len = ltrec.rm_blockcount;
2088
2089 /* Shrink the left side of the rmap */
2090 error = xfs_rmap_lookup_eq(cur, ltrec.rm_startblock,
2091 ltrec.rm_blockcount, ltrec.rm_owner,
2092 ltrec.rm_offset, ltrec.rm_flags, &i);
2093 if (error)
2094 goto out_error;
2095 if (XFS_IS_CORRUPT(mp, i != 1)) {
2096 error = -EFSCORRUPTED;
2097 goto out_error;
2098 }
2099 ltrec.rm_blockcount = bno - ltrec.rm_startblock;
2100 error = xfs_rmap_update(cur, <rec);
2101 if (error)
2102 goto out_error;
2103
2104 /* Add an rmap at the new offset */
2105 error = xfs_rmap_insert(cur, bno + len,
2106 orig_len - len - ltrec.rm_blockcount,
2107 ltrec.rm_owner, offset + len,
2108 ltrec.rm_flags);
2109 if (error)
2110 goto out_error;
2111 }
2112
2113 trace_xfs_rmap_unmap_done(mp, cur->bc_ag.pag->pag_agno, bno, len,
2114 unwritten, oinfo);
2115out_error:
2116 if (error)
2117 trace_xfs_rmap_unmap_error(cur->bc_mp,
2118 cur->bc_ag.pag->pag_agno, error, _RET_IP_);
2119 return error;
2120}
2121
2122/*
2123 * Find an extent in the rmap btree and map it. For rmap extent types that
2124 * can overlap (data fork rmaps on reflink filesystems) we must be careful
2125 * that the prev/next records in the btree might belong to another owner.
2126 * Therefore we must use delete+insert to alter any of the key fields.
2127 *
2128 * For every other situation there can only be one owner for a given extent,
2129 * so we can call the regular _alloc function.
2130 */
2131STATIC int
2132xfs_rmap_map_shared(
2133 struct xfs_btree_cur *cur,
2134 xfs_agblock_t bno,
2135 xfs_extlen_t len,
2136 bool unwritten,
2137 const struct xfs_owner_info *oinfo)
2138{
2139 struct xfs_mount *mp = cur->bc_mp;
2140 struct xfs_rmap_irec ltrec;
2141 struct xfs_rmap_irec gtrec;
2142 int have_gt;
2143 int have_lt;
2144 int error = 0;
2145 int i;
2146 uint64_t owner;
2147 uint64_t offset;
2148 unsigned int flags = 0;
2149
2150 xfs_owner_info_unpack(oinfo, &owner, &offset, &flags);
2151 if (unwritten)
2152 flags |= XFS_RMAP_UNWRITTEN;
2153 trace_xfs_rmap_map(mp, cur->bc_ag.pag->pag_agno, bno, len,
2154 unwritten, oinfo);
2155
2156 /* Is there a left record that abuts our range? */
2157 error = xfs_rmap_find_left_neighbor(cur, bno, owner, offset, flags,
2158 <rec, &have_lt);
2159 if (error)
2160 goto out_error;
2161 if (have_lt &&
2162 !xfs_rmap_is_mergeable(<rec, owner, flags))
2163 have_lt = 0;
2164
2165 /* Is there a right record that abuts our range? */
2166 error = xfs_rmap_lookup_eq(cur, bno + len, len, owner, offset + len,
2167 flags, &have_gt);
2168 if (error)
2169 goto out_error;
2170 if (have_gt) {
2171 error = xfs_rmap_get_rec(cur, >rec, &have_gt);
2172 if (error)
2173 goto out_error;
2174 if (XFS_IS_CORRUPT(mp, have_gt != 1)) {
2175 error = -EFSCORRUPTED;
2176 goto out_error;
2177 }
2178 trace_xfs_rmap_find_right_neighbor_result(cur->bc_mp,
2179 cur->bc_ag.pag->pag_agno, gtrec.rm_startblock,
2180 gtrec.rm_blockcount, gtrec.rm_owner,
2181 gtrec.rm_offset, gtrec.rm_flags);
2182
2183 if (!xfs_rmap_is_mergeable(>rec, owner, flags))
2184 have_gt = 0;
2185 }
2186
2187 if (have_lt &&
2188 ltrec.rm_startblock + ltrec.rm_blockcount == bno &&
2189 ltrec.rm_offset + ltrec.rm_blockcount == offset) {
2190 /*
2191 * Left edge contiguous, merge into left record.
2192 *
2193 * ltbno ltlen
2194 * orig: |ooooooooo|
2195 * adding: |aaaaaaaaa|
2196 * result: |rrrrrrrrrrrrrrrrrrr|
2197 * bno len
2198 */
2199 ltrec.rm_blockcount += len;
2200 if (have_gt &&
2201 bno + len == gtrec.rm_startblock &&
2202 offset + len == gtrec.rm_offset) {
2203 /*
2204 * Right edge also contiguous, delete right record
2205 * and merge into left record.
2206 *
2207 * ltbno ltlen gtbno gtlen
2208 * orig: |ooooooooo| |ooooooooo|
2209 * adding: |aaaaaaaaa|
2210 * result: |rrrrrrrrrrrrrrrrrrrrrrrrrrrrr|
2211 */
2212 ltrec.rm_blockcount += gtrec.rm_blockcount;
2213 error = xfs_rmap_delete(cur, gtrec.rm_startblock,
2214 gtrec.rm_blockcount, gtrec.rm_owner,
2215 gtrec.rm_offset, gtrec.rm_flags);
2216 if (error)
2217 goto out_error;
2218 }
2219
2220 /* Point the cursor back to the left record and update. */
2221 error = xfs_rmap_lookup_eq(cur, ltrec.rm_startblock,
2222 ltrec.rm_blockcount, ltrec.rm_owner,
2223 ltrec.rm_offset, ltrec.rm_flags, &i);
2224 if (error)
2225 goto out_error;
2226 if (XFS_IS_CORRUPT(mp, i != 1)) {
2227 error = -EFSCORRUPTED;
2228 goto out_error;
2229 }
2230
2231 error = xfs_rmap_update(cur, <rec);
2232 if (error)
2233 goto out_error;
2234 } else if (have_gt &&
2235 bno + len == gtrec.rm_startblock &&
2236 offset + len == gtrec.rm_offset) {
2237 /*
2238 * Right edge contiguous, merge into right record.
2239 *
2240 * gtbno gtlen
2241 * Orig: |ooooooooo|
2242 * adding: |aaaaaaaaa|
2243 * Result: |rrrrrrrrrrrrrrrrrrr|
2244 * bno len
2245 */
2246 /* Delete the old record. */
2247 error = xfs_rmap_delete(cur, gtrec.rm_startblock,
2248 gtrec.rm_blockcount, gtrec.rm_owner,
2249 gtrec.rm_offset, gtrec.rm_flags);
2250 if (error)
2251 goto out_error;
2252
2253 /* Move the start and re-add it. */
2254 gtrec.rm_startblock = bno;
2255 gtrec.rm_blockcount += len;
2256 gtrec.rm_offset = offset;
2257 error = xfs_rmap_insert(cur, gtrec.rm_startblock,
2258 gtrec.rm_blockcount, gtrec.rm_owner,
2259 gtrec.rm_offset, gtrec.rm_flags);
2260 if (error)
2261 goto out_error;
2262 } else {
2263 /*
2264 * No contiguous edge with identical owner, insert
2265 * new record at current cursor position.
2266 */
2267 error = xfs_rmap_insert(cur, bno, len, owner, offset, flags);
2268 if (error)
2269 goto out_error;
2270 }
2271
2272 trace_xfs_rmap_map_done(mp, cur->bc_ag.pag->pag_agno, bno, len,
2273 unwritten, oinfo);
2274out_error:
2275 if (error)
2276 trace_xfs_rmap_map_error(cur->bc_mp,
2277 cur->bc_ag.pag->pag_agno, error, _RET_IP_);
2278 return error;
2279}
2280
2281/* Insert a raw rmap into the rmapbt. */
2282int
2283xfs_rmap_map_raw(
2284 struct xfs_btree_cur *cur,
2285 struct xfs_rmap_irec *rmap)
2286{
2287 struct xfs_owner_info oinfo;
2288
2289 oinfo.oi_owner = rmap->rm_owner;
2290 oinfo.oi_offset = rmap->rm_offset;
2291 oinfo.oi_flags = 0;
2292 if (rmap->rm_flags & XFS_RMAP_ATTR_FORK)
2293 oinfo.oi_flags |= XFS_OWNER_INFO_ATTR_FORK;
2294 if (rmap->rm_flags & XFS_RMAP_BMBT_BLOCK)
2295 oinfo.oi_flags |= XFS_OWNER_INFO_BMBT_BLOCK;
2296
2297 if (rmap->rm_flags || XFS_RMAP_NON_INODE_OWNER(rmap->rm_owner))
2298 return xfs_rmap_map(cur, rmap->rm_startblock,
2299 rmap->rm_blockcount,
2300 rmap->rm_flags & XFS_RMAP_UNWRITTEN,
2301 &oinfo);
2302
2303 return xfs_rmap_map_shared(cur, rmap->rm_startblock,
2304 rmap->rm_blockcount,
2305 rmap->rm_flags & XFS_RMAP_UNWRITTEN,
2306 &oinfo);
2307}
2308
2309struct xfs_rmap_query_range_info {
2310 xfs_rmap_query_range_fn fn;
2311 void *priv;
2312};
2313
2314/* Format btree record and pass to our callback. */
2315STATIC int
2316xfs_rmap_query_range_helper(
2317 struct xfs_btree_cur *cur,
2318 const union xfs_btree_rec *rec,
2319 void *priv)
2320{
2321 struct xfs_rmap_query_range_info *query = priv;
2322 struct xfs_rmap_irec irec;
2323 int error;
2324
2325 error = xfs_rmap_btrec_to_irec(rec, &irec);
2326 if (error)
2327 return error;
2328 return query->fn(cur, &irec, query->priv);
2329}
2330
2331/* Find all rmaps between two keys. */
2332int
2333xfs_rmap_query_range(
2334 struct xfs_btree_cur *cur,
2335 const struct xfs_rmap_irec *low_rec,
2336 const struct xfs_rmap_irec *high_rec,
2337 xfs_rmap_query_range_fn fn,
2338 void *priv)
2339{
2340 union xfs_btree_irec low_brec;
2341 union xfs_btree_irec high_brec;
2342 struct xfs_rmap_query_range_info query;
2343
2344 low_brec.r = *low_rec;
2345 high_brec.r = *high_rec;
2346 query.priv = priv;
2347 query.fn = fn;
2348 return xfs_btree_query_range(cur, &low_brec, &high_brec,
2349 xfs_rmap_query_range_helper, &query);
2350}
2351
2352/* Find all rmaps. */
2353int
2354xfs_rmap_query_all(
2355 struct xfs_btree_cur *cur,
2356 xfs_rmap_query_range_fn fn,
2357 void *priv)
2358{
2359 struct xfs_rmap_query_range_info query;
2360
2361 query.priv = priv;
2362 query.fn = fn;
2363 return xfs_btree_query_all(cur, xfs_rmap_query_range_helper, &query);
2364}
2365
2366/* Clean up after calling xfs_rmap_finish_one. */
2367void
2368xfs_rmap_finish_one_cleanup(
2369 struct xfs_trans *tp,
2370 struct xfs_btree_cur *rcur,
2371 int error)
2372{
2373 struct xfs_buf *agbp;
2374
2375 if (rcur == NULL)
2376 return;
2377 agbp = rcur->bc_ag.agbp;
2378 xfs_btree_del_cursor(rcur, error);
2379 if (error)
2380 xfs_trans_brelse(tp, agbp);
2381}
2382
2383/*
2384 * Process one of the deferred rmap operations. We pass back the
2385 * btree cursor to maintain our lock on the rmapbt between calls.
2386 * This saves time and eliminates a buffer deadlock between the
2387 * superblock and the AGF because we'll always grab them in the same
2388 * order.
2389 */
2390int
2391xfs_rmap_finish_one(
2392 struct xfs_trans *tp,
2393 enum xfs_rmap_intent_type type,
2394 uint64_t owner,
2395 int whichfork,
2396 xfs_fileoff_t startoff,
2397 xfs_fsblock_t startblock,
2398 xfs_filblks_t blockcount,
2399 xfs_exntst_t state,
2400 struct xfs_btree_cur **pcur)
2401{
2402 struct xfs_mount *mp = tp->t_mountp;
2403 struct xfs_perag *pag;
2404 struct xfs_btree_cur *rcur;
2405 struct xfs_buf *agbp = NULL;
2406 int error = 0;
2407 struct xfs_owner_info oinfo;
2408 xfs_agblock_t bno;
2409 bool unwritten;
2410
2411 pag = xfs_perag_get(mp, XFS_FSB_TO_AGNO(mp, startblock));
2412 bno = XFS_FSB_TO_AGBNO(mp, startblock);
2413
2414 trace_xfs_rmap_deferred(mp, pag->pag_agno, type, bno, owner, whichfork,
2415 startoff, blockcount, state);
2416
2417 if (XFS_TEST_ERROR(false, mp, XFS_ERRTAG_RMAP_FINISH_ONE)) {
2418 error = -EIO;
2419 goto out_drop;
2420 }
2421
2422
2423 /*
2424 * If we haven't gotten a cursor or the cursor AG doesn't match
2425 * the startblock, get one now.
2426 */
2427 rcur = *pcur;
2428 if (rcur != NULL && rcur->bc_ag.pag != pag) {
2429 xfs_rmap_finish_one_cleanup(tp, rcur, 0);
2430 rcur = NULL;
2431 *pcur = NULL;
2432 }
2433 if (rcur == NULL) {
2434 /*
2435 * Refresh the freelist before we start changing the
2436 * rmapbt, because a shape change could cause us to
2437 * allocate blocks.
2438 */
2439 error = xfs_free_extent_fix_freelist(tp, pag, &agbp);
2440 if (error)
2441 goto out_drop;
2442 if (XFS_IS_CORRUPT(tp->t_mountp, !agbp)) {
2443 error = -EFSCORRUPTED;
2444 goto out_drop;
2445 }
2446
2447 rcur = xfs_rmapbt_init_cursor(mp, tp, agbp, pag);
2448 }
2449 *pcur = rcur;
2450
2451 xfs_rmap_ino_owner(&oinfo, owner, whichfork, startoff);
2452 unwritten = state == XFS_EXT_UNWRITTEN;
2453 bno = XFS_FSB_TO_AGBNO(rcur->bc_mp, startblock);
2454
2455 switch (type) {
2456 case XFS_RMAP_ALLOC:
2457 case XFS_RMAP_MAP:
2458 error = xfs_rmap_map(rcur, bno, blockcount, unwritten, &oinfo);
2459 break;
2460 case XFS_RMAP_MAP_SHARED:
2461 error = xfs_rmap_map_shared(rcur, bno, blockcount, unwritten,
2462 &oinfo);
2463 break;
2464 case XFS_RMAP_FREE:
2465 case XFS_RMAP_UNMAP:
2466 error = xfs_rmap_unmap(rcur, bno, blockcount, unwritten,
2467 &oinfo);
2468 break;
2469 case XFS_RMAP_UNMAP_SHARED:
2470 error = xfs_rmap_unmap_shared(rcur, bno, blockcount, unwritten,
2471 &oinfo);
2472 break;
2473 case XFS_RMAP_CONVERT:
2474 error = xfs_rmap_convert(rcur, bno, blockcount, !unwritten,
2475 &oinfo);
2476 break;
2477 case XFS_RMAP_CONVERT_SHARED:
2478 error = xfs_rmap_convert_shared(rcur, bno, blockcount,
2479 !unwritten, &oinfo);
2480 break;
2481 default:
2482 ASSERT(0);
2483 error = -EFSCORRUPTED;
2484 }
2485out_drop:
2486 xfs_perag_put(pag);
2487 return error;
2488}
2489
2490/*
2491 * Don't defer an rmap if we aren't an rmap filesystem.
2492 */
2493static bool
2494xfs_rmap_update_is_needed(
2495 struct xfs_mount *mp,
2496 int whichfork)
2497{
2498 return xfs_has_rmapbt(mp) && whichfork != XFS_COW_FORK;
2499}
2500
2501/*
2502 * Record a rmap intent; the list is kept sorted first by AG and then by
2503 * increasing age.
2504 */
2505static void
2506__xfs_rmap_add(
2507 struct xfs_trans *tp,
2508 enum xfs_rmap_intent_type type,
2509 uint64_t owner,
2510 int whichfork,
2511 struct xfs_bmbt_irec *bmap)
2512{
2513 struct xfs_rmap_intent *ri;
2514
2515 trace_xfs_rmap_defer(tp->t_mountp,
2516 XFS_FSB_TO_AGNO(tp->t_mountp, bmap->br_startblock),
2517 type,
2518 XFS_FSB_TO_AGBNO(tp->t_mountp, bmap->br_startblock),
2519 owner, whichfork,
2520 bmap->br_startoff,
2521 bmap->br_blockcount,
2522 bmap->br_state);
2523
2524 ri = kmem_cache_alloc(xfs_rmap_intent_cache, GFP_NOFS | __GFP_NOFAIL);
2525 INIT_LIST_HEAD(&ri->ri_list);
2526 ri->ri_type = type;
2527 ri->ri_owner = owner;
2528 ri->ri_whichfork = whichfork;
2529 ri->ri_bmap = *bmap;
2530
2531 xfs_defer_add(tp, XFS_DEFER_OPS_TYPE_RMAP, &ri->ri_list);
2532}
2533
2534/* Map an extent into a file. */
2535void
2536xfs_rmap_map_extent(
2537 struct xfs_trans *tp,
2538 struct xfs_inode *ip,
2539 int whichfork,
2540 struct xfs_bmbt_irec *PREV)
2541{
2542 enum xfs_rmap_intent_type type = XFS_RMAP_MAP;
2543
2544 if (!xfs_rmap_update_is_needed(tp->t_mountp, whichfork))
2545 return;
2546
2547 if (whichfork != XFS_ATTR_FORK && xfs_is_reflink_inode(ip))
2548 type = XFS_RMAP_MAP_SHARED;
2549
2550 __xfs_rmap_add(tp, type, ip->i_ino, whichfork, PREV);
2551}
2552
2553/* Unmap an extent out of a file. */
2554void
2555xfs_rmap_unmap_extent(
2556 struct xfs_trans *tp,
2557 struct xfs_inode *ip,
2558 int whichfork,
2559 struct xfs_bmbt_irec *PREV)
2560{
2561 enum xfs_rmap_intent_type type = XFS_RMAP_UNMAP;
2562
2563 if (!xfs_rmap_update_is_needed(tp->t_mountp, whichfork))
2564 return;
2565
2566 if (whichfork != XFS_ATTR_FORK && xfs_is_reflink_inode(ip))
2567 type = XFS_RMAP_UNMAP_SHARED;
2568
2569 __xfs_rmap_add(tp, type, ip->i_ino, whichfork, PREV);
2570}
2571
2572/*
2573 * Convert a data fork extent from unwritten to real or vice versa.
2574 *
2575 * Note that tp can be NULL here as no transaction is used for COW fork
2576 * unwritten conversion.
2577 */
2578void
2579xfs_rmap_convert_extent(
2580 struct xfs_mount *mp,
2581 struct xfs_trans *tp,
2582 struct xfs_inode *ip,
2583 int whichfork,
2584 struct xfs_bmbt_irec *PREV)
2585{
2586 enum xfs_rmap_intent_type type = XFS_RMAP_CONVERT;
2587
2588 if (!xfs_rmap_update_is_needed(mp, whichfork))
2589 return;
2590
2591 if (whichfork != XFS_ATTR_FORK && xfs_is_reflink_inode(ip))
2592 type = XFS_RMAP_CONVERT_SHARED;
2593
2594 __xfs_rmap_add(tp, type, ip->i_ino, whichfork, PREV);
2595}
2596
2597/* Schedule the creation of an rmap for non-file data. */
2598void
2599xfs_rmap_alloc_extent(
2600 struct xfs_trans *tp,
2601 xfs_agnumber_t agno,
2602 xfs_agblock_t bno,
2603 xfs_extlen_t len,
2604 uint64_t owner)
2605{
2606 struct xfs_bmbt_irec bmap;
2607
2608 if (!xfs_rmap_update_is_needed(tp->t_mountp, XFS_DATA_FORK))
2609 return;
2610
2611 bmap.br_startblock = XFS_AGB_TO_FSB(tp->t_mountp, agno, bno);
2612 bmap.br_blockcount = len;
2613 bmap.br_startoff = 0;
2614 bmap.br_state = XFS_EXT_NORM;
2615
2616 __xfs_rmap_add(tp, XFS_RMAP_ALLOC, owner, XFS_DATA_FORK, &bmap);
2617}
2618
2619/* Schedule the deletion of an rmap for non-file data. */
2620void
2621xfs_rmap_free_extent(
2622 struct xfs_trans *tp,
2623 xfs_agnumber_t agno,
2624 xfs_agblock_t bno,
2625 xfs_extlen_t len,
2626 uint64_t owner)
2627{
2628 struct xfs_bmbt_irec bmap;
2629
2630 if (!xfs_rmap_update_is_needed(tp->t_mountp, XFS_DATA_FORK))
2631 return;
2632
2633 bmap.br_startblock = XFS_AGB_TO_FSB(tp->t_mountp, agno, bno);
2634 bmap.br_blockcount = len;
2635 bmap.br_startoff = 0;
2636 bmap.br_state = XFS_EXT_NORM;
2637
2638 __xfs_rmap_add(tp, XFS_RMAP_FREE, owner, XFS_DATA_FORK, &bmap);
2639}
2640
2641/* Compare rmap records. Returns -1 if a < b, 1 if a > b, and 0 if equal. */
2642int
2643xfs_rmap_compare(
2644 const struct xfs_rmap_irec *a,
2645 const struct xfs_rmap_irec *b)
2646{
2647 __u64 oa;
2648 __u64 ob;
2649
2650 oa = xfs_rmap_irec_offset_pack(a);
2651 ob = xfs_rmap_irec_offset_pack(b);
2652
2653 if (a->rm_startblock < b->rm_startblock)
2654 return -1;
2655 else if (a->rm_startblock > b->rm_startblock)
2656 return 1;
2657 else if (a->rm_owner < b->rm_owner)
2658 return -1;
2659 else if (a->rm_owner > b->rm_owner)
2660 return 1;
2661 else if (oa < ob)
2662 return -1;
2663 else if (oa > ob)
2664 return 1;
2665 else
2666 return 0;
2667}
2668
2669/* Is there a record covering a given extent? */
2670int
2671xfs_rmap_has_record(
2672 struct xfs_btree_cur *cur,
2673 xfs_agblock_t bno,
2674 xfs_extlen_t len,
2675 bool *exists)
2676{
2677 union xfs_btree_irec low;
2678 union xfs_btree_irec high;
2679
2680 memset(&low, 0, sizeof(low));
2681 low.r.rm_startblock = bno;
2682 memset(&high, 0xFF, sizeof(high));
2683 high.r.rm_startblock = bno + len - 1;
2684
2685 return xfs_btree_has_record(cur, &low, &high, exists);
2686}
2687
2688/*
2689 * Is there a record for this owner completely covering a given physical
2690 * extent? If so, *has_rmap will be set to true. If there is no record
2691 * or the record only covers part of the range, we set *has_rmap to false.
2692 * This function doesn't perform range lookups or offset checks, so it is
2693 * not suitable for checking data fork blocks.
2694 */
2695int
2696xfs_rmap_record_exists(
2697 struct xfs_btree_cur *cur,
2698 xfs_agblock_t bno,
2699 xfs_extlen_t len,
2700 const struct xfs_owner_info *oinfo,
2701 bool *has_rmap)
2702{
2703 uint64_t owner;
2704 uint64_t offset;
2705 unsigned int flags;
2706 int has_record;
2707 struct xfs_rmap_irec irec;
2708 int error;
2709
2710 xfs_owner_info_unpack(oinfo, &owner, &offset, &flags);
2711 ASSERT(XFS_RMAP_NON_INODE_OWNER(owner) ||
2712 (flags & XFS_RMAP_BMBT_BLOCK));
2713
2714 error = xfs_rmap_lookup_le(cur, bno, owner, offset, flags, &irec,
2715 &has_record);
2716 if (error)
2717 return error;
2718 if (!has_record) {
2719 *has_rmap = false;
2720 return 0;
2721 }
2722
2723 *has_rmap = (irec.rm_owner == owner && irec.rm_startblock <= bno &&
2724 irec.rm_startblock + irec.rm_blockcount >= bno + len);
2725 return 0;
2726}
2727
2728struct xfs_rmap_key_state {
2729 uint64_t owner;
2730 uint64_t offset;
2731 unsigned int flags;
2732};
2733
2734/* For each rmap given, figure out if it doesn't match the key we want. */
2735STATIC int
2736xfs_rmap_has_other_keys_helper(
2737 struct xfs_btree_cur *cur,
2738 const struct xfs_rmap_irec *rec,
2739 void *priv)
2740{
2741 struct xfs_rmap_key_state *rks = priv;
2742
2743 if (rks->owner == rec->rm_owner && rks->offset == rec->rm_offset &&
2744 ((rks->flags & rec->rm_flags) & XFS_RMAP_KEY_FLAGS) == rks->flags)
2745 return 0;
2746 return -ECANCELED;
2747}
2748
2749/*
2750 * Given an extent and some owner info, can we find records overlapping
2751 * the extent whose owner info does not match the given owner?
2752 */
2753int
2754xfs_rmap_has_other_keys(
2755 struct xfs_btree_cur *cur,
2756 xfs_agblock_t bno,
2757 xfs_extlen_t len,
2758 const struct xfs_owner_info *oinfo,
2759 bool *has_rmap)
2760{
2761 struct xfs_rmap_irec low = {0};
2762 struct xfs_rmap_irec high;
2763 struct xfs_rmap_key_state rks;
2764 int error;
2765
2766 xfs_owner_info_unpack(oinfo, &rks.owner, &rks.offset, &rks.flags);
2767 *has_rmap = false;
2768
2769 low.rm_startblock = bno;
2770 memset(&high, 0xFF, sizeof(high));
2771 high.rm_startblock = bno + len - 1;
2772
2773 error = xfs_rmap_query_range(cur, &low, &high,
2774 xfs_rmap_has_other_keys_helper, &rks);
2775 if (error == -ECANCELED) {
2776 *has_rmap = true;
2777 return 0;
2778 }
2779
2780 return error;
2781}
2782
2783const struct xfs_owner_info XFS_RMAP_OINFO_SKIP_UPDATE = {
2784 .oi_owner = XFS_RMAP_OWN_NULL,
2785};
2786const struct xfs_owner_info XFS_RMAP_OINFO_ANY_OWNER = {
2787 .oi_owner = XFS_RMAP_OWN_UNKNOWN,
2788};
2789const struct xfs_owner_info XFS_RMAP_OINFO_FS = {
2790 .oi_owner = XFS_RMAP_OWN_FS,
2791};
2792const struct xfs_owner_info XFS_RMAP_OINFO_LOG = {
2793 .oi_owner = XFS_RMAP_OWN_LOG,
2794};
2795const struct xfs_owner_info XFS_RMAP_OINFO_AG = {
2796 .oi_owner = XFS_RMAP_OWN_AG,
2797};
2798const struct xfs_owner_info XFS_RMAP_OINFO_INOBT = {
2799 .oi_owner = XFS_RMAP_OWN_INOBT,
2800};
2801const struct xfs_owner_info XFS_RMAP_OINFO_INODES = {
2802 .oi_owner = XFS_RMAP_OWN_INODES,
2803};
2804const struct xfs_owner_info XFS_RMAP_OINFO_REFC = {
2805 .oi_owner = XFS_RMAP_OWN_REFC,
2806};
2807const struct xfs_owner_info XFS_RMAP_OINFO_COW = {
2808 .oi_owner = XFS_RMAP_OWN_COW,
2809};
2810
2811int __init
2812xfs_rmap_intent_init_cache(void)
2813{
2814 xfs_rmap_intent_cache = kmem_cache_create("xfs_rmap_intent",
2815 sizeof(struct xfs_rmap_intent),
2816 0, 0, NULL);
2817
2818 return xfs_rmap_intent_cache != NULL ? 0 : -ENOMEM;
2819}
2820
2821void
2822xfs_rmap_intent_destroy_cache(void)
2823{
2824 kmem_cache_destroy(xfs_rmap_intent_cache);
2825 xfs_rmap_intent_cache = NULL;
2826}