Merge tag 'm68knommu-for-v6.2' of git://git.kernel.org/pub/scm/linux/kernel/git/gerg...
[platform/kernel/linux-starfive.git] / fs / xfs / scrub / bmap.c
1 // SPDX-License-Identifier: GPL-2.0+
2 /*
3  * Copyright (C) 2017 Oracle.  All Rights Reserved.
4  * Author: Darrick J. Wong <darrick.wong@oracle.com>
5  */
6 #include "xfs.h"
7 #include "xfs_fs.h"
8 #include "xfs_shared.h"
9 #include "xfs_format.h"
10 #include "xfs_trans_resv.h"
11 #include "xfs_mount.h"
12 #include "xfs_btree.h"
13 #include "xfs_bit.h"
14 #include "xfs_log_format.h"
15 #include "xfs_trans.h"
16 #include "xfs_inode.h"
17 #include "xfs_alloc.h"
18 #include "xfs_bmap.h"
19 #include "xfs_bmap_btree.h"
20 #include "xfs_rmap.h"
21 #include "xfs_rmap_btree.h"
22 #include "scrub/scrub.h"
23 #include "scrub/common.h"
24 #include "scrub/btree.h"
25 #include "xfs_ag.h"
26
27 /* Set us up with an inode's bmap. */
28 int
29 xchk_setup_inode_bmap(
30         struct xfs_scrub        *sc)
31 {
32         int                     error;
33
34         error = xchk_get_inode(sc);
35         if (error)
36                 goto out;
37
38         sc->ilock_flags = XFS_IOLOCK_EXCL | XFS_MMAPLOCK_EXCL;
39         xfs_ilock(sc->ip, sc->ilock_flags);
40
41         /*
42          * We don't want any ephemeral data fork updates sitting around
43          * while we inspect block mappings, so wait for directio to finish
44          * and flush dirty data if we have delalloc reservations.
45          */
46         if (S_ISREG(VFS_I(sc->ip)->i_mode) &&
47             sc->sm->sm_type == XFS_SCRUB_TYPE_BMBTD) {
48                 struct address_space    *mapping = VFS_I(sc->ip)->i_mapping;
49
50                 inode_dio_wait(VFS_I(sc->ip));
51
52                 /*
53                  * Try to flush all incore state to disk before we examine the
54                  * space mappings for the data fork.  Leave accumulated errors
55                  * in the mapping for the writer threads to consume.
56                  *
57                  * On ENOSPC or EIO writeback errors, we continue into the
58                  * extent mapping checks because write failures do not
59                  * necessarily imply anything about the correctness of the file
60                  * metadata.  The metadata and the file data could be on
61                  * completely separate devices; a media failure might only
62                  * affect a subset of the disk, etc.  We can handle delalloc
63                  * extents in the scrubber, so leaving them in memory is fine.
64                  */
65                 error = filemap_fdatawrite(mapping);
66                 if (!error)
67                         error = filemap_fdatawait_keep_errors(mapping);
68                 if (error && (error != -ENOSPC && error != -EIO))
69                         goto out;
70         }
71
72         /* Got the inode, lock it and we're ready to go. */
73         error = xchk_trans_alloc(sc, 0);
74         if (error)
75                 goto out;
76         sc->ilock_flags |= XFS_ILOCK_EXCL;
77         xfs_ilock(sc->ip, XFS_ILOCK_EXCL);
78
79 out:
80         /* scrub teardown will unlock and release the inode */
81         return error;
82 }
83
84 /*
85  * Inode fork block mapping (BMBT) scrubber.
86  * More complex than the others because we have to scrub
87  * all the extents regardless of whether or not the fork
88  * is in btree format.
89  */
90
91 struct xchk_bmap_info {
92         struct xfs_scrub        *sc;
93         struct xfs_iext_cursor  icur;
94         xfs_fileoff_t           lastoff;
95         bool                    is_rt;
96         bool                    is_shared;
97         bool                    was_loaded;
98         int                     whichfork;
99 };
100
101 /* Look for a corresponding rmap for this irec. */
102 static inline bool
103 xchk_bmap_get_rmap(
104         struct xchk_bmap_info   *info,
105         struct xfs_bmbt_irec    *irec,
106         xfs_agblock_t           agbno,
107         uint64_t                owner,
108         struct xfs_rmap_irec    *rmap)
109 {
110         xfs_fileoff_t           offset;
111         unsigned int            rflags = 0;
112         int                     has_rmap;
113         int                     error;
114
115         if (info->whichfork == XFS_ATTR_FORK)
116                 rflags |= XFS_RMAP_ATTR_FORK;
117         if (irec->br_state == XFS_EXT_UNWRITTEN)
118                 rflags |= XFS_RMAP_UNWRITTEN;
119
120         /*
121          * CoW staging extents are owned (on disk) by the refcountbt, so
122          * their rmaps do not have offsets.
123          */
124         if (info->whichfork == XFS_COW_FORK)
125                 offset = 0;
126         else
127                 offset = irec->br_startoff;
128
129         /*
130          * If the caller thinks this could be a shared bmbt extent (IOWs,
131          * any data fork extent of a reflink inode) then we have to use the
132          * range rmap lookup to make sure we get the correct owner/offset.
133          */
134         if (info->is_shared) {
135                 error = xfs_rmap_lookup_le_range(info->sc->sa.rmap_cur, agbno,
136                                 owner, offset, rflags, rmap, &has_rmap);
137         } else {
138                 error = xfs_rmap_lookup_le(info->sc->sa.rmap_cur, agbno,
139                                 owner, offset, rflags, rmap, &has_rmap);
140         }
141         if (!xchk_should_check_xref(info->sc, &error, &info->sc->sa.rmap_cur))
142                 return false;
143
144         if (!has_rmap)
145                 xchk_fblock_xref_set_corrupt(info->sc, info->whichfork,
146                         irec->br_startoff);
147         return has_rmap;
148 }
149
150 static inline bool
151 xchk_bmap_has_prev(
152         struct xchk_bmap_info   *info,
153         struct xfs_bmbt_irec    *irec)
154 {
155         struct xfs_bmbt_irec    got;
156         struct xfs_ifork        *ifp;
157
158         ifp = xfs_ifork_ptr(info->sc->ip, info->whichfork);
159
160         if (!xfs_iext_peek_prev_extent(ifp, &info->icur, &got))
161                 return false;
162         if (got.br_startoff + got.br_blockcount != irec->br_startoff)
163                 return false;
164         if (got.br_startblock + got.br_blockcount != irec->br_startblock)
165                 return false;
166         if (got.br_state != irec->br_state)
167                 return false;
168         return true;
169 }
170
171 static inline bool
172 xchk_bmap_has_next(
173         struct xchk_bmap_info   *info,
174         struct xfs_bmbt_irec    *irec)
175 {
176         struct xfs_bmbt_irec    got;
177         struct xfs_ifork        *ifp;
178
179         ifp = xfs_ifork_ptr(info->sc->ip, info->whichfork);
180
181         if (!xfs_iext_peek_next_extent(ifp, &info->icur, &got))
182                 return false;
183         if (irec->br_startoff + irec->br_blockcount != got.br_startoff)
184                 return false;
185         if (irec->br_startblock + irec->br_blockcount != got.br_startblock)
186                 return false;
187         if (got.br_state != irec->br_state)
188                 return false;
189         return true;
190 }
191
192 /* Make sure that we have rmapbt records for this extent. */
193 STATIC void
194 xchk_bmap_xref_rmap(
195         struct xchk_bmap_info   *info,
196         struct xfs_bmbt_irec    *irec,
197         xfs_agblock_t           agbno)
198 {
199         struct xfs_rmap_irec    rmap;
200         unsigned long long      rmap_end;
201         uint64_t                owner;
202
203         if (!info->sc->sa.rmap_cur || xchk_skip_xref(info->sc->sm))
204                 return;
205
206         if (info->whichfork == XFS_COW_FORK)
207                 owner = XFS_RMAP_OWN_COW;
208         else
209                 owner = info->sc->ip->i_ino;
210
211         /* Find the rmap record for this irec. */
212         if (!xchk_bmap_get_rmap(info, irec, agbno, owner, &rmap))
213                 return;
214
215         /* Check the rmap. */
216         rmap_end = (unsigned long long)rmap.rm_startblock + rmap.rm_blockcount;
217         if (rmap.rm_startblock > agbno ||
218             agbno + irec->br_blockcount > rmap_end)
219                 xchk_fblock_xref_set_corrupt(info->sc, info->whichfork,
220                                 irec->br_startoff);
221
222         /*
223          * Check the logical offsets if applicable.  CoW staging extents
224          * don't track logical offsets since the mappings only exist in
225          * memory.
226          */
227         if (info->whichfork != XFS_COW_FORK) {
228                 rmap_end = (unsigned long long)rmap.rm_offset +
229                                 rmap.rm_blockcount;
230                 if (rmap.rm_offset > irec->br_startoff ||
231                     irec->br_startoff + irec->br_blockcount > rmap_end)
232                         xchk_fblock_xref_set_corrupt(info->sc,
233                                         info->whichfork, irec->br_startoff);
234         }
235
236         if (rmap.rm_owner != owner)
237                 xchk_fblock_xref_set_corrupt(info->sc, info->whichfork,
238                                 irec->br_startoff);
239
240         /*
241          * Check for discrepancies between the unwritten flag in the irec and
242          * the rmap.  Note that the (in-memory) CoW fork distinguishes between
243          * unwritten and written extents, but we don't track that in the rmap
244          * records because the blocks are owned (on-disk) by the refcountbt,
245          * which doesn't track unwritten state.
246          */
247         if (owner != XFS_RMAP_OWN_COW &&
248             !!(irec->br_state == XFS_EXT_UNWRITTEN) !=
249             !!(rmap.rm_flags & XFS_RMAP_UNWRITTEN))
250                 xchk_fblock_xref_set_corrupt(info->sc, info->whichfork,
251                                 irec->br_startoff);
252
253         if (!!(info->whichfork == XFS_ATTR_FORK) !=
254             !!(rmap.rm_flags & XFS_RMAP_ATTR_FORK))
255                 xchk_fblock_xref_set_corrupt(info->sc, info->whichfork,
256                                 irec->br_startoff);
257         if (rmap.rm_flags & XFS_RMAP_BMBT_BLOCK)
258                 xchk_fblock_xref_set_corrupt(info->sc, info->whichfork,
259                                 irec->br_startoff);
260
261         /*
262          * If the rmap starts before this bmbt record, make sure there's a bmbt
263          * record for the previous offset that is contiguous with this mapping.
264          * Skip this for CoW fork extents because the refcount btree (and not
265          * the inode) is the ondisk owner for those extents.
266          */
267         if (info->whichfork != XFS_COW_FORK && rmap.rm_startblock < agbno &&
268             !xchk_bmap_has_prev(info, irec)) {
269                 xchk_fblock_xref_set_corrupt(info->sc, info->whichfork,
270                                 irec->br_startoff);
271                 return;
272         }
273
274         /*
275          * If the rmap ends after this bmbt record, make sure there's a bmbt
276          * record for the next offset that is contiguous with this mapping.
277          * Skip this for CoW fork extents because the refcount btree (and not
278          * the inode) is the ondisk owner for those extents.
279          */
280         rmap_end = (unsigned long long)rmap.rm_startblock + rmap.rm_blockcount;
281         if (info->whichfork != XFS_COW_FORK &&
282             rmap_end > agbno + irec->br_blockcount &&
283             !xchk_bmap_has_next(info, irec)) {
284                 xchk_fblock_xref_set_corrupt(info->sc, info->whichfork,
285                                 irec->br_startoff);
286                 return;
287         }
288 }
289
290 /* Cross-reference a single rtdev extent record. */
291 STATIC void
292 xchk_bmap_rt_iextent_xref(
293         struct xfs_inode        *ip,
294         struct xchk_bmap_info   *info,
295         struct xfs_bmbt_irec    *irec)
296 {
297         xchk_xref_is_used_rt_space(info->sc, irec->br_startblock,
298                         irec->br_blockcount);
299 }
300
301 /* Cross-reference a single datadev extent record. */
302 STATIC void
303 xchk_bmap_iextent_xref(
304         struct xfs_inode        *ip,
305         struct xchk_bmap_info   *info,
306         struct xfs_bmbt_irec    *irec)
307 {
308         struct xfs_mount        *mp = info->sc->mp;
309         xfs_agnumber_t          agno;
310         xfs_agblock_t           agbno;
311         xfs_extlen_t            len;
312         int                     error;
313
314         agno = XFS_FSB_TO_AGNO(mp, irec->br_startblock);
315         agbno = XFS_FSB_TO_AGBNO(mp, irec->br_startblock);
316         len = irec->br_blockcount;
317
318         error = xchk_ag_init_existing(info->sc, agno, &info->sc->sa);
319         if (!xchk_fblock_process_error(info->sc, info->whichfork,
320                         irec->br_startoff, &error))
321                 goto out_free;
322
323         xchk_xref_is_used_space(info->sc, agbno, len);
324         xchk_xref_is_not_inode_chunk(info->sc, agbno, len);
325         xchk_bmap_xref_rmap(info, irec, agbno);
326         switch (info->whichfork) {
327         case XFS_DATA_FORK:
328                 if (xfs_is_reflink_inode(info->sc->ip))
329                         break;
330                 fallthrough;
331         case XFS_ATTR_FORK:
332                 xchk_xref_is_not_shared(info->sc, agbno,
333                                 irec->br_blockcount);
334                 break;
335         case XFS_COW_FORK:
336                 xchk_xref_is_cow_staging(info->sc, agbno,
337                                 irec->br_blockcount);
338                 xchk_xref_is_not_shared(info->sc, agbno,
339                                 irec->br_blockcount);
340                 break;
341         }
342
343 out_free:
344         xchk_ag_free(info->sc, &info->sc->sa);
345 }
346
347 /*
348  * Directories and attr forks should never have blocks that can't be addressed
349  * by a xfs_dablk_t.
350  */
351 STATIC void
352 xchk_bmap_dirattr_extent(
353         struct xfs_inode        *ip,
354         struct xchk_bmap_info   *info,
355         struct xfs_bmbt_irec    *irec)
356 {
357         struct xfs_mount        *mp = ip->i_mount;
358         xfs_fileoff_t           off;
359
360         if (!S_ISDIR(VFS_I(ip)->i_mode) && info->whichfork != XFS_ATTR_FORK)
361                 return;
362
363         if (!xfs_verify_dablk(mp, irec->br_startoff))
364                 xchk_fblock_set_corrupt(info->sc, info->whichfork,
365                                 irec->br_startoff);
366
367         off = irec->br_startoff + irec->br_blockcount - 1;
368         if (!xfs_verify_dablk(mp, off))
369                 xchk_fblock_set_corrupt(info->sc, info->whichfork, off);
370 }
371
372 /* Scrub a single extent record. */
373 STATIC void
374 xchk_bmap_iextent(
375         struct xfs_inode        *ip,
376         struct xchk_bmap_info   *info,
377         struct xfs_bmbt_irec    *irec)
378 {
379         struct xfs_mount        *mp = info->sc->mp;
380
381         /*
382          * Check for out-of-order extents.  This record could have come
383          * from the incore list, for which there is no ordering check.
384          */
385         if (irec->br_startoff < info->lastoff)
386                 xchk_fblock_set_corrupt(info->sc, info->whichfork,
387                                 irec->br_startoff);
388
389         if (!xfs_verify_fileext(mp, irec->br_startoff, irec->br_blockcount))
390                 xchk_fblock_set_corrupt(info->sc, info->whichfork,
391                                 irec->br_startoff);
392
393         xchk_bmap_dirattr_extent(ip, info, irec);
394
395         /* There should never be a "hole" extent in either extent list. */
396         if (irec->br_startblock == HOLESTARTBLOCK)
397                 xchk_fblock_set_corrupt(info->sc, info->whichfork,
398                                 irec->br_startoff);
399
400         /* Make sure the extent points to a valid place. */
401         if (irec->br_blockcount > XFS_MAX_BMBT_EXTLEN)
402                 xchk_fblock_set_corrupt(info->sc, info->whichfork,
403                                 irec->br_startoff);
404         if (info->is_rt &&
405             !xfs_verify_rtext(mp, irec->br_startblock, irec->br_blockcount))
406                 xchk_fblock_set_corrupt(info->sc, info->whichfork,
407                                 irec->br_startoff);
408         if (!info->is_rt &&
409             !xfs_verify_fsbext(mp, irec->br_startblock, irec->br_blockcount))
410                 xchk_fblock_set_corrupt(info->sc, info->whichfork,
411                                 irec->br_startoff);
412
413         /* We don't allow unwritten extents on attr forks. */
414         if (irec->br_state == XFS_EXT_UNWRITTEN &&
415             info->whichfork == XFS_ATTR_FORK)
416                 xchk_fblock_set_corrupt(info->sc, info->whichfork,
417                                 irec->br_startoff);
418
419         if (info->sc->sm->sm_flags & XFS_SCRUB_OFLAG_CORRUPT)
420                 return;
421
422         if (info->is_rt)
423                 xchk_bmap_rt_iextent_xref(ip, info, irec);
424         else
425                 xchk_bmap_iextent_xref(ip, info, irec);
426 }
427
428 /* Scrub a bmbt record. */
429 STATIC int
430 xchk_bmapbt_rec(
431         struct xchk_btree       *bs,
432         const union xfs_btree_rec *rec)
433 {
434         struct xfs_bmbt_irec    irec;
435         struct xfs_bmbt_irec    iext_irec;
436         struct xfs_iext_cursor  icur;
437         struct xchk_bmap_info   *info = bs->private;
438         struct xfs_inode        *ip = bs->cur->bc_ino.ip;
439         struct xfs_buf          *bp = NULL;
440         struct xfs_btree_block  *block;
441         struct xfs_ifork        *ifp = xfs_ifork_ptr(ip, info->whichfork);
442         uint64_t                owner;
443         int                     i;
444
445         /*
446          * Check the owners of the btree blocks up to the level below
447          * the root since the verifiers don't do that.
448          */
449         if (xfs_has_crc(bs->cur->bc_mp) &&
450             bs->cur->bc_levels[0].ptr == 1) {
451                 for (i = 0; i < bs->cur->bc_nlevels - 1; i++) {
452                         block = xfs_btree_get_block(bs->cur, i, &bp);
453                         owner = be64_to_cpu(block->bb_u.l.bb_owner);
454                         if (owner != ip->i_ino)
455                                 xchk_fblock_set_corrupt(bs->sc,
456                                                 info->whichfork, 0);
457                 }
458         }
459
460         /*
461          * Check that the incore extent tree contains an extent that matches
462          * this one exactly.  We validate those cached bmaps later, so we don't
463          * need to check them here.  If the incore extent tree was just loaded
464          * from disk by the scrubber, we assume that its contents match what's
465          * on disk (we still hold the ILOCK) and skip the equivalence check.
466          */
467         if (!info->was_loaded)
468                 return 0;
469
470         xfs_bmbt_disk_get_all(&rec->bmbt, &irec);
471         if (!xfs_iext_lookup_extent(ip, ifp, irec.br_startoff, &icur,
472                                 &iext_irec) ||
473             irec.br_startoff != iext_irec.br_startoff ||
474             irec.br_startblock != iext_irec.br_startblock ||
475             irec.br_blockcount != iext_irec.br_blockcount ||
476             irec.br_state != iext_irec.br_state)
477                 xchk_fblock_set_corrupt(bs->sc, info->whichfork,
478                                 irec.br_startoff);
479         return 0;
480 }
481
482 /* Scan the btree records. */
483 STATIC int
484 xchk_bmap_btree(
485         struct xfs_scrub        *sc,
486         int                     whichfork,
487         struct xchk_bmap_info   *info)
488 {
489         struct xfs_owner_info   oinfo;
490         struct xfs_ifork        *ifp = xfs_ifork_ptr(sc->ip, whichfork);
491         struct xfs_mount        *mp = sc->mp;
492         struct xfs_inode        *ip = sc->ip;
493         struct xfs_btree_cur    *cur;
494         int                     error;
495
496         /* Load the incore bmap cache if it's not loaded. */
497         info->was_loaded = !xfs_need_iread_extents(ifp);
498
499         error = xfs_iread_extents(sc->tp, ip, whichfork);
500         if (!xchk_fblock_process_error(sc, whichfork, 0, &error))
501                 goto out;
502
503         /* Check the btree structure. */
504         cur = xfs_bmbt_init_cursor(mp, sc->tp, ip, whichfork);
505         xfs_rmap_ino_bmbt_owner(&oinfo, ip->i_ino, whichfork);
506         error = xchk_btree(sc, cur, xchk_bmapbt_rec, &oinfo, info);
507         xfs_btree_del_cursor(cur, error);
508 out:
509         return error;
510 }
511
512 struct xchk_bmap_check_rmap_info {
513         struct xfs_scrub        *sc;
514         int                     whichfork;
515         struct xfs_iext_cursor  icur;
516 };
517
518 /* Can we find bmaps that fit this rmap? */
519 STATIC int
520 xchk_bmap_check_rmap(
521         struct xfs_btree_cur            *cur,
522         const struct xfs_rmap_irec      *rec,
523         void                            *priv)
524 {
525         struct xfs_bmbt_irec            irec;
526         struct xfs_rmap_irec            check_rec;
527         struct xchk_bmap_check_rmap_info        *sbcri = priv;
528         struct xfs_ifork                *ifp;
529         struct xfs_scrub                *sc = sbcri->sc;
530         bool                            have_map;
531
532         /* Is this even the right fork? */
533         if (rec->rm_owner != sc->ip->i_ino)
534                 return 0;
535         if ((sbcri->whichfork == XFS_ATTR_FORK) ^
536             !!(rec->rm_flags & XFS_RMAP_ATTR_FORK))
537                 return 0;
538         if (rec->rm_flags & XFS_RMAP_BMBT_BLOCK)
539                 return 0;
540
541         /* Now look up the bmbt record. */
542         ifp = xfs_ifork_ptr(sc->ip, sbcri->whichfork);
543         if (!ifp) {
544                 xchk_fblock_set_corrupt(sc, sbcri->whichfork,
545                                 rec->rm_offset);
546                 goto out;
547         }
548         have_map = xfs_iext_lookup_extent(sc->ip, ifp, rec->rm_offset,
549                         &sbcri->icur, &irec);
550         if (!have_map)
551                 xchk_fblock_set_corrupt(sc, sbcri->whichfork,
552                                 rec->rm_offset);
553         /*
554          * bmap extent record lengths are constrained to 2^21 blocks in length
555          * because of space constraints in the on-disk metadata structure.
556          * However, rmap extent record lengths are constrained only by AG
557          * length, so we have to loop through the bmbt to make sure that the
558          * entire rmap is covered by bmbt records.
559          */
560         check_rec = *rec;
561         while (have_map) {
562                 if (irec.br_startoff != check_rec.rm_offset)
563                         xchk_fblock_set_corrupt(sc, sbcri->whichfork,
564                                         check_rec.rm_offset);
565                 if (irec.br_startblock != XFS_AGB_TO_FSB(sc->mp,
566                                 cur->bc_ag.pag->pag_agno,
567                                 check_rec.rm_startblock))
568                         xchk_fblock_set_corrupt(sc, sbcri->whichfork,
569                                         check_rec.rm_offset);
570                 if (irec.br_blockcount > check_rec.rm_blockcount)
571                         xchk_fblock_set_corrupt(sc, sbcri->whichfork,
572                                         check_rec.rm_offset);
573                 if (sc->sm->sm_flags & XFS_SCRUB_OFLAG_CORRUPT)
574                         break;
575                 check_rec.rm_startblock += irec.br_blockcount;
576                 check_rec.rm_offset += irec.br_blockcount;
577                 check_rec.rm_blockcount -= irec.br_blockcount;
578                 if (check_rec.rm_blockcount == 0)
579                         break;
580                 have_map = xfs_iext_next_extent(ifp, &sbcri->icur, &irec);
581                 if (!have_map)
582                         xchk_fblock_set_corrupt(sc, sbcri->whichfork,
583                                         check_rec.rm_offset);
584         }
585
586 out:
587         if (sc->sm->sm_flags & XFS_SCRUB_OFLAG_CORRUPT)
588                 return -ECANCELED;
589         return 0;
590 }
591
592 /* Make sure each rmap has a corresponding bmbt entry. */
593 STATIC int
594 xchk_bmap_check_ag_rmaps(
595         struct xfs_scrub                *sc,
596         int                             whichfork,
597         struct xfs_perag                *pag)
598 {
599         struct xchk_bmap_check_rmap_info        sbcri;
600         struct xfs_btree_cur            *cur;
601         struct xfs_buf                  *agf;
602         int                             error;
603
604         error = xfs_alloc_read_agf(pag, sc->tp, 0, &agf);
605         if (error)
606                 return error;
607
608         cur = xfs_rmapbt_init_cursor(sc->mp, sc->tp, agf, pag);
609
610         sbcri.sc = sc;
611         sbcri.whichfork = whichfork;
612         error = xfs_rmap_query_all(cur, xchk_bmap_check_rmap, &sbcri);
613         if (error == -ECANCELED)
614                 error = 0;
615
616         xfs_btree_del_cursor(cur, error);
617         xfs_trans_brelse(sc->tp, agf);
618         return error;
619 }
620
621 /* Make sure each rmap has a corresponding bmbt entry. */
622 STATIC int
623 xchk_bmap_check_rmaps(
624         struct xfs_scrub        *sc,
625         int                     whichfork)
626 {
627         struct xfs_ifork        *ifp = xfs_ifork_ptr(sc->ip, whichfork);
628         struct xfs_perag        *pag;
629         xfs_agnumber_t          agno;
630         bool                    zero_size;
631         int                     error;
632
633         if (!xfs_has_rmapbt(sc->mp) ||
634             whichfork == XFS_COW_FORK ||
635             (sc->sm->sm_flags & XFS_SCRUB_OFLAG_CORRUPT))
636                 return 0;
637
638         /* Don't support realtime rmap checks yet. */
639         if (XFS_IS_REALTIME_INODE(sc->ip) && whichfork == XFS_DATA_FORK)
640                 return 0;
641
642         ASSERT(xfs_ifork_ptr(sc->ip, whichfork) != NULL);
643
644         /*
645          * Only do this for complex maps that are in btree format, or for
646          * situations where we would seem to have a size but zero extents.
647          * The inode repair code can zap broken iforks, which means we have
648          * to flag this bmap as corrupt if there are rmaps that need to be
649          * reattached.
650          */
651
652         if (whichfork == XFS_DATA_FORK)
653                 zero_size = i_size_read(VFS_I(sc->ip)) == 0;
654         else
655                 zero_size = false;
656
657         if (ifp->if_format != XFS_DINODE_FMT_BTREE &&
658             (zero_size || ifp->if_nextents > 0))
659                 return 0;
660
661         for_each_perag(sc->mp, agno, pag) {
662                 error = xchk_bmap_check_ag_rmaps(sc, whichfork, pag);
663                 if (error ||
664                     (sc->sm->sm_flags & XFS_SCRUB_OFLAG_CORRUPT)) {
665                         xfs_perag_put(pag);
666                         return error;
667                 }
668         }
669
670         return 0;
671 }
672
673 /* Scrub a delalloc reservation from the incore extent map tree. */
674 STATIC void
675 xchk_bmap_iextent_delalloc(
676         struct xfs_inode        *ip,
677         struct xchk_bmap_info   *info,
678         struct xfs_bmbt_irec    *irec)
679 {
680         struct xfs_mount        *mp = info->sc->mp;
681
682         /*
683          * Check for out-of-order extents.  This record could have come
684          * from the incore list, for which there is no ordering check.
685          */
686         if (irec->br_startoff < info->lastoff)
687                 xchk_fblock_set_corrupt(info->sc, info->whichfork,
688                                 irec->br_startoff);
689
690         if (!xfs_verify_fileext(mp, irec->br_startoff, irec->br_blockcount))
691                 xchk_fblock_set_corrupt(info->sc, info->whichfork,
692                                 irec->br_startoff);
693
694         /* Make sure the extent points to a valid place. */
695         if (irec->br_blockcount > XFS_MAX_BMBT_EXTLEN)
696                 xchk_fblock_set_corrupt(info->sc, info->whichfork,
697                                 irec->br_startoff);
698 }
699
700 /*
701  * Scrub an inode fork's block mappings.
702  *
703  * First we scan every record in every btree block, if applicable.
704  * Then we unconditionally scan the incore extent cache.
705  */
706 STATIC int
707 xchk_bmap(
708         struct xfs_scrub        *sc,
709         int                     whichfork)
710 {
711         struct xfs_bmbt_irec    irec;
712         struct xchk_bmap_info   info = { NULL };
713         struct xfs_mount        *mp = sc->mp;
714         struct xfs_inode        *ip = sc->ip;
715         struct xfs_ifork        *ifp = xfs_ifork_ptr(ip, whichfork);
716         xfs_fileoff_t           endoff;
717         int                     error = 0;
718
719         /* Non-existent forks can be ignored. */
720         if (!ifp)
721                 goto out;
722
723         info.is_rt = whichfork == XFS_DATA_FORK && XFS_IS_REALTIME_INODE(ip);
724         info.whichfork = whichfork;
725         info.is_shared = whichfork == XFS_DATA_FORK && xfs_is_reflink_inode(ip);
726         info.sc = sc;
727
728         switch (whichfork) {
729         case XFS_COW_FORK:
730                 /* No CoW forks on non-reflink inodes/filesystems. */
731                 if (!xfs_is_reflink_inode(ip)) {
732                         xchk_ino_set_corrupt(sc, sc->ip->i_ino);
733                         goto out;
734                 }
735                 break;
736         case XFS_ATTR_FORK:
737                 if (!xfs_has_attr(mp) && !xfs_has_attr2(mp))
738                         xchk_ino_set_corrupt(sc, sc->ip->i_ino);
739                 break;
740         default:
741                 ASSERT(whichfork == XFS_DATA_FORK);
742                 break;
743         }
744
745         /* Check the fork values */
746         switch (ifp->if_format) {
747         case XFS_DINODE_FMT_UUID:
748         case XFS_DINODE_FMT_DEV:
749         case XFS_DINODE_FMT_LOCAL:
750                 /* No mappings to check. */
751                 if (whichfork == XFS_COW_FORK)
752                         xchk_fblock_set_corrupt(sc, whichfork, 0);
753                 goto out;
754         case XFS_DINODE_FMT_EXTENTS:
755                 break;
756         case XFS_DINODE_FMT_BTREE:
757                 if (whichfork == XFS_COW_FORK) {
758                         xchk_fblock_set_corrupt(sc, whichfork, 0);
759                         goto out;
760                 }
761
762                 error = xchk_bmap_btree(sc, whichfork, &info);
763                 if (error)
764                         goto out;
765                 break;
766         default:
767                 xchk_fblock_set_corrupt(sc, whichfork, 0);
768                 goto out;
769         }
770
771         if (sc->sm->sm_flags & XFS_SCRUB_OFLAG_CORRUPT)
772                 goto out;
773
774         /* Find the offset of the last extent in the mapping. */
775         error = xfs_bmap_last_offset(ip, &endoff, whichfork);
776         if (!xchk_fblock_process_error(sc, whichfork, 0, &error))
777                 goto out;
778
779         /* Scrub extent records. */
780         info.lastoff = 0;
781         ifp = xfs_ifork_ptr(ip, whichfork);
782         for_each_xfs_iext(ifp, &info.icur, &irec) {
783                 if (xchk_should_terminate(sc, &error) ||
784                     (sc->sm->sm_flags & XFS_SCRUB_OFLAG_CORRUPT))
785                         goto out;
786
787                 if (irec.br_startoff >= endoff) {
788                         xchk_fblock_set_corrupt(sc, whichfork,
789                                         irec.br_startoff);
790                         goto out;
791                 }
792
793                 if (isnullstartblock(irec.br_startblock))
794                         xchk_bmap_iextent_delalloc(ip, &info, &irec);
795                 else
796                         xchk_bmap_iextent(ip, &info, &irec);
797                 info.lastoff = irec.br_startoff + irec.br_blockcount;
798         }
799
800         error = xchk_bmap_check_rmaps(sc, whichfork);
801         if (!xchk_fblock_xref_process_error(sc, whichfork, 0, &error))
802                 goto out;
803 out:
804         return error;
805 }
806
807 /* Scrub an inode's data fork. */
808 int
809 xchk_bmap_data(
810         struct xfs_scrub        *sc)
811 {
812         return xchk_bmap(sc, XFS_DATA_FORK);
813 }
814
815 /* Scrub an inode's attr fork. */
816 int
817 xchk_bmap_attr(
818         struct xfs_scrub        *sc)
819 {
820         return xchk_bmap(sc, XFS_ATTR_FORK);
821 }
822
823 /* Scrub an inode's CoW fork. */
824 int
825 xchk_bmap_cow(
826         struct xfs_scrub        *sc)
827 {
828         if (!xfs_is_reflink_inode(sc->ip))
829                 return -ENOENT;
830
831         return xchk_bmap(sc, XFS_COW_FORK);
832 }