1 // SPDX-License-Identifier: GPL-2.0+
3 * Copyright (C) 2017 Oracle. All Rights Reserved.
4 * Author: Darrick J. Wong <darrick.wong@oracle.com>
8 #include "xfs_shared.h"
9 #include "xfs_format.h"
10 #include "xfs_trans_resv.h"
11 #include "xfs_mount.h"
12 #include "xfs_log_format.h"
13 #include "xfs_trans.h"
14 #include "xfs_inode.h"
16 #include "xfs_dir2_priv.h"
17 #include "xfs_attr_leaf.h"
18 #include "scrub/scrub.h"
19 #include "scrub/common.h"
20 #include "scrub/trace.h"
21 #include "scrub/dabtree.h"
23 /* Directory/Attribute Btree */
26 * Check for da btree operation errors. See the section about handling
27 * operational errors in common.c.
30 xchk_da_process_error(
31 struct xchk_da_btree
*ds
,
35 struct xfs_scrub
*sc
= ds
->sc
;
42 /* Used to restart an op with deadlock avoidance. */
43 trace_xchk_deadlock_retry(sc
->ip
, sc
->sm
, *error
);
47 /* Note the badness but don't abort. */
48 sc
->sm
->sm_flags
|= XFS_SCRUB_OFLAG_CORRUPT
;
52 trace_xchk_file_op_error(sc
, ds
->dargs
.whichfork
,
53 xfs_dir2_da_to_db(ds
->dargs
.geo
,
54 ds
->state
->path
.blk
[level
].blkno
),
55 *error
, __return_address
);
62 * Check for da btree corruption. See the section about handling
63 * operational errors in common.c.
67 struct xchk_da_btree
*ds
,
70 struct xfs_scrub
*sc
= ds
->sc
;
72 sc
->sm
->sm_flags
|= XFS_SCRUB_OFLAG_CORRUPT
;
74 trace_xchk_fblock_error(sc
, ds
->dargs
.whichfork
,
75 xfs_dir2_da_to_db(ds
->dargs
.geo
,
76 ds
->state
->path
.blk
[level
].blkno
),
80 static struct xfs_da_node_entry
*
81 xchk_da_btree_node_entry(
82 struct xchk_da_btree
*ds
,
85 struct xfs_da_state_blk
*blk
= &ds
->state
->path
.blk
[level
];
86 struct xfs_da3_icnode_hdr hdr
;
88 ASSERT(blk
->magic
== XFS_DA_NODE_MAGIC
);
90 xfs_da3_node_hdr_from_disk(ds
->sc
->mp
, &hdr
, blk
->bp
->b_addr
);
91 return hdr
.btree
+ blk
->index
;
94 /* Scrub a da btree hash (key). */
97 struct xchk_da_btree
*ds
,
101 struct xfs_da_node_entry
*entry
;
103 xfs_dahash_t parent_hash
;
105 /* Is this hash in order? */
106 hash
= be32_to_cpu(*hashp
);
107 if (hash
< ds
->hashes
[level
])
108 xchk_da_set_corrupt(ds
, level
);
109 ds
->hashes
[level
] = hash
;
114 /* Is this hash no larger than the parent hash? */
115 entry
= xchk_da_btree_node_entry(ds
, level
- 1);
116 parent_hash
= be32_to_cpu(entry
->hashval
);
117 if (parent_hash
< hash
)
118 xchk_da_set_corrupt(ds
, level
);
124 * Check a da btree pointer. Returns true if it's ok to use this
128 xchk_da_btree_ptr_ok(
129 struct xchk_da_btree
*ds
,
133 if (blkno
< ds
->lowest
|| (ds
->highest
!= 0 && blkno
>= ds
->highest
)) {
134 xchk_da_set_corrupt(ds
, level
);
142 * The da btree scrubber can handle leaf1 blocks as a degenerate
143 * form of leafn blocks. Since the regular da code doesn't handle
144 * leaf1, we must multiplex the verifiers.
147 xchk_da_btree_read_verify(
150 struct xfs_da_blkinfo
*info
= bp
->b_addr
;
152 switch (be16_to_cpu(info
->magic
)) {
153 case XFS_DIR2_LEAF1_MAGIC
:
154 case XFS_DIR3_LEAF1_MAGIC
:
155 bp
->b_ops
= &xfs_dir3_leaf1_buf_ops
;
156 bp
->b_ops
->verify_read(bp
);
160 * xfs_da3_node_buf_ops already know how to handle
161 * DA*_NODE, ATTR*_LEAF, and DIR*_LEAFN blocks.
163 bp
->b_ops
= &xfs_da3_node_buf_ops
;
164 bp
->b_ops
->verify_read(bp
);
169 xchk_da_btree_write_verify(
172 struct xfs_da_blkinfo
*info
= bp
->b_addr
;
174 switch (be16_to_cpu(info
->magic
)) {
175 case XFS_DIR2_LEAF1_MAGIC
:
176 case XFS_DIR3_LEAF1_MAGIC
:
177 bp
->b_ops
= &xfs_dir3_leaf1_buf_ops
;
178 bp
->b_ops
->verify_write(bp
);
182 * xfs_da3_node_buf_ops already know how to handle
183 * DA*_NODE, ATTR*_LEAF, and DIR*_LEAFN blocks.
185 bp
->b_ops
= &xfs_da3_node_buf_ops
;
186 bp
->b_ops
->verify_write(bp
);
191 xchk_da_btree_verify(
194 struct xfs_da_blkinfo
*info
= bp
->b_addr
;
196 switch (be16_to_cpu(info
->magic
)) {
197 case XFS_DIR2_LEAF1_MAGIC
:
198 case XFS_DIR3_LEAF1_MAGIC
:
199 bp
->b_ops
= &xfs_dir3_leaf1_buf_ops
;
200 return bp
->b_ops
->verify_struct(bp
);
202 bp
->b_ops
= &xfs_da3_node_buf_ops
;
203 return bp
->b_ops
->verify_struct(bp
);
207 static const struct xfs_buf_ops xchk_da_btree_buf_ops
= {
208 .name
= "xchk_da_btree",
209 .verify_read
= xchk_da_btree_read_verify
,
210 .verify_write
= xchk_da_btree_write_verify
,
211 .verify_struct
= xchk_da_btree_verify
,
214 /* Check a block's sibling. */
216 xchk_da_btree_block_check_sibling(
217 struct xchk_da_btree
*ds
,
225 memcpy(&ds
->state
->altpath
, &ds
->state
->path
,
226 sizeof(ds
->state
->altpath
));
229 * If the pointer is null, we shouldn't be able to move the upper
230 * level pointer anywhere.
233 error
= xfs_da3_path_shift(ds
->state
, &ds
->state
->altpath
,
234 direction
, false, &retval
);
235 if (error
== 0 && retval
== 0)
236 xchk_da_set_corrupt(ds
, level
);
241 /* Move the alternate cursor one block in the direction given. */
242 error
= xfs_da3_path_shift(ds
->state
, &ds
->state
->altpath
,
243 direction
, false, &retval
);
244 if (!xchk_da_process_error(ds
, level
, &error
))
247 xchk_da_set_corrupt(ds
, level
);
250 if (ds
->state
->altpath
.blk
[level
].bp
)
251 xchk_buffer_recheck(ds
->sc
,
252 ds
->state
->altpath
.blk
[level
].bp
);
254 /* Compare upper level pointer to sibling pointer. */
255 if (ds
->state
->altpath
.blk
[level
].blkno
!= sibling
)
256 xchk_da_set_corrupt(ds
, level
);
257 if (ds
->state
->altpath
.blk
[level
].bp
) {
258 xfs_trans_brelse(ds
->dargs
.trans
,
259 ds
->state
->altpath
.blk
[level
].bp
);
260 ds
->state
->altpath
.blk
[level
].bp
= NULL
;
266 /* Check a block's sibling pointers. */
268 xchk_da_btree_block_check_siblings(
269 struct xchk_da_btree
*ds
,
271 struct xfs_da_blkinfo
*hdr
)
277 forw
= be32_to_cpu(hdr
->forw
);
278 back
= be32_to_cpu(hdr
->back
);
280 /* Top level blocks should not have sibling pointers. */
282 if (forw
!= 0 || back
!= 0)
283 xchk_da_set_corrupt(ds
, level
);
288 * Check back (left) and forw (right) pointers. These functions
289 * absorb error codes for us.
291 error
= xchk_da_btree_block_check_sibling(ds
, level
, 0, back
);
294 error
= xchk_da_btree_block_check_sibling(ds
, level
, 1, forw
);
297 memset(&ds
->state
->altpath
, 0, sizeof(ds
->state
->altpath
));
301 /* Load a dir/attribute block from a btree. */
304 struct xchk_da_btree
*ds
,
308 struct xfs_da_state_blk
*blk
;
309 struct xfs_da_intnode
*node
;
310 struct xfs_da_node_entry
*btree
;
311 struct xfs_da3_blkinfo
*hdr3
;
312 struct xfs_da_args
*dargs
= &ds
->dargs
;
313 struct xfs_inode
*ip
= ds
->dargs
.dp
;
316 struct xfs_da3_icnode_hdr nodehdr
;
319 blk
= &ds
->state
->path
.blk
[level
];
320 ds
->state
->path
.active
= level
+ 1;
322 /* Release old block. */
324 xfs_trans_brelse(dargs
->trans
, blk
->bp
);
328 /* Check the pointer. */
330 if (!xchk_da_btree_ptr_ok(ds
, level
, blkno
))
333 /* Read the buffer. */
334 error
= xfs_da_read_buf(dargs
->trans
, dargs
->dp
, blk
->blkno
,
335 XFS_DABUF_MAP_HOLE_OK
, &blk
->bp
, dargs
->whichfork
,
336 &xchk_da_btree_buf_ops
);
337 if (!xchk_da_process_error(ds
, level
, &error
))
340 xchk_buffer_recheck(ds
->sc
, blk
->bp
);
343 * We didn't find a dir btree root block, which means that
344 * there's no LEAF1/LEAFN tree (at least not where it's supposed
345 * to be), so jump out now.
347 if (ds
->dargs
.whichfork
== XFS_DATA_FORK
&& level
== 0 &&
351 /* It's /not/ ok for attr trees not to have a da btree. */
352 if (blk
->bp
== NULL
) {
353 xchk_da_set_corrupt(ds
, level
);
357 hdr3
= blk
->bp
->b_addr
;
358 blk
->magic
= be16_to_cpu(hdr3
->hdr
.magic
);
359 pmaxrecs
= &ds
->maxrecs
[level
];
361 /* We only started zeroing the header on v5 filesystems. */
362 if (xfs_sb_version_hascrc(&ds
->sc
->mp
->m_sb
) && hdr3
->hdr
.pad
)
363 xchk_da_set_corrupt(ds
, level
);
365 /* Check the owner. */
366 if (xfs_sb_version_hascrc(&ip
->i_mount
->m_sb
)) {
367 owner
= be64_to_cpu(hdr3
->owner
);
368 if (owner
!= ip
->i_ino
)
369 xchk_da_set_corrupt(ds
, level
);
372 /* Check the siblings. */
373 error
= xchk_da_btree_block_check_siblings(ds
, level
, &hdr3
->hdr
);
377 /* Interpret the buffer. */
378 switch (blk
->magic
) {
379 case XFS_ATTR_LEAF_MAGIC
:
380 case XFS_ATTR3_LEAF_MAGIC
:
381 xfs_trans_buf_set_type(dargs
->trans
, blk
->bp
,
382 XFS_BLFT_ATTR_LEAF_BUF
);
383 blk
->magic
= XFS_ATTR_LEAF_MAGIC
;
384 blk
->hashval
= xfs_attr_leaf_lasthash(blk
->bp
, pmaxrecs
);
385 if (ds
->tree_level
!= 0)
386 xchk_da_set_corrupt(ds
, level
);
388 case XFS_DIR2_LEAFN_MAGIC
:
389 case XFS_DIR3_LEAFN_MAGIC
:
390 xfs_trans_buf_set_type(dargs
->trans
, blk
->bp
,
391 XFS_BLFT_DIR_LEAFN_BUF
);
392 blk
->magic
= XFS_DIR2_LEAFN_MAGIC
;
393 blk
->hashval
= xfs_dir2_leaf_lasthash(ip
, blk
->bp
, pmaxrecs
);
394 if (ds
->tree_level
!= 0)
395 xchk_da_set_corrupt(ds
, level
);
397 case XFS_DIR2_LEAF1_MAGIC
:
398 case XFS_DIR3_LEAF1_MAGIC
:
399 xfs_trans_buf_set_type(dargs
->trans
, blk
->bp
,
400 XFS_BLFT_DIR_LEAF1_BUF
);
401 blk
->magic
= XFS_DIR2_LEAF1_MAGIC
;
402 blk
->hashval
= xfs_dir2_leaf_lasthash(ip
, blk
->bp
, pmaxrecs
);
403 if (ds
->tree_level
!= 0)
404 xchk_da_set_corrupt(ds
, level
);
406 case XFS_DA_NODE_MAGIC
:
407 case XFS_DA3_NODE_MAGIC
:
408 xfs_trans_buf_set_type(dargs
->trans
, blk
->bp
,
409 XFS_BLFT_DA_NODE_BUF
);
410 blk
->magic
= XFS_DA_NODE_MAGIC
;
411 node
= blk
->bp
->b_addr
;
412 xfs_da3_node_hdr_from_disk(ip
->i_mount
, &nodehdr
, node
);
413 btree
= nodehdr
.btree
;
414 *pmaxrecs
= nodehdr
.count
;
415 blk
->hashval
= be32_to_cpu(btree
[*pmaxrecs
- 1].hashval
);
417 if (nodehdr
.level
>= XFS_DA_NODE_MAXDEPTH
) {
418 xchk_da_set_corrupt(ds
, level
);
421 ds
->tree_level
= nodehdr
.level
;
423 if (ds
->tree_level
!= nodehdr
.level
) {
424 xchk_da_set_corrupt(ds
, level
);
429 /* XXX: Check hdr3.pad32 once we know how to fix it. */
432 xchk_da_set_corrupt(ds
, level
);
439 xfs_trans_brelse(dargs
->trans
, blk
->bp
);
446 /* Visit all nodes and leaves of a da btree. */
449 struct xfs_scrub
*sc
,
451 xchk_da_btree_rec_fn scrub_fn
,
454 struct xchk_da_btree ds
= {};
455 struct xfs_mount
*mp
= sc
->mp
;
456 struct xfs_da_state_blk
*blks
;
457 struct xfs_da_node_entry
*key
;
462 /* Skip short format data structures; no btree to scan. */
463 if (!xfs_ifork_has_extents(sc
->ip
, whichfork
))
466 /* Set up initial da state. */
467 ds
.dargs
.dp
= sc
->ip
;
468 ds
.dargs
.whichfork
= whichfork
;
469 ds
.dargs
.trans
= sc
->tp
;
470 ds
.dargs
.op_flags
= XFS_DA_OP_OKNOENT
;
471 ds
.state
= xfs_da_state_alloc();
472 ds
.state
->args
= &ds
.dargs
;
475 ds
.private = private;
476 if (whichfork
== XFS_ATTR_FORK
) {
477 ds
.dargs
.geo
= mp
->m_attr_geo
;
481 ds
.dargs
.geo
= mp
->m_dir_geo
;
482 ds
.lowest
= ds
.dargs
.geo
->leafblk
;
483 ds
.highest
= ds
.dargs
.geo
->freeblk
;
488 /* Find the root of the da tree, if present. */
489 blks
= ds
.state
->path
.blk
;
490 error
= xchk_da_btree_block(&ds
, level
, blkno
);
494 * We didn't find a block at ds.lowest, which means that there's
495 * no LEAF1/LEAFN tree (at least not where it's supposed to be),
498 if (blks
[level
].bp
== NULL
)
501 blks
[level
].index
= 0;
502 while (level
>= 0 && level
< XFS_DA_NODE_MAXDEPTH
) {
503 /* Handle leaf block. */
504 if (blks
[level
].magic
!= XFS_DA_NODE_MAGIC
) {
505 /* End of leaf, pop back towards the root. */
506 if (blks
[level
].index
>= ds
.maxrecs
[level
]) {
508 blks
[level
- 1].index
++;
514 /* Dispatch record scrubbing. */
515 error
= scrub_fn(&ds
, level
);
518 if (xchk_should_terminate(sc
, &error
) ||
519 (sc
->sm
->sm_flags
& XFS_SCRUB_OFLAG_CORRUPT
))
527 /* End of node, pop back towards the root. */
528 if (blks
[level
].index
>= ds
.maxrecs
[level
]) {
530 blks
[level
- 1].index
++;
536 /* Hashes in order for scrub? */
537 key
= xchk_da_btree_node_entry(&ds
, level
);
538 error
= xchk_da_btree_hash(&ds
, level
, &key
->hashval
);
542 /* Drill another level deeper. */
543 blkno
= be32_to_cpu(key
->before
);
545 if (level
>= XFS_DA_NODE_MAXDEPTH
) {
547 xchk_da_set_corrupt(&ds
, level
- 1);
551 error
= xchk_da_btree_block(&ds
, level
, blkno
);
554 if (blks
[level
].bp
== NULL
)
557 blks
[level
].index
= 0;
561 /* Release all the buffers we're tracking. */
562 for (level
= 0; level
< XFS_DA_NODE_MAXDEPTH
; level
++) {
563 if (blks
[level
].bp
== NULL
)
565 xfs_trans_brelse(sc
->tp
, blks
[level
].bp
);
566 blks
[level
].bp
= NULL
;
570 xfs_da_state_free(ds
.state
);