1 // SPDX-License-Identifier: GPL-2.0-or-later
3 * Copyright (C) 2017-2023 Oracle. All Rights Reserved.
4 * Author: Darrick J. Wong <djwong@kernel.org>
8 #include "xfs_shared.h"
9 #include "xfs_format.h"
10 #include "xfs_trans_resv.h"
11 #include "xfs_mount.h"
12 #include "xfs_btree.h"
13 #include "xfs_inode.h"
14 #include "xfs_log_format.h"
15 #include "xfs_trans.h"
16 #include "xfs_rtbitmap.h"
20 #include "xfs_exchmaps.h"
21 #include "xfs_rtgroup.h"
22 #include "scrub/scrub.h"
23 #include "scrub/common.h"
24 #include "scrub/trace.h"
25 #include "scrub/xfile.h"
26 #include "scrub/repair.h"
27 #include "scrub/tempexch.h"
28 #include "scrub/rtsummary.h"
34 * We check the realtime summary by scanning the realtime bitmap file to create
35 * a new summary file incore, and then we compare the computed version against
36 * the ondisk version. We use the 'xfile' functionality to store this
37 * (potentially large) amount of data in pageable memory.
40 /* Set us up to check the rtsummary file. */
45 struct xfs_mount
*mp
= sc
->mp
;
47 struct xchk_rtsummary
*rts
;
50 if (xchk_need_intent_drain(sc
))
51 xchk_fsgates_enable(sc
, XCHK_FSGATES_DRAIN
);
53 rts
= kvzalloc(struct_size(rts
, words
, mp
->m_blockwsize
),
59 error
= xchk_rtgroup_init(sc
, sc
->sm
->sm_agno
, &sc
->sr
);
63 if (xchk_could_repair(sc
)) {
64 error
= xrep_setup_rtsummary(sc
, rts
);
70 * Create an xfile to construct a new rtsummary file. The xfile allows
71 * us to avoid pinning kernel memory for this purpose.
73 descr
= xchk_xfile_descr(sc
, "realtime summary file");
74 error
= xfile_create(descr
, XFS_FSB_TO_B(mp
, mp
->m_rsumblocks
),
80 error
= xchk_trans_alloc(sc
, rts
->resblks
);
84 error
= xchk_install_live_inode(sc
,
85 sc
->sr
.rtg
->rtg_inodes
[XFS_RTGI_SUMMARY
]);
89 error
= xchk_ino_dqattach(sc
);
94 * Now that we've locked the rtbitmap and rtsummary, we can't race with
95 * growfsrt trying to expand the summary or change the size of the rt
96 * volume. Hence it is safe to compute and check the geometry values.
98 * Note that there is no strict requirement for an exclusive lock on the
99 * summary here, but to keep the locking APIs simple we lock both inodes
100 * exclusively here. If we ever start caring about running concurrent
101 * fsmap with scrub this could be changed.
103 xchk_rtgroup_lock(&sc
->sr
, XFS_RTGLOCK_BITMAP
);
104 if (mp
->m_sb
.sb_rblocks
) {
105 rts
->rextents
= xfs_blen_to_rtbxlen(mp
, mp
->m_sb
.sb_rblocks
);
106 rts
->rbmblocks
= xfs_rtbitmap_blockcount(mp
);
108 xfs_rtsummary_blockcount(mp
, &rts
->rsumlevels
);
114 /* Helper functions to record suminfo words in an xfile. */
118 struct xfs_scrub
*sc
,
119 xfs_rtsumoff_t sumoff
,
120 union xfs_suminfo_raw
*rawinfo
)
122 return xfile_load(sc
->xfile
, rawinfo
,
123 sizeof(union xfs_suminfo_raw
),
124 sumoff
<< XFS_WORDLOG
);
129 struct xfs_scrub
*sc
,
130 xfs_rtsumoff_t sumoff
,
131 const union xfs_suminfo_raw rawinfo
)
133 return xfile_store(sc
->xfile
, &rawinfo
,
134 sizeof(union xfs_suminfo_raw
),
135 sumoff
<< XFS_WORDLOG
);
140 struct xfs_scrub
*sc
,
141 xfs_rtsumoff_t sumoff
,
142 union xfs_suminfo_raw
*rawinfo
,
143 unsigned int nr_words
)
145 return xfile_load(sc
->xfile
, rawinfo
, nr_words
<< XFS_WORDLOG
,
146 sumoff
<< XFS_WORDLOG
);
149 static inline xfs_suminfo_t
151 struct xfs_mount
*mp
,
152 union xfs_suminfo_raw
*v
)
154 if (xfs_has_rtgroups(mp
)) {
155 be32_add_cpu(&v
->rtg
, 1);
156 return be32_to_cpu(v
->rtg
);
163 /* Update the summary file to reflect the free extent that we've accumulated. */
165 xchk_rtsum_record_free(
166 struct xfs_rtgroup
*rtg
,
167 struct xfs_trans
*tp
,
168 const struct xfs_rtalloc_rec
*rec
,
171 struct xfs_mount
*mp
= rtg_mount(rtg
);
172 struct xfs_scrub
*sc
= priv
;
173 xfs_fileoff_t rbmoff
;
178 union xfs_suminfo_raw v
;
182 if (xchk_should_terminate(sc
, &error
))
185 /* Compute the relevant location in the rtsum file. */
186 rbmoff
= xfs_rtx_to_rbmblock(mp
, rec
->ar_startext
);
187 lenlog
= xfs_highbit64(rec
->ar_extcount
);
188 offs
= xfs_rtsumoffs(mp
, lenlog
, rbmoff
);
190 rtbno
= xfs_rtx_to_rtb(rtg
, rec
->ar_startext
);
191 rtlen
= xfs_rtxlen_to_extlen(mp
, rec
->ar_extcount
);
193 if (!xfs_verify_rtbext(mp
, rtbno
, rtlen
)) {
194 xchk_ino_xref_set_corrupt(sc
,
195 rtg
->rtg_inodes
[XFS_RTGI_BITMAP
]->i_ino
);
196 return -EFSCORRUPTED
;
199 /* Bump the summary count. */
200 error
= xfsum_load(sc
, offs
, &v
);
204 value
= xchk_rtsum_inc(sc
->mp
, &v
);
205 trace_xchk_rtsum_record_free(mp
, rec
->ar_startext
, rec
->ar_extcount
,
206 lenlog
, offs
, value
);
208 return xfsum_store(sc
, offs
, v
);
211 /* Compute the realtime summary from the realtime bitmap. */
214 struct xfs_scrub
*sc
)
216 struct xfs_mount
*mp
= sc
->mp
;
217 struct xfs_rtgroup
*rtg
= sc
->sr
.rtg
;
219 /* If the bitmap size doesn't match the computed size, bail. */
220 if (XFS_FSB_TO_B(mp
, xfs_rtbitmap_blockcount(mp
)) !=
221 rtg
->rtg_inodes
[XFS_RTGI_BITMAP
]->i_disk_size
)
222 return -EFSCORRUPTED
;
224 return xfs_rtalloc_query_all(rtg
, sc
->tp
, xchk_rtsum_record_free
, sc
);
227 /* Compare the rtsummary file against the one we computed. */
230 struct xfs_scrub
*sc
)
232 struct xfs_bmbt_irec map
;
233 struct xfs_iext_cursor icur
;
235 struct xfs_mount
*mp
= sc
->mp
;
236 struct xfs_inode
*ip
= sc
->ip
;
237 struct xchk_rtsummary
*rts
= sc
->buf
;
238 xfs_fileoff_t off
= 0;
239 xfs_fileoff_t endoff
;
240 xfs_rtsumoff_t sumoff
= 0;
244 rts
->args
.tp
= sc
->tp
;
245 rts
->args
.rtg
= sc
->sr
.rtg
;
247 /* Mappings may not cross or lie beyond EOF. */
248 endoff
= XFS_B_TO_FSB(mp
, ip
->i_disk_size
);
249 if (xfs_iext_lookup_extent(ip
, &ip
->i_df
, endoff
, &icur
, &map
)) {
250 xchk_fblock_set_corrupt(sc
, XFS_DATA_FORK
, endoff
);
254 while (off
< endoff
) {
257 if (xchk_should_terminate(sc
, &error
))
259 if (sc
->sm
->sm_flags
& XFS_SCRUB_OFLAG_CORRUPT
)
262 /* Make sure we have a written extent. */
263 error
= xfs_bmapi_read(ip
, off
, endoff
- off
, &map
, &nmap
,
265 if (!xchk_fblock_process_error(sc
, XFS_DATA_FORK
, off
, &error
))
268 if (nmap
!= 1 || !xfs_bmap_is_written_extent(&map
)) {
269 xchk_fblock_set_corrupt(sc
, XFS_DATA_FORK
, off
);
273 off
+= map
.br_blockcount
;
276 for (off
= 0; off
< endoff
; off
++) {
277 union xfs_suminfo_raw
*ondisk_info
;
279 /* Read a block's worth of ondisk rtsummary file. */
280 error
= xfs_rtsummary_read_buf(&rts
->args
, off
);
281 if (!xchk_fblock_process_error(sc
, XFS_DATA_FORK
, off
, &error
))
284 /* Read a block's worth of computed rtsummary file. */
285 error
= xfsum_copyout(sc
, sumoff
, rts
->words
, mp
->m_blockwsize
);
287 xfs_rtbuf_cache_relse(&rts
->args
);
291 ondisk_info
= xfs_rsumblock_infoptr(&rts
->args
, 0);
292 if (memcmp(ondisk_info
, rts
->words
,
293 mp
->m_blockwsize
<< XFS_WORDLOG
) != 0) {
294 xchk_fblock_set_corrupt(sc
, XFS_DATA_FORK
, off
);
295 xfs_rtbuf_cache_relse(&rts
->args
);
299 xfs_rtbuf_cache_relse(&rts
->args
);
300 sumoff
+= mp
->m_blockwsize
;
306 /* Scrub the realtime summary. */
309 struct xfs_scrub
*sc
)
311 struct xfs_mount
*mp
= sc
->mp
;
312 struct xfs_rtgroup
*rtg
= sc
->sr
.rtg
;
313 struct xfs_inode
*rbmip
= rtg
->rtg_inodes
[XFS_RTGI_BITMAP
];
314 struct xfs_inode
*rsumip
= rtg
->rtg_inodes
[XFS_RTGI_SUMMARY
];
315 struct xchk_rtsummary
*rts
= sc
->buf
;
318 /* Is sb_rextents correct? */
319 if (mp
->m_sb
.sb_rextents
!= rts
->rextents
) {
320 xchk_ino_set_corrupt(sc
, rbmip
->i_ino
);
324 /* Is m_rsumlevels correct? */
325 if (mp
->m_rsumlevels
!= rts
->rsumlevels
) {
326 xchk_ino_set_corrupt(sc
, rsumip
->i_ino
);
330 /* Is m_rsumsize correct? */
331 if (mp
->m_rsumblocks
!= rts
->rsumblocks
) {
332 xchk_ino_set_corrupt(sc
, rsumip
->i_ino
);
336 /* The summary file length must be aligned to an fsblock. */
337 if (rsumip
->i_disk_size
& mp
->m_blockmask
) {
338 xchk_ino_set_corrupt(sc
, rsumip
->i_ino
);
343 * Is the summary file itself large enough to handle the rt volume?
344 * growfsrt expands the summary file before updating sb_rextents, so
345 * the file can be larger than rsumsize.
347 if (rsumip
->i_disk_size
< XFS_FSB_TO_B(mp
, rts
->rsumblocks
)) {
348 xchk_ino_set_corrupt(sc
, rsumip
->i_ino
);
352 /* Invoke the fork scrubber. */
353 error
= xchk_metadata_inode_forks(sc
);
354 if (error
|| (sc
->sm
->sm_flags
& XFS_SCRUB_OFLAG_CORRUPT
))
357 /* Construct the new summary file from the rtbitmap. */
358 error
= xchk_rtsum_compute(sc
);
359 if (error
== -EFSCORRUPTED
) {
361 * EFSCORRUPTED means the rtbitmap is corrupt, which is an xref
362 * error since we're checking the summary file.
364 xchk_ino_set_corrupt(sc
, rbmip
->i_ino
);
370 /* Does the computed summary file match the actual rtsummary file? */
371 return xchk_rtsum_compare(sc
);