blob: f7568a4b5fe58f5aecef931c3928d3c9ec0564fd [file] [log] [blame]
Dave Chinner0b61f8a2018-06-05 19:42:14 -07001// SPDX-License-Identifier: GPL-2.0+
Darrick J. Wongd25522f2018-05-29 22:18:12 -07002/*
3 * Copyright (C) 2018 Oracle. All Rights Reserved.
Darrick J. Wongd25522f2018-05-29 22:18:12 -07004 * Author: Darrick J. Wong <darrick.wong@oracle.com>
Darrick J. Wongd25522f2018-05-29 22:18:12 -07005 */
6#include "xfs.h"
7#include "xfs_fs.h"
8#include "xfs_shared.h"
9#include "xfs_format.h"
10#include "xfs_trans_resv.h"
11#include "xfs_mount.h"
12#include "xfs_defer.h"
13#include "xfs_btree.h"
14#include "xfs_bit.h"
15#include "xfs_log_format.h"
16#include "xfs_trans.h"
17#include "xfs_sb.h"
18#include "xfs_inode.h"
19#include "xfs_alloc.h"
Darrick J. Wongf9ed6de2018-08-09 22:42:53 -070020#include "xfs_alloc_btree.h"
Darrick J. Wongd25522f2018-05-29 22:18:12 -070021#include "xfs_ialloc.h"
Darrick J. Wongf9ed6de2018-08-09 22:42:53 -070022#include "xfs_ialloc_btree.h"
Darrick J. Wongd25522f2018-05-29 22:18:12 -070023#include "xfs_rmap.h"
Darrick J. Wongf9ed6de2018-08-09 22:42:53 -070024#include "xfs_rmap_btree.h"
25#include "xfs_refcount.h"
26#include "xfs_refcount_btree.h"
Darrick J. Wongd25522f2018-05-29 22:18:12 -070027#include "scrub/xfs_scrub.h"
28#include "scrub/scrub.h"
29#include "scrub/common.h"
30#include "scrub/trace.h"
Darrick J. Wongf9ed6de2018-08-09 22:42:53 -070031#include "scrub/repair.h"
32#include "scrub/bitmap.h"
Darrick J. Wongd25522f2018-05-29 22:18:12 -070033
34/* Superblock */
35
36/* Repair the superblock. */
37int
Darrick J. Wongb5e21962018-07-19 12:29:11 -070038xrep_superblock(
Darrick J. Wong1d8a7482018-07-19 12:29:12 -070039 struct xfs_scrub *sc)
Darrick J. Wongd25522f2018-05-29 22:18:12 -070040{
Darrick J. Wong032d91f2018-07-19 12:29:12 -070041 struct xfs_mount *mp = sc->mp;
42 struct xfs_buf *bp;
43 xfs_agnumber_t agno;
44 int error;
Darrick J. Wongd25522f2018-05-29 22:18:12 -070045
46 /* Don't try to repair AG 0's sb; let xfs_repair deal with it. */
47 agno = sc->sm->sm_agno;
48 if (agno == 0)
49 return -EOPNOTSUPP;
50
51 error = xfs_sb_get_secondary(mp, sc->tp, agno, &bp);
52 if (error)
53 return error;
54
55 /* Copy AG 0's superblock to this one. */
56 xfs_buf_zero(bp, 0, BBTOB(bp->b_length));
57 xfs_sb_to_disk(XFS_BUF_TO_SBP(bp), &mp->m_sb);
58
59 /* Write this to disk. */
60 xfs_trans_buf_set_type(sc->tp, bp, XFS_BLFT_SB_BUF);
61 xfs_trans_log_buf(sc->tp, bp, 0, BBTOB(bp->b_length) - 1);
62 return error;
63}
Darrick J. Wongf9ed6de2018-08-09 22:42:53 -070064
65/* AGF */
66
67struct xrep_agf_allocbt {
68 struct xfs_scrub *sc;
69 xfs_agblock_t freeblks;
70 xfs_agblock_t longest;
71};
72
73/* Record free space shape information. */
74STATIC int
75xrep_agf_walk_allocbt(
76 struct xfs_btree_cur *cur,
77 struct xfs_alloc_rec_incore *rec,
78 void *priv)
79{
80 struct xrep_agf_allocbt *raa = priv;
81 int error = 0;
82
83 if (xchk_should_terminate(raa->sc, &error))
84 return error;
85
86 raa->freeblks += rec->ar_blockcount;
87 if (rec->ar_blockcount > raa->longest)
88 raa->longest = rec->ar_blockcount;
89 return error;
90}
91
92/* Does this AGFL block look sane? */
93STATIC int
94xrep_agf_check_agfl_block(
95 struct xfs_mount *mp,
96 xfs_agblock_t agbno,
97 void *priv)
98{
99 struct xfs_scrub *sc = priv;
100
101 if (!xfs_verify_agbno(mp, sc->sa.agno, agbno))
102 return -EFSCORRUPTED;
103 return 0;
104}
105
106/*
107 * Offset within the xrep_find_ag_btree array for each btree type. Avoid the
108 * XFS_BTNUM_ names here to avoid creating a sparse array.
109 */
110enum {
111 XREP_AGF_BNOBT = 0,
112 XREP_AGF_CNTBT,
113 XREP_AGF_RMAPBT,
114 XREP_AGF_REFCOUNTBT,
115 XREP_AGF_END,
116 XREP_AGF_MAX
117};
118
119/* Check a btree root candidate. */
120static inline bool
121xrep_check_btree_root(
122 struct xfs_scrub *sc,
123 struct xrep_find_ag_btree *fab)
124{
125 struct xfs_mount *mp = sc->mp;
126 xfs_agnumber_t agno = sc->sm->sm_agno;
127
128 return xfs_verify_agbno(mp, agno, fab->root) &&
129 fab->height <= XFS_BTREE_MAXLEVELS;
130}
131
132/*
133 * Given the btree roots described by *fab, find the roots, check them for
134 * sanity, and pass the root data back out via *fab.
135 *
136 * This is /also/ a chicken and egg problem because we have to use the rmapbt
137 * (rooted in the AGF) to find the btrees rooted in the AGF. We also have no
138 * idea if the btrees make any sense. If we hit obvious corruptions in those
139 * btrees we'll bail out.
140 */
141STATIC int
142xrep_agf_find_btrees(
143 struct xfs_scrub *sc,
144 struct xfs_buf *agf_bp,
145 struct xrep_find_ag_btree *fab,
146 struct xfs_buf *agfl_bp)
147{
148 struct xfs_agf *old_agf = XFS_BUF_TO_AGF(agf_bp);
149 int error;
150
151 /* Go find the root data. */
152 error = xrep_find_ag_btree_roots(sc, agf_bp, fab, agfl_bp);
153 if (error)
154 return error;
155
156 /* We must find the bnobt, cntbt, and rmapbt roots. */
157 if (!xrep_check_btree_root(sc, &fab[XREP_AGF_BNOBT]) ||
158 !xrep_check_btree_root(sc, &fab[XREP_AGF_CNTBT]) ||
159 !xrep_check_btree_root(sc, &fab[XREP_AGF_RMAPBT]))
160 return -EFSCORRUPTED;
161
162 /*
163 * We relied on the rmapbt to reconstruct the AGF. If we get a
164 * different root then something's seriously wrong.
165 */
166 if (fab[XREP_AGF_RMAPBT].root !=
167 be32_to_cpu(old_agf->agf_roots[XFS_BTNUM_RMAPi]))
168 return -EFSCORRUPTED;
169
170 /* We must find the refcountbt root if that feature is enabled. */
171 if (xfs_sb_version_hasreflink(&sc->mp->m_sb) &&
172 !xrep_check_btree_root(sc, &fab[XREP_AGF_REFCOUNTBT]))
173 return -EFSCORRUPTED;
174
175 return 0;
176}
177
178/*
179 * Reinitialize the AGF header, making an in-core copy of the old contents so
180 * that we know which in-core state needs to be reinitialized.
181 */
182STATIC void
183xrep_agf_init_header(
184 struct xfs_scrub *sc,
185 struct xfs_buf *agf_bp,
186 struct xfs_agf *old_agf)
187{
188 struct xfs_mount *mp = sc->mp;
189 struct xfs_agf *agf = XFS_BUF_TO_AGF(agf_bp);
190
191 memcpy(old_agf, agf, sizeof(*old_agf));
192 memset(agf, 0, BBTOB(agf_bp->b_length));
193 agf->agf_magicnum = cpu_to_be32(XFS_AGF_MAGIC);
194 agf->agf_versionnum = cpu_to_be32(XFS_AGF_VERSION);
195 agf->agf_seqno = cpu_to_be32(sc->sa.agno);
196 agf->agf_length = cpu_to_be32(xfs_ag_block_count(mp, sc->sa.agno));
197 agf->agf_flfirst = old_agf->agf_flfirst;
198 agf->agf_fllast = old_agf->agf_fllast;
199 agf->agf_flcount = old_agf->agf_flcount;
200 if (xfs_sb_version_hascrc(&mp->m_sb))
201 uuid_copy(&agf->agf_uuid, &mp->m_sb.sb_meta_uuid);
202
203 /* Mark the incore AGF data stale until we're done fixing things. */
204 ASSERT(sc->sa.pag->pagf_init);
205 sc->sa.pag->pagf_init = 0;
206}
207
208/* Set btree root information in an AGF. */
209STATIC void
210xrep_agf_set_roots(
211 struct xfs_scrub *sc,
212 struct xfs_agf *agf,
213 struct xrep_find_ag_btree *fab)
214{
215 agf->agf_roots[XFS_BTNUM_BNOi] =
216 cpu_to_be32(fab[XREP_AGF_BNOBT].root);
217 agf->agf_levels[XFS_BTNUM_BNOi] =
218 cpu_to_be32(fab[XREP_AGF_BNOBT].height);
219
220 agf->agf_roots[XFS_BTNUM_CNTi] =
221 cpu_to_be32(fab[XREP_AGF_CNTBT].root);
222 agf->agf_levels[XFS_BTNUM_CNTi] =
223 cpu_to_be32(fab[XREP_AGF_CNTBT].height);
224
225 agf->agf_roots[XFS_BTNUM_RMAPi] =
226 cpu_to_be32(fab[XREP_AGF_RMAPBT].root);
227 agf->agf_levels[XFS_BTNUM_RMAPi] =
228 cpu_to_be32(fab[XREP_AGF_RMAPBT].height);
229
230 if (xfs_sb_version_hasreflink(&sc->mp->m_sb)) {
231 agf->agf_refcount_root =
232 cpu_to_be32(fab[XREP_AGF_REFCOUNTBT].root);
233 agf->agf_refcount_level =
234 cpu_to_be32(fab[XREP_AGF_REFCOUNTBT].height);
235 }
236}
237
238/* Update all AGF fields which derive from btree contents. */
239STATIC int
240xrep_agf_calc_from_btrees(
241 struct xfs_scrub *sc,
242 struct xfs_buf *agf_bp)
243{
244 struct xrep_agf_allocbt raa = { .sc = sc };
245 struct xfs_btree_cur *cur = NULL;
246 struct xfs_agf *agf = XFS_BUF_TO_AGF(agf_bp);
247 struct xfs_mount *mp = sc->mp;
248 xfs_agblock_t btreeblks;
249 xfs_agblock_t blocks;
250 int error;
251
252 /* Update the AGF counters from the bnobt. */
253 cur = xfs_allocbt_init_cursor(mp, sc->tp, agf_bp, sc->sa.agno,
254 XFS_BTNUM_BNO);
255 error = xfs_alloc_query_all(cur, xrep_agf_walk_allocbt, &raa);
256 if (error)
257 goto err;
258 error = xfs_btree_count_blocks(cur, &blocks);
259 if (error)
260 goto err;
261 xfs_btree_del_cursor(cur, error);
262 btreeblks = blocks - 1;
263 agf->agf_freeblks = cpu_to_be32(raa.freeblks);
264 agf->agf_longest = cpu_to_be32(raa.longest);
265
266 /* Update the AGF counters from the cntbt. */
267 cur = xfs_allocbt_init_cursor(mp, sc->tp, agf_bp, sc->sa.agno,
268 XFS_BTNUM_CNT);
269 error = xfs_btree_count_blocks(cur, &blocks);
270 if (error)
271 goto err;
272 xfs_btree_del_cursor(cur, error);
273 btreeblks += blocks - 1;
274
275 /* Update the AGF counters from the rmapbt. */
276 cur = xfs_rmapbt_init_cursor(mp, sc->tp, agf_bp, sc->sa.agno);
277 error = xfs_btree_count_blocks(cur, &blocks);
278 if (error)
279 goto err;
280 xfs_btree_del_cursor(cur, error);
281 agf->agf_rmap_blocks = cpu_to_be32(blocks);
282 btreeblks += blocks - 1;
283
284 agf->agf_btreeblks = cpu_to_be32(btreeblks);
285
286 /* Update the AGF counters from the refcountbt. */
287 if (xfs_sb_version_hasreflink(&mp->m_sb)) {
288 cur = xfs_refcountbt_init_cursor(mp, sc->tp, agf_bp,
289 sc->sa.agno);
290 error = xfs_btree_count_blocks(cur, &blocks);
291 if (error)
292 goto err;
293 xfs_btree_del_cursor(cur, error);
294 agf->agf_refcount_blocks = cpu_to_be32(blocks);
295 }
296
297 return 0;
298err:
299 xfs_btree_del_cursor(cur, error);
300 return error;
301}
302
303/* Commit the new AGF and reinitialize the incore state. */
304STATIC int
305xrep_agf_commit_new(
306 struct xfs_scrub *sc,
307 struct xfs_buf *agf_bp)
308{
309 struct xfs_perag *pag;
310 struct xfs_agf *agf = XFS_BUF_TO_AGF(agf_bp);
311
312 /* Trigger fdblocks recalculation */
313 xfs_force_summary_recalc(sc->mp);
314
315 /* Write this to disk. */
316 xfs_trans_buf_set_type(sc->tp, agf_bp, XFS_BLFT_AGF_BUF);
317 xfs_trans_log_buf(sc->tp, agf_bp, 0, BBTOB(agf_bp->b_length) - 1);
318
319 /* Now reinitialize the in-core counters we changed. */
320 pag = sc->sa.pag;
321 pag->pagf_btreeblks = be32_to_cpu(agf->agf_btreeblks);
322 pag->pagf_freeblks = be32_to_cpu(agf->agf_freeblks);
323 pag->pagf_longest = be32_to_cpu(agf->agf_longest);
324 pag->pagf_levels[XFS_BTNUM_BNOi] =
325 be32_to_cpu(agf->agf_levels[XFS_BTNUM_BNOi]);
326 pag->pagf_levels[XFS_BTNUM_CNTi] =
327 be32_to_cpu(agf->agf_levels[XFS_BTNUM_CNTi]);
328 pag->pagf_levels[XFS_BTNUM_RMAPi] =
329 be32_to_cpu(agf->agf_levels[XFS_BTNUM_RMAPi]);
330 pag->pagf_refcount_level = be32_to_cpu(agf->agf_refcount_level);
331 pag->pagf_init = 1;
332
333 return 0;
334}
335
336/* Repair the AGF. v5 filesystems only. */
337int
338xrep_agf(
339 struct xfs_scrub *sc)
340{
341 struct xrep_find_ag_btree fab[XREP_AGF_MAX] = {
342 [XREP_AGF_BNOBT] = {
343 .rmap_owner = XFS_RMAP_OWN_AG,
344 .buf_ops = &xfs_allocbt_buf_ops,
345 .magic = XFS_ABTB_CRC_MAGIC,
346 },
347 [XREP_AGF_CNTBT] = {
348 .rmap_owner = XFS_RMAP_OWN_AG,
349 .buf_ops = &xfs_allocbt_buf_ops,
350 .magic = XFS_ABTC_CRC_MAGIC,
351 },
352 [XREP_AGF_RMAPBT] = {
353 .rmap_owner = XFS_RMAP_OWN_AG,
354 .buf_ops = &xfs_rmapbt_buf_ops,
355 .magic = XFS_RMAP_CRC_MAGIC,
356 },
357 [XREP_AGF_REFCOUNTBT] = {
358 .rmap_owner = XFS_RMAP_OWN_REFC,
359 .buf_ops = &xfs_refcountbt_buf_ops,
360 .magic = XFS_REFC_CRC_MAGIC,
361 },
362 [XREP_AGF_END] = {
363 .buf_ops = NULL,
364 },
365 };
366 struct xfs_agf old_agf;
367 struct xfs_mount *mp = sc->mp;
368 struct xfs_buf *agf_bp;
369 struct xfs_buf *agfl_bp;
370 struct xfs_agf *agf;
371 int error;
372
373 /* We require the rmapbt to rebuild anything. */
374 if (!xfs_sb_version_hasrmapbt(&mp->m_sb))
375 return -EOPNOTSUPP;
376
377 xchk_perag_get(sc->mp, &sc->sa);
378 /*
379 * Make sure we have the AGF buffer, as scrub might have decided it
380 * was corrupt after xfs_alloc_read_agf failed with -EFSCORRUPTED.
381 */
382 error = xfs_trans_read_buf(mp, sc->tp, mp->m_ddev_targp,
383 XFS_AG_DADDR(mp, sc->sa.agno, XFS_AGF_DADDR(mp)),
384 XFS_FSS_TO_BB(mp, 1), 0, &agf_bp, NULL);
385 if (error)
386 return error;
387 agf_bp->b_ops = &xfs_agf_buf_ops;
388 agf = XFS_BUF_TO_AGF(agf_bp);
389
390 /*
391 * Load the AGFL so that we can screen out OWN_AG blocks that are on
392 * the AGFL now; these blocks might have once been part of the
393 * bno/cnt/rmap btrees but are not now. This is a chicken and egg
394 * problem: the AGF is corrupt, so we have to trust the AGFL contents
395 * because we can't do any serious cross-referencing with any of the
396 * btrees rooted in the AGF. If the AGFL contents are obviously bad
397 * then we'll bail out.
398 */
399 error = xfs_alloc_read_agfl(mp, sc->tp, sc->sa.agno, &agfl_bp);
400 if (error)
401 return error;
402
403 /*
404 * Spot-check the AGFL blocks; if they're obviously corrupt then
405 * there's nothing we can do but bail out.
406 */
407 error = xfs_agfl_walk(sc->mp, XFS_BUF_TO_AGF(agf_bp), agfl_bp,
408 xrep_agf_check_agfl_block, sc);
409 if (error)
410 return error;
411
412 /*
413 * Find the AGF btree roots. This is also a chicken-and-egg situation;
414 * see the function for more details.
415 */
416 error = xrep_agf_find_btrees(sc, agf_bp, fab, agfl_bp);
417 if (error)
418 return error;
419
420 /* Start rewriting the header and implant the btrees we found. */
421 xrep_agf_init_header(sc, agf_bp, &old_agf);
422 xrep_agf_set_roots(sc, agf, fab);
423 error = xrep_agf_calc_from_btrees(sc, agf_bp);
424 if (error)
425 goto out_revert;
426
427 /* Commit the changes and reinitialize incore state. */
428 return xrep_agf_commit_new(sc, agf_bp);
429
430out_revert:
431 /* Mark the incore AGF state stale and revert the AGF. */
432 sc->sa.pag->pagf_init = 0;
433 memcpy(agf, &old_agf, sizeof(old_agf));
434 return error;
435}
Darrick J. Wong0e93d3f2018-08-09 22:43:02 -0700436
437/* AGFL */
438
439struct xrep_agfl {
440 /* Bitmap of other OWN_AG metadata blocks. */
441 struct xfs_bitmap agmetablocks;
442
443 /* Bitmap of free space. */
444 struct xfs_bitmap *freesp;
445
446 struct xfs_scrub *sc;
447};
448
449/* Record all OWN_AG (free space btree) information from the rmap data. */
450STATIC int
451xrep_agfl_walk_rmap(
452 struct xfs_btree_cur *cur,
453 struct xfs_rmap_irec *rec,
454 void *priv)
455{
456 struct xrep_agfl *ra = priv;
457 xfs_fsblock_t fsb;
458 int error = 0;
459
460 if (xchk_should_terminate(ra->sc, &error))
461 return error;
462
463 /* Record all the OWN_AG blocks. */
464 if (rec->rm_owner == XFS_RMAP_OWN_AG) {
465 fsb = XFS_AGB_TO_FSB(cur->bc_mp, cur->bc_private.a.agno,
466 rec->rm_startblock);
467 error = xfs_bitmap_set(ra->freesp, fsb, rec->rm_blockcount);
468 if (error)
469 return error;
470 }
471
472 return xfs_bitmap_set_btcur_path(&ra->agmetablocks, cur);
473}
474
475/*
476 * Map out all the non-AGFL OWN_AG space in this AG so that we can deduce
477 * which blocks belong to the AGFL.
478 *
479 * Compute the set of old AGFL blocks by subtracting from the list of OWN_AG
480 * blocks the list of blocks owned by all other OWN_AG metadata (bnobt, cntbt,
481 * rmapbt). These are the old AGFL blocks, so return that list and the number
482 * of blocks we're actually going to put back on the AGFL.
483 */
484STATIC int
485xrep_agfl_collect_blocks(
486 struct xfs_scrub *sc,
487 struct xfs_buf *agf_bp,
488 struct xfs_bitmap *agfl_extents,
489 xfs_agblock_t *flcount)
490{
491 struct xrep_agfl ra;
492 struct xfs_mount *mp = sc->mp;
493 struct xfs_btree_cur *cur;
494 struct xfs_bitmap_range *br;
495 struct xfs_bitmap_range *n;
496 int error;
497
498 ra.sc = sc;
499 ra.freesp = agfl_extents;
500 xfs_bitmap_init(&ra.agmetablocks);
501
502 /* Find all space used by the free space btrees & rmapbt. */
503 cur = xfs_rmapbt_init_cursor(mp, sc->tp, agf_bp, sc->sa.agno);
504 error = xfs_rmap_query_all(cur, xrep_agfl_walk_rmap, &ra);
505 if (error)
506 goto err;
507 xfs_btree_del_cursor(cur, error);
508
509 /* Find all blocks currently being used by the bnobt. */
510 cur = xfs_allocbt_init_cursor(mp, sc->tp, agf_bp, sc->sa.agno,
511 XFS_BTNUM_BNO);
512 error = xfs_bitmap_set_btblocks(&ra.agmetablocks, cur);
513 if (error)
514 goto err;
515 xfs_btree_del_cursor(cur, error);
516
517 /* Find all blocks currently being used by the cntbt. */
518 cur = xfs_allocbt_init_cursor(mp, sc->tp, agf_bp, sc->sa.agno,
519 XFS_BTNUM_CNT);
520 error = xfs_bitmap_set_btblocks(&ra.agmetablocks, cur);
521 if (error)
522 goto err;
523
524 xfs_btree_del_cursor(cur, error);
525
526 /*
527 * Drop the freesp meta blocks that are in use by btrees.
528 * The remaining blocks /should/ be AGFL blocks.
529 */
530 error = xfs_bitmap_disunion(agfl_extents, &ra.agmetablocks);
531 xfs_bitmap_destroy(&ra.agmetablocks);
532 if (error)
533 return error;
534
535 /*
536 * Calculate the new AGFL size. If we found more blocks than fit in
537 * the AGFL we'll free them later.
538 */
539 *flcount = 0;
540 for_each_xfs_bitmap_extent(br, n, agfl_extents) {
541 *flcount += br->len;
542 if (*flcount > xfs_agfl_size(mp))
543 break;
544 }
545 if (*flcount > xfs_agfl_size(mp))
546 *flcount = xfs_agfl_size(mp);
547 return 0;
548
549err:
550 xfs_bitmap_destroy(&ra.agmetablocks);
551 xfs_btree_del_cursor(cur, error);
552 return error;
553}
554
555/* Update the AGF and reset the in-core state. */
556STATIC void
557xrep_agfl_update_agf(
558 struct xfs_scrub *sc,
559 struct xfs_buf *agf_bp,
560 xfs_agblock_t flcount)
561{
562 struct xfs_agf *agf = XFS_BUF_TO_AGF(agf_bp);
563
564 ASSERT(flcount <= xfs_agfl_size(sc->mp));
565
566 /* Trigger fdblocks recalculation */
567 xfs_force_summary_recalc(sc->mp);
568
569 /* Update the AGF counters. */
570 if (sc->sa.pag->pagf_init)
571 sc->sa.pag->pagf_flcount = flcount;
572 agf->agf_flfirst = cpu_to_be32(0);
573 agf->agf_flcount = cpu_to_be32(flcount);
574 agf->agf_fllast = cpu_to_be32(flcount - 1);
575
576 xfs_alloc_log_agf(sc->tp, agf_bp,
577 XFS_AGF_FLFIRST | XFS_AGF_FLLAST | XFS_AGF_FLCOUNT);
578}
579
580/* Write out a totally new AGFL. */
581STATIC void
582xrep_agfl_init_header(
583 struct xfs_scrub *sc,
584 struct xfs_buf *agfl_bp,
585 struct xfs_bitmap *agfl_extents,
586 xfs_agblock_t flcount)
587{
588 struct xfs_mount *mp = sc->mp;
589 __be32 *agfl_bno;
590 struct xfs_bitmap_range *br;
591 struct xfs_bitmap_range *n;
592 struct xfs_agfl *agfl;
593 xfs_agblock_t agbno;
594 unsigned int fl_off;
595
596 ASSERT(flcount <= xfs_agfl_size(mp));
597
598 /*
599 * Start rewriting the header by setting the bno[] array to
600 * NULLAGBLOCK, then setting AGFL header fields.
601 */
602 agfl = XFS_BUF_TO_AGFL(agfl_bp);
603 memset(agfl, 0xFF, BBTOB(agfl_bp->b_length));
604 agfl->agfl_magicnum = cpu_to_be32(XFS_AGFL_MAGIC);
605 agfl->agfl_seqno = cpu_to_be32(sc->sa.agno);
606 uuid_copy(&agfl->agfl_uuid, &mp->m_sb.sb_meta_uuid);
607
608 /*
609 * Fill the AGFL with the remaining blocks. If agfl_extents has more
610 * blocks than fit in the AGFL, they will be freed in a subsequent
611 * step.
612 */
613 fl_off = 0;
614 agfl_bno = XFS_BUF_TO_AGFL_BNO(mp, agfl_bp);
615 for_each_xfs_bitmap_extent(br, n, agfl_extents) {
616 agbno = XFS_FSB_TO_AGBNO(mp, br->start);
617
618 trace_xrep_agfl_insert(mp, sc->sa.agno, agbno, br->len);
619
620 while (br->len > 0 && fl_off < flcount) {
621 agfl_bno[fl_off] = cpu_to_be32(agbno);
622 fl_off++;
623 agbno++;
624
625 /*
626 * We've now used br->start by putting it in the AGFL,
627 * so bump br so that we don't reap the block later.
628 */
629 br->start++;
630 br->len--;
631 }
632
633 if (br->len)
634 break;
635 list_del(&br->list);
636 kmem_free(br);
637 }
638
639 /* Write new AGFL to disk. */
640 xfs_trans_buf_set_type(sc->tp, agfl_bp, XFS_BLFT_AGFL_BUF);
641 xfs_trans_log_buf(sc->tp, agfl_bp, 0, BBTOB(agfl_bp->b_length) - 1);
642}
643
644/* Repair the AGFL. */
645int
646xrep_agfl(
647 struct xfs_scrub *sc)
648{
649 struct xfs_owner_info oinfo;
650 struct xfs_bitmap agfl_extents;
651 struct xfs_mount *mp = sc->mp;
652 struct xfs_buf *agf_bp;
653 struct xfs_buf *agfl_bp;
654 xfs_agblock_t flcount;
655 int error;
656
657 /* We require the rmapbt to rebuild anything. */
658 if (!xfs_sb_version_hasrmapbt(&mp->m_sb))
659 return -EOPNOTSUPP;
660
661 xchk_perag_get(sc->mp, &sc->sa);
662 xfs_bitmap_init(&agfl_extents);
663
664 /*
665 * Read the AGF so that we can query the rmapbt. We hope that there's
666 * nothing wrong with the AGF, but all the AG header repair functions
667 * have this chicken-and-egg problem.
668 */
669 error = xfs_alloc_read_agf(mp, sc->tp, sc->sa.agno, 0, &agf_bp);
670 if (error)
671 return error;
672 if (!agf_bp)
673 return -ENOMEM;
674
675 /*
676 * Make sure we have the AGFL buffer, as scrub might have decided it
677 * was corrupt after xfs_alloc_read_agfl failed with -EFSCORRUPTED.
678 */
679 error = xfs_trans_read_buf(mp, sc->tp, mp->m_ddev_targp,
680 XFS_AG_DADDR(mp, sc->sa.agno, XFS_AGFL_DADDR(mp)),
681 XFS_FSS_TO_BB(mp, 1), 0, &agfl_bp, NULL);
682 if (error)
683 return error;
684 agfl_bp->b_ops = &xfs_agfl_buf_ops;
685
686 /* Gather all the extents we're going to put on the new AGFL. */
687 error = xrep_agfl_collect_blocks(sc, agf_bp, &agfl_extents, &flcount);
688 if (error)
689 goto err;
690
691 /*
692 * Update AGF and AGFL. We reset the global free block counter when
693 * we adjust the AGF flcount (which can fail) so avoid updating any
694 * buffers until we know that part works.
695 */
696 xrep_agfl_update_agf(sc, agf_bp, flcount);
697 xrep_agfl_init_header(sc, agfl_bp, &agfl_extents, flcount);
698
699 /*
700 * Ok, the AGFL should be ready to go now. Roll the transaction to
701 * make the new AGFL permanent before we start using it to return
702 * freespace overflow to the freespace btrees.
703 */
704 sc->sa.agf_bp = agf_bp;
705 sc->sa.agfl_bp = agfl_bp;
706 error = xrep_roll_ag_trans(sc);
707 if (error)
708 goto err;
709
710 /* Dump any AGFL overflow. */
711 xfs_rmap_ag_owner(&oinfo, XFS_RMAP_OWN_AG);
712 return xrep_reap_extents(sc, &agfl_extents, &oinfo, XFS_AG_RESV_AGFL);
713err:
714 xfs_bitmap_destroy(&agfl_extents);
715 return error;
716}
Darrick J. Wong13942aa2018-08-09 22:43:04 -0700717
718/* AGI */
719
720/*
721 * Offset within the xrep_find_ag_btree array for each btree type. Avoid the
722 * XFS_BTNUM_ names here to avoid creating a sparse array.
723 */
724enum {
725 XREP_AGI_INOBT = 0,
726 XREP_AGI_FINOBT,
727 XREP_AGI_END,
728 XREP_AGI_MAX
729};
730
731/*
732 * Given the inode btree roots described by *fab, find the roots, check them
733 * for sanity, and pass the root data back out via *fab.
734 */
735STATIC int
736xrep_agi_find_btrees(
737 struct xfs_scrub *sc,
738 struct xrep_find_ag_btree *fab)
739{
740 struct xfs_buf *agf_bp;
741 struct xfs_mount *mp = sc->mp;
742 int error;
743
744 /* Read the AGF. */
745 error = xfs_alloc_read_agf(mp, sc->tp, sc->sa.agno, 0, &agf_bp);
746 if (error)
747 return error;
748 if (!agf_bp)
749 return -ENOMEM;
750
751 /* Find the btree roots. */
752 error = xrep_find_ag_btree_roots(sc, agf_bp, fab, NULL);
753 if (error)
754 return error;
755
756 /* We must find the inobt root. */
757 if (!xrep_check_btree_root(sc, &fab[XREP_AGI_INOBT]))
758 return -EFSCORRUPTED;
759
760 /* We must find the finobt root if that feature is enabled. */
761 if (xfs_sb_version_hasfinobt(&mp->m_sb) &&
762 !xrep_check_btree_root(sc, &fab[XREP_AGI_FINOBT]))
763 return -EFSCORRUPTED;
764
765 return 0;
766}
767
768/*
769 * Reinitialize the AGI header, making an in-core copy of the old contents so
770 * that we know which in-core state needs to be reinitialized.
771 */
772STATIC void
773xrep_agi_init_header(
774 struct xfs_scrub *sc,
775 struct xfs_buf *agi_bp,
776 struct xfs_agi *old_agi)
777{
778 struct xfs_agi *agi = XFS_BUF_TO_AGI(agi_bp);
779 struct xfs_mount *mp = sc->mp;
780
781 memcpy(old_agi, agi, sizeof(*old_agi));
782 memset(agi, 0, BBTOB(agi_bp->b_length));
783 agi->agi_magicnum = cpu_to_be32(XFS_AGI_MAGIC);
784 agi->agi_versionnum = cpu_to_be32(XFS_AGI_VERSION);
785 agi->agi_seqno = cpu_to_be32(sc->sa.agno);
786 agi->agi_length = cpu_to_be32(xfs_ag_block_count(mp, sc->sa.agno));
787 agi->agi_newino = cpu_to_be32(NULLAGINO);
788 agi->agi_dirino = cpu_to_be32(NULLAGINO);
789 if (xfs_sb_version_hascrc(&mp->m_sb))
790 uuid_copy(&agi->agi_uuid, &mp->m_sb.sb_meta_uuid);
791
792 /* We don't know how to fix the unlinked list yet. */
793 memcpy(&agi->agi_unlinked, &old_agi->agi_unlinked,
794 sizeof(agi->agi_unlinked));
795
796 /* Mark the incore AGF data stale until we're done fixing things. */
797 ASSERT(sc->sa.pag->pagi_init);
798 sc->sa.pag->pagi_init = 0;
799}
800
801/* Set btree root information in an AGI. */
802STATIC void
803xrep_agi_set_roots(
804 struct xfs_scrub *sc,
805 struct xfs_agi *agi,
806 struct xrep_find_ag_btree *fab)
807{
808 agi->agi_root = cpu_to_be32(fab[XREP_AGI_INOBT].root);
809 agi->agi_level = cpu_to_be32(fab[XREP_AGI_INOBT].height);
810
811 if (xfs_sb_version_hasfinobt(&sc->mp->m_sb)) {
812 agi->agi_free_root = cpu_to_be32(fab[XREP_AGI_FINOBT].root);
813 agi->agi_free_level = cpu_to_be32(fab[XREP_AGI_FINOBT].height);
814 }
815}
816
817/* Update the AGI counters. */
818STATIC int
819xrep_agi_calc_from_btrees(
820 struct xfs_scrub *sc,
821 struct xfs_buf *agi_bp)
822{
823 struct xfs_btree_cur *cur;
824 struct xfs_agi *agi = XFS_BUF_TO_AGI(agi_bp);
825 struct xfs_mount *mp = sc->mp;
826 xfs_agino_t count;
827 xfs_agino_t freecount;
828 int error;
829
830 cur = xfs_inobt_init_cursor(mp, sc->tp, agi_bp, sc->sa.agno,
831 XFS_BTNUM_INO);
832 error = xfs_ialloc_count_inodes(cur, &count, &freecount);
833 if (error)
834 goto err;
835 xfs_btree_del_cursor(cur, error);
836
837 agi->agi_count = cpu_to_be32(count);
838 agi->agi_freecount = cpu_to_be32(freecount);
839 return 0;
840err:
841 xfs_btree_del_cursor(cur, error);
842 return error;
843}
844
845/* Trigger reinitialization of the in-core data. */
846STATIC int
847xrep_agi_commit_new(
848 struct xfs_scrub *sc,
849 struct xfs_buf *agi_bp)
850{
851 struct xfs_perag *pag;
852 struct xfs_agi *agi = XFS_BUF_TO_AGI(agi_bp);
853
854 /* Trigger inode count recalculation */
855 xfs_force_summary_recalc(sc->mp);
856
857 /* Write this to disk. */
858 xfs_trans_buf_set_type(sc->tp, agi_bp, XFS_BLFT_AGI_BUF);
859 xfs_trans_log_buf(sc->tp, agi_bp, 0, BBTOB(agi_bp->b_length) - 1);
860
861 /* Now reinitialize the in-core counters if necessary. */
862 pag = sc->sa.pag;
863 pag->pagi_count = be32_to_cpu(agi->agi_count);
864 pag->pagi_freecount = be32_to_cpu(agi->agi_freecount);
865 pag->pagi_init = 1;
866
867 return 0;
868}
869
870/* Repair the AGI. */
871int
872xrep_agi(
873 struct xfs_scrub *sc)
874{
875 struct xrep_find_ag_btree fab[XREP_AGI_MAX] = {
876 [XREP_AGI_INOBT] = {
877 .rmap_owner = XFS_RMAP_OWN_INOBT,
878 .buf_ops = &xfs_inobt_buf_ops,
879 .magic = XFS_IBT_CRC_MAGIC,
880 },
881 [XREP_AGI_FINOBT] = {
882 .rmap_owner = XFS_RMAP_OWN_INOBT,
883 .buf_ops = &xfs_inobt_buf_ops,
884 .magic = XFS_FIBT_CRC_MAGIC,
885 },
886 [XREP_AGI_END] = {
887 .buf_ops = NULL
888 },
889 };
890 struct xfs_agi old_agi;
891 struct xfs_mount *mp = sc->mp;
892 struct xfs_buf *agi_bp;
893 struct xfs_agi *agi;
894 int error;
895
896 /* We require the rmapbt to rebuild anything. */
897 if (!xfs_sb_version_hasrmapbt(&mp->m_sb))
898 return -EOPNOTSUPP;
899
900 xchk_perag_get(sc->mp, &sc->sa);
901 /*
902 * Make sure we have the AGI buffer, as scrub might have decided it
903 * was corrupt after xfs_ialloc_read_agi failed with -EFSCORRUPTED.
904 */
905 error = xfs_trans_read_buf(mp, sc->tp, mp->m_ddev_targp,
906 XFS_AG_DADDR(mp, sc->sa.agno, XFS_AGI_DADDR(mp)),
907 XFS_FSS_TO_BB(mp, 1), 0, &agi_bp, NULL);
908 if (error)
909 return error;
910 agi_bp->b_ops = &xfs_agi_buf_ops;
911 agi = XFS_BUF_TO_AGI(agi_bp);
912
913 /* Find the AGI btree roots. */
914 error = xrep_agi_find_btrees(sc, fab);
915 if (error)
916 return error;
917
918 /* Start rewriting the header and implant the btrees we found. */
919 xrep_agi_init_header(sc, agi_bp, &old_agi);
920 xrep_agi_set_roots(sc, agi, fab);
921 error = xrep_agi_calc_from_btrees(sc, agi_bp);
922 if (error)
923 goto out_revert;
924
925 /* Reinitialize in-core state. */
926 return xrep_agi_commit_new(sc, agi_bp);
927
928out_revert:
929 /* Mark the incore AGI state stale and revert the AGI. */
930 sc->sa.pag->pagi_init = 0;
931 memcpy(agi, &old_agi, sizeof(old_agi));
932 return error;
933}