Fix scrub resume from newly created hole

It may happen that scan bookmark points to a block that was turned
into a part of a big hole.  In such case dsl_scan_visitbp() may skip
it and dsl_scan_check_resume() will not be called for it.  As result
new scan suspend won't be possible until the end of the object, that
may take hours if the object is a multi-terabyte ZVOL on a slow HDD
pool, stretching TXG to all that time, creating all sorts of problems.

This patch changes the resume condition to any greater or equal block,
so even if we miss the bookmarked block, the next one we find will
delete the bookmark, allowing new suspend.

Reviewed-by: Brian Behlendorf <behlendorf1@llnl.gov>
Reviewed-by: Ryan Moeller <ryan@iXsystems.com>
Signed-off-by: Alexander Motin <mav@FreeBSD.org>
Sponsored-By: iXsystems, Inc.
Closes #13643
This commit is contained in:
Alexander Motin 2022-07-20 20:02:36 -04:00 committed by GitHub
parent 97fd1ea42a
commit 33dba8c792
No known key found for this signature in database
GPG Key ID: 4AEE18F83AFDEB23
3 changed files with 23 additions and 7 deletions

View File

@ -696,6 +696,8 @@ extern void spa_handle_ignored_writes(spa_t *spa);
/* zbookmark_phys functions */ /* zbookmark_phys functions */
boolean_t zbookmark_subtree_completed(const struct dnode_phys *dnp, boolean_t zbookmark_subtree_completed(const struct dnode_phys *dnp,
const zbookmark_phys_t *subtree_root, const zbookmark_phys_t *last_block); const zbookmark_phys_t *subtree_root, const zbookmark_phys_t *last_block);
boolean_t zbookmark_subtree_tbd(const struct dnode_phys *dnp,
const zbookmark_phys_t *subtree_root, const zbookmark_phys_t *last_block);
int zbookmark_compare(uint16_t dbss1, uint8_t ibs1, uint16_t dbss2, int zbookmark_compare(uint16_t dbss1, uint8_t ibs1, uint16_t dbss2,
uint8_t ibs2, const zbookmark_phys_t *zb1, const zbookmark_phys_t *zb2); uint8_t ibs2, const zbookmark_phys_t *zb1, const zbookmark_phys_t *zb2);

View File

@ -1802,13 +1802,11 @@ dsl_scan_check_resume(dsl_scan_t *scn, const dnode_phys_t *dnp,
/* /*
* If we found the block we're trying to resume from, or * If we found the block we're trying to resume from, or
* we went past it to a different object, zero it out to * we went past it, zero it out to indicate that it's OK
* indicate that it's OK to start checking for suspending * to start checking for suspending again.
* again.
*/ */
if (memcmp(zb, &scn->scn_phys.scn_bookmark, if (zbookmark_subtree_tbd(dnp, zb,
sizeof (*zb)) == 0 || &scn->scn_phys.scn_bookmark)) {
zb->zb_object > scn->scn_phys.scn_bookmark.zb_object) {
dprintf("resuming at %llx/%llx/%llx/%llx\n", dprintf("resuming at %llx/%llx/%llx/%llx\n",
(longlong_t)zb->zb_objset, (longlong_t)zb->zb_objset,
(longlong_t)zb->zb_object, (longlong_t)zb->zb_object,

View File

@ -4997,7 +4997,7 @@ zbookmark_subtree_completed(const dnode_phys_t *dnp,
{ {
zbookmark_phys_t mod_zb = *subtree_root; zbookmark_phys_t mod_zb = *subtree_root;
mod_zb.zb_blkid++; mod_zb.zb_blkid++;
ASSERT(last_block->zb_level == 0); ASSERT0(last_block->zb_level);
/* The objset_phys_t isn't before anything. */ /* The objset_phys_t isn't before anything. */
if (dnp == NULL) if (dnp == NULL)
@ -5023,6 +5023,22 @@ zbookmark_subtree_completed(const dnode_phys_t *dnp,
last_block) <= 0); last_block) <= 0);
} }
/*
* This function is similar to zbookmark_subtree_completed(), but returns true
* if subtree_root is equal or ahead of last_block, i.e. still to be done.
*/
boolean_t
zbookmark_subtree_tbd(const dnode_phys_t *dnp,
const zbookmark_phys_t *subtree_root, const zbookmark_phys_t *last_block)
{
ASSERT0(last_block->zb_level);
if (dnp == NULL)
return (B_FALSE);
return (zbookmark_compare(dnp->dn_datablkszsec, dnp->dn_indblkshift,
1ULL << (DNODE_BLOCK_SHIFT - SPA_MINBLOCKSHIFT), 0, subtree_root,
last_block) >= 0);
}
EXPORT_SYMBOL(zio_type_name); EXPORT_SYMBOL(zio_type_name);
EXPORT_SYMBOL(zio_buf_alloc); EXPORT_SYMBOL(zio_buf_alloc);
EXPORT_SYMBOL(zio_data_buf_alloc); EXPORT_SYMBOL(zio_data_buf_alloc);