Only send earliest mismatched ancestor to replay (#31842)

2023-07-06 21:31:12 -07:00 · 2023-07-06 21:31:12 -07:00 · c172dfd268
parent 282e043177
commit c172dfd268
5 changed files with 261 additions and 198 deletions
--- a/core/src/repair/ancestor_hashes_service.rs
+++ b/core/src/repair/ancestor_hashes_service.rs
@ -487,18 +487,16 @@ impl AncestorHashesService {
        // another ancestor repair request from the earliest returned
        // ancestor from this search.
-        let potential_slots_to_repair = ancestor_request_decision.slots_to_repair();
+        let potential_slot_to_repair = ancestor_request_decision.slot_to_repair();
-        // Now signal ReplayStage about the new updated slots. It's important to do this
+        // Now signal ReplayStage about the new updated slot. It's important to do this
        // AFTER we've removed the ancestor_hashes_status_ref in case replay
        // then sends us another dead slot signal based on the updates we are
        // about to send.
-        if let Some(slots_to_repair) = potential_slots_to_repair {
+        if let Some(slot_to_repair) = potential_slot_to_repair {
-            if !slots_to_repair.is_empty() {
+            // Signal ReplayStage to dump the fork that is descended from
-                // Signal ReplayStage to dump the fork that is descended from
+            // `earliest_mismatched_slot_to_dump`.
-                // `earliest_mismatched_slot_to_dump`.
+            let _ = ancestor_duplicate_slots_sender.send(slot_to_repair);
                let _ = ancestor_duplicate_slots_sender.send(slots_to_repair);
            }
        }
    }
@ -1233,9 +1231,12 @@ mod test {
            // Set up blockstore for responses
            let blockstore = Arc::new(Blockstore::open(&ledger_path).unwrap());
-            // Create slots [slot, slot + MAX_ANCESTOR_RESPONSES) with 5 shreds apiece
+            // Create slots [slot - MAX_ANCESTOR_RESPONSES, slot) with 5 shreds apiece
-            let (shreds, _) =
+            let (shreds, _) = make_many_slot_entries(
-                make_many_slot_entries(slot_to_query, MAX_ANCESTOR_RESPONSES as u64, 5);
+                slot_to_query - MAX_ANCESTOR_RESPONSES as Slot + 1,
                MAX_ANCESTOR_RESPONSES as u64,
                5,
            );
            blockstore
                .insert_shreds(shreds, None, false)
                .expect("Expect successful ledger write");
@ -1346,6 +1347,9 @@ mod test {
        }
    }
    /// Creates valid fork up to `dead_slot - 1`
    /// For `dead_slot - 1` insert the wrong `bank_hash`
    /// Mark `dead_slot` as dead
    fn setup_dead_slot(
        dead_slot: Slot,
        correct_bank_hashes: &HashMap<Slot, Hash>,
@ -1377,13 +1381,15 @@ mod test {
        blockstore
            .insert_shreds(shreds, None, false)
            .expect("Expect successful ledger write");
-        for duplicate_confirmed_slot in 0..dead_slot {
+        for duplicate_confirmed_slot in 0..(dead_slot - 1) {
            let bank_hash = correct_bank_hashes
                .get(&duplicate_confirmed_slot)
                .cloned()
                .unwrap_or_else(Hash::new_unique);
            blockstore.insert_bank_hash(duplicate_confirmed_slot, bank_hash, true);
        }
        // Insert wrong hash for `dead_slot - 1`
        blockstore.insert_bank_hash(dead_slot - 1, Hash::new_unique(), false);
        blockstore.set_dead_slot(dead_slot).unwrap();
        replay_blockstore_components
    }
@ -1532,16 +1538,16 @@ mod test {
        assert_eq!(slot, dead_slot);
        assert_eq!(
-            decision
+            decision.repair_status().unwrap().correct_ancestor_to_repair,
-                .repair_status()
+            (
-                .unwrap()
+                dead_slot - 1,
-                .correct_ancestors_to_repair,
+                *correct_bank_hashes.get(&(dead_slot - 1)).unwrap()
-            vec![(dead_slot, *correct_bank_hashes.get(&dead_slot).unwrap())]
+            )
        );
        assert_matches!(
            (decision, request_type),
            (
-                DuplicateAncestorDecision::EarliestAncestorNotFrozen(_),
+                DuplicateAncestorDecision::EarliestMismatchFound(_),
                AncestorRequestType::DeadDuplicateConfirmed,
            )
        );
@ -1567,7 +1573,7 @@ mod test {
        assert_eq!(ancestor_hashes_request_statuses.len(), 1);
        assert!(ancestor_hashes_request_statuses.contains_key(&dead_slot));
-        // Should have received valid response since pruned doesn't check hashes
+        // Should have received valid response
        let mut response_packet = response_receiver
            .recv_timeout(Duration::from_millis(10_000))
            .unwrap();
@ -1591,10 +1597,17 @@ mod test {
        .unwrap();
        assert_eq!(slot, dead_slot);
        assert_eq!(
            decision.repair_status().unwrap().correct_ancestor_to_repair,
            (
                dead_slot - 1,
                *correct_bank_hashes.get(&(dead_slot - 1)).unwrap()
            )
        );
        assert_matches!(
            (decision, request_type),
            (
-                DuplicateAncestorDecision::AncestorsAllMatch,
+                DuplicateAncestorDecision::EarliestMismatchFound(_),
                AncestorRequestType::PopularPruned,
            )
        );
@ -2024,16 +2037,16 @@ mod test {
        assert_eq!(slot, dead_slot);
        assert_eq!(
-            decision
+            decision.repair_status().unwrap().correct_ancestor_to_repair,
-                .repair_status()
+            (
-                .unwrap()
+                dead_slot - 1,
-                .correct_ancestors_to_repair,
+                *correct_bank_hashes.get(&(dead_slot - 1)).unwrap()
-            vec![(dead_slot, *correct_bank_hashes.get(&dead_slot).unwrap())]
+            )
        );
        assert_matches!(
            (decision, request_type),
            (
-                DuplicateAncestorDecision::EarliestAncestorNotFrozen(_),
+                DuplicateAncestorDecision::EarliestMismatchFound(_),
                AncestorRequestType::DeadDuplicateConfirmed
            )
        );
--- a/core/src/repair/duplicate_repair_status.rs
+++ b/core/src/repair/duplicate_repair_status.rs
@ -35,10 +35,8 @@ const RETRY_INTERVAL_SECONDS: usize = 5;
 #[derive(Debug, PartialEq, Eq, Clone)]
 pub enum DuplicateAncestorDecision {
    InvalidSample,
    AncestorsAllMatch,
    SampleNotDuplicateConfirmed,
    ContinueSearch(DuplicateSlotRepairStatus),
    EarliestAncestorNotFrozen(DuplicateSlotRepairStatus),
    EarliestMismatchFound(DuplicateSlotRepairStatus),
    EarliestPrunedMismatchFound(DuplicateSlotRepairStatus),
 }
@ -52,10 +50,7 @@ impl DuplicateAncestorDecision {
            // so retry
            | DuplicateAncestorDecision::SampleNotDuplicateConfirmed => true,
            DuplicateAncestorDecision::AncestorsAllMatch => false,
             DuplicateAncestorDecision::ContinueSearch(_status)
            | DuplicateAncestorDecision::EarliestAncestorNotFrozen(_status)
            | DuplicateAncestorDecision::EarliestMismatchFound(_status)
            | DuplicateAncestorDecision::EarliestPrunedMismatchFound(_status) => false,
        }
@ -64,11 +59,9 @@ impl DuplicateAncestorDecision {
    pub fn repair_status(&self) -> Option<&DuplicateSlotRepairStatus> {
        match self {
            DuplicateAncestorDecision::InvalidSample
            | DuplicateAncestorDecision::AncestorsAllMatch
            | DuplicateAncestorDecision::SampleNotDuplicateConfirmed => None,
            DuplicateAncestorDecision::ContinueSearch(status)
            | DuplicateAncestorDecision::EarliestAncestorNotFrozen(status)
            | DuplicateAncestorDecision::EarliestMismatchFound(status)
            | DuplicateAncestorDecision::EarliestPrunedMismatchFound(status) => Some(status),
        }
@ -77,11 +70,9 @@ impl DuplicateAncestorDecision {
    pub fn repair_status_mut(&mut self) -> Option<&mut DuplicateSlotRepairStatus> {
        match self {
            DuplicateAncestorDecision::InvalidSample
            | DuplicateAncestorDecision::AncestorsAllMatch
            | DuplicateAncestorDecision::SampleNotDuplicateConfirmed => None,
            DuplicateAncestorDecision::ContinueSearch(status)
            | DuplicateAncestorDecision::EarliestAncestorNotFrozen(status)
            | DuplicateAncestorDecision::EarliestMismatchFound(status)
            | DuplicateAncestorDecision::EarliestPrunedMismatchFound(status) => Some(status),
        }
@ -90,25 +81,21 @@ impl DuplicateAncestorDecision {
 #[derive(Debug, Default, Clone, PartialEq, Eq)]
 pub struct DuplicateSlotRepairStatus {
-    // Any ancestor slots that are either missing or are mismatched.
+    // The first ancestor slot that is mismatched.
    // A mismatched ancestor slot is one that has been replayed (frozen)
    // that has a different hash than the one agreed upon by the sampled peers.
    //
    //
-    // These are the slots that need to be dumped in order to repair the correct
+    // This is the slots that needs to be dumped in order to replay the originally requested slot.
-    // versions. The hash is None if the slot is not frozen, because it's:
+    pub correct_ancestor_to_repair: (Slot, Hash),
    // 1) Dead
    // 2) Hasn't been replayed
    // 3) We don't have the slot in our Ledger
    pub correct_ancestors_to_repair: Vec<(Slot, Hash)>,
    pub repair_pubkey_and_addr: Option<(Pubkey, SocketAddr)>,
    pub start_ts: u64,
 }
 impl DuplicateSlotRepairStatus {
-    fn new(correct_ancestors_to_repair: Vec<(Slot, Hash)>) -> Self {
+    fn new(correct_ancestor_to_repair: (Slot, Hash)) -> Self {
        Self {
-            correct_ancestors_to_repair,
+            correct_ancestor_to_repair,
            repair_pubkey_and_addr: None,
            start_ts: timestamp(),
        }
@ -128,19 +115,13 @@ impl AncestorRequestType {
    }
 }
-pub struct AncestorDuplicateSlotsToRepair {
+pub struct AncestorDuplicateSlotToRepair {
-    // Slots that `ancestor_hashes_service` found that need to be repaired
+    // Slot that `ancestor_hashes_service` found that needs to be repaired
-    pub slots_to_repair: Vec<(Slot, Hash)>,
+    pub slot_to_repair: (Slot, Hash),
    // Condition that initiated this request
    pub request_type: AncestorRequestType,
 }
 impl AncestorDuplicateSlotsToRepair {
    pub fn is_empty(&self) -> bool {
        self.slots_to_repair.is_empty()
    }
 }
 #[derive(Debug, PartialEq, Eq)]
 pub struct AncestorRequestDecision {
    // The slot that initiated this request
@ -152,7 +133,7 @@ pub struct AncestorRequestDecision {
 }
 impl AncestorRequestDecision {
-    pub fn slots_to_repair(self) -> Option<AncestorDuplicateSlotsToRepair> {
+    pub fn slot_to_repair(self) -> Option<AncestorDuplicateSlotToRepair> {
        let Self {
            request_type,
            mut decision,
@ -160,8 +141,8 @@ impl AncestorRequestDecision {
        } = self;
        decision
            .repair_status_mut()
-            .map(|status| AncestorDuplicateSlotsToRepair {
+            .map(|status| AncestorDuplicateSlotToRepair {
-                slots_to_repair: std::mem::take(&mut status.correct_ancestors_to_repair),
+                slot_to_repair: std::mem::take(&mut status.correct_ancestor_to_repair),
                request_type,
            })
    }
@ -276,7 +257,7 @@ impl AncestorRequestStatus {
    fn handle_sampled_validators_reached_agreement(
        &mut self,
        blockstore: &Blockstore,
-        mut agreed_response: Vec<(Slot, Hash)>,
+        agreed_response: Vec<(Slot, Hash)>,
    ) -> DuplicateAncestorDecision {
        if agreed_response.is_empty() {
            info!(
@ -350,15 +331,18 @@ impl AncestorRequestStatus {
                        return DuplicateAncestorDecision::InvalidSample;
                    }
                    (
-                        Some((mismatch_i, DuplicateAncestorDecision::EarliestAncestorNotFrozen(_))),
+                        Some((
                            mismatch_i,
                            DuplicateAncestorDecision::EarliestPrunedMismatchFound(_),
                        )),
                        true,
                    ) => {
                        // In this case an earlier ancestor was not frozen in our blockstore,
                        // however this later ancestor is matching with our version. This most
                        // likely should never happen however it could happen if we initiate an
-                        // ancestor_hashes request immediately after startup from snapshot, we will
+                        // ancestor_hashes request immediately after startup from snapshot on a
-                        // have a match for the snapshot bank, however we don't have any of the
+                        // pruned branch, we will have a match for the snapshot bank, however we
-                        // ancestors frozen
+                        // don't have any of the ancestors frozen
                        let (mismatch_slot, mismatch_agreed_upon_hash) =
                            agreed_response[*mismatch_i];
                        info!(
@ -366,8 +350,9 @@ impl AncestorRequestStatus {
                            was agreed upon by the cluster with hash {mismatch_agreed_upon_hash} but not
                            frozen in our blockstore. However for a later ancestor {ancestor_slot} we have
                            agreement on {our_frozen_hash} as the bank hash. This should only be possible if
-                            we have just started from snapshot and immediately encountered a duplicate block,
+                            we have just started from snapshot and immediately encountered a duplicate block on
-                            otherwise something is seriously wrong. Continuing with the repair",
+                            a popular pruned fork, otherwise something is seriously wrong. Continuing with the
                            repair",
                            self.requested_mismatched_slot
                        );
                    }
@ -425,14 +410,14 @@ impl AncestorRequestStatus {
                // ancestors of our version of `self.requested_mismatched_slot`
                //
                //  ```
-                //       1 - 2 - 3 - 5' - 6' (our current fork)
+                //       1 - 2 - 3 - 5' - 6 (our current fork)
                //     /
                //  0
                //     \
                //       1 - 2 - 4 - 5 - 6 (cluster agreed fork)
                // ```
                //
-                // In this case, if we make a AncestorsHashes(6) request for our dead slot 6', we may
+                // In this case, if we make a AncestorsHashes(6) request for our dead slot 6, we may
                // get a response with slot `4` in it, which is a slot that doesn't have a frozen
                // hash in blockstore yet because either:
                //
@ -451,25 +436,47 @@ impl AncestorRequestStatus {
                // There are two cases:
                // 1) The first such mismatch `first_mismatch` appears somewhere BEFORE the slot `4` that is
                // missing from our blockstore.
-                // 2) The first such mismatch `first_mismatch` appears immediately AFTER the slot `4` that is
+                // 2) The first such mismatch `first_mismatch` appears AFTER the slot `4` that is
                // missing from our blockstore.
                //
-                // Because we know any mismatches will also trigger the mismatch casing earlier in
+                // For (1), the earlier cases in this function will cause us to detect the
-                // the function, we will return`EarliestMismatchFound(first_mismatch)`. This will
+                // mismatch, and stop until that slot is dumped and repaired.
-                // cause us to dump and repair `first_mismatch` and all its descendants, which should
+                // For (2), we continue searching until we find the mismatch. There must be a
-                // be the right behavior in both above cases.
+                // mismatch for us to have played the requested slot, and that mismatch will be
                // found or in case of no mismatch the last slot (requested slot) will be dumped
                // and repaired.
                //
                // In the rare case of multiple incorrect ancestry, where multiple cases of (1) and
                // (2) are present, the accompanying code in replay `dump_then_repair`, dumps
                // descendants of the earliest mismatch that also have frozen hashes. Failing that,
                // in extreme cases another round of ancestor or replay dump then repair will be
                // necessary to fix the fork.
                //
                // On example of an extreme case requiring multiple rounds of dump then repair is as follows:
                //
                // ```
                //       1 - 2 - 3 - 5' - 6' (our current fork)
                //     /
                //  0
                //     \
                //       1 - 2 - 4 - 5 - 6 (cluster agreed fork)
                // ```
                //
                // In this case suppose we have the wrong version of 5, the correct version is
                // supposed to chain to 4, and we also have the wrong version of 6, both versions
                // chain to 5 however ours is the duplicate.
                //
                // The first round of ancestor repair will detect 5' using case (2) above, and
                // replay will dump then repair it. Upon successful replay of 5, we see that 6 is
                // still dead or incorrect hash. This will require another round of ancestor or
                // replay dump then repair to fix.
                warn!(
                    "Blockstore is missing frozen hash for slot {},
                which the cluster claims is an ancestor of dead slot {}. Potentially
                our version of the dead slot chains to the wrong fork!",
                    ancestor_slot, self.requested_mismatched_slot
                );
                earliest_erroring_ancestor = Some((
                    agreed_response.len() - i - 1,
                    DuplicateAncestorDecision::EarliestAncestorNotFrozen(
                        DuplicateSlotRepairStatus::default(),
                    ),
                ));
            }
            last_ancestor = *ancestor_slot;
        }
@ -481,20 +488,26 @@ impl AncestorRequestStatus {
            if earliest_erroring_ancestor_index == agreed_response.len() - 1 {
                // If the earliest ancestor is missing or a mismatch, then we need to keep searching
                // for earlier mismatches
-                let repair_status = DuplicateSlotRepairStatus::new(agreed_response);
+                let repair_status =
                    DuplicateSlotRepairStatus::new(*agreed_response.last().unwrap());
                DuplicateAncestorDecision::ContinueSearch(repair_status)
            } else {
-                // We only need to look through the first `earliest_erroring_ancestor_index + 1`
+                // We only need to dump and repair the earliest mismatching ancestor.
                // elements and dump/repair any mismatches.
                agreed_response.truncate(earliest_erroring_ancestor_index + 1);
                let repair_status = decision.repair_status_mut().unwrap();
-                repair_status.correct_ancestors_to_repair = agreed_response;
+                repair_status.correct_ancestor_to_repair =
                    agreed_response[earliest_erroring_ancestor_index];
                decision
            }
        } else {
            // If we haven't returned by now, this implies all the ancestors matched our versions
-            // of those ancestors. Only slot to dump and repair is `self.requested_mismatched_slot`
+            // of those ancestors, or are missing or incomplete. Only slot to dump and repair is
-            DuplicateAncestorDecision::AncestorsAllMatch
+            // `self.requested_mismatched_slot`
            let repair_status = DuplicateSlotRepairStatus::new(*agreed_response.first().unwrap());
            if self.request_type.is_pruned() {
                DuplicateAncestorDecision::EarliestPrunedMismatchFound(repair_status)
            } else {
                DuplicateAncestorDecision::EarliestMismatchFound(repair_status)
            }
        }
    }
@ -869,18 +882,44 @@ pub mod tests {
                .insert_bank_hash(slot, correct_hash, false);
        }
        // We don't have the earlier ancestors because we just started up, however sample should
        // not be rejected as invalid.
        let DuplicateAncestorDecision::EarliestMismatchFound(repair_status) = run_add_multiple_correct_and_incorrect_responses(
            vec![],
            &mut test_setup,
        ) else {
            panic!("Incorrect decision")
        };
        assert_eq!(
            repair_status.correct_ancestor_to_repair,
            *test_setup.correct_ancestors_response.first().unwrap()
        );
    }
    #[test]
    fn test_add_multiple_responses_start_from_snapshot_missing_then_mismatch() {
        let request_slot = 100;
        let mut test_setup = setup_add_response_test(request_slot, 10);
        // Only insert the later half in our blockstore, however make mistakes
        for &(slot, _) in test_setup.correct_ancestors_response.iter().take(5) {
            test_setup
                .blockstore
                .insert_bank_hash(slot, Hash::new_unique(), false);
        }
        // We don't have the earlier ancestors because we just started up, however sample should
        // not be rejected as invalid.
        let repair_status =
            match run_add_multiple_correct_and_incorrect_responses(vec![], &mut test_setup) {
-                DuplicateAncestorDecision::ContinueSearch(repair_status) => repair_status,
+                DuplicateAncestorDecision::EarliestMismatchFound(repair_status) => repair_status,
                x => panic!("Incorrect decision {x:?}"),
            };
-        // Expect to find everything in the `correct_ancestors_to_repair`.
+        // Expect to find the first mismatch that is present
        assert_eq!(
-            repair_status.correct_ancestors_to_repair,
+            repair_status.correct_ancestor_to_repair,
-            test_setup.correct_ancestors_response
+            test_setup.correct_ancestors_response[4]
        );
    }
@ -899,18 +938,16 @@ pub mod tests {
        )];
        // We have no entries in the blockstore, so all the ancestors will be missing
-        match run_add_multiple_correct_and_incorrect_responses(
+        let DuplicateAncestorDecision::EarliestMismatchFound(repair_status) = run_add_multiple_correct_and_incorrect_responses(
            desired_incorrect_responses,
            &mut test_setup,
-        ) {
+        ) else {
-            DuplicateAncestorDecision::ContinueSearch(repair_status) => {
+            panic!("Incorrect decision")
                assert_eq!(
                    repair_status.correct_ancestors_to_repair,
                    test_setup.correct_ancestors_response
                );
            }
            x => panic!("Incorrect decision {x:?}"),
        };
        assert_eq!(
            repair_status.correct_ancestor_to_repair,
            *test_setup.correct_ancestors_response.first().unwrap()
        );
    }
    #[test]
@ -939,11 +976,11 @@ pub mod tests {
                //
                // 1) If we skip slot 93, and insert mismatched slot 94 we're testing the order of
                // events `Not frozen -> Mismatched hash` which should return
-                // `EarliestAncestorNotFrozen`
+                // `EarliestMismatchFound(94)`
                //
                // 2) If we insert mismatched slot 93, and skip slot 94 we're testing the order of
                // events `Mismatched hash -> Not frozen`, which should return
-                // `EarliestMismatchFound`
+                // `EarliestMismatchFound(93)`
                test_setup
                    .blockstore
                    .insert_bank_hash(slot, Hash::new_unique(), false);
@ -952,28 +989,19 @@ pub mod tests {
        let repair_status =
            match run_add_multiple_correct_and_incorrect_responses(vec![], &mut test_setup) {
-                DuplicateAncestorDecision::EarliestMismatchFound(repair_status)
+                DuplicateAncestorDecision::EarliestMismatchFound(repair_status) => repair_status,
                    if insert_even_or_odds == 1 =>
                {
                    repair_status
                }
                DuplicateAncestorDecision::EarliestAncestorNotFrozen(repair_status)
                    if insert_even_or_odds == 0 =>
                {
                    repair_status
                }
                x => panic!("Incorrect decision {x:?}"),
            };
-        // Expect to find everything after 92 in the `correct_ancestors_to_repair`.
+        // Expect to find 93 or 94 (see comment above)
-        let expected_mismatched_slots: Vec<(Slot, Hash)> = test_setup
+        let expected_mismatched = test_setup
            .correct_ancestors_response
            .into_iter()
-            .filter(|(slot, _)| *slot > 92)
+            .find(|(slot, _)| *slot == if insert_even_or_odds == 0 { 94 } else { 93 })
-            .collect();
+            .unwrap();
        assert_eq!(
-            repair_status.correct_ancestors_to_repair,
+            repair_status.correct_ancestor_to_repair,
-            expected_mismatched_slots
+            expected_mismatched
        );
    }
@ -993,8 +1021,8 @@ pub mod tests {
        match run_add_multiple_correct_and_incorrect_responses(vec![], &mut test_setup) {
            DuplicateAncestorDecision::ContinueSearch(repair_status) => {
                assert_eq!(
-                    repair_status.correct_ancestors_to_repair,
+                    repair_status.correct_ancestor_to_repair,
-                    test_setup.correct_ancestors_response
+                    *test_setup.correct_ancestors_response.last().unwrap()
                );
            }
            x => panic!("Incorrect decision {x:?}"),
@ -1032,15 +1060,16 @@ pub mod tests {
        // All the ancestors are mismatched, so we need to continue the search
        match run_add_multiple_correct_and_incorrect_responses(vec![], &mut test_setup) {
            DuplicateAncestorDecision::EarliestMismatchFound(repair_status) => {
-                // Expect to find everything after 92 in the `correct_ancestors_to_repair`.
+                // Expect to find the first slot after 92 in the `correct_ancestor_to_repair`.
-                let expected_mismatched_slots: Vec<(Slot, Hash)> = test_setup
+                let expected_mismatched = test_setup
                    .correct_ancestors_response
                    .into_iter()
-                    .filter(|(slot, _)| *slot > 92)
+                    .rev()
-                    .collect();
+                    .find(|(slot, _)| *slot > 92)
                    .unwrap();
                assert_eq!(
-                    repair_status.correct_ancestors_to_repair,
+                    repair_status.correct_ancestor_to_repair,
-                    expected_mismatched_slots
+                    expected_mismatched,
                );
            }
            x => panic!("Incorrect decision {x:?}"),
@ -1059,10 +1088,16 @@ pub mod tests {
                .insert_bank_hash(slot, correct_hash, false);
        }
-        // All the ancestors matched
+        // All the ancestors matched, only the requested slot should be dumped
        let DuplicateAncestorDecision::EarliestMismatchFound(repair_status) = run_add_multiple_correct_and_incorrect_responses(
            vec![],
            &mut test_setup,
        ) else {
            panic!("Incorrect decision")
        };
        assert_eq!(
-            run_add_multiple_correct_and_incorrect_responses(vec![], &mut test_setup),
+            repair_status.correct_ancestor_to_repair,
-            DuplicateAncestorDecision::AncestorsAllMatch
+            *test_setup.correct_ancestors_response.first().unwrap()
        );
    }
@ -1075,8 +1110,8 @@ pub mod tests {
        match run_add_multiple_correct_and_incorrect_responses(vec![], &mut test_setup) {
            DuplicateAncestorDecision::ContinueSearch(repair_status) => {
                assert_eq!(
-                    repair_status.correct_ancestors_to_repair,
+                    repair_status.correct_ancestor_to_repair,
-                    test_setup.correct_ancestors_response
+                    *test_setup.correct_ancestors_response.last().unwrap()
                );
            }
            x => panic!("Incorrect decision {x:?}"),
@ -1097,10 +1132,16 @@ pub mod tests {
            .blockstore
            .add_tree(tree, true, true, 2, Hash::default());
-        // All the ancestors matched
+        // All the ancestors matched, only the requested slot should be dumped
        let DuplicateAncestorDecision::EarliestPrunedMismatchFound(repair_status) = run_add_multiple_correct_and_incorrect_responses(
            vec![],
            &mut test_setup,
        ) else {
            panic!("Incorrect decision")
        };
        assert_eq!(
-            run_add_multiple_correct_and_incorrect_responses(vec![], &mut test_setup),
+            repair_status.correct_ancestor_to_repair,
-            DuplicateAncestorDecision::AncestorsAllMatch
+            *test_setup.correct_ancestors_response.first().unwrap()
        );
    }
@ -1135,15 +1176,16 @@ pub mod tests {
                x => panic!("Incorrect decision {x:?}"),
            };
-        // Expect to find everything after 93 in the `correct_ancestors_to_repair`.
+        // Expect to find first slot after 93 in the `correct_ancestor_to_repair`.
-        let expected_mismatched_slots: Vec<(Slot, Hash)> = test_setup
+        let expected_mismatched = test_setup
            .correct_ancestors_response
            .into_iter()
-            .filter(|(slot, _)| *slot > 93)
+            .rev()
-            .collect();
+            .find(|(slot, _)| *slot > 93)
            .unwrap();
        assert_eq!(
-            repair_status.correct_ancestors_to_repair,
+            repair_status.correct_ancestor_to_repair,
-            expected_mismatched_slots
+            expected_mismatched,
        );
    }
@ -1183,15 +1225,16 @@ pub mod tests {
                x => panic!("Incorrect decision {x:?}"),
            };
-        // Expect to find everything after 92 in the `correct_ancestors_to_repair`.
+        // Expect to find first slot after 92 in the `correct_ancestor_to_repair`.
-        let expected_mismatched_slots: Vec<(Slot, Hash)> = test_setup
+        let expected_mismatched = test_setup
            .correct_ancestors_response
            .into_iter()
-            .filter(|(slot, _)| *slot >= 93)
+            .rev()
-            .collect();
+            .find(|(slot, _)| *slot >= 93)
            .unwrap();
        assert_eq!(
-            repair_status.correct_ancestors_to_repair,
+            repair_status.correct_ancestor_to_repair,
-            expected_mismatched_slots
+            expected_mismatched,
        );
    }
 }
--- a/core/src/repair/repair_service.rs
+++ b/core/src/repair/repair_service.rs
@ -11,7 +11,7 @@ use {
        cluster_slots_service::cluster_slots::ClusterSlots,
        repair::{
            ancestor_hashes_service::{AncestorHashesReplayUpdateReceiver, AncestorHashesService},
-            duplicate_repair_status::AncestorDuplicateSlotsToRepair,
+            duplicate_repair_status::AncestorDuplicateSlotToRepair,
            outstanding_requests::OutstandingRequests,
            repair_weight::RepairWeight,
            serve_repair::{ServeRepair, ShredRepairType, REPAIR_PEERS_CACHE_CAPACITY},
@ -52,8 +52,8 @@ use {
 const DEFER_REPAIR_THRESHOLD: Duration = Duration::from_millis(200);
 const DEFER_REPAIR_THRESHOLD_TICKS: u64 = DEFER_REPAIR_THRESHOLD.as_millis() as u64 / MS_PER_TICK;
-pub type AncestorDuplicateSlotsSender = CrossbeamSender<AncestorDuplicateSlotsToRepair>;
+pub type AncestorDuplicateSlotsSender = CrossbeamSender<AncestorDuplicateSlotToRepair>;
-pub type AncestorDuplicateSlotsReceiver = CrossbeamReceiver<AncestorDuplicateSlotsToRepair>;
+pub type AncestorDuplicateSlotsReceiver = CrossbeamReceiver<AncestorDuplicateSlotToRepair>;
 pub type ConfirmedSlotsSender = CrossbeamSender<Vec<Slot>>;
 pub type ConfirmedSlotsReceiver = CrossbeamReceiver<Vec<Slot>>;
 pub type DumpedSlotsSender = CrossbeamSender<Vec<(Slot, Hash)>>;
@ -822,7 +822,7 @@ impl RepairService {
            .repair_request_duplicate_compute_best_peer(slot, cluster_slots, repair_validators)
            .ok();
        let new_duplicate_slot_repair_status = DuplicateSlotRepairStatus {
-            correct_ancestors_to_repair: vec![(slot, Hash::default())],
+            correct_ancestor_to_repair: (slot, Hash::default()),
            repair_pubkey_and_addr,
            start_ts: timestamp(),
        };
@ -1206,7 +1206,7 @@ mod test {
        let dead_slot = 9;
        let receive_socket = &UdpSocket::bind("0.0.0.0:0").unwrap();
        let duplicate_status = DuplicateSlotRepairStatus {
-            correct_ancestors_to_repair: vec![(dead_slot, Hash::default())],
+            correct_ancestor_to_repair: (dead_slot, Hash::default()),
            start_ts: std::u64::MAX,
            repair_pubkey_and_addr: None,
        };
@ -1313,7 +1313,7 @@ mod test {
        // Not enough time has passed, should not update the
        // address
        let mut duplicate_status = DuplicateSlotRepairStatus {
-            correct_ancestors_to_repair: vec![(dead_slot, Hash::default())],
+            correct_ancestor_to_repair: (dead_slot, Hash::default()),
            start_ts: std::u64::MAX,
            repair_pubkey_and_addr: dummy_addr,
        };
@ -1328,7 +1328,7 @@ mod test {
        // If the repair address is None, should try to update
        let mut duplicate_status = DuplicateSlotRepairStatus {
-            correct_ancestors_to_repair: vec![(dead_slot, Hash::default())],
+            correct_ancestor_to_repair: (dead_slot, Hash::default()),
            start_ts: std::u64::MAX,
            repair_pubkey_and_addr: None,
        };
@ -1343,7 +1343,7 @@ mod test {
        // If sufficient time has passed, should try to update
        let mut duplicate_status = DuplicateSlotRepairStatus {
-            correct_ancestors_to_repair: vec![(dead_slot, Hash::default())],
+            correct_ancestor_to_repair: (dead_slot, Hash::default()),
            start_ts: timestamp() - MAX_DUPLICATE_WAIT_MS as u64,
            repair_pubkey_and_addr: dummy_addr,
        };
--- a/core/src/replay_stage.rs
+++ b/core/src/replay_stage.rs
@ -22,7 +22,7 @@ use {
        repair::{
            ancestor_hashes_service::AncestorHashesReplayUpdateSender,
            cluster_slot_state_verifier::*,
-            duplicate_repair_status::AncestorDuplicateSlotsToRepair,
+            duplicate_repair_status::AncestorDuplicateSlotToRepair,
            repair_service::{
                AncestorDuplicateSlotsReceiver, DumpedSlotsSender, PopularPrunedForksReceiver,
            },
@ -1416,46 +1416,42 @@ impl ReplayStage {
        purge_repair_slot_counter: &mut PurgeRepairSlotCounter,
    ) {
        let root = bank_forks.read().unwrap().root();
-        for AncestorDuplicateSlotsToRepair {
+        for AncestorDuplicateSlotToRepair {
-            slots_to_repair: maybe_repairable_duplicate_slots,
+            slot_to_repair: (epoch_slots_frozen_slot, epoch_slots_frozen_hash),
            request_type,
        } in ancestor_duplicate_slots_receiver.try_iter()
        {
            warn!(
-                "{} ReplayStage notified of duplicate slots from ancestor hashes service but we observed as {}: {:?}",
+                "{} ReplayStage notified of duplicate slot from ancestor hashes service but we observed as {}: {:?}",
-                pubkey, if request_type.is_pruned() {"pruned"} else {"dead"}, maybe_repairable_duplicate_slots,
+                pubkey, if request_type.is_pruned() {"pruned"} else {"dead"}, (epoch_slots_frozen_slot, epoch_slots_frozen_hash),
            );
            let epoch_slots_frozen_state = EpochSlotsFrozenState::new_from_state(
                epoch_slots_frozen_slot,
                epoch_slots_frozen_hash,
                gossip_duplicate_confirmed_slots,
                fork_choice,
                || progress.is_dead(epoch_slots_frozen_slot).unwrap_or(false),
                || {
                    bank_forks
                        .read()
                        .unwrap()
                        .get(epoch_slots_frozen_slot)
                        .map(|b| b.hash())
                },
                request_type.is_pruned(),
            );
            check_slot_agrees_with_cluster(
                epoch_slots_frozen_slot,
                root,
                blockstore,
                duplicate_slots_tracker,
                epoch_slots_frozen_slots,
                fork_choice,
                duplicate_slots_to_repair,
                ancestor_hashes_replay_update_sender,
                purge_repair_slot_counter,
                SlotStateUpdate::EpochSlotsFrozen(epoch_slots_frozen_state),
            );
            for (epoch_slots_frozen_slot, epoch_slots_frozen_hash) in
                maybe_repairable_duplicate_slots.into_iter()
            {
                let epoch_slots_frozen_state = EpochSlotsFrozenState::new_from_state(
                    epoch_slots_frozen_slot,
                    epoch_slots_frozen_hash,
                    gossip_duplicate_confirmed_slots,
                    fork_choice,
                    || progress.is_dead(epoch_slots_frozen_slot).unwrap_or(false),
                    || {
                        bank_forks
                            .read()
                            .unwrap()
                            .get(epoch_slots_frozen_slot)
                            .map(|b| b.hash())
                    },
                    request_type.is_pruned(),
                );
                check_slot_agrees_with_cluster(
                    epoch_slots_frozen_slot,
                    root,
                    blockstore,
                    duplicate_slots_tracker,
                    epoch_slots_frozen_slots,
                    fork_choice,
                    duplicate_slots_to_repair,
                    ancestor_hashes_replay_update_sender,
                    purge_repair_slot_counter,
                    SlotStateUpdate::EpochSlotsFrozen(epoch_slots_frozen_state),
                );
            }
        }
    }
--- a/local-cluster/tests/local_cluster.rs
+++ b/local-cluster/tests/local_cluster.rs
@ -16,10 +16,14 @@ use {
        validator::ValidatorConfig,
    },
    solana_download_utils::download_snapshot_archive,
    solana_entry::entry::create_ticks,
    solana_gossip::{contact_info::LegacyContactInfo, gossip_service::discover_cluster},
    solana_ledger::{
-        ancestor_iterator::AncestorIterator, bank_forks_utils, blockstore::Blockstore,
+        ancestor_iterator::AncestorIterator,
-        blockstore_processor::ProcessOptions, leader_schedule::FixedSchedule,
+        bank_forks_utils,
        blockstore::{entries_to_test_shreds, Blockstore},
        blockstore_processor::ProcessOptions,
        leader_schedule::FixedSchedule,
        use_snapshot_archives_at_startup::UseSnapshotArchivesAtStartup,
    },
    solana_local_cluster::{
@ -80,7 +84,6 @@ use {
        thread::{sleep, Builder, JoinHandle},
        time::{Duration, Instant},
    },
    trees::tr,
 };
 mod common;
@ -4542,7 +4545,6 @@ fn test_duplicate_with_pruned_ancestor() {
        "28bN3xyvrP4E8LwEgtLjhnkb7cY4amQb6DrYAbAYjgRV4GAGgkVM2K7wnxnAS7WDneuavza7x21MiafLu1HkwQt4",
        "2saHBBoTkLMmttmPQP8KfBkcCw45S5cwtV3wTdGCscRC8uxdgvHxpHiWXKx4LvJjNJtnNcbSv5NdheokFFqnNDt8",
        "4mx9yoFBeYasDKBGDWCTWGJdWuJCKbgqmuP8bN9umybCh5Jzngw7KQxe99Rf5uzfyzgba1i65rJW4Wqk7Ab5S8ye",
        "3zsEPEDsjfEay7te9XqNjRTCE7vwuT6u4DHzBJC19yp7GS8BuNRMRjnpVrKCBzb3d44kxc4KPGSHkCmk6tEfswCg",
    ]
    .iter()
    .map(|s| (Arc::new(Keypair::from_base58_string(s)), true))
@ -4568,7 +4570,6 @@ fn test_duplicate_with_pruned_ancestor() {
    });
    let mut validator_configs = make_identical_validator_configs(&default_config, num_nodes);
    validator_configs[3].voting_disabled = true;
    // Don't let majority produce anything past the fork by tricking its leader schedule
    validator_configs[0].fixed_leader_schedule = Some(FixedSchedule {
        leader_schedule: Arc::new(create_custom_leader_schedule(
@ -4704,7 +4705,10 @@ fn test_duplicate_with_pruned_ancestor() {
    let last_majority_vote =
        wait_for_last_vote_in_tower_to_land_in_ledger(&majority_ledger_path, &majority_pubkey);
-    info!("Creating duplicate block built off of pruned branch for our node. Last majority vote {last_majority_vote}, Last minority vote {last_minority_vote}");
+    info!(
        "Creating duplicate block built off of pruned branch for our node.
           Last majority vote {last_majority_vote}, Last minority vote {last_minority_vote}"
    );
    {
        {
            // Copy majority fork
@ -4723,14 +4727,21 @@ fn test_duplicate_with_pruned_ancestor() {
        // Change last block parent to chain off of (purged) minority fork
        info!("For our node, changing parent of {last_majority_vote} to {last_minority_vote}");
-        purge_slots_with_count(&our_blockstore, last_majority_vote, 1);
+        our_blockstore.clear_unconfirmed_slot(last_majority_vote);
-        our_blockstore.add_tree(
+        let entries = create_ticks(
-            tr(last_minority_vote) / tr(last_majority_vote),
+            64 * (std::cmp::max(1, last_majority_vote - last_minority_vote)),
-            false,
+            0,
            true,
            64,
            Hash::default(),
        );
        let shreds = entries_to_test_shreds(
            &entries,
            last_majority_vote,
            last_minority_vote,
            true,
            0,
            true, // merkle_variant
        );
        our_blockstore.insert_shreds(shreds, None, false).unwrap();
        // Update the root to set minority fork back as pruned
        our_blockstore.set_last_root(fork_slot + fork_length);