Fix duplicate column reconstruction race in reprocessing queue

This commit is contained in:
Jimmy Chen
2026-03-02 16:52:40 +11:00
parent 2f43d234d8
commit 4ad036a281

View File

@@ -257,7 +257,9 @@ struct ReprocessQueue<S> {
/// Light Client Updates per parent_root.
awaiting_lc_updates_per_parent_root: HashMap<Hash256, Vec<QueuedLightClientUpdateId>>,
/// Column reconstruction per block root.
queued_column_reconstructions: HashMap<Hash256, DelayKey>,
/// `Some(key)` = active timer in the delay queue.
/// `None` = reconstruction already fired, reject late messages.
queued_column_reconstructions: HashMap<Hash256, Option<DelayKey>>,
/// Queued backfill batches
queued_backfill_batches: Vec<QueuedBackfillBatch>,
@@ -772,15 +774,18 @@ impl<S: SlotClock> ReprocessQueue<S> {
reconstruction_delay = Duration::from_secs(0);
}
match self.queued_column_reconstructions.entry(request.block_root) {
Entry::Occupied(key) => {
self.column_reconstructions_delay_queue
.reset(key.get(), reconstruction_delay);
Entry::Occupied(entry) => {
if let Some(delay_key) = entry.get() {
self.column_reconstructions_delay_queue
.reset(delay_key, reconstruction_delay);
}
// None → reconstruction already fired, skip
}
Entry::Vacant(vacant) => {
let delay_key = self
.column_reconstructions_delay_queue
.insert(request, reconstruction_delay);
vacant.insert(delay_key);
vacant.insert(Some(delay_key));
}
}
}
@@ -921,8 +926,12 @@ impl<S: SlotClock> ReprocessQueue<S> {
}
}
InboundEvent::ReadyColumnReconstruction(column_reconstruction) => {
let block_root = column_reconstruction.block_root;
// Prune old fired entries before marking current
self.queued_column_reconstructions
.remove(&column_reconstruction.block_root);
.retain(|_, v| v.is_some());
// Mark as fired (prevents duplicate reconstruction from late messages)
self.queued_column_reconstructions.insert(block_root, None);
if self
.ready_work_tx
.try_send(ReadyWork::ColumnReconstruction(column_reconstruction))