320 lines
12 KiB
Rust
320 lines
12 KiB
Rust
|
//! Import attestations and publish them to the network.
|
||
|
//!
|
||
|
//! This module gracefully handles attestations to unknown blocks by requeuing them and then
|
||
|
//! efficiently waiting for them to finish reprocessing (using an async yield).
|
||
|
//!
|
||
|
//! The following comments relate to the handling of duplicate attestations (relocated here during
|
||
|
//! refactoring):
|
||
|
//!
|
||
|
//! Skip to the next attestation since an attestation for this
|
||
|
//! validator is already known in this epoch.
|
||
|
//!
|
||
|
//! There's little value for the network in validating a second
|
||
|
//! attestation for another validator since it is either:
|
||
|
//!
|
||
|
//! 1. A duplicate.
|
||
|
//! 2. Slashable.
|
||
|
//! 3. Invalid.
|
||
|
//!
|
||
|
//! We are likely to get duplicates in the case where a VC is using
|
||
|
//! fallback BNs. If the first BN actually publishes some/all of a
|
||
|
//! batch of attestations but fails to respond in a timely fashion,
|
||
|
//! the VC is likely to try publishing the attestations on another
|
||
|
//! BN. That second BN may have already seen the attestations from
|
||
|
//! the first BN and therefore indicate that the attestations are
|
||
|
//! "already seen". An attestation that has already been seen has
|
||
|
//! been published on the network so there's no actual error from
|
||
|
//! the perspective of the user.
|
||
|
//!
|
||
|
//! It's better to prevent slashable attestations from ever
|
||
|
//! appearing on the network than trying to slash validators,
|
||
|
//! especially those validators connected to the local API.
|
||
|
//!
|
||
|
//! There might be *some* value in determining that this attestation
|
||
|
//! is invalid, but since a valid attestation already it exists it
|
||
|
//! appears that this validator is capable of producing valid
|
||
|
//! attestations and there's no immediate cause for concern.
|
||
|
use crate::task_spawner::{Priority, TaskSpawner};
|
||
|
use beacon_chain::{
|
||
|
validator_monitor::timestamp_now, AttestationError, BeaconChain, BeaconChainError,
|
||
|
BeaconChainTypes,
|
||
|
};
|
||
|
use beacon_processor::work_reprocessing_queue::{QueuedUnaggregate, ReprocessQueueMessage};
|
||
|
use eth2::types::Failure;
|
||
|
use lighthouse_network::PubsubMessage;
|
||
|
use network::NetworkMessage;
|
||
|
use slog::{debug, error, warn, Logger};
|
||
|
use std::sync::Arc;
|
||
|
use std::time::Duration;
|
||
|
use tokio::sync::{
|
||
|
mpsc::{Sender, UnboundedSender},
|
||
|
oneshot,
|
||
|
};
|
||
|
use types::Attestation;
|
||
|
|
||
|
// Error variants are only used in `Debug` and considered `dead_code` by the compiler.
|
||
|
#[derive(Debug)]
|
||
|
enum Error {
|
||
|
Validation(AttestationError),
|
||
|
Publication,
|
||
|
ForkChoice(#[allow(dead_code)] BeaconChainError),
|
||
|
AggregationPool(#[allow(dead_code)] AttestationError),
|
||
|
ReprocessDisabled,
|
||
|
ReprocessFull,
|
||
|
ReprocessTimeout,
|
||
|
}
|
||
|
|
||
|
enum PublishAttestationResult {
|
||
|
Success,
|
||
|
AlreadyKnown,
|
||
|
Reprocessing(oneshot::Receiver<Result<(), Error>>),
|
||
|
Failure(Error),
|
||
|
}
|
||
|
|
||
|
fn verify_and_publish_attestation<T: BeaconChainTypes>(
|
||
|
chain: &Arc<BeaconChain<T>>,
|
||
|
attestation: &Attestation<T::EthSpec>,
|
||
|
seen_timestamp: Duration,
|
||
|
network_tx: &UnboundedSender<NetworkMessage<T::EthSpec>>,
|
||
|
log: &Logger,
|
||
|
) -> Result<(), Error> {
|
||
|
let attestation = chain
|
||
|
.verify_unaggregated_attestation_for_gossip(attestation, None)
|
||
|
.map_err(Error::Validation)?;
|
||
|
|
||
|
// Publish.
|
||
|
network_tx
|
||
|
.send(NetworkMessage::Publish {
|
||
|
messages: vec![PubsubMessage::Attestation(Box::new((
|
||
|
attestation.subnet_id(),
|
||
|
attestation.attestation().clone(),
|
||
|
)))],
|
||
|
})
|
||
|
.map_err(|_| Error::Publication)?;
|
||
|
|
||
|
// Notify the validator monitor.
|
||
|
chain
|
||
|
.validator_monitor
|
||
|
.read()
|
||
|
.register_api_unaggregated_attestation(
|
||
|
seen_timestamp,
|
||
|
attestation.indexed_attestation(),
|
||
|
&chain.slot_clock,
|
||
|
);
|
||
|
|
||
|
let fc_result = chain.apply_attestation_to_fork_choice(&attestation);
|
||
|
let naive_aggregation_result = chain.add_to_naive_aggregation_pool(&attestation);
|
||
|
|
||
|
if let Err(e) = &fc_result {
|
||
|
warn!(
|
||
|
log,
|
||
|
"Attestation invalid for fork choice";
|
||
|
"err" => ?e,
|
||
|
);
|
||
|
}
|
||
|
if let Err(e) = &naive_aggregation_result {
|
||
|
warn!(
|
||
|
log,
|
||
|
"Attestation invalid for aggregation";
|
||
|
"err" => ?e
|
||
|
);
|
||
|
}
|
||
|
|
||
|
if let Err(e) = fc_result {
|
||
|
Err(Error::ForkChoice(e))
|
||
|
} else if let Err(e) = naive_aggregation_result {
|
||
|
Err(Error::AggregationPool(e))
|
||
|
} else {
|
||
|
Ok(())
|
||
|
}
|
||
|
}
|
||
|
|
||
|
pub async fn publish_attestations<T: BeaconChainTypes>(
|
||
|
task_spawner: TaskSpawner<T::EthSpec>,
|
||
|
chain: Arc<BeaconChain<T>>,
|
||
|
attestations: Vec<Attestation<T::EthSpec>>,
|
||
|
network_tx: UnboundedSender<NetworkMessage<T::EthSpec>>,
|
||
|
reprocess_send: Option<Sender<ReprocessQueueMessage>>,
|
||
|
log: Logger,
|
||
|
) -> Result<(), warp::Rejection> {
|
||
|
// Collect metadata about attestations which we'll use to report failures. We need to
|
||
|
// move the `attestations` vec into the blocking task, so this small overhead is unavoidable.
|
||
|
let attestation_metadata = attestations
|
||
|
.iter()
|
||
|
.map(|att| (att.data.slot, att.data.index))
|
||
|
.collect::<Vec<_>>();
|
||
|
|
||
|
// Gossip validate and publish attestations that can be immediately processed.
|
||
|
let seen_timestamp = timestamp_now();
|
||
|
let inner_log = log.clone();
|
||
|
let mut prelim_results = task_spawner
|
||
|
.blocking_task(Priority::P0, move || {
|
||
|
Ok(attestations
|
||
|
.into_iter()
|
||
|
.map(|attestation| {
|
||
|
match verify_and_publish_attestation(
|
||
|
&chain,
|
||
|
&attestation,
|
||
|
seen_timestamp,
|
||
|
&network_tx,
|
||
|
&inner_log,
|
||
|
) {
|
||
|
Ok(()) => PublishAttestationResult::Success,
|
||
|
Err(Error::Validation(AttestationError::UnknownHeadBlock {
|
||
|
beacon_block_root,
|
||
|
})) => {
|
||
|
let Some(reprocess_tx) = &reprocess_send else {
|
||
|
return PublishAttestationResult::Failure(Error::ReprocessDisabled);
|
||
|
};
|
||
|
// Re-process.
|
||
|
let (tx, rx) = oneshot::channel();
|
||
|
let reprocess_chain = chain.clone();
|
||
|
let reprocess_network_tx = network_tx.clone();
|
||
|
let reprocess_log = inner_log.clone();
|
||
|
let reprocess_fn = move || {
|
||
|
let result = verify_and_publish_attestation(
|
||
|
&reprocess_chain,
|
||
|
&attestation,
|
||
|
seen_timestamp,
|
||
|
&reprocess_network_tx,
|
||
|
&reprocess_log,
|
||
|
);
|
||
|
// Ignore failure on the oneshot that reports the result. This
|
||
|
// shouldn't happen unless some catastrophe befalls the waiting
|
||
|
// thread which causes it to drop.
|
||
|
let _ = tx.send(result);
|
||
|
};
|
||
|
let reprocess_msg =
|
||
|
ReprocessQueueMessage::UnknownBlockUnaggregate(QueuedUnaggregate {
|
||
|
beacon_block_root,
|
||
|
process_fn: Box::new(reprocess_fn),
|
||
|
});
|
||
|
if reprocess_tx.try_send(reprocess_msg).is_err() {
|
||
|
PublishAttestationResult::Failure(Error::ReprocessFull)
|
||
|
} else {
|
||
|
PublishAttestationResult::Reprocessing(rx)
|
||
|
}
|
||
|
}
|
||
|
Err(Error::Validation(AttestationError::PriorAttestationKnown {
|
||
|
..
|
||
|
})) => PublishAttestationResult::AlreadyKnown,
|
||
|
Err(e) => PublishAttestationResult::Failure(e),
|
||
|
}
|
||
|
})
|
||
|
.map(Some)
|
||
|
.collect::<Vec<_>>())
|
||
|
})
|
||
|
.await?;
|
||
|
|
||
|
// Asynchronously wait for re-processing of attestations to unknown blocks. This avoids blocking
|
||
|
// any of the beacon processor workers while we wait for reprocessing.
|
||
|
let (reprocess_indices, reprocess_futures): (Vec<_>, Vec<_>) = prelim_results
|
||
|
.iter_mut()
|
||
|
.enumerate()
|
||
|
.filter_map(|(i, opt_result)| {
|
||
|
if let Some(PublishAttestationResult::Reprocessing(..)) = &opt_result {
|
||
|
let PublishAttestationResult::Reprocessing(rx) = opt_result.take()? else {
|
||
|
// Unreachable.
|
||
|
return None;
|
||
|
};
|
||
|
Some((i, rx))
|
||
|
} else {
|
||
|
None
|
||
|
}
|
||
|
})
|
||
|
.unzip();
|
||
|
let reprocess_results = futures::future::join_all(reprocess_futures).await;
|
||
|
|
||
|
// Join everything back together and construct a response.
|
||
|
// This part should be quick so we just stay in the Tokio executor's async task.
|
||
|
for (i, reprocess_result) in reprocess_indices.into_iter().zip(reprocess_results) {
|
||
|
let Some(result_entry) = prelim_results.get_mut(i) else {
|
||
|
error!(
|
||
|
log,
|
||
|
"Unreachable case in attestation publishing";
|
||
|
"case" => "prelim out of bounds",
|
||
|
"request_index" => i,
|
||
|
);
|
||
|
continue;
|
||
|
};
|
||
|
*result_entry = Some(match reprocess_result {
|
||
|
Ok(Ok(())) => PublishAttestationResult::Success,
|
||
|
// Attestation failed processing on re-process.
|
||
|
Ok(Err(Error::Validation(AttestationError::PriorAttestationKnown { .. }))) => {
|
||
|
PublishAttestationResult::AlreadyKnown
|
||
|
}
|
||
|
Ok(Err(e)) => PublishAttestationResult::Failure(e),
|
||
|
// Oneshot was dropped, indicating that the attestation either timed out in the
|
||
|
// reprocess queue or was dropped due to some error.
|
||
|
Err(_) => PublishAttestationResult::Failure(Error::ReprocessTimeout),
|
||
|
});
|
||
|
}
|
||
|
|
||
|
// Construct the response.
|
||
|
let mut failures = vec![];
|
||
|
let mut num_already_known = 0;
|
||
|
|
||
|
for (index, result) in prelim_results.iter().enumerate() {
|
||
|
match result {
|
||
|
Some(PublishAttestationResult::Success) => {}
|
||
|
Some(PublishAttestationResult::AlreadyKnown) => num_already_known += 1,
|
||
|
Some(PublishAttestationResult::Failure(e)) => {
|
||
|
if let Some((slot, committee_index)) = attestation_metadata.get(index) {
|
||
|
error!(
|
||
|
log,
|
||
|
"Failure verifying attestation for gossip";
|
||
|
"error" => ?e,
|
||
|
"request_index" => index,
|
||
|
"committee_index" => committee_index,
|
||
|
"attestation_slot" => slot,
|
||
|
);
|
||
|
failures.push(Failure::new(index, format!("{e:?}")));
|
||
|
} else {
|
||
|
error!(
|
||
|
log,
|
||
|
"Unreachable case in attestation publishing";
|
||
|
"case" => "out of bounds",
|
||
|
"request_index" => index
|
||
|
);
|
||
|
failures.push(Failure::new(index, "metadata logic error".into()));
|
||
|
}
|
||
|
}
|
||
|
Some(PublishAttestationResult::Reprocessing(_)) => {
|
||
|
error!(
|
||
|
log,
|
||
|
"Unreachable case in attestation publishing";
|
||
|
"case" => "reprocessing",
|
||
|
"request_index" => index
|
||
|
);
|
||
|
failures.push(Failure::new(index, "reprocess logic error".into()));
|
||
|
}
|
||
|
None => {
|
||
|
error!(
|
||
|
log,
|
||
|
"Unreachable case in attestation publishing";
|
||
|
"case" => "result is None",
|
||
|
"request_index" => index
|
||
|
);
|
||
|
failures.push(Failure::new(index, "result logic error".into()));
|
||
|
}
|
||
|
}
|
||
|
}
|
||
|
|
||
|
if num_already_known > 0 {
|
||
|
debug!(
|
||
|
log,
|
||
|
"Some unagg attestations already known";
|
||
|
"count" => num_already_known
|
||
|
);
|
||
|
}
|
||
|
|
||
|
if failures.is_empty() {
|
||
|
Ok(())
|
||
|
} else {
|
||
|
Err(warp_utils::reject::indexed_bad_request(
|
||
|
"error processing attestations".to_string(),
|
||
|
failures,
|
||
|
))
|
||
|
}
|
||
|
}
|