Upgrade the parent lookup logic (#895)
* Upgrade the parent lookup logic
This commit is contained in:
parent
6b2e9ff246
commit
5d8a085880
@ -43,6 +43,7 @@ use eth2_libp2p::rpc::RequestId;
|
|||||||
use eth2_libp2p::PeerId;
|
use eth2_libp2p::PeerId;
|
||||||
use fnv::FnvHashMap;
|
use fnv::FnvHashMap;
|
||||||
use futures::prelude::*;
|
use futures::prelude::*;
|
||||||
|
use rand::seq::SliceRandom;
|
||||||
use slog::{crit, debug, error, info, trace, warn, Logger};
|
use slog::{crit, debug, error, info, trace, warn, Logger};
|
||||||
use smallvec::SmallVec;
|
use smallvec::SmallVec;
|
||||||
use std::boxed::Box;
|
use std::boxed::Box;
|
||||||
@ -160,8 +161,11 @@ pub struct SyncManager<T: BeaconChainTypes> {
|
|||||||
/// A collection of parent block lookups.
|
/// A collection of parent block lookups.
|
||||||
parent_queue: SmallVec<[ParentRequests<T::EthSpec>; 3]>,
|
parent_queue: SmallVec<[ParentRequests<T::EthSpec>; 3]>,
|
||||||
|
|
||||||
/// A collection of block hashes being searched for
|
/// A collection of block hashes being searched for and a flag indicating if a result has been
|
||||||
single_block_lookups: FnvHashMap<RequestId, Hash256>,
|
/// received or not.
|
||||||
|
///
|
||||||
|
/// The flag allows us to determine if the peer returned data or sent us nothing.
|
||||||
|
single_block_lookups: FnvHashMap<RequestId, (Hash256, bool)>,
|
||||||
|
|
||||||
/// The collection of known, connected, fully-sync'd peers.
|
/// The collection of known, connected, fully-sync'd peers.
|
||||||
full_peers: HashSet<PeerId>,
|
full_peers: HashSet<PeerId>,
|
||||||
@ -292,44 +296,74 @@ impl<T: BeaconChainTypes> SyncManager<T> {
|
|||||||
request_id: RequestId,
|
request_id: RequestId,
|
||||||
block: Option<SignedBeaconBlock<T::EthSpec>>,
|
block: Option<SignedBeaconBlock<T::EthSpec>>,
|
||||||
) {
|
) {
|
||||||
// check if this is a single block lookup - i.e we were searching for a specific hash
|
|
||||||
if block.is_some() {
|
|
||||||
if let Some(block_hash) = self.single_block_lookups.remove(&request_id) {
|
|
||||||
self.single_block_lookup_response(
|
|
||||||
peer_id,
|
|
||||||
block.expect("block exists"),
|
|
||||||
block_hash,
|
|
||||||
);
|
|
||||||
return;
|
|
||||||
}
|
|
||||||
}
|
|
||||||
|
|
||||||
// this should be a response to a parent request search
|
|
||||||
// find the request
|
|
||||||
let mut parent_request = match self
|
|
||||||
.parent_queue
|
|
||||||
.iter()
|
|
||||||
.position(|request| request.pending == Some(request_id))
|
|
||||||
{
|
|
||||||
Some(pos) => self.parent_queue.remove(pos),
|
|
||||||
None => {
|
|
||||||
if block.is_some() {
|
|
||||||
// No pending request, invalid request_id or coding error
|
|
||||||
warn!(self.log, "BlocksByRoot response unknown"; "request_id" => request_id);
|
|
||||||
}
|
|
||||||
// it could be a stream termination None, in which case we just ignore it
|
|
||||||
return;
|
|
||||||
}
|
|
||||||
};
|
|
||||||
|
|
||||||
match block {
|
match block {
|
||||||
Some(block) => {
|
Some(block) => {
|
||||||
|
// data was returned, not just a stream termination
|
||||||
|
|
||||||
|
// check if this is a single block lookup - i.e we were searching for a specific hash
|
||||||
|
let mut single_block_hash = None;
|
||||||
|
if let Some((block_hash, data_received)) =
|
||||||
|
self.single_block_lookups.get_mut(&request_id)
|
||||||
|
{
|
||||||
|
// update the state of the lookup indicating a block was received from the peer
|
||||||
|
*data_received = true;
|
||||||
|
single_block_hash = Some(block_hash.clone());
|
||||||
|
}
|
||||||
|
if let Some(block_hash) = single_block_hash {
|
||||||
|
self.single_block_lookup_response(peer_id, block, block_hash);
|
||||||
|
return;
|
||||||
|
}
|
||||||
|
|
||||||
|
// This wasn't a single block lookup request, it must be a response to a parent request search
|
||||||
|
// find the request
|
||||||
|
let mut parent_request = match self
|
||||||
|
.parent_queue
|
||||||
|
.iter()
|
||||||
|
.position(|request| request.pending == Some(request_id))
|
||||||
|
{
|
||||||
|
// we remove from the queue and process it. It will get re-added if required
|
||||||
|
Some(pos) => self.parent_queue.remove(pos),
|
||||||
|
None => {
|
||||||
|
// No pending request, invalid request_id or coding error
|
||||||
|
warn!(self.log, "BlocksByRoot response unknown"; "request_id" => request_id);
|
||||||
|
return;
|
||||||
|
}
|
||||||
|
};
|
||||||
// add the block to response
|
// add the block to response
|
||||||
parent_request.downloaded_blocks.push(block);
|
parent_request.downloaded_blocks.push(block);
|
||||||
// queue for processing
|
// queue for processing
|
||||||
self.process_parent_request(parent_request);
|
self.process_parent_request(parent_request);
|
||||||
}
|
}
|
||||||
None => {
|
None => {
|
||||||
|
// this is a stream termination
|
||||||
|
|
||||||
|
// stream termination for a single block lookup, remove the key
|
||||||
|
if let Some((block_hash, data_received)) =
|
||||||
|
self.single_block_lookups.remove(&request_id)
|
||||||
|
{
|
||||||
|
// the peer didn't respond with a block that it referenced
|
||||||
|
if !data_received {
|
||||||
|
warn!(self.log, "Peer didn't respond with a block it referenced"; "referenced_block_hash" => format!("{}", block_hash), "peer_id" => format!("{}", peer_id));
|
||||||
|
self.network.downvote_peer(peer_id);
|
||||||
|
}
|
||||||
|
return;
|
||||||
|
}
|
||||||
|
|
||||||
|
// This wasn't a single block lookup request, it must be a response to a parent request search
|
||||||
|
// find the request and remove it
|
||||||
|
let mut parent_request = match self
|
||||||
|
.parent_queue
|
||||||
|
.iter()
|
||||||
|
.position(|request| request.pending == Some(request_id))
|
||||||
|
{
|
||||||
|
Some(pos) => self.parent_queue.remove(pos),
|
||||||
|
None => {
|
||||||
|
// No pending request, the parent request has been processed and this is
|
||||||
|
// the resulting stream termination.
|
||||||
|
return;
|
||||||
|
}
|
||||||
|
};
|
||||||
|
// An empty response has been returned to a parent request
|
||||||
// if an empty response is given, the peer didn't have the requested block, try again
|
// if an empty response is given, the peer didn't have the requested block, try again
|
||||||
parent_request.failed_attempts += 1;
|
parent_request.failed_attempts += 1;
|
||||||
parent_request.last_submitted_peer = peer_id;
|
parent_request.last_submitted_peer = peer_id;
|
||||||
@ -350,6 +384,7 @@ impl<T: BeaconChainTypes> SyncManager<T> {
|
|||||||
// verify the hash is correct and try and process the block
|
// verify the hash is correct and try and process the block
|
||||||
if expected_block_hash != block.canonical_root() {
|
if expected_block_hash != block.canonical_root() {
|
||||||
// the peer that sent this, sent us the wrong block
|
// the peer that sent this, sent us the wrong block
|
||||||
|
warn!(self.log, "Peer sent incorrect block for single block lookup"; "peer_id" => format!("{}", peer_id));
|
||||||
self.network.downvote_peer(peer_id);
|
self.network.downvote_peer(peer_id);
|
||||||
return;
|
return;
|
||||||
}
|
}
|
||||||
@ -405,7 +440,7 @@ impl<T: BeaconChainTypes> SyncManager<T> {
|
|||||||
}
|
}
|
||||||
|
|
||||||
// Make sure this block is not already being searched for
|
// Make sure this block is not already being searched for
|
||||||
// TODO: Potentially store a hashset of blocks for O(1) lookups
|
// NOTE: Potentially store a hashset of blocks for O(1) lookups
|
||||||
for parent_req in self.parent_queue.iter() {
|
for parent_req in self.parent_queue.iter() {
|
||||||
if parent_req
|
if parent_req
|
||||||
.downloaded_blocks
|
.downloaded_blocks
|
||||||
@ -440,18 +475,18 @@ impl<T: BeaconChainTypes> SyncManager<T> {
|
|||||||
};
|
};
|
||||||
|
|
||||||
if let Ok(request_id) = self.network.blocks_by_root_request(peer_id, request) {
|
if let Ok(request_id) = self.network.blocks_by_root_request(peer_id, request) {
|
||||||
self.single_block_lookups.insert(request_id, block_hash);
|
self.single_block_lookups
|
||||||
|
.insert(request_id, (block_hash, false));
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
fn inject_error(&mut self, peer_id: PeerId, request_id: RequestId) {
|
fn inject_error(&mut self, peer_id: PeerId, request_id: RequestId) {
|
||||||
trace!(self.log, "Sync manager received a failed RPC");
|
trace!(self.log, "Sync manager received a failed RPC");
|
||||||
// remove any single block lookups
|
// remove any single block lookups
|
||||||
self.single_block_lookups.remove(&request_id);
|
if self.single_block_lookups.remove(&request_id).is_some() {
|
||||||
|
// this was a single block request lookup, look no further
|
||||||
// notify the range sync
|
return;
|
||||||
self.range_sync
|
}
|
||||||
.inject_error(&mut self.network, peer_id.clone(), request_id);
|
|
||||||
|
|
||||||
// increment the failure of a parent lookup if the request matches a parent search
|
// increment the failure of a parent lookup if the request matches a parent search
|
||||||
if let Some(pos) = self
|
if let Some(pos) = self
|
||||||
@ -463,7 +498,12 @@ impl<T: BeaconChainTypes> SyncManager<T> {
|
|||||||
parent_request.failed_attempts += 1;
|
parent_request.failed_attempts += 1;
|
||||||
parent_request.last_submitted_peer = peer_id;
|
parent_request.last_submitted_peer = peer_id;
|
||||||
self.request_parent(parent_request);
|
self.request_parent(parent_request);
|
||||||
|
return;
|
||||||
}
|
}
|
||||||
|
|
||||||
|
// otherwise, this is a range sync issue, notify the range sync
|
||||||
|
self.range_sync
|
||||||
|
.inject_error(&mut self.network, peer_id.clone(), request_id);
|
||||||
}
|
}
|
||||||
|
|
||||||
fn peer_disconnect(&mut self, peer_id: &PeerId) {
|
fn peer_disconnect(&mut self, peer_id: &PeerId) {
|
||||||
@ -504,6 +544,7 @@ impl<T: BeaconChainTypes> SyncManager<T> {
|
|||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
|
/// A new block has been received for a parent lookup query, process it.
|
||||||
fn process_parent_request(&mut self, mut parent_request: ParentRequests<T::EthSpec>) {
|
fn process_parent_request(&mut self, mut parent_request: ParentRequests<T::EthSpec>) {
|
||||||
// verify the last added block is the parent of the last requested block
|
// verify the last added block is the parent of the last requested block
|
||||||
|
|
||||||
@ -512,7 +553,7 @@ impl<T: BeaconChainTypes> SyncManager<T> {
|
|||||||
self.log,
|
self.log,
|
||||||
"There must be at least two blocks in a parent request lookup at all times"
|
"There must be at least two blocks in a parent request lookup at all times"
|
||||||
);
|
);
|
||||||
panic!("There must be at least two blocks in parent request lookup at all time");
|
panic!("There must be at least two blocks in parent request lookup at all times");
|
||||||
// fail loudly
|
// fail loudly
|
||||||
}
|
}
|
||||||
let previous_index = parent_request.downloaded_blocks.len() - 2;
|
let previous_index = parent_request.downloaded_blocks.len() - 2;
|
||||||
@ -530,87 +571,135 @@ impl<T: BeaconChainTypes> SyncManager<T> {
|
|||||||
let _ = parent_request.downloaded_blocks.pop();
|
let _ = parent_request.downloaded_blocks.pop();
|
||||||
let peer = parent_request.last_submitted_peer.clone();
|
let peer = parent_request.last_submitted_peer.clone();
|
||||||
|
|
||||||
debug!(self.log, "Peer sent invalid parent.";
|
warn!(self.log, "Peer sent invalid parent.";
|
||||||
"peer_id" => format!("{:?}",peer),
|
"peer_id" => format!("{:?}",peer),
|
||||||
"received_block" => format!("{}", block_hash),
|
"received_block" => format!("{}", block_hash),
|
||||||
"expected_parent" => format!("{}", expected_hash),
|
"expected_parent" => format!("{}", expected_hash),
|
||||||
);
|
);
|
||||||
|
|
||||||
self.request_parent(parent_request);
|
self.request_parent(parent_request);
|
||||||
self.network.downvote_peer(peer);
|
self.network.downvote_peer(peer);
|
||||||
} else {
|
} else {
|
||||||
let mut successes = 0;
|
// The last block in the queue is the only one that has not attempted to be processed yet.
|
||||||
|
//
|
||||||
|
// The logic here attempts to process the last block. If it can be processed, the rest
|
||||||
|
// of the blocks must have known parents. If any of them cannot be processed, we
|
||||||
|
// consider the entire chain corrupt and drop it, notifying the user.
|
||||||
|
//
|
||||||
|
// If the last block in the queue cannot be processed, we also drop the entire queue.
|
||||||
|
// If the last block in the queue has an unknown parent, we continue the parent
|
||||||
|
// lookup-search.
|
||||||
|
|
||||||
// try and process the list of blocks up to the requested block
|
let total_blocks_to_process = parent_request.downloaded_blocks.len();
|
||||||
|
|
||||||
|
if let Some(chain) = self.chain.upgrade() {
|
||||||
|
let newest_block = parent_request
|
||||||
|
.downloaded_blocks
|
||||||
|
.pop()
|
||||||
|
.expect("There is always at least one block in the queue");
|
||||||
|
match chain.process_block(newest_block.clone()) {
|
||||||
|
Ok(BlockProcessingOutcome::ParentUnknown { .. }) => {
|
||||||
|
// need to keep looking for parents
|
||||||
|
// add the block back to the queue and continue the search
|
||||||
|
parent_request.downloaded_blocks.push(newest_block);
|
||||||
|
self.request_parent(parent_request);
|
||||||
|
return;
|
||||||
|
}
|
||||||
|
Ok(BlockProcessingOutcome::Processed { .. })
|
||||||
|
| Ok(BlockProcessingOutcome::BlockIsAlreadyKnown { .. }) => {}
|
||||||
|
Ok(outcome) => {
|
||||||
|
// all else we consider the chain a failure and downvote the peer that sent
|
||||||
|
// us the last block
|
||||||
|
warn!(
|
||||||
|
self.log, "Invalid parent chain. Downvoting peer";
|
||||||
|
"outcome" => format!("{:?}", outcome),
|
||||||
|
"last_peer" => format!("{:?}", parent_request.last_submitted_peer),
|
||||||
|
);
|
||||||
|
self.network
|
||||||
|
.downvote_peer(parent_request.last_submitted_peer.clone());
|
||||||
|
return;
|
||||||
|
}
|
||||||
|
Err(e) => {
|
||||||
|
warn!(
|
||||||
|
self.log, "Parent chain processing error. Downvoting peer";
|
||||||
|
"error" => format!("{:?}", e),
|
||||||
|
"last_peer" => format!("{:?}", parent_request.last_submitted_peer),
|
||||||
|
);
|
||||||
|
self.network
|
||||||
|
.downvote_peer(parent_request.last_submitted_peer.clone());
|
||||||
|
return;
|
||||||
|
}
|
||||||
|
}
|
||||||
|
} else {
|
||||||
|
// chain doesn't exist, drop the parent queue and return
|
||||||
|
return;
|
||||||
|
}
|
||||||
|
|
||||||
|
//TODO: Shift this to a block processing thread
|
||||||
|
|
||||||
|
// the last received block has been successfully processed, process all other blocks in the
|
||||||
|
// chain
|
||||||
while let Some(block) = parent_request.downloaded_blocks.pop() {
|
while let Some(block) = parent_request.downloaded_blocks.pop() {
|
||||||
// check if the chain exists
|
// check if the chain exists
|
||||||
if let Some(chain) = self.chain.upgrade() {
|
if let Some(chain) = self.chain.upgrade() {
|
||||||
match chain.process_block(block.clone()) {
|
match chain.process_block(block) {
|
||||||
Ok(BlockProcessingOutcome::ParentUnknown { .. }) => {
|
Ok(BlockProcessingOutcome::Processed { .. })
|
||||||
// need to keep looking for parents
|
| Ok(BlockProcessingOutcome::BlockIsAlreadyKnown { .. }) => {} // continue to the next block
|
||||||
parent_request.downloaded_blocks.push(block);
|
|
||||||
self.request_parent(parent_request);
|
// all else is considered a failure
|
||||||
break;
|
|
||||||
}
|
|
||||||
Ok(BlockProcessingOutcome::Processed { .. }) => successes += 1,
|
|
||||||
Ok(BlockProcessingOutcome::BlockIsAlreadyKnown { .. }) => {}
|
|
||||||
Ok(outcome) => {
|
Ok(outcome) => {
|
||||||
// it's a future slot or an invalid block, remove it and try again
|
// the previous blocks have failed, notify the user the chain lookup has
|
||||||
parent_request.failed_attempts += 1;
|
// failed and drop the parent queue
|
||||||
debug!(
|
debug!(
|
||||||
self.log, "Invalid parent block";
|
self.log, "Invalid parent chain. Past blocks failure";
|
||||||
"outcome" => format!("{:?}", outcome),
|
"outcome" => format!("{:?}", outcome),
|
||||||
"peer" => format!("{:?}", parent_request.last_submitted_peer),
|
"peer" => format!("{:?}", parent_request.last_submitted_peer),
|
||||||
);
|
);
|
||||||
self.network
|
self.network
|
||||||
.downvote_peer(parent_request.last_submitted_peer.clone());
|
.downvote_peer(parent_request.last_submitted_peer.clone());
|
||||||
self.request_parent(parent_request);
|
|
||||||
break;
|
break;
|
||||||
}
|
}
|
||||||
Err(e) => {
|
Err(e) => {
|
||||||
parent_request.failed_attempts += 1;
|
|
||||||
warn!(
|
warn!(
|
||||||
self.log, "Parent processing error";
|
self.log, "Parent chain processing error.";
|
||||||
"error" => format!("{:?}", e)
|
"error" => format!("{:?}", e)
|
||||||
);
|
);
|
||||||
self.network
|
self.network
|
||||||
.downvote_peer(parent_request.last_submitted_peer.clone());
|
.downvote_peer(parent_request.last_submitted_peer.clone());
|
||||||
self.request_parent(parent_request);
|
|
||||||
break;
|
break;
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
} else {
|
} else {
|
||||||
|
// chain doesn't exist, end the processing
|
||||||
break;
|
break;
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
if successes > 0 {
|
// at least one block has been processed, run fork-choice
|
||||||
if let Some(chain) = self.chain.upgrade() {
|
if let Some(chain) = self.chain.upgrade() {
|
||||||
match chain.fork_choice() {
|
match chain.fork_choice() {
|
||||||
Ok(()) => trace!(
|
Ok(()) => trace!(
|
||||||
self.log,
|
self.log,
|
||||||
"Fork choice success";
|
"Fork choice success";
|
||||||
"block_imports" => successes,
|
"block_imports" => total_blocks_to_process - parent_request.downloaded_blocks.len(),
|
||||||
"location" => "parent request"
|
"location" => "parent request"
|
||||||
),
|
),
|
||||||
Err(e) => error!(
|
Err(e) => error!(
|
||||||
self.log,
|
self.log,
|
||||||
"Fork choice failed";
|
"Fork choice failed";
|
||||||
"error" => format!("{:?}", e),
|
"error" => format!("{:?}", e),
|
||||||
"location" => "parent request"
|
"location" => "parent request"
|
||||||
),
|
),
|
||||||
};
|
};
|
||||||
}
|
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
|
/// Progresses a parent request query.
|
||||||
|
///
|
||||||
|
/// This checks to ensure there a peers to progress the query, checks for failures and
|
||||||
|
/// initiates requests.
|
||||||
fn request_parent(&mut self, mut parent_request: ParentRequests<T::EthSpec>) {
|
fn request_parent(&mut self, mut parent_request: ParentRequests<T::EthSpec>) {
|
||||||
// check to make sure there are peers to search for the parent from
|
|
||||||
if self.full_peers.is_empty() {
|
|
||||||
return;
|
|
||||||
}
|
|
||||||
|
|
||||||
// check to make sure this request hasn't failed
|
// check to make sure this request hasn't failed
|
||||||
if parent_request.failed_attempts >= PARENT_FAIL_TOLERANCE
|
if parent_request.failed_attempts >= PARENT_FAIL_TOLERANCE
|
||||||
|| parent_request.downloaded_blocks.len() >= PARENT_DEPTH_TOLERANCE
|
|| parent_request.downloaded_blocks.len() >= PARENT_DEPTH_TOLERANCE
|
||||||
@ -622,21 +711,26 @@ impl<T: BeaconChainTypes> SyncManager<T> {
|
|||||||
return; // drop the request
|
return; // drop the request
|
||||||
}
|
}
|
||||||
|
|
||||||
let parent_hash = parent_request
|
let parent_hash = if let Some(block) = parent_request.downloaded_blocks.last() {
|
||||||
.downloaded_blocks
|
block.parent_root()
|
||||||
.last()
|
} else {
|
||||||
.expect("The parent queue should never be empty")
|
crit!(self.log, "Parent queue is empty. This should never happen");
|
||||||
.parent_root();
|
return;
|
||||||
|
};
|
||||||
|
|
||||||
let request = BlocksByRootRequest {
|
let request = BlocksByRootRequest {
|
||||||
block_roots: vec![parent_hash],
|
block_roots: vec![parent_hash],
|
||||||
};
|
};
|
||||||
// select a random fully synced peer to attempt to download the parent block
|
// select a random fully synced peer to attempt to download the parent block
|
||||||
let peer_id = self.full_peers.iter().next().expect("List is not empty");
|
let available_peers = self.full_peers.iter().collect::<Vec<_>>();
|
||||||
|
let peer_id = if let Some(peer_id) = available_peers.choose(&mut rand::thread_rng()) {
|
||||||
|
(**peer_id).clone()
|
||||||
|
} else {
|
||||||
|
// there were no peers to choose from. We drop the lookup request
|
||||||
|
return;
|
||||||
|
};
|
||||||
|
|
||||||
if let Ok(request_id) = self
|
if let Ok(request_id) = self.network.blocks_by_root_request(peer_id, request) {
|
||||||
.network
|
|
||||||
.blocks_by_root_request(peer_id.clone(), request)
|
|
||||||
{
|
|
||||||
// if the request was successful add the queue back into self
|
// if the request was successful add the queue back into self
|
||||||
parent_request.pending = Some(request_id);
|
parent_request.pending = Some(request_id);
|
||||||
self.parent_queue.push(parent_request);
|
self.parent_queue.push(parent_request);
|
||||||
|
Loading…
Reference in New Issue
Block a user