miscelaneous fixes on syncing, rpc and responding to peer's sync related requests (#3827)

- there was a bug in responding range blob requests where we would incorrectly label the first slot of an epoch as a non-skipped slot if it were skipped. this bug did not exist in the code for responding to block range request because the logic error was mitigated by defensive coding elsewhere - there was a bug where a block received during range sync without a corresponding blob (and vice versa) was incorrectly interpreted as a stream termination - RPC size limit fixes. - Our blob cache was dead locking so I removed use of it for now. - Because of our change in finalized sync batch size from 2 to 1 and our transition to using exact epoch boundaries for batches (rather than one slot past the epoch boundary), we need to sync finalized sync to 2 epochs + 1 slot past our peer's finalized slot in order to finalize the chain locally. - use fork context bytes in rpc methods on both the server and client side
2022-12-21 15:50:51 -05:00 · 2022-12-21 15:50:51 -05:00 · 33d01a7911
commit 33d01a7911
parent cc420caaa5
6 changed files with 78 additions and 20 deletions
--- a/beacon_node/lighthouse_network/src/rpc/codec/ssz_snappy.rs
+++ b/beacon_node/lighthouse_network/src/rpc/codec/ssz_snappy.rs
@ -298,8 +298,8 @@ impl<TSpec: EthSpec> Decoder for SSZSnappyOutboundCodec<TSpec> {
            .rpc_response_limits::<TSpec>(&self.fork_context);
        if ssz_limits.is_out_of_bounds(length, self.max_packet_size) {
            return Err(RPCError::InvalidData(format!(
-                "RPC response length is out of bounds, length {}",
-                length
+                "RPC response length is out of bounds, length {}, max {}, min {}",
+                length, ssz_limits.max, ssz_limits.min
            )));
        }
        // Calculate worst case compression length for given uncompressed length
@ -439,6 +439,9 @@ fn context_bytes<T: EthSpec>(
                    SignedBeaconBlock::Base { .. } => Some(fork_context.genesis_context_bytes()),
                };
            }
+            if let RPCResponse::BlobsByRange(_) | RPCResponse::BlobsByRoot(_) = rpc_variant {
+                return fork_context.to_context_bytes(ForkName::Eip4844);
+            }
        }
    }
    None
--- a/beacon_node/lighthouse_network/src/rpc/protocol.rs
+++ b/beacon_node/lighthouse_network/src/rpc/protocol.rs
@ -107,6 +107,12 @@ lazy_static! {
    .as_ssz_bytes()
    .len();

+    pub static ref BLOBS_SIDECAR_MIN: usize = BlobsSidecar::<MainnetEthSpec>::empty().as_ssz_bytes().len();
+    pub static ref BLOBS_SIDECAR_MAX: usize = BlobsSidecar::<MainnetEthSpec>::max_size();
+
+    //FIXME(sean) these are underestimates
+    pub static ref SIGNED_BLOCK_AND_BLOBS_MIN: usize = *BLOBS_SIDECAR_MIN + *SIGNED_BEACON_BLOCK_BASE_MIN;
+    pub static ref SIGNED_BLOCK_AND_BLOBS_MAX: usize =*BLOBS_SIDECAR_MAX + *SIGNED_BEACON_BLOCK_EIP4844_MAX;
 }

 /// The maximum bytes that can be sent across the RPC pre-merge.
@ -358,11 +364,10 @@ impl ProtocolId {
            Protocol::Goodbye => RpcLimits::new(0, 0), // Goodbye request has no response
            Protocol::BlocksByRange => rpc_block_limits_by_fork(fork_context.current_fork()),
            Protocol::BlocksByRoot => rpc_block_limits_by_fork(fork_context.current_fork()),
-
-            //FIXME(sean) add blob sizes
-            Protocol::BlobsByRange => rpc_block_limits_by_fork(fork_context.current_fork()),
-            Protocol::BlobsByRoot => rpc_block_limits_by_fork(fork_context.current_fork()),
-
+            Protocol::BlobsByRange => RpcLimits::new(*BLOBS_SIDECAR_MIN, *BLOBS_SIDECAR_MAX),
+            Protocol::BlobsByRoot => {
+                RpcLimits::new(*SIGNED_BLOCK_AND_BLOBS_MIN, *SIGNED_BLOCK_AND_BLOBS_MAX)
+            }
            Protocol::Ping => RpcLimits::new(
                <Ping as Encode>::ssz_fixed_len(),
                <Ping as Encode>::ssz_fixed_len(),
@ -381,13 +386,16 @@ impl ProtocolId {
    /// Returns `true` if the given `ProtocolId` should expect `context_bytes` in the
    /// beginning of the stream, else returns `false`.
    pub fn has_context_bytes(&self) -> bool {
-        if self.version == Version::V2 {
-            match self.message_name {
+        match self.version {
+            Version::V2 => match self.message_name {
                Protocol::BlocksByRange | Protocol::BlocksByRoot => return true,
                _ => return false,
-            }
+            },
+            Version::V1 => match self.message_name {
+                Protocol::BlobsByRange | Protocol::BlobsByRoot => return true,
+                _ => return false,
+            },
        }
-        false
    }
 }

--- a/beacon_node/network/src/beacon_processor/worker/rpc_methods.rs
+++ b/beacon_node/network/src/beacon_processor/worker/rpc_methods.rs
@ -433,7 +433,17 @@ impl<T: BeaconChainTypes> Worker<T> {
        };

        // Pick out the required blocks, ignoring skip-slots.
-        let mut last_block_root = None;
+        let mut last_block_root = req
+            .start_slot
+            .checked_sub(1)
+            .map(|prev_slot| {
+                self.chain
+                    .block_root_at_slot(Slot::new(prev_slot), WhenSlotSkipped::Prev)
+            })
+            .transpose()
+            .ok()
+            .flatten()
+            .flatten();
        let maybe_block_roots = process_results(forwards_block_root_iter, |iter| {
            iter.take_while(|(_, slot)| slot.as_u64() < req.start_slot.saturating_add(req.count))
                // map skip slots to None
@ -602,7 +612,17 @@ impl<T: BeaconChainTypes> Worker<T> {
        };

        // Pick out the required blocks, ignoring skip-slots.
-        let mut last_block_root = None;
+        let mut last_block_root = req
+            .start_slot
+            .checked_sub(1)
+            .map(|prev_slot| {
+                self.chain
+                    .block_root_at_slot(Slot::new(prev_slot), WhenSlotSkipped::Prev)
+            })
+            .transpose()
+            .ok()
+            .flatten()
+            .flatten();
        let maybe_block_roots = process_results(forwards_block_root_iter, |iter| {
            iter.take_while(|(_, slot)| slot.as_u64() < req.start_slot.saturating_add(req.count))
                // map skip slots to None
@ -669,7 +689,7 @@ impl<T: BeaconChainTypes> Worker<T> {
                self.log,
                "BlobsByRange Response processed";
                "peer" => %peer_id,
-                "msg" => "Failed to return all requested blocks",
+                "msg" => "Failed to return all requested blobs",
                "start_slot" => req.start_slot,
                "current_slot" => current_slot,
                "requested" => req.count,
--- a/beacon_node/network/src/sync/network_context.rs
+++ b/beacon_node/network/src/sync/network_context.rs
@ -314,14 +314,24 @@ impl<T: BeaconChainTypes> SyncNetworkContext<T> {
                        let (chain_id, batch_id, info) = entry.get_mut();
                        let chain_id = chain_id.clone();
                        let batch_id = batch_id.clone();
+                        let stream_terminator = maybe_block.is_none();
                        info.add_block_response(maybe_block);
-                        let maybe_block = info.pop_response().map(|block_sidecar_pair| {
+                        let maybe_block_wrapped = info.pop_response().map(|block_sidecar_pair| {
                            BlockWrapper::BlockAndBlob { block_sidecar_pair }
                        });
+
+                        if stream_terminator && !info.is_finished() {
+                            return None;
+                        }
+                        if !stream_terminator && maybe_block_wrapped.is_none() {
+                            return None;
+                        }
+
                        if info.is_finished() {
                            entry.remove();
                        }
-                        Some((chain_id, batch_id, maybe_block))
+
+                        Some((chain_id, batch_id, maybe_block_wrapped))
                    }
                    Entry::Vacant(_) => None,
                }
@ -356,13 +366,24 @@ impl<T: BeaconChainTypes> SyncNetworkContext<T> {
                let (chain_id, batch_id, info) = entry.get_mut();
                let chain_id = chain_id.clone();
                let batch_id = batch_id.clone();
+                let stream_terminator = maybe_sidecar.is_none();
                info.add_sidecar_response(maybe_sidecar);
                let maybe_block = info
                    .pop_response()
                    .map(|block_sidecar_pair| BlockWrapper::BlockAndBlob { block_sidecar_pair });
+
+                if stream_terminator && !info.is_finished() {
+                    return None;
+                }
+
+                if !stream_terminator && maybe_block.is_none() {
+                    return None;
+                }
+
                if info.is_finished() {
                    entry.remove();
                }
+
                Some((chain_id, batch_id, maybe_block))
            }
            Entry::Vacant(_) => None,
--- a/beacon_node/network/src/sync/range_sync/chain.rs
+++ b/beacon_node/network/src/sync/range_sync/chain.rs
@ -137,10 +137,16 @@ impl<T: BeaconChainTypes> SyncingChain<T> {

        let id = SyncingChain::<T>::id(&target_head_root, &target_head_slot);

+        let target_slot = if is_finalized_segment {
+            target_head_slot + (2 * T::EthSpec::slots_per_epoch()) + 1
+        } else {
+            target_head_slot
+        };
+
        SyncingChain {
            id,
            start_epoch,
-            target_head_slot,
+            target_head_slot: target_slot,
            target_head_root,
            batches: BTreeMap::new(),
            peers,
--- a/beacon_node/store/src/hot_cold_store.rs
+++ b/beacon_node/store/src/hot_cold_store.rs
@ -503,9 +503,9 @@ impl<E: EthSpec, Hot: ItemStore<E>, Cold: ItemStore<E>> HotColdDB<E, Hot, Cold>
    }

    pub fn get_blobs(&self, block_root: &Hash256) -> Result<Option<BlobsSidecar<E>>, Error> {
-        if let Some(blobs) = self.blob_cache.lock().get(block_root) {
-            Ok(Some(blobs.clone()))
-        } else if let Some(bytes) = self
+        // FIXME(sean) I was attempting to use a blob cache here but was getting deadlocks,
+        // may want to attempt to use one again
+        if let Some(bytes) = self
            .hot_db
            .get_bytes(DBColumn::BeaconBlob.into(), block_root.as_bytes())?
        {