2021-08-04 01:44:57 +00:00
|
|
|
use beacon_chain::{
|
|
|
|
attestation_verification::Error as AttnError,
|
|
|
|
sync_committee_verification::Error as SyncCommitteeError,
|
|
|
|
};
|
2020-11-28 05:30:57 +00:00
|
|
|
use fnv::FnvHashMap;
|
2020-05-17 11:16:48 +00:00
|
|
|
pub use lighthouse_metrics::*;
|
Rename eth2_libp2p to lighthouse_network (#2702)
## Description
The `eth2_libp2p` crate was originally named and designed to incorporate a simple libp2p integration into lighthouse. Since its origins the crates purpose has expanded dramatically. It now houses a lot more sophistication that is specific to lighthouse and no longer just a libp2p integration.
As of this writing it currently houses the following high-level lighthouse-specific logic:
- Lighthouse's implementation of the eth2 RPC protocol and specific encodings/decodings
- Integration and handling of ENRs with respect to libp2p and eth2
- Lighthouse's discovery logic, its integration with discv5 and logic about searching and handling peers.
- Lighthouse's peer manager - This is a large module handling various aspects of Lighthouse's network, such as peer scoring, handling pings and metadata, connection maintenance and recording, etc.
- Lighthouse's peer database - This is a collection of information stored for each individual peer which is specific to lighthouse. We store connection state, sync state, last seen ips and scores etc. The data stored for each peer is designed for various elements of the lighthouse code base such as syncing and the http api.
- Gossipsub scoring - This stores a collection of gossipsub 1.1 scoring mechanisms that are continuously analyssed and updated based on the ethereum 2 networks and how Lighthouse performs on these networks.
- Lighthouse specific types for managing gossipsub topics, sync status and ENR fields
- Lighthouse's network HTTP API metrics - A collection of metrics for lighthouse network monitoring
- Lighthouse's custom configuration of all networking protocols, RPC, gossipsub, discovery, identify and libp2p.
Therefore it makes sense to rename the crate to be more akin to its current purposes, simply that it manages the majority of Lighthouse's network stack. This PR renames this crate to `lighthouse_network`
Co-authored-by: Paul Hauner <paul@paulhauner.com>
2021-10-19 00:30:39 +00:00
|
|
|
use lighthouse_network::{
|
2022-03-01 01:49:22 +00:00
|
|
|
peer_manager::peerdb::client::ClientKind, types::GossipKind, BandwidthSinks, GossipTopic,
|
|
|
|
Gossipsub, NetworkGlobals,
|
Rename eth2_libp2p to lighthouse_network (#2702)
## Description
The `eth2_libp2p` crate was originally named and designed to incorporate a simple libp2p integration into lighthouse. Since its origins the crates purpose has expanded dramatically. It now houses a lot more sophistication that is specific to lighthouse and no longer just a libp2p integration.
As of this writing it currently houses the following high-level lighthouse-specific logic:
- Lighthouse's implementation of the eth2 RPC protocol and specific encodings/decodings
- Integration and handling of ENRs with respect to libp2p and eth2
- Lighthouse's discovery logic, its integration with discv5 and logic about searching and handling peers.
- Lighthouse's peer manager - This is a large module handling various aspects of Lighthouse's network, such as peer scoring, handling pings and metadata, connection maintenance and recording, etc.
- Lighthouse's peer database - This is a collection of information stored for each individual peer which is specific to lighthouse. We store connection state, sync state, last seen ips and scores etc. The data stored for each peer is designed for various elements of the lighthouse code base such as syncing and the http api.
- Gossipsub scoring - This stores a collection of gossipsub 1.1 scoring mechanisms that are continuously analyssed and updated based on the ethereum 2 networks and how Lighthouse performs on these networks.
- Lighthouse specific types for managing gossipsub topics, sync status and ENR fields
- Lighthouse's network HTTP API metrics - A collection of metrics for lighthouse network monitoring
- Lighthouse's custom configuration of all networking protocols, RPC, gossipsub, discovery, identify and libp2p.
Therefore it makes sense to rename the crate to be more akin to its current purposes, simply that it manages the majority of Lighthouse's network stack. This PR renames this crate to `lighthouse_network`
Co-authored-by: Paul Hauner <paul@paulhauner.com>
2021-10-19 00:30:39 +00:00
|
|
|
};
|
2021-12-22 06:17:14 +00:00
|
|
|
use std::sync::Arc;
|
2022-03-01 01:49:22 +00:00
|
|
|
use strum::IntoEnumIterator;
|
2021-12-22 06:17:14 +00:00
|
|
|
use types::EthSpec;
|
2020-05-17 11:16:48 +00:00
|
|
|
|
2020-09-01 06:59:14 +00:00
|
|
|
lazy_static! {
|
|
|
|
|
2021-12-22 06:17:14 +00:00
|
|
|
pub static ref BEACON_BLOCK_MESH_PEERS_PER_CLIENT: Result<IntGaugeVec> =
|
|
|
|
try_create_int_gauge_vec(
|
|
|
|
"block_mesh_peers_per_client",
|
|
|
|
"Number of mesh peers for BeaconBlock topic per client",
|
2020-11-12 01:48:28 +00:00
|
|
|
&["Client"]
|
|
|
|
);
|
|
|
|
|
|
|
|
pub static ref BEACON_AGGREGATE_AND_PROOF_MESH_PEERS_PER_CLIENT: Result<IntGaugeVec> =
|
|
|
|
try_create_int_gauge_vec(
|
|
|
|
"beacon_aggregate_and_proof_mesh_peers_per_client",
|
|
|
|
"Number of mesh peers for BeaconAggregateAndProof topic per client",
|
|
|
|
&["Client"]
|
|
|
|
);
|
2020-06-28 00:47:03 +00:00
|
|
|
|
|
|
|
/*
|
|
|
|
* Attestation subnet subscriptions
|
|
|
|
*/
|
|
|
|
pub static ref SUBNET_SUBSCRIPTION_REQUESTS: Result<IntCounter> = try_create_int_counter(
|
2021-12-22 06:17:14 +00:00
|
|
|
"validator_attestation_subnet_subscriptions_total",
|
2021-08-04 01:44:57 +00:00
|
|
|
"Count of validator attestation subscription requests."
|
2020-06-28 00:47:03 +00:00
|
|
|
);
|
|
|
|
pub static ref SUBNET_SUBSCRIPTION_AGGREGATOR_REQUESTS: Result<IntCounter> = try_create_int_counter(
|
2021-12-22 06:17:14 +00:00
|
|
|
"validator_subnet_subscriptions_aggregator_total",
|
2020-06-28 00:47:03 +00:00
|
|
|
"Count of validator subscription requests where the subscriber is an aggregator."
|
|
|
|
);
|
2021-12-22 06:17:14 +00:00
|
|
|
pub static ref SYNC_COMMITTEE_SUBSCRIPTION_REQUESTS: Result<IntCounter> = try_create_int_counter(
|
|
|
|
"validator_sync_committee_subnet_subscriptions_total",
|
2021-08-04 01:44:57 +00:00
|
|
|
"Count of validator sync committee subscription requests."
|
|
|
|
);
|
|
|
|
|
2020-08-14 04:38:45 +00:00
|
|
|
/*
|
|
|
|
* Gossip processor
|
|
|
|
*/
|
2020-08-17 09:20:27 +00:00
|
|
|
pub static ref BEACON_PROCESSOR_WORK_EVENTS_RX_COUNT: Result<IntCounterVec> = try_create_int_counter_vec(
|
|
|
|
"beacon_processor_work_events_rx_count",
|
|
|
|
"Count of work events received (but not necessarily processed)",
|
|
|
|
&["type"]
|
|
|
|
);
|
|
|
|
pub static ref BEACON_PROCESSOR_WORK_EVENTS_IGNORED_COUNT: Result<IntCounterVec> = try_create_int_counter_vec(
|
|
|
|
"beacon_processor_work_events_ignored_count",
|
|
|
|
"Count of work events purposefully ignored",
|
|
|
|
&["type"]
|
|
|
|
);
|
|
|
|
pub static ref BEACON_PROCESSOR_WORK_EVENTS_STARTED_COUNT: Result<IntCounterVec> = try_create_int_counter_vec(
|
|
|
|
"beacon_processor_work_events_started_count",
|
|
|
|
"Count of work events which have been started by a worker",
|
|
|
|
&["type"]
|
|
|
|
);
|
|
|
|
pub static ref BEACON_PROCESSOR_WORKER_TIME: Result<HistogramVec> = try_create_histogram_vec(
|
|
|
|
"beacon_processor_worker_time",
|
|
|
|
"Time taken for a worker to fully process some parcel of work.",
|
|
|
|
&["type"]
|
|
|
|
);
|
|
|
|
pub static ref BEACON_PROCESSOR_WORKERS_SPAWNED_TOTAL: Result<IntCounter> = try_create_int_counter(
|
|
|
|
"beacon_processor_workers_spawned_total",
|
2020-08-14 04:38:45 +00:00
|
|
|
"The number of workers ever spawned by the gossip processing pool."
|
|
|
|
);
|
2020-08-17 09:20:27 +00:00
|
|
|
pub static ref BEACON_PROCESSOR_WORKERS_ACTIVE_TOTAL: Result<IntGauge> = try_create_int_gauge(
|
|
|
|
"beacon_processor_workers_active_total",
|
2020-08-14 04:38:45 +00:00
|
|
|
"Count of active workers in the gossip processing pool."
|
|
|
|
);
|
2020-08-17 09:20:27 +00:00
|
|
|
pub static ref BEACON_PROCESSOR_IDLE_EVENTS_TOTAL: Result<IntCounter> = try_create_int_counter(
|
|
|
|
"beacon_processor_idle_events_total",
|
2020-08-14 04:38:45 +00:00
|
|
|
"Count of idle events processed by the gossip processor manager."
|
|
|
|
);
|
2020-08-17 09:20:27 +00:00
|
|
|
pub static ref BEACON_PROCESSOR_EVENT_HANDLING_SECONDS: Result<Histogram> = try_create_histogram(
|
|
|
|
"beacon_processor_event_handling_seconds",
|
2020-08-14 04:38:45 +00:00
|
|
|
"Time spent handling a new message and allocating it to a queue or worker."
|
|
|
|
);
|
2020-08-17 09:20:27 +00:00
|
|
|
// Gossip blocks.
|
|
|
|
pub static ref BEACON_PROCESSOR_GOSSIP_BLOCK_QUEUE_TOTAL: Result<IntGauge> = try_create_int_gauge(
|
|
|
|
"beacon_processor_gossip_block_queue_total",
|
|
|
|
"Count of blocks from gossip waiting to be verified."
|
2020-08-14 04:38:45 +00:00
|
|
|
);
|
2020-08-17 09:20:27 +00:00
|
|
|
pub static ref BEACON_PROCESSOR_GOSSIP_BLOCK_VERIFIED_TOTAL: Result<IntCounter> = try_create_int_counter(
|
|
|
|
"beacon_processor_gossip_block_verified_total",
|
|
|
|
"Total number of gossip blocks verified for propagation."
|
|
|
|
);
|
|
|
|
pub static ref BEACON_PROCESSOR_GOSSIP_BLOCK_IMPORTED_TOTAL: Result<IntCounter> = try_create_int_counter(
|
|
|
|
"beacon_processor_gossip_block_imported_total",
|
|
|
|
"Total number of gossip blocks imported to fork choice, etc."
|
|
|
|
);
|
Handle early blocks (#2155)
## Issue Addressed
NA
## Problem this PR addresses
There's an issue where Lighthouse is banning a lot of peers due to the following sequence of events:
1. Gossip block 0xabc arrives ~200ms early
- It is propagated across the network, with respect to [`MAXIMUM_GOSSIP_CLOCK_DISPARITY`](https://github.com/ethereum/eth2.0-specs/blob/v1.0.0/specs/phase0/p2p-interface.md#why-is-there-maximum_gossip_clock_disparity-when-validating-slot-ranges-of-messages-in-gossip-subnets).
- However, it is not imported to our database since the block is early.
2. Attestations for 0xabc arrive, but the block was not imported.
- The peer that sent the attestation is down-voted.
- Each unknown-block attestation causes a score loss of 1, the peer is banned at -100.
- When the peer is on an attestation subnet there can be hundreds of attestations, so the peer is banned quickly (before the missed block can be obtained via rpc).
## Potential solutions
I can think of three solutions to this:
1. Wait for attestation-queuing (#635) to arrive and solve this.
- Easy
- Not immediate fix.
- Whilst this would work, I don't think it's a perfect solution for this particular issue, rather (3) is better.
1. Allow importing blocks with a tolerance of `MAXIMUM_GOSSIP_CLOCK_DISPARITY`.
- Easy
- ~~I have implemented this, for now.~~
1. If a block is verified for gossip propagation (i.e., signature verified) and it's within `MAXIMUM_GOSSIP_CLOCK_DISPARITY`, then queue it to be processed at the start of the appropriate slot.
- More difficult
- Feels like the best solution, I will try to implement this.
**This PR takes approach (3).**
## Changes included
- Implement the `block_delay_queue`, based upon a [`DelayQueue`](https://docs.rs/tokio-util/0.6.3/tokio_util/time/delay_queue/struct.DelayQueue.html) which can store blocks until it's time to import them.
- Add a new `DelayedImportBlock` variant to the `beacon_processor::WorkEvent` enum to handle this new event.
- In the `BeaconProcessor`, refactor a `tokio::select!` to a struct with an explicit `Stream` implementation. I experienced some issues with `tokio::select!` in the block delay queue and I also found it hard to debug. I think this explicit implementation is nicer and functionally equivalent (apart from the fact that `tokio::select!` randomly chooses futures to poll, whereas now we're deterministic).
- Add a testing framework to the `beacon_processor` module that tests this new block delay logic. I also tested a handful of other operations in the beacon processor (attns, slashings, exits) since it was super easy to copy-pasta the code from the `http_api` tester.
- To implement these tests I added the concept of an optional `work_journal_tx` to the `BeaconProcessor` which will spit out a log of events. I used this in the tests to ensure that things were happening as I expect.
- The tests are a little racey, but it's hard to avoid that when testing timing-based code. If we see CI failures I can revise. I haven't observed *any* failures due to races on my machine or on CI yet.
- To assist with testing I allowed for directly setting the time on the `ManualSlotClock`.
- I gave the `beacon_processor::Worker` a `Toolbox` for two reasons; (a) it avoids changing tons of function sigs when you want to pass a new object to the worker and (b) it seemed cute.
2021-02-24 03:08:52 +00:00
|
|
|
pub static ref BEACON_PROCESSOR_GOSSIP_BLOCK_REQUEUED_TOTAL: Result<IntCounter> = try_create_int_counter(
|
|
|
|
"beacon_processor_gossip_block_requeued_total",
|
|
|
|
"Total number of gossip blocks that arrived early and were re-queued for later processing."
|
|
|
|
);
|
|
|
|
pub static ref BEACON_PROCESSOR_GOSSIP_BLOCK_EARLY_SECONDS: Result<Histogram> = try_create_histogram(
|
|
|
|
"beacon_processor_gossip_block_early_seconds",
|
|
|
|
"Whenever a gossip block is received early this metrics is set to how early that block was."
|
|
|
|
);
|
2020-08-19 05:09:53 +00:00
|
|
|
// Gossip Exits.
|
|
|
|
pub static ref BEACON_PROCESSOR_EXIT_QUEUE_TOTAL: Result<IntGauge> = try_create_int_gauge(
|
|
|
|
"beacon_processor_exit_queue_total",
|
|
|
|
"Count of exits from gossip waiting to be verified."
|
|
|
|
);
|
|
|
|
pub static ref BEACON_PROCESSOR_EXIT_VERIFIED_TOTAL: Result<IntCounter> = try_create_int_counter(
|
|
|
|
"beacon_processor_exit_verified_total",
|
|
|
|
"Total number of voluntary exits verified for propagation."
|
|
|
|
);
|
|
|
|
pub static ref BEACON_PROCESSOR_EXIT_IMPORTED_TOTAL: Result<IntCounter> = try_create_int_counter(
|
|
|
|
"beacon_processor_exit_imported_total",
|
|
|
|
"Total number of voluntary exits imported to the op pool."
|
|
|
|
);
|
|
|
|
// Gossip proposer slashings.
|
|
|
|
pub static ref BEACON_PROCESSOR_PROPOSER_SLASHING_QUEUE_TOTAL: Result<IntGauge> = try_create_int_gauge(
|
|
|
|
"beacon_processor_proposer_slashing_queue_total",
|
|
|
|
"Count of proposer slashings from gossip waiting to be verified."
|
|
|
|
);
|
|
|
|
pub static ref BEACON_PROCESSOR_PROPOSER_SLASHING_VERIFIED_TOTAL: Result<IntCounter> = try_create_int_counter(
|
|
|
|
"beacon_processor_proposer_slashing_verified_total",
|
|
|
|
"Total number of proposer slashings verified for propagation."
|
|
|
|
);
|
|
|
|
pub static ref BEACON_PROCESSOR_PROPOSER_SLASHING_IMPORTED_TOTAL: Result<IntCounter> = try_create_int_counter(
|
|
|
|
"beacon_processor_proposer_slashing_imported_total",
|
|
|
|
"Total number of proposer slashings imported to the op pool."
|
|
|
|
);
|
|
|
|
// Gossip attester slashings.
|
|
|
|
pub static ref BEACON_PROCESSOR_ATTESTER_SLASHING_QUEUE_TOTAL: Result<IntGauge> = try_create_int_gauge(
|
|
|
|
"beacon_processor_attester_slashing_queue_total",
|
|
|
|
"Count of attester slashings from gossip waiting to be verified."
|
|
|
|
);
|
|
|
|
pub static ref BEACON_PROCESSOR_ATTESTER_SLASHING_VERIFIED_TOTAL: Result<IntCounter> = try_create_int_counter(
|
|
|
|
"beacon_processor_attester_slashing_verified_total",
|
|
|
|
"Total number of attester slashings verified for propagation."
|
|
|
|
);
|
|
|
|
pub static ref BEACON_PROCESSOR_ATTESTER_SLASHING_IMPORTED_TOTAL: Result<IntCounter> = try_create_int_counter(
|
|
|
|
"beacon_processor_attester_slashing_imported_total",
|
|
|
|
"Total number of attester slashings imported to the op pool."
|
|
|
|
);
|
2020-08-17 09:20:27 +00:00
|
|
|
// Rpc blocks.
|
|
|
|
pub static ref BEACON_PROCESSOR_RPC_BLOCK_QUEUE_TOTAL: Result<IntGauge> = try_create_int_gauge(
|
|
|
|
"beacon_processor_rpc_block_queue_total",
|
|
|
|
"Count of blocks from the rpc waiting to be verified."
|
|
|
|
);
|
|
|
|
pub static ref BEACON_PROCESSOR_RPC_BLOCK_IMPORTED_TOTAL: Result<IntCounter> = try_create_int_counter(
|
|
|
|
"beacon_processor_rpc_block_imported_total",
|
|
|
|
"Total number of gossip blocks imported to fork choice, etc."
|
2020-08-14 04:38:45 +00:00
|
|
|
);
|
2020-08-17 09:20:27 +00:00
|
|
|
// Chain segments.
|
|
|
|
pub static ref BEACON_PROCESSOR_CHAIN_SEGMENT_QUEUE_TOTAL: Result<IntGauge> = try_create_int_gauge(
|
|
|
|
"beacon_processor_chain_segment_queue_total",
|
|
|
|
"Count of chain segments from the rpc waiting to be verified."
|
2020-08-14 04:38:45 +00:00
|
|
|
);
|
2022-05-26 02:05:17 +00:00
|
|
|
pub static ref BEACON_PROCESSOR_BACKFILL_CHAIN_SEGMENT_QUEUE_TOTAL: Result<IntGauge> = try_create_int_gauge(
|
|
|
|
"beacon_processor_backfill_chain_segment_queue_total",
|
|
|
|
"Count of backfill chain segments from the rpc waiting to be verified."
|
|
|
|
);
|
2020-08-17 09:20:27 +00:00
|
|
|
pub static ref BEACON_PROCESSOR_CHAIN_SEGMENT_SUCCESS_TOTAL: Result<IntCounter> = try_create_int_counter(
|
|
|
|
"beacon_processor_chain_segment_success_total",
|
|
|
|
"Total number of chain segments successfully processed."
|
|
|
|
);
|
2021-09-22 00:37:28 +00:00
|
|
|
pub static ref BEACON_PROCESSOR_BACKFILL_CHAIN_SEGMENT_SUCCESS_TOTAL: Result<IntCounter> = try_create_int_counter(
|
|
|
|
"beacon_processor_backfill_chain_segment_success_total",
|
|
|
|
"Total number of chain segments successfully processed."
|
|
|
|
);
|
2020-08-17 09:20:27 +00:00
|
|
|
pub static ref BEACON_PROCESSOR_CHAIN_SEGMENT_FAILED_TOTAL: Result<IntCounter> = try_create_int_counter(
|
|
|
|
"beacon_processor_chain_segment_failed_total",
|
|
|
|
"Total number of chain segments that failed processing."
|
|
|
|
);
|
2021-09-22 00:37:28 +00:00
|
|
|
pub static ref BEACON_PROCESSOR_BACKFILL_CHAIN_SEGMENT_FAILED_TOTAL: Result<IntCounter> = try_create_int_counter(
|
|
|
|
"beacon_processor_backfill_chain_segment_failed_total",
|
|
|
|
"Total number of backfill chain segments that failed processing."
|
|
|
|
);
|
2020-08-17 09:20:27 +00:00
|
|
|
// Unaggregated attestations.
|
|
|
|
pub static ref BEACON_PROCESSOR_UNAGGREGATED_ATTESTATION_QUEUE_TOTAL: Result<IntGauge> = try_create_int_gauge(
|
|
|
|
"beacon_processor_unaggregated_attestation_queue_total",
|
|
|
|
"Count of unagg. attestations waiting to be processed."
|
|
|
|
);
|
|
|
|
pub static ref BEACON_PROCESSOR_UNAGGREGATED_ATTESTATION_VERIFIED_TOTAL: Result<IntCounter> = try_create_int_counter(
|
|
|
|
"beacon_processor_unaggregated_attestation_verified_total",
|
2020-08-14 04:38:45 +00:00
|
|
|
"Total number of unaggregated attestations verified for gossip."
|
|
|
|
);
|
2020-08-17 09:20:27 +00:00
|
|
|
pub static ref BEACON_PROCESSOR_UNAGGREGATED_ATTESTATION_IMPORTED_TOTAL: Result<IntCounter> = try_create_int_counter(
|
|
|
|
"beacon_processor_unaggregated_attestation_imported_total",
|
2020-08-14 04:38:45 +00:00
|
|
|
"Total number of unaggregated attestations imported to fork choice, etc."
|
|
|
|
);
|
2021-07-14 05:24:08 +00:00
|
|
|
pub static ref BEACON_PROCESSOR_UNAGGREGATED_ATTESTATION_REQUEUED_TOTAL: Result<IntCounter> = try_create_int_counter(
|
|
|
|
"beacon_processor_unaggregated_attestation_requeued_total",
|
|
|
|
"Total number of unaggregated attestations that referenced an unknown block and were re-queued."
|
|
|
|
);
|
2020-08-17 09:20:27 +00:00
|
|
|
// Aggregated attestations.
|
|
|
|
pub static ref BEACON_PROCESSOR_AGGREGATED_ATTESTATION_QUEUE_TOTAL: Result<IntGauge> = try_create_int_gauge(
|
|
|
|
"beacon_processor_aggregated_attestation_queue_total",
|
2020-08-14 04:38:45 +00:00
|
|
|
"Count of agg. attestations waiting to be processed."
|
|
|
|
);
|
2020-08-17 09:20:27 +00:00
|
|
|
pub static ref BEACON_PROCESSOR_AGGREGATED_ATTESTATION_VERIFIED_TOTAL: Result<IntCounter> = try_create_int_counter(
|
|
|
|
"beacon_processor_aggregated_attestation_verified_total",
|
2020-08-14 04:38:45 +00:00
|
|
|
"Total number of aggregated attestations verified for gossip."
|
|
|
|
);
|
2020-08-17 09:20:27 +00:00
|
|
|
pub static ref BEACON_PROCESSOR_AGGREGATED_ATTESTATION_IMPORTED_TOTAL: Result<IntCounter> = try_create_int_counter(
|
|
|
|
"beacon_processor_aggregated_attestation_imported_total",
|
2020-08-14 04:38:45 +00:00
|
|
|
"Total number of aggregated attestations imported to fork choice, etc."
|
|
|
|
);
|
2021-07-14 05:24:08 +00:00
|
|
|
pub static ref BEACON_PROCESSOR_AGGREGATED_ATTESTATION_REQUEUED_TOTAL: Result<IntCounter> = try_create_int_counter(
|
|
|
|
"beacon_processor_aggregated_attestation_requeued_total",
|
|
|
|
"Total number of aggregated attestations that referenced an unknown block and were re-queued."
|
|
|
|
);
|
2021-08-04 01:44:57 +00:00
|
|
|
// Sync committee messages.
|
|
|
|
pub static ref BEACON_PROCESSOR_SYNC_MESSAGE_QUEUE_TOTAL: Result<IntGauge> = try_create_int_gauge(
|
|
|
|
"beacon_processor_sync_message_queue_total",
|
|
|
|
"Count of sync committee messages waiting to be processed."
|
|
|
|
);
|
|
|
|
pub static ref BEACON_PROCESSOR_SYNC_MESSAGE_VERIFIED_TOTAL: Result<IntCounter> = try_create_int_counter(
|
|
|
|
"beacon_processor_sync_message_verified_total",
|
|
|
|
"Total number of sync committee messages verified for gossip."
|
|
|
|
);
|
|
|
|
pub static ref BEACON_PROCESSOR_SYNC_MESSAGE_IMPORTED_TOTAL: Result<IntCounter> = try_create_int_counter(
|
|
|
|
"beacon_processor_sync_message_imported_total",
|
|
|
|
"Total number of sync committee messages imported to fork choice, etc."
|
|
|
|
);
|
|
|
|
// Sync contribution.
|
|
|
|
pub static ref BEACON_PROCESSOR_SYNC_CONTRIBUTION_QUEUE_TOTAL: Result<IntGauge> = try_create_int_gauge(
|
|
|
|
"beacon_processor_sync_contribution_queue_total",
|
|
|
|
"Count of sync committee contributions waiting to be processed."
|
|
|
|
);
|
|
|
|
pub static ref BEACON_PROCESSOR_SYNC_CONTRIBUTION_VERIFIED_TOTAL: Result<IntCounter> = try_create_int_counter(
|
|
|
|
"beacon_processor_sync_contribution_verified_total",
|
|
|
|
"Total number of sync committee contributions verified for gossip."
|
|
|
|
);
|
2021-12-22 06:17:14 +00:00
|
|
|
|
2021-08-04 01:44:57 +00:00
|
|
|
pub static ref BEACON_PROCESSOR_SYNC_CONTRIBUTION_IMPORTED_TOTAL: Result<IntCounter> = try_create_int_counter(
|
|
|
|
"beacon_processor_sync_contribution_imported_total",
|
|
|
|
"Total number of sync committee contributions imported to fork choice, etc."
|
|
|
|
);
|
|
|
|
|
2021-12-22 06:17:14 +00:00
|
|
|
/// Errors and Debugging Stats
|
2021-01-19 06:33:58 +00:00
|
|
|
pub static ref GOSSIP_ATTESTATION_ERRORS_PER_TYPE: Result<IntCounterVec> =
|
|
|
|
try_create_int_counter_vec(
|
|
|
|
"gossipsub_attestation_errors_per_type",
|
|
|
|
"Gossipsub attestation errors per error type",
|
|
|
|
&["type"]
|
|
|
|
);
|
2021-08-04 01:44:57 +00:00
|
|
|
pub static ref GOSSIP_SYNC_COMMITTEE_ERRORS_PER_TYPE: Result<IntCounterVec> =
|
|
|
|
try_create_int_counter_vec(
|
|
|
|
"gossipsub_sync_committee_errors_per_type",
|
|
|
|
"Gossipsub sync_committee errors per error type",
|
|
|
|
&["type"]
|
|
|
|
);
|
2022-08-30 05:47:31 +00:00
|
|
|
|
|
|
|
/*
|
|
|
|
* Network queue metrics
|
|
|
|
*/
|
|
|
|
pub static ref NETWORK_RECEIVE_EVENTS: Result<IntCounterVec> = try_create_int_counter_vec(
|
|
|
|
"network_receive_events",
|
|
|
|
"Count of events received by the channel to the network service",
|
|
|
|
&["type"]
|
|
|
|
);
|
|
|
|
pub static ref NETWORK_RECEIVE_TIMES: Result<HistogramVec> = try_create_histogram_vec(
|
|
|
|
"network_receive_times",
|
|
|
|
"Time taken for network to handle an event sent to the network service.",
|
|
|
|
&["type"]
|
|
|
|
);
|
2021-12-22 06:17:14 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
lazy_static! {
|
|
|
|
|
|
|
|
/*
|
|
|
|
* Bandwidth metrics
|
|
|
|
*/
|
2020-11-28 05:30:57 +00:00
|
|
|
pub static ref INBOUND_LIBP2P_BYTES: Result<IntGauge> =
|
|
|
|
try_create_int_gauge("libp2p_inbound_bytes", "The inbound bandwidth over libp2p");
|
2021-12-22 06:17:14 +00:00
|
|
|
|
2020-11-28 05:30:57 +00:00
|
|
|
pub static ref OUTBOUND_LIBP2P_BYTES: Result<IntGauge> = try_create_int_gauge(
|
|
|
|
"libp2p_outbound_bytes",
|
|
|
|
"The outbound bandwidth over libp2p"
|
|
|
|
);
|
|
|
|
pub static ref TOTAL_LIBP2P_BANDWIDTH: Result<IntGauge> = try_create_int_gauge(
|
|
|
|
"libp2p_total_bandwidth",
|
|
|
|
"The total inbound/outbound bandwidth over libp2p"
|
|
|
|
);
|
|
|
|
|
2020-08-14 04:38:45 +00:00
|
|
|
|
2020-11-26 05:23:17 +00:00
|
|
|
/*
|
|
|
|
* Sync related metrics
|
|
|
|
*/
|
|
|
|
pub static ref PEERS_PER_SYNC_TYPE: Result<IntGaugeVec> = try_create_int_gauge_vec(
|
|
|
|
"sync_peers_per_status",
|
|
|
|
"Number of connected peers per sync status type",
|
|
|
|
&["sync_status"]
|
|
|
|
);
|
|
|
|
pub static ref SYNCING_CHAINS_COUNT: Result<IntGaugeVec> = try_create_int_gauge_vec(
|
|
|
|
"sync_range_chains",
|
|
|
|
"Number of Syncing chains in range, per range type",
|
|
|
|
&["range_type"]
|
|
|
|
);
|
2022-03-23 01:09:39 +00:00
|
|
|
pub static ref SYNC_SINGLE_BLOCK_LOOKUPS: Result<IntGauge> = try_create_int_gauge(
|
|
|
|
"sync_single_block_lookups",
|
|
|
|
"Number of single block lookups underway"
|
|
|
|
);
|
|
|
|
pub static ref SYNC_PARENT_BLOCK_LOOKUPS: Result<IntGauge> = try_create_int_gauge(
|
|
|
|
"sync_parent_block_lookups",
|
|
|
|
"Number of parent block lookups underway"
|
|
|
|
);
|
2020-11-26 05:23:17 +00:00
|
|
|
|
2021-02-04 05:33:56 +00:00
|
|
|
/*
|
|
|
|
* Block Delay Metrics
|
|
|
|
*/
|
|
|
|
pub static ref BEACON_BLOCK_GOSSIP_PROPAGATION_VERIFICATION_DELAY_TIME: Result<Histogram> = try_create_histogram(
|
|
|
|
"beacon_block_gossip_propagation_verification_delay_time",
|
|
|
|
"Duration between when the block is received and when it is verified for propagation.",
|
|
|
|
);
|
|
|
|
pub static ref BEACON_BLOCK_GOSSIP_SLOT_START_DELAY_TIME: Result<Histogram> = try_create_histogram(
|
|
|
|
"beacon_block_gossip_slot_start_delay_time",
|
|
|
|
"Duration between when the block is received and the start of the slot it belongs to.",
|
|
|
|
);
|
2021-08-23 00:59:14 +00:00
|
|
|
pub static ref BEACON_BLOCK_GOSSIP_ARRIVED_LATE_TOTAL: Result<IntCounter> = try_create_int_counter(
|
|
|
|
"beacon_block_gossip_arrived_late_total",
|
|
|
|
"Count of times when a gossip block arrived from the network later than the attestation deadline.",
|
|
|
|
);
|
2021-07-14 05:24:08 +00:00
|
|
|
|
|
|
|
/*
|
|
|
|
* Attestation reprocessing queue metrics.
|
|
|
|
*/
|
|
|
|
pub static ref BEACON_PROCESSOR_REPROCESSING_QUEUE_TOTAL: Result<IntGaugeVec> =
|
|
|
|
try_create_int_gauge_vec(
|
|
|
|
"beacon_processor_reprocessing_queue_total",
|
|
|
|
"Count of items in a reprocessing queue.",
|
|
|
|
&["type"]
|
|
|
|
);
|
|
|
|
pub static ref BEACON_PROCESSOR_REPROCESSING_QUEUE_EXPIRED_ATTESTATIONS: Result<IntCounter> = try_create_int_counter(
|
|
|
|
"beacon_processor_reprocessing_queue_expired_attestations",
|
2021-12-22 06:17:14 +00:00
|
|
|
"Number of queued attestations which have expired before a matching block has been found."
|
2021-07-14 05:24:08 +00:00
|
|
|
);
|
|
|
|
pub static ref BEACON_PROCESSOR_REPROCESSING_QUEUE_MATCHED_ATTESTATIONS: Result<IntCounter> = try_create_int_counter(
|
|
|
|
"beacon_processor_reprocessing_queue_matched_attestations",
|
2021-12-22 06:17:14 +00:00
|
|
|
"Number of queued attestations where as matching block has been imported."
|
|
|
|
);
|
|
|
|
|
|
|
|
}
|
|
|
|
|
|
|
|
pub fn update_bandwidth_metrics(bandwidth: Arc<BandwidthSinks>) {
|
|
|
|
set_gauge(&INBOUND_LIBP2P_BYTES, bandwidth.total_inbound() as i64);
|
|
|
|
set_gauge(&OUTBOUND_LIBP2P_BYTES, bandwidth.total_outbound() as i64);
|
|
|
|
set_gauge(
|
|
|
|
&TOTAL_LIBP2P_BANDWIDTH,
|
|
|
|
(bandwidth.total_inbound() + bandwidth.total_outbound()) as i64,
|
2021-07-14 05:24:08 +00:00
|
|
|
);
|
2020-11-26 05:23:17 +00:00
|
|
|
}
|
|
|
|
|
2020-08-14 04:38:45 +00:00
|
|
|
pub fn register_attestation_error(error: &AttnError) {
|
2021-01-19 06:33:58 +00:00
|
|
|
inc_counter_vec(&GOSSIP_ATTESTATION_ERRORS_PER_TYPE, &[error.as_ref()]);
|
2020-05-17 11:16:48 +00:00
|
|
|
}
|
2020-11-28 05:30:57 +00:00
|
|
|
|
2021-08-04 01:44:57 +00:00
|
|
|
pub fn register_sync_committee_error(error: &SyncCommitteeError) {
|
|
|
|
inc_counter_vec(&GOSSIP_SYNC_COMMITTEE_ERRORS_PER_TYPE, &[error.as_ref()]);
|
|
|
|
}
|
|
|
|
|
2020-11-28 05:30:57 +00:00
|
|
|
pub fn update_gossip_metrics<T: EthSpec>(
|
|
|
|
gossipsub: &Gossipsub,
|
|
|
|
network_globals: &Arc<NetworkGlobals<T>>,
|
|
|
|
) {
|
2021-12-22 06:17:14 +00:00
|
|
|
// Mesh peers per client
|
2022-03-01 01:49:22 +00:00
|
|
|
// Reset the gauges
|
|
|
|
for client_kind in ClientKind::iter() {
|
|
|
|
set_gauge_vec(
|
|
|
|
&BEACON_BLOCK_MESH_PEERS_PER_CLIENT,
|
2022-04-01 00:58:59 +00:00
|
|
|
&[client_kind.as_ref()],
|
2022-03-01 01:49:22 +00:00
|
|
|
0_i64,
|
|
|
|
);
|
|
|
|
set_gauge_vec(
|
|
|
|
&BEACON_AGGREGATE_AND_PROOF_MESH_PEERS_PER_CLIENT,
|
2022-04-01 00:58:59 +00:00
|
|
|
&[client_kind.as_ref()],
|
2022-03-01 01:49:22 +00:00
|
|
|
0_i64,
|
|
|
|
);
|
|
|
|
}
|
|
|
|
|
2020-11-28 05:30:57 +00:00
|
|
|
for topic_hash in gossipsub.topics() {
|
|
|
|
if let Ok(topic) = GossipTopic::decode(topic_hash.as_str()) {
|
2021-12-22 06:17:14 +00:00
|
|
|
match topic.kind() {
|
|
|
|
GossipKind::Attestation(_subnet_id) => {}
|
|
|
|
GossipKind::BeaconBlock => {
|
|
|
|
for peer_id in gossipsub.mesh_peers(topic_hash) {
|
|
|
|
let client = network_globals
|
|
|
|
.peers
|
|
|
|
.read()
|
|
|
|
.peer_info(peer_id)
|
2022-04-01 00:58:59 +00:00
|
|
|
.map(|peer_info| peer_info.client().kind.into())
|
2021-12-22 06:17:14 +00:00
|
|
|
.unwrap_or_else(|| "Unknown");
|
|
|
|
if let Some(v) =
|
|
|
|
get_int_gauge(&BEACON_BLOCK_MESH_PEERS_PER_CLIENT, &[client])
|
|
|
|
{
|
2020-11-28 05:30:57 +00:00
|
|
|
v.inc()
|
|
|
|
};
|
|
|
|
}
|
2021-12-22 06:17:14 +00:00
|
|
|
}
|
|
|
|
GossipKind::BeaconAggregateAndProof => {
|
|
|
|
for peer_id in gossipsub.mesh_peers(topic_hash) {
|
|
|
|
let client = network_globals
|
|
|
|
.peers
|
|
|
|
.read()
|
|
|
|
.peer_info(peer_id)
|
2022-04-01 00:58:59 +00:00
|
|
|
.map(|peer_info| peer_info.client().kind.into())
|
2021-12-22 06:17:14 +00:00
|
|
|
.unwrap_or_else(|| "Unknown");
|
2021-08-04 01:44:57 +00:00
|
|
|
if let Some(v) = get_int_gauge(
|
2021-12-22 06:17:14 +00:00
|
|
|
&BEACON_AGGREGATE_AND_PROOF_MESH_PEERS_PER_CLIENT,
|
|
|
|
&[client],
|
2021-08-04 01:44:57 +00:00
|
|
|
) {
|
|
|
|
v.inc()
|
|
|
|
};
|
2020-11-28 05:30:57 +00:00
|
|
|
}
|
|
|
|
}
|
2021-12-22 06:17:14 +00:00
|
|
|
GossipKind::SyncCommitteeMessage(_subnet_id) => {}
|
|
|
|
_kind => {}
|
2020-11-28 05:30:57 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
pub fn update_sync_metrics<T: EthSpec>(network_globals: &Arc<NetworkGlobals<T>>) {
|
|
|
|
// reset the counts
|
|
|
|
if PEERS_PER_SYNC_TYPE
|
|
|
|
.as_ref()
|
|
|
|
.map(|metric| metric.reset())
|
|
|
|
.is_err()
|
|
|
|
{
|
|
|
|
return;
|
|
|
|
};
|
|
|
|
|
|
|
|
// count per sync status, the number of connected peers
|
|
|
|
let mut peers_per_sync_type = FnvHashMap::default();
|
|
|
|
for sync_type in network_globals
|
2021-11-25 03:45:52 +00:00
|
|
|
.peers
|
|
|
|
.read()
|
2020-11-28 05:30:57 +00:00
|
|
|
.connected_peers()
|
2021-10-11 02:45:06 +00:00
|
|
|
.map(|(_peer_id, info)| info.sync_status().as_str())
|
2020-11-28 05:30:57 +00:00
|
|
|
{
|
|
|
|
*peers_per_sync_type.entry(sync_type).or_default() += 1;
|
|
|
|
}
|
|
|
|
|
|
|
|
for (sync_type, peer_count) in peers_per_sync_type {
|
|
|
|
set_gauge_entry(&PEERS_PER_SYNC_TYPE, &[sync_type], peer_count);
|
|
|
|
}
|
|
|
|
}
|