Use external head for subgraph alerts and show blockProcessingOffset on watcher dashboard #861

Open
prathamesh wants to merge 4 commits from deep-stack/stack-orchestrator:pm-update-monitoring into main
5 changed files with 179 additions and 79 deletions

View File

@ -1,5 +1,6 @@
services: services:
graph-node: graph-node:
restart: unless-stopped
image: cerc/graph-node:local image: cerc/graph-node:local
depends_on: depends_on:
db: db:
@ -40,6 +41,7 @@ services:
retries: 10 retries: 10
start_period: 3s start_period: 3s
ipfs: ipfs:
restart: unless-stopped
image: ipfs/kubo:master-2023-02-20-714a968 image: ipfs/kubo:master-2023-02-20-714a968
volumes: volumes:
- ipfs-import:/import - ipfs-import:/import
@ -49,6 +51,7 @@ services:
- "4001" - "4001"
- "5001" - "5001"
db: db:
restart: unless-stopped
image: postgres:14-alpine image: postgres:14-alpine
volumes: volumes:
- db-data:/var/lib/postgresql/data - db-data:/var/lib/postgresql/data

View File

@ -2866,6 +2866,19 @@
"legendFormat": "{{field}}", "legendFormat": "{{field}}",
"range": true, "range": true,
"refId": "E" "refId": "E"
},
{
"datasource": {
"type": "prometheus",
"uid": "PBFA97CFB590B2093"
},
"editorMode": "code",
"expr": "watcher_config_info{job=~\"$job\", instance=~\"$watcher\", category=\"jobqueue\", field=\"block_processing_offset\"}",
"hide": false,
"instant": false,
"legendFormat": "{{field}}",
"range": true,
"refId": "F"
} }
], ],
"title": "Watcher config (job queue)", "title": "Watcher config (job queue)",
@ -3284,6 +3297,6 @@
"timepicker": {}, "timepicker": {},
"timezone": "", "timezone": "",
"title": "Watchers", "title": "Watchers",
"version": 5, "version": 6,
"weekStart": "" "weekStart": ""
} }

View File

@ -49,6 +49,10 @@ scrape_configs:
labels: labels:
instance: 'external' instance: 'external'
chain: 'ethereum' chain: 'ethereum'
- targets: ['sepolia-chain-head-exporter:5000']
labels:
instance: 'external'
chain: 'sepolia'
- targets: ['filecoin-chain-head-exporter:5000'] - targets: ['filecoin-chain-head-exporter:5000']
labels: labels:
instance: 'external' instance: 'external'

View File

@ -19,7 +19,7 @@ groups:
type: prometheus type: prometheus
uid: PBFA97CFB590B2093 uid: PBFA97CFB590B2093
editorMode: code editorMode: code
expr: ethereum_chain_head_number - on(network) group_right deployment_head{deployment=~"REPLACE_WITH_SUBGRAPH_IDS"} expr: label_replace(latest_block_number{instance="external"}, "network", "$1", "chain", "(.*)") - on(network) group_right deployment_head{deployment=~"REPLACE_WITH_SUBGRAPH_IDS"}
instant: true instant: true
intervalMs: 1000 intervalMs: 1000
legendFormat: __auto legendFormat: __auto

View File

@ -695,82 +695,6 @@ groups:
annotations: annotations:
summary: Watcher {{ index $labels "instance" }} of group {{ index $labels "job" }} is falling behind external head by {{ index $values "diff" }} summary: Watcher {{ index $labels "instance" }} of group {{ index $labels "job" }} is falling behind external head by {{ index $values "diff" }}
isPaused: false isPaused: false
- uid: merkl_sushiswap_diff_external
title: merkl_sushiswap_watcher_head_tracking
condition: condition
data:
- refId: diff
relativeTimeRange:
from: 600
to: 0
datasourceUid: PBFA97CFB590B2093
model:
datasource:
type: prometheus
uid: PBFA97CFB590B2093
disableTextWrap: false
editorMode: code
expr: latest_block_number{instance="external"} - on(chain) group_right sync_status_block_number{job="sushi", instance="merkl_sushiswap", kind="latest_indexed"}
fullMetaSearch: false
includeNullMetadata: true
instant: true
intervalMs: 1000
legendFormat: __auto
maxDataPoints: 43200
range: false
refId: diff
useBackend: false
- refId: latest_external
relativeTimeRange:
from: 600
to: 0
datasourceUid: PBFA97CFB590B2093
model:
datasource:
type: prometheus
uid: PBFA97CFB590B2093
editorMode: code
expr: latest_block_number{chain="filecoin"}
hide: false
instant: true
legendFormat: __auto
range: false
refId: latest_external
- refId: condition
relativeTimeRange:
from: 600
to: 0
datasourceUid: __expr__
model:
conditions:
- evaluator:
params:
- 0
- 0
type: gt
operator:
type: and
query:
params: []
reducer:
params: []
type: avg
type: query
datasource:
name: Expression
type: __expr__
uid: __expr__
expression: ${diff} >= 16
intervalMs: 1000
maxDataPoints: 43200
refId: condition
type: math
noDataState: Alerting
execErrState: Alerting
for: 15m
annotations:
summary: Watcher {{ index $labels "instance" }} of group {{ index $labels "job" }} is falling behind external head by {{ index $values "diff" }}
isPaused: false
# Ajna # Ajna
- uid: ajna_diff_external - uid: ajna_diff_external
@ -927,3 +851,159 @@ groups:
annotations: annotations:
summary: Watcher {{ index $labels "instance" }} of group {{ index $labels "job" }} is falling behind external head by {{ index $values "diff" }} summary: Watcher {{ index $labels "instance" }} of group {{ index $labels "job" }} is falling behind external head by {{ index $values "diff" }}
isPaused: false isPaused: false
# Borg
- uid: borg_diff_external
title: borg_watcher_head_tracking
condition: condition
data:
- refId: diff
relativeTimeRange:
from: 600
to: 0
datasourceUid: PBFA97CFB590B2093
model:
datasource:
type: prometheus
uid: PBFA97CFB590B2093
disableTextWrap: false
editorMode: code
expr: latest_block_number{instance="external"} - on(chain) group_right sync_status_block_number{job="borg", instance="borg", kind="latest_indexed"}
fullMetaSearch: false
includeNullMetadata: true
instant: true
intervalMs: 1000
legendFormat: __auto
maxDataPoints: 43200
range: false
refId: diff
useBackend: false
- refId: latest_external
relativeTimeRange:
from: 600
to: 0
datasourceUid: PBFA97CFB590B2093
model:
datasource:
type: prometheus
uid: PBFA97CFB590B2093
editorMode: code
expr: latest_block_number{chain="sepolia"}
hide: false
instant: true
legendFormat: __auto
range: false
refId: latest_external
- refId: condition
relativeTimeRange:
from: 600
to: 0
datasourceUid: __expr__
model:
conditions:
- evaluator:
params:
- 0
- 0
type: gt
operator:
type: and
query:
params: []
reducer:
params: []
type: avg
type: query
datasource:
name: Expression
type: __expr__
uid: __expr__
expression: ${diff} >= 16
intervalMs: 1000
maxDataPoints: 43200
refId: condition
type: math
noDataState: Alerting
execErrState: Alerting
for: 15m
annotations:
summary: Watcher {{ index $labels "instance" }} of group {{ index $labels "job" }} is falling behind external head by {{ index $values "diff" }}
isPaused: false
# Steer Protocol
- uid: steer_protocol_diff_external
title: steer_protocol_watcher_head_tracking
condition: condition
data:
- refId: diff
relativeTimeRange:
from: 600
to: 0
datasourceUid: PBFA97CFB590B2093
model:
datasource:
type: prometheus
uid: PBFA97CFB590B2093
disableTextWrap: false
editorMode: code
expr: latest_block_number{instance="external"} - on(chain) group_right sync_status_block_number{job="steer-protocol", instance="steer-protocol", kind="latest_indexed"}
fullMetaSearch: false
includeNullMetadata: true
instant: true
intervalMs: 1000
legendFormat: __auto
maxDataPoints: 43200
range: false
refId: diff
useBackend: false
- refId: latest_external
relativeTimeRange:
from: 600
to: 0
datasourceUid: PBFA97CFB590B2093
model:
datasource:
type: prometheus
uid: PBFA97CFB590B2093
editorMode: code
expr: latest_block_number{chain="filecoin"}
hide: false
instant: true
legendFormat: __auto
range: false
refId: latest_external
- refId: condition
relativeTimeRange:
from: 600
to: 0
datasourceUid: __expr__
model:
conditions:
- evaluator:
params:
- 0
- 0
type: gt
operator:
type: and
query:
params: []
reducer:
params: []
type: avg
type: query
datasource:
name: Expression
type: __expr__
uid: __expr__
expression: ${diff} >= 16
intervalMs: 1000
maxDataPoints: 43200
refId: condition
type: math
noDataState: Alerting
execErrState: Alerting
for: 15m
annotations:
summary: Watcher {{ index $labels "instance" }} of group {{ index $labels "job" }} is falling behind external head by {{ index $values "diff" }}
isPaused: false