amb-monitor/prometheus/rules.yml

90 lines
3.3 KiB
YAML

groups:
- name: StuckMessage
rules:
- alert: StuckMessage
expr: max_over_time(alert_monitor_stuck_message_confirmation[5m]) > 3600
annotations:
age: '{{ humanizeDuration $value }}'
- name: UnknownMessageConfirmation
rules:
- alert: UnknownMessageConfirmation
expr: max_over_time(alert_monitor_unknown_message_confirmation[5m]) > 0
annotations:
age: '{{ humanizeDuration $value }}'
- name: UnknownMessageExecution
rules:
- alert: UnknownMessageExecution
expr: max_over_time(alert_monitor_unknown_message_execution[5m]) > 0
annotations:
age: '{{ humanizeDuration $value }}'
- name: FailedMessageExecution
rules:
- alert: FailedMessageExecution
expr: max_over_time(alert_monitor_failed_message_execution[5m]) > 0
annotations:
age: '{{ humanizeDuration $value }}'
- name: StuckInformationRequest
rules:
- alert: StuckInformationRequest
expr: max_over_time(alert_monitor_stuck_information_request[5m]) > 3600
annotations:
age: '{{ humanizeDuration $value }}'
- name: UnknownInformationSignature
rules:
- alert: UnknownInformationSignature
expr: max_over_time(alert_monitor_unknown_information_signature[5m]) > 0
annotations:
age: '{{ humanizeDuration $value }}'
- name: UnknownInformationExecution
rules:
- alert: UnknownInformationExecution
expr: max_over_time(alert_monitor_unknown_information_execution[5m]) > 0
annotations:
age: '{{ humanizeDuration $value }}'
- name: FailedInformationRequest
rules:
- alert: FailedInformationRequest
expr: max_over_time(alert_monitor_failed_information_request[5m]) > 0
annotations:
age: '{{ humanizeDuration $value }}'
- name: DifferentInformationSignatures
rules:
- alert: DifferentInformationSignatures
expr: max_over_time(alert_monitor_different_information_signatures[5m]) > 0
annotations:
age: '{{ humanizeDuration $value }}'
- name: StuckErcToNativeMessage
rules:
- alert: StuckErcToNativeMessage
expr: max_over_time(alert_monitor_stuck_erc_to_native_message_confirmation[5m]) > 3600
annotations:
age: '{{ humanizeDuration $value }}'
- name: UnknownErcToNativeMessageConfirmation
rules:
- alert: UnknownErcToNativeMessageConfirmation
expr: max_over_time(alert_monitor_unknown_erc_to_native_message_confirmation[5m]) > 0
annotations:
age: '{{ humanizeDuration $value }}'
- name: UnknownErcToNativeMessageExecution
rules:
- alert: UnknownErcToNativeMessageExecution
expr: max_over_time(alert_monitor_unknown_erc_to_native_message_execution[5m]) > 0
annotations:
age: '{{ humanizeDuration $value }}'
- name: ValidatorOffline
rules:
- alert: ValidatorOffline
expr: max_over_time(alert_monitor_last_validator_activity[5m]) > 43200
annotations:
age: '{{ humanizeDuration $value }}'
- name: StuckContractProgress
rules:
- alert: StuckContractProgress
expr: increase(monitor_contract_latest_processed_block[10m]) < 10
for: 5m
- name: InstanceIsDown
rules:
- alert: InstanceIsDown
expr: up < 1
for: 2m