Prometheus Time Series Collection and Processing Server

Rules

alert.rules			50.12s ago	81.78ms
Rule	State	Error	Last Evaluation	Evaluation Time
alert: InstanceDown expr: up == 0 for: 10s labels: severity: critical annotations: description: '{{ $labels.instance }} of job {{ $labels.job }} has been down for more than 1 minutes.' summary: Endpoint {{ $labels.instance }} down	ok		50.123s ago	831.8us
alert: PrometheusConfigurationReloadFailure expr: prometheus_config_last_reload_successful != 1 for: 1m labels: severity: warning annotations: description: \|- Prometheus configuration reload error VALUE = {{ $value }} LABELS: {{ $labels }} summary: Prometheus configuration reload failure (instance {{ $labels.instance }})	ok		50.122s ago	144.4us
alert: PrometheusTooManyRestarts expr: changes(process_start_time_seconds{job=~"prometheus\|pushgateway\|alertmanager"}[15m]) > 2 for: 5m labels: severity: warning annotations: description: \|- Prometheus has restarted more than twice in the last 15 minutes. It might be crashlooping. VALUE = {{ $value }} LABELS: {{ $labels }} summary: Prometheus too many restarts (instance {{ $labels.instance }})	ok		50.122s ago	250.5us
alert: HostMemoryUnderMemoryPressure expr: rate(node_vmstat_pgmajfault[2m]) > 8 labels: severity: warning annotations: description: \|- The node is under heavy memory pressure. High rate of major page faults VALUE = {{ $value }} LABELS: {{ $labels }} summary: Host memory under memory pressure (instance {{ $labels.instance }})	ok		50.122s ago	173.6us
alert: HostOutOfMemory expr: (node_memory_MemAvailable_bytes / node_memory_MemTotal_bytes) * 100 < 30 labels: severity: warning annotations: description: \|- Node memory is filling up (< 30% left) VALUE = {{ $value }} LABELS: {{ $labels }} summary: Host out of memory (instance {{ $labels.instance }})	ok		50.123s ago	304.7us
alert: HostOutOfMemoryCritical expr: (node_memory_MemAvailable_bytes / node_memory_MemTotal_bytes) * 100 < 10 labels: severity: critical annotations: description: \|- Node memory is filling up (< 10% left) VALUE = {{ $value }} LABELS: {{ $labels }} summary: Host out of memory (instance {{ $labels.instance }})	ok		50.123s ago	271.5us
alert: HostUnusualNetworkThroughputIn expr: (sum by(instance) (irate(node_network_receive_bytes_total[2m]))) / (1024 * 1024) > 1 for: 2m labels: severity: warning annotations: description: \|- Host network interfaces are probably receiving too much data (> 1 MB/s) VALUE = {{ $value }} LABELS: {{ $labels }} summary: Host unusual network throughput in (instance {{ $labels.instance }})	ok		50.123s ago	962.9us
alert: HostUnusualNetworkThroughputOut expr: (sum by(instance) (irate(node_network_transmit_bytes_total[2m]))) / (1024 * 1024) > 1 for: 2m labels: severity: warning	ok		50.122s ago	911.3us
alert: HostOutOfDiskSpace expr: (node_filesystem_avail_bytes / node_filesystem_size_bytes) * 100 < 30 labels: severity: warning annotations: description: \|- Disk is almost full (< 30% left) VALUE = {{ $value }} LABELS: {{ $labels }} summary: Host out of disk space (instance {{ $labels.instance }})	ok		50.121s ago	291.3us
alert: HostDiskWillFillIn48Hours expr: predict_linear(node_filesystem_avail_bytes[1h], 48 * 3600) < 0 for: 5m labels: severity: warning annotations: description: \|- Disk will fill in 48 hours at current write rate VALUE = {{ $value }} LABELS: {{ $labels }} summary: Host disk will fill in 4 hours (instance {{ $labels.instance }})	ok		50.121s ago	198.7us
alert: HostOutOfDiskInodes expr: (node_filesystem_files_free / node_filesystem_files) * 100 < 50 labels: severity: warning annotations: description: \|- Disk inodes is almost full (< 50% left) VALUE = {{ $value }} LABELS: {{ $labels }} summary: Host out of disk inodes (instance {{ $labels.instance }})	ok		50.121s ago	306us
alert: HostHighCpuLoad expr: 100 - (avg by(instance) (irate(node_cpu_seconds_total{mode="idle"}[2m])) * 100) > 60 labels: severity: warning annotations: description: \|- CPU load is > 80% VALUE = {{ $value }} LABELS: {{ $labels }} summary: Host high CPU load (instance {{ $labels.instance }})	ok		50.121s ago	346.1us
alert: containerStatusLastTerminatedReason expr: increase(kube_pod_container_status_last_terminated_reason[1d]) > 0 labels: severity: warning annotations: description: \|- Container VALUE = {{ $value }} LABELS: {{ $labels }} summary: Container {{ $labels.instance }} down	ok		50.121s ago	69.73ms
alert: RaftLeaderChanges expr: changes(consensus_etcdraft_is_leader[2h]) > 0 labels: severity: warning annotations: description: \|2- VALUE = {{ $value }} LABELS: {{ $labels }} summary: ' raft leader changed (instance {{ $labels.instance }})'	ok		50.051s ago	1.336ms
alert: ledgerTransactionCountPerMinuteWarning expr: rate(ledger_transaction_count[1m]) * 60 > 16 labels: severity: warning annotations: description: \|2- VALUE = {{ $value }} LABELS: {{ $labels }} summary: ' ledger_transaction_count more than 16 per minute (instance {{ $labels.instance }})'	ok		50.05s ago	396.2us
alert: ledgerTransactionCountPerMinuteCritical expr: rate(ledger_transaction_count[1m]) * 60 > 60 labels: severity: critical annotations: description: \|2- VALUE = {{ $value }} LABELS: {{ $labels }} summary: ' ledger_transaction_count more than 60 per minute (instance {{ $labels.instance }})'	ok		50.049s ago	445.6us
alert: chaincodeExecuteTimeouts expr: rate(chaincode_execute_timeouts[30s]) * 30 > 0 labels: severity: critical annotations: description: \|2- VALUE = {{ $value }} LABELS: {{ $labels }} summary: ' chaincodeExecuteTimeouts per minute (instance {{ $labels.instance }})'	ok		50.049s ago	182.3us
alert: chaincodeLaunchFailures expr: rate(chaincode_launch_failures[30s]) * 30 > 0 labels: severity: critical annotations: description: \|2- VALUE = {{ $value }} LABELS: {{ $labels }} summary: ' chaincodeLaunchFailures per minute (instance {{ $labels.instance }})'	ok		50.049s ago	487.4us
alert: chaincodeLaunchTimeouts expr: rate(chaincode_launch_timeouts[30s]) * 30 > 0 labels: severity: critical annotations: description: \|2- VALUE = {{ $value }} LABELS: {{ $labels }} summary: ' chaincodeLaunchFailures per minute (instance {{ $labels.instance }})'	ok		50.049s ago	137.4us
alert: endorserChaincodeInstantiationFailures expr: rate(endorser_chaincode_instantiation_failures[30s]) * 30 > 0 labels: severity: critical annotations: description: \|2- VALUE = {{ $value }} LABELS: {{ $labels }} summary: endorserChaincodeInstantiationFailures (instance {{ $labels.instance }})	ok		50.049s ago	343.1us
alert: endorserDuplicateTransactionFailures expr: rate(endorser_duplicate_transaction_failures[30s]) * 30 > 0 labels: severity: critical annotations: description: \|2- VALUE = {{ $value }} LABELS: {{ $labels }} summary: endorserDuplicateTransactionFailures (instance {{ $labels.instance }})	ok		50.048s ago	193us
alert: endorserEndorsementFailures expr: rate(endorser_endorsement_failures[30s]) * 30 > 0 labels: severity: critical annotations: description: \|2- VALUE = {{ $value }} LABELS: {{ $labels }} summary: endorser_endorsement_failures (instance {{ $labels.instance }})	ok		50.048s ago	146us
alert: endorserProposalAclFailures expr: rate(endorser_proposal_acl_failures[30s]) * 30 > 0 labels: severity: critical annotations: description: \|2- VALUE = {{ $value }} LABELS: {{ $labels }} summary: endorserProposalAclFailures (instance {{ $labels.instance }})	ok		50.049s ago	199.6us
alert: endorserProposalValidationFailures expr: rate(endorser_proposal_validation_failures[30s]) * 30 > 0 labels: severity: critical annotations: description: \|2- VALUE = {{ $value }} LABELS: {{ $labels }} summary: endorserProposalValidationFailures (instance {{ $labels.instance }})	ok		50.049s ago	171us
alert: peerMemoryUsage expr: container_memory_working_set_bytes{container="peer",pod=~"peer."} / (1204 1024) > 600 labels: severity: medium annotations: description: \|2- VALUE = {{ $value }} LABELS: {{ $labels }} summary: peerMemoryUsage greater than 600Mb (instance {{ $labels.instance }})	ok		50.049s ago	304.8us
alert: couchDbMemoryUsage expr: container_memory_working_set_bytes{container="couchdb",pod=~"peer."} / (1204 1024) > 1200 labels: severity: medium annotations: description: \|2- VALUE = {{ $value }} LABELS: {{ $labels }} summary: couchDbMemoryUsage greater than 1200Mb (instance {{ $labels.instance }})	ok		50.049s ago	266.5us
alert: ordererMemoryUsage expr: container_memory_working_set_bytes{container=~"orderer."} / (1204 * 1024) > 100 labels: severity: medium annotations: description: \|2- VALUE = {{ $value }} LABELS: {{ $labels }} summary: ordererMemoryUsage greater than 100Mb (instance {{ $labels.instance }})	ok		50.048s ago	588.1us
alert: chainCodeMemoryUsage expr: container_memory_working_set_bytes{name=~"pr.-peer..pr..gouze.io-."} / (1204 1024) > 25 labels: severity: medium annotations: description: \|2- VALUE = {{ $value }} LABELS: {{ $labels }} summary: chainCodeMemoryUsage greater than 25Mb (instance {{ $labels.instance }})	ok		50.048s ago	452.3us
alert: fabricUsedDisk expr: kubelet_volume_stats_used_bytes{persistentvolumeclaim=~"production-.\|database-"} / kubelet_volume_stats_capacity_bytes{persistentvolumeclaim=~"production-.\|database-"} * 100 > 60 labels: severity: medium annotations: description: \|2- VALUE = {{ $value }} LABELS: {{ $labels }} summary: fabricUsedDisk greater than 60% (instance {{ $labels.instance }})	ok		50.048s ago	1.346ms

Rules

alert.rules

50.12s ago

81.78ms