Alerts

ExporterDown (4 active)
alert: ExporterDown
expr: up == 0
for: 5m
annotations:
  description: Exporter {{ $labels.instance }} has been down for more than 5 minutes.
  summary: Exporter {{ $labels.instance }} down
Labels State Active Since Value
alertname="ExporterDown" instance="localhost:9113" job="nginx" firing 2024-10-29 04:57:41.811792528 +0000 UTC 0
alertname="ExporterDown" instance="ap01:5556" job="jmx" firing 2024-10-30 03:40:41.8138731 +0000 UTC 0
alertname="ExporterDown" instance="ap02:5556" job="jmx" firing 2025-01-22 04:50:41.813852095 +0000 UTC 0
alertname="ExporterDown" instance="db01:9104" job="mysql_master" firing 2025-02-06 00:02:41.81385913 +0000 UTC 0
DBNotEnoughStrage (0 active)
alert: DBNotEnoughStrage
expr: node_filesystem_avail_bytes{job=~"dbserver"}
  < 2.147483648e+09
for: 5m
labels:
  severity: page
annotations:
  description: Instance {{ $labels.instance }} not enough strage less than 2GB
  summary: Instance {{ $labels.instance }} not enough strage.
DBNotEnoughStrageForSystem (0 active)
alert: DBNotEnoughStrageForSystem
expr: node_filesystem_free_bytes
  - node_filesystem_avail_bytes{job=~"dbserver"} < 5.24288e+08
for: 5m
labels:
  severity: page
annotations:
  description: Instance {{ $labels.instance }} not enough strage less than 500MB
  summary: Instance {{ $labels.instance }} not enough strage.
InstanceDown (0 active)
alert: InstanceDown
expr: nginx_up == 0
for: 5m
labels:
  severity: page
annotations:
  description: '{{ $labels.instance }} of job {{ $labels.job }} has been down for
    more than 5 minutes.'
  summary: Instance {{ $labels.instance }} down
JVMUseMetaspaceOver1GB (0 active)
alert: JVMUseMetaspaceOver1GB
expr: java_lang_Memory_NonHeapMemoryUsage_used
  > 1.073741824e+09
for: 5m
labels:
  severity: page
annotations:
  description: Instance {{ $labels.instance }} use Metaspace over 1GB
  summary: Instance {{ $labels.instance }} use Metaspace over 1GB
NotEnoughMemory (0 active)
alert: NotEnoughMemory
expr: node_memory_MemAvailable{job=~"gateway|webserver|apserver"}
  < 1.048576e+08
for: 5m
labels:
  severity: page
annotations:
  description: Instance {{ $labels.instance }} not enough memory less than 100MB
  summary: Instance {{ $labels.instance }} not enough memory.
NotEnoughMemory (0 active)
alert: NotEnoughMemory
expr: node_memory_MemAvailable_bytes{job=~"dbserver"}
  < 5.24288e+08
for: 5m
labels:
  severity: page
annotations:
  description: Instance {{ $labels.instance }} not enough memory less than 500MB
  summary: Instance {{ $labels.instance }} not enough memory.
OverNginxConnectionsActive (0 active)
alert: OverNginxConnectionsActive
expr: nginx_connections_active
  > 40
for: 5m
labels:
  severity: page
annotations:
  description: Instance {{ $labels.instance }} over 40 nginx connections
  summary: Instance {{ $labels.instance }} over 40 nginx connections
OverWork (0 active)
alert: OverWork
expr: node_load1{job=~"dbserver"}
  > 3
for: 5m
labels:
  severity: page
annotations:
  description: Instance {{ $labels.instance }} node_load over 2 for more than 5 minutes.
  summary: Instance {{ $labels.instance }} over working.
OverWork (0 active)
alert: OverWork
expr: node_load1{job="gateway"}
  > 2
for: 5m
labels:
  severity: page
annotations:
  description: Instance {{ $labels.instance }} node_load over 1 for more than 5 minutes.
  summary: Instance {{ $labels.instance }} over working.
OverWork (0 active)
alert: OverWork
expr: node_load1{job=~"webserver|apserver"}
  > 2
for: 5m
labels:
  severity: page
annotations:
  description: Instance {{ $labels.instance }} node_load over 2 for more than 5 minutes.
  summary: Instance {{ $labels.instance }} over working.
RedisUsageMemOver (0 active)
alert: RedisUsageMemOver
expr: 100
  * redis_memory_used_bytes / redis_memory_max_bytes > 80
for: 5m
labels:
  severity: page
annotations:
  description: redis is using 80% of the maximum value
  summary: redis is using 80% of the maximum value
ServerNotEnoughStrage (0 active)
alert: ServerNotEnoughStrage
expr: node_filesystem_avail{job=~"gateway|webserver|apserver"}
  < 2.147483648e+09
for: 5m
labels:
  severity: page
annotations:
  description: Instance {{ $labels.instance }} not enough strage less than 2GB
  summary: Instance {{ $labels.instance }} not enough strage.
ServerNotEnoughStrageForSystem (0 active)
alert: ServerNotEnoughStrageForSystem
expr: node_filesystem_free
  - node_filesystem_avail{job=~"gateway|webserver|apserver"} < 5.24288e+08
for: 5m
labels:
  severity: page
annotations:
  description: Instance {{ $labels.instance }} not enough strage less than 500MB
  summary: Instance {{ $labels.instance }} not enough strage.
SlaveBehindMaster (0 active)
alert: SlaveBehindMaster
expr: mysql_slave_status_seconds_behind_master{job=~"mysql_slave"}
  > 0
for: 5m
labels:
  severity: page
annotations:
  description: Instance {{ $labels.instance }} behind master
  summary: Instance {{ $labels.instance }} behind master
StopSlaveIO (0 active)
alert: StopSlaveIO
expr: mysql_slave_status_slave_io_running{job=~"mysql_slave"}
  < 1
for: 1m
labels:
  severity: page
annotations:
  description: Instance {{ $labels.instance }} stop slave io
  summary: Instance {{ $labels.instance }} stop slave io
StopSlaveSQL (0 active)
alert: StopSlaveSQL
expr: mysql_slave_status_slave_sql_running{job=~"mysql_slave"}
  < 1
for: 1m
labels:
  severity: page
annotations:
  description: Instance {{ $labels.instance }} stop slave SQL
  summary: Instance {{ $labels.instance }} stop slave SQL
UserHeapMemOver1GB (0 active)
alert: UserHeapMemOver1GB
expr: java_lang_Memory_HeapMemoryUsage_used
  > 1.073741824e+09
for: 5m
labels:
  severity: page
annotations:
  description: Instance {{ $labels.instance }} use heap memory over 900MB
  summary: Instance {{ $labels.instance }} use heap memory over 900MB
UserOldMemOver800MB (0 active)
alert: UserOldMemOver800MB
expr: java_lang_G1_Old_Gen_Usage_used
  > 8.388608e+08
for: 5m
labels:
  severity: page
annotations:
  description: Instance {{ $labels.instance }} use old over 800MB
  summary: Instance {{ $labels.instance }} use old  over 800MB