infrastructure |
19.739s ago |
2.135ms |
||
| Rule | State | Error | Last Evaluation | Evaluation Time |
| alert: NodeDown expr: up{job="node"} == 0 for: 2m labels: severity: critical annotations: description: '{{ $labels.instance }} is down' summary: Node exporter down | ok | 19.745s ago | 449.3us | |
| alert: HighCPUUsage expr: 100 - (avg by (instance) (rate(node_cpu_seconds_total{mode="idle"}[5m])) * 100) > 80 for: 10m labels: severity: warning annotations: description: CPU usage > 80% on {{ $labels.instance }} summary: High CPU usage | ok | 19.745s ago | 626.3us | |
| alert: HighMemoryUsage expr: (1 - (node_memory_MemAvailable_bytes / node_memory_MemTotal_bytes)) * 100 > 85 for: 5m labels: severity: warning annotations: description: Memory usage > 85% on {{ $labels.instance }} summary: High memory usage | ok | 19.744s ago | 376.3us | |
| alert: DiskSpaceLow expr: (node_filesystem_avail_bytes{mountpoint="/"} / node_filesystem_size_bytes{mountpoint="/"}) * 100 < 15 for: 5m labels: severity: warning annotations: description: Disk space < 15% on {{ $labels.instance }} summary: Low disk space | ok | 19.744s ago | 355.7us | |
| alert: DiskSpaceCritical expr: (node_filesystem_avail_bytes{mountpoint="/"} / node_filesystem_size_bytes{mountpoint="/"}) * 100 < 5 for: 2m labels: severity: critical annotations: description: Disk space < 5% on {{ $labels.instance }} summary: Critical disk space | ok | 19.744s ago | 282.9us | |
postgresql |
28.368s ago |
1.346ms |
||
| Rule | State | Error | Last Evaluation | Evaluation Time |
| alert: PostgreSQLDown expr: pg_up == 0 for: 1m labels: severity: critical annotations: description: PostgreSQL on {{ $labels.instance }} is down summary: PostgreSQL is down | ok | 28.368s ago | 958.9us | |
| alert: PostgreSQLTooManyConnections expr: pg_stat_activity_count > 80 for: 5m labels: severity: warning annotations: description: '{{ $value }} connections (>80)' summary: PostgreSQL connections high | ok | 28.367s ago | 106.7us | |
| alert: PostgreSQLDeadlocks expr: increase(pg_stat_database_deadlocks[5m]) > 0 for: 1m labels: severity: warning annotations: description: Deadlocks detected on {{ $labels.datname }} summary: PostgreSQL deadlocks | ok | 28.367s ago | 127us | |
| alert: PostgreSQLSlowQueries expr: rate(pg_stat_statements_seconds_total[5m]) > 1 for: 10m labels: severity: warning annotations: description: High query time on {{ $labels.instance }} summary: Slow queries detected | ok | 28.367s ago | 89.63us | |
services |
18.933s ago |
1.872ms |
||
| Rule | State | Error | Last Evaluation | Evaluation Time |
| alert: ServiceDown expr: probe_success == 0 for: 3m labels: severity: critical annotations: description: '{{ $labels.instance }} is not responding' summary: Service unreachable | ok | 18.933s ago | 388.9us | |
| alert: APIDown expr: up{job="api"} == 0 for: 2m labels: severity: critical annotations: description: ProbatioVault API is not responding summary: API Backend down | ok | 18.933s ago | 549.5us | |
| alert: GrafanaDown expr: probe_success{instance=~".*grafana.*"} == 0 for: 3m labels: severity: warning annotations: description: Grafana dashboard is not responding summary: Grafana unreachable | ok | 18.933s ago | 330us | |
| alert: PrometheusDown expr: up{job="prometheus"} == 0 for: 1m labels: severity: critical annotations: description: Prometheus monitoring is down summary: Prometheus down | ok | 18.933s ago | 243.6us | |
| alert: SonarQubeDown expr: probe_success{instance=~".*sonar.*"} == 0 for: 5m labels: severity: warning annotations: description: SonarQube is not responding summary: SonarQube unreachable | ok | 18.932s ago | 333.6us | |
ssl |
27.323s ago |
1.592ms |
||
| Rule | State | Error | Last Evaluation | Evaluation Time |
| alert: SSLCertExpiringSoon expr: probe_ssl_earliest_cert_expiry - time() < 86400 * 14 for: 1h labels: severity: warning annotations: description: Certificate for {{ $labels.instance }} expires in < 14 days summary: SSL certificate expiring soon | ok | 27.324s ago | 730.6us | |
| alert: SSLCertExpired expr: probe_ssl_earliest_cert_expiry - time() < 0 for: 1m labels: severity: critical annotations: description: Certificate for {{ $labels.instance }} has expired summary: SSL certificate expired | ok | 27.323s ago | 807.3us | |