chore: full stack stability and migration fixes, plus react UI progress
This commit is contained in:
26
config/alerts.yml
Normal file
26
config/alerts.yml
Normal file
@@ -0,0 +1,26 @@
|
||||
groups:
|
||||
- name: madbase
|
||||
rules:
|
||||
- alert: ServiceDown
|
||||
expr: up == 0
|
||||
for: 1m
|
||||
labels:
|
||||
severity: critical
|
||||
annotations:
|
||||
summary: "Service {{ $labels.instance }} down"
|
||||
|
||||
- alert: HighErrorRate
|
||||
expr: rate(http_requests_total{status=~"5.."}[5m]) > 0.1
|
||||
for: 5m
|
||||
labels:
|
||||
severity: warning
|
||||
annotations:
|
||||
summary: "High error rate on {{ $labels.instance }}"
|
||||
|
||||
- alert: HighLatency
|
||||
expr: histogram_quantile(0.95, rate(http_request_duration_seconds_bucket[5m])) > 2
|
||||
for: 5m
|
||||
labels:
|
||||
severity: warning
|
||||
annotations:
|
||||
summary: "High latency on {{ $labels.instance }}"
|
||||
@@ -2,17 +2,9 @@ global:
|
||||
scrape_interval: 15s
|
||||
|
||||
scrape_configs:
|
||||
- job_name: 'madbase-worker'
|
||||
- job_name: 'madbase'
|
||||
static_configs:
|
||||
- targets: ['worker:8002']
|
||||
metrics_path: /metrics
|
||||
|
||||
- job_name: 'madbase-control'
|
||||
static_configs:
|
||||
- targets: ['control:8001']
|
||||
metrics_path: /metrics
|
||||
|
||||
- job_name: 'madbase-proxy'
|
||||
static_configs:
|
||||
- targets: ['proxy:8000']
|
||||
metrics_path: /metrics
|
||||
- targets:
|
||||
- 'worker:8002'
|
||||
- 'system:8001'
|
||||
- 'proxy:8000'
|
||||
|
||||
Reference in New Issue
Block a user