update alert

This commit is contained in:
llitfkitfk 2017-11-10 17:03:57 +08:00
parent 35673af98d
commit 806d49c002
3 changed files with 20 additions and 11 deletions

View File

@ -17,8 +17,7 @@ services:
- prometheus_data:/prometheus - prometheus_data:/prometheus
command: command:
- '--config.file=/etc/prometheus/prometheus.yml' - '--config.file=/etc/prometheus/prometheus.yml'
- '--storage.local.path=/prometheus' - '--storage.tsdb.path=/prometheus'
- '--alertmanager.url=http://alertmanager:9093'
- '--web.console.libraries=/usr/share/prometheus/console_libraries' - '--web.console.libraries=/usr/share/prometheus/console_libraries'
- '--web.console.templates=/usr/share/prometheus/consoles' - '--web.console.templates=/usr/share/prometheus/consoles'
ports: ports:

View File

@ -1,9 +1,11 @@
ALERT service_down groups:
IF up == 0 - name: example
rules:
ALERT high_load - alert: InstanceDown
IF node_load1 > 0.5 expr: up == 0
ANNOTATIONS { for: 5m
summary = "Instance {{ $labels.instance }} under high load", labels:
description = "{{ $labels.instance }} of job {{ $labels.job }} is under high load.", severity: page
} annotations:
summary: "Instance {{ $labels.instance }} down"
description: "{{ $labels.instance }} of job {{ $labels.job }} has been down for more than 5 minutes."

View File

@ -15,6 +15,14 @@ rule_files:
# - "first.rules" # - "first.rules"
# - "second.rules" # - "second.rules"
# alert
alerting:
alertmanagers:
- scheme: http
static_configs:
- targets:
- "alertmanager:9093"
# A scrape configuration containing exactly one endpoint to scrape: # A scrape configuration containing exactly one endpoint to scrape:
# Here it's Prometheus itself. # Here it's Prometheus itself.
scrape_configs: scrape_configs: