https://prometheus.io/download/
1.原理图

2.安装
tar xf alertmanager-0.19.0.linux-amd64.tar.gz -C /usr/local/alertmanager
cd /usr/local/alertmanager
修改配置:
[root@zabbix-proxy alertmanager]# cat alertmanager.yml
global:
resolve_timeout: 5m
smtp_smarthost: 'smtp.163.com:25'
smtp_from: 'ww673004768@163.com'
smtp_auth_username: 'ww673004768@163.com'
smtp_auth_password: '123456'
smtp_require_tls: false
route:
group_by: ['alertname']
group_wait: 10s
group_interval: 10s
repeat_interval: 1h
receiver: 'email'
receivers:
- name: 'email'
email_configs:
- to: 'w673004768@163.com'
inhibit_rules:
- source_match:
severity: 'critical'
target_match:
severity: 'warning'
equal: ['alertname', 'dev', 'instance']
[root@zabbix-proxy alertmanager]#
校验配置:
[root@zabbix-proxy alertmanager]# ./amtool check-config ./alertmanager.yml
Checking './alertmanager.yml' SUCCESS
Found:
- global config
- route
- 1 inhibit rules
- 1 receivers
- 0 templates
[root@zabbix-proxy alertmanager]# pwd
/usr/local/alertmanager
[root@zabbix-proxy alertmanager]#
3.systemd管理 alertmanager
[root@zabbix-proxy alertmanager]# cat /usr/lib/systemd/system/alertmanager.service
[Unit]
Description=Alertmanager
After=network.target
[Service]
Type=simple
User=root
ExecStart=/usr/local/alertmanager/alertmanager --config.file=/usr/local/alertmanager/alertmanager.yml --storage.path=/usr/local/alertmanager/data
Restart=on-failure
[Install]
WantedBy=multi-user.target
You have new mail in /var/spool/mail/root
[root@zabbix-proxy alertmanager]#
4.设置prometheus的配置
vim prometheus.yml
./promtool check config prometheus.yml 校验配置文件 并重启
5.查看报警配置rule
[root@zabbix-proxy rules]# cat general.yml
groups:
- name: general
rules:
- alert: InstanceDown
expr: up == 0
for: 1m
labels:
severity: error
annotations:
summary: "Instance {{ $labels.instance }} down"
description: "{{ $labels.instance }} of job {{ $labels.job }} has been down for more than 1 minutes."
[root@zabbix-proxy rules]# pwd
/usr/local/prometheus/rules
[root@zabbix-proxy rules]#
6.测试



