Compare commits

..

No commits in common. "79699ed2c610a74c4603b975573a0a22b53a633c" and "52eece85e43e662d5a48fa00da03493fc560dd7d" have entirely different histories.

2 changed files with 44 additions and 43 deletions

View File

@ -1,5 +0,0 @@
---
extends: default
rules:
line-length: disable

View File

@ -19,30 +19,30 @@ prometheus_config:
alerting: alerting:
alertmanagers: alertmanagers:
- static_configs: - static_configs:
- targets: - targets:
- localhost:9093 - localhost:9093
scrape_configs: scrape_configs:
- job_name: prometheus - job_name: prometheus
scrape_interval: 5s scrape_interval: 5s
static_configs: static_configs:
- targets: - targets:
- localhost:9090 - localhost:9090
- job_name: alertmanager - job_name: alertmanager
scrape_interval: 5s scrape_interval: 5s
static_configs: static_configs:
- targets: - targets:
- localhost:9093 - localhost:9093
- job_name: pushgateway - job_name: pushgateway
scrape_interval: 5s scrape_interval: 5s
static_configs: static_configs:
- targets: - targets:
- jump0.kill0.net:9091 - jump0.kill0.net:9091
- job_name: node - job_name: node
scrape_interval: 5s scrape_interval: 5s
static_configs: static_configs:
- targets: - targets:
- jump0.kill0.net:9100 - jump0.kill0.net:9100
- mine0.kill0.net:9100 - mine0.kill0.net:9100
relabel_configs: relabel_configs:
- source_labels: [__address__] - source_labels: [__address__]
target_label: instance target_label: instance
@ -52,8 +52,8 @@ prometheus_config:
scrape_interval: 5s scrape_interval: 5s
static_configs: static_configs:
- targets: - targets:
- jump0.kill0.net:3903 - jump0.kill0.net:3903
- mine0.kill0.net:3903 - mine0.kill0.net:3903
relabel_configs: relabel_configs:
- source_labels: [__address__] - source_labels: [__address__]
target_label: instance target_label: instance
@ -63,8 +63,8 @@ prometheus_config:
scrape_interval: 5s scrape_interval: 5s
static_configs: static_configs:
- targets: - targets:
- jump0.kill0.net:9115 - jump0.kill0.net:9115
- mine0.kill0.net:9115 - mine0.kill0.net:9115
- job_name: blackbox-icmp4 - job_name: blackbox-icmp4
metrics_path: /probe metrics_path: /probe
params: params:
@ -72,13 +72,13 @@ prometheus_config:
- icmpv4 - icmpv4
static_configs: static_configs:
- targets: - targets:
- dns.google - dns.google
- vpn-home.kill0.net - vpn-home.kill0.net
- ping-home.kill0.net - ping-home.kill0.net
- 10.255.0.16 - 10.255.0.16
- vpn1-sch.corp.nmi.com - vpn1-sch.corp.nmi.com
- vpn-chi.ops.nmi.com - vpn-chi.ops.nmi.com
- vpn-ash.ops.nmi.com - vpn-ash.ops.nmi.com
relabel_configs: relabel_configs:
- source_labels: [__address__] - source_labels: [__address__]
target_label: __param_target target_label: __param_target
@ -93,8 +93,8 @@ prometheus_config:
- icmpv6 - icmpv6
static_configs: static_configs:
- targets: - targets:
- dns.google - dns.google
- ping-home.kill0.net - ping-home.kill0.net
relabel_configs: relabel_configs:
- source_labels: [__address__] - source_labels: [__address__]
target_label: __param_target target_label: __param_target
@ -109,7 +109,7 @@ prometheus_config:
- tcp_connect4 - tcp_connect4
static_configs: static_configs:
- targets: - targets:
- mine0.kill0.net:25565 - mine0.kill0.net:25565
relabel_configs: relabel_configs:
- source_labels: [__address__] - source_labels: [__address__]
target_label: __param_target target_label: __param_target
@ -124,7 +124,7 @@ prometheus_config:
- tcp_connect6 - tcp_connect6
static_configs: static_configs:
- targets: - targets:
- mine0.kill0.net:25565 - mine0.kill0.net:25565
relabel_configs: relabel_configs:
- source_labels: [__address__] - source_labels: [__address__]
target_label: __param_target target_label: __param_target
@ -139,9 +139,9 @@ prometheus_config:
- http_2xx - http_2xx
static_configs: static_configs:
- targets: - targets:
- https://cavi.cc - https://cavi.cc
- https://git.kill0.net - https://git.kill0.net
- https://stats.kill0.net - https://stats.kill0.net
relabel_configs: relabel_configs:
- source_labels: [__address__] - source_labels: [__address__]
target_label: __param_target target_label: __param_target
@ -152,23 +152,23 @@ prometheus_config:
- job_name: thanos-sidecar - job_name: thanos-sidecar
scrape_interval: 5s scrape_interval: 5s
static_configs: static_configs:
- targets: - targets:
- "localhost:10902" - "localhost:10902"
- job_name: thanos-query - job_name: thanos-query
scrape_interval: 5s scrape_interval: 5s
static_configs: static_configs:
- targets: - targets:
- "localhost:10904" - "localhost:10904"
- job_name: thanos-store - job_name: thanos-store
scrape_interval: 5s scrape_interval: 5s
static_configs: static_configs:
- targets: - targets:
- "localhost:10902" - "localhost:10902"
- job_name: thanos-compact - job_name: thanos-compact
scrape_interval: 5s scrape_interval: 5s
static_configs: static_configs:
- targets: - targets:
- "localhost:10912" - "localhost:10912"
rule_files: rule_files:
- rules.yaml - rules.yaml
@ -238,20 +238,23 @@ prometheus_rules_config:
expr: (time() - node_restic_last_run_time{restic_job=~"minecraft"}) > 86400 expr: (time() - node_restic_last_run_time{restic_job=~"minecraft"}) > 86400
for: 2h for: 2h
- alert: MinecraftUnitInactive - alert: MinecraftUnitInactive
expr: node_systemd_unit_state{name="minecraft.service",state="inactive"} == 1 expr: node_systemd_unit_state{name="minecraft.service",state="inactive"} == 1
for: 15m for: 15m
- alert: GiteaUnitInactive - alert: GiteaUnitInactive
expr: node_systemd_unit_state{name="gitea.service",state="inactive"} == 1 expr: node_systemd_unit_state{name="gitea.service",state="inactive"} == 1
for: 15m for: 15m
- alert: MaintenanceMode - alert: MaintenanceMode
expr: maintenance_mode == 1 expr: maintenance_mode == 1
for: 1m for: 1m
#- alert: QuietHours
# expr: america_chicago_hour >= 22 or america_chicago_hour < 10
# for: 1m
- name: blackbox.rules - name: blackbox.rules
rules: rules:
- alert: ServiceDown - alert: ServiceDown
expr: probe_success{job!~"blackbox-icmp[0-9]"} == 0 expr: probe_success{job!~"blackbox-icmp[0-9]"} == 0
for: 1m for: 1m
- alert: PingDown - alert: PingDown
expr: probe_success{job=~"blackbox-icmp[0-9]"} == 0 expr: probe_success{job=~"blackbox-icmp[0-9]"} == 0
for: 15s for: 15s
- alert: CertExpiry - alert: CertExpiry
@ -263,7 +266,7 @@ prometheus_rules_config:
# summary: Certificates expiring in < 30 days # summary: Certificates expiring in < 30 days
summary: "{% raw %}Blackbox SSL certificate will expire soon (instance {{ $labels.instance }}){% endraw %}" summary: "{% raw %}Blackbox SSL certificate will expire soon (instance {{ $labels.instance }}){% endraw %}"
description: "{% raw %}SSL certificate expires in 30 days\n VALUE = {{ $value }}\n LABELS = {{ $labels }}{% endraw %}" description: "{% raw %}SSL certificate expires in 30 days\n VALUE = {{ $value }}\n LABELS = {{ $labels }}{% endraw %}"
- alert: CertExpiry - alert: CertExpiry
expr: ((probe_ssl_earliest_cert_expiry{job="blackbox-http"} - time()) / 86400) < 14 expr: ((probe_ssl_earliest_cert_expiry{job="blackbox-http"} - time()) / 86400) < 14
for: 15s for: 15s
labels: labels:
@ -357,7 +360,7 @@ alertmanager_config:
- times: - times:
- start_time: "03:00" - start_time: "03:00"
end_time: "15:00" end_time: "15:00"
node_exporter_du_directories: node_exporter_du_directories:
- /var/log/syslog - /var/log/syslog
- /var/spool/rsyslog - /var/spool/rsyslog
@ -407,6 +410,9 @@ karma_config:
color: "#ff220c" color: "#ff220c"
alertAcknowledgement: alertAcknowledgement:
enabled: true enabled: true
#duration: 15m0s
#author: karma
#comment: ACK! This alert was acknowledged using karma on %NOW%
thanos_bucket_config: "{{ vault_thanos_bucket_config }}" thanos_bucket_config: "{{ vault_thanos_bucket_config }}"