DEV-873 added custom node exporter polling for EXT stage

qa
Ketelsen, Sven 3 years ago committed by Hoan To
parent 47c801f5e1
commit e4a391be7f

@ -204,16 +204,6 @@ logstash_certificate: "{{ stage }}-elastic-stack-logstash-01"
backup_directory: "/backups" backup_directory: "/backups"
blackbox_exporter_fqdn: "dev-blackbox-01.{{ domain }}"
blackbox_http_2xx_targets:
- 'https://{{ stage }}-keycloak-01.smardigo.digital/auth/'
- 'https://{{ stage }}-kube-awx.smardigo.digital'
#- 'https://{{ stage }}-management-01-connect.smardigo.digital/'
blackbox_http_2xx_additional_targets: []
prometheus_federation_enabled: true
kubernetes_prometheus_endpoint: "{{ stage }}-kube-prometheus.{{ domain }}"
get_current_date: "{{ lookup('pipe','date +%Y-%m-%d') }}" get_current_date: "{{ lookup('pipe','date +%Y-%m-%d') }}"
get_current_date_time: "{{ lookup('pipe','date +%Y-%m-%d_%H:%M') }}" get_current_date_time: "{{ lookup('pipe','date +%Y-%m-%d_%H:%M') }}"
@ -227,9 +217,6 @@ k8s_basic_services:
selfsigned_ca_private_key_passphrase: '{{ selfsigned_ca_private_key_passphrase_vault }}' selfsigned_ca_private_key_passphrase: '{{ selfsigned_ca_private_key_passphrase_vault }}'
prometheus_alert_diskspaceusage_warning: 85
prometheus_alert_pg_replication_lag: 120
# hetzner upstream DNSservers # hetzner upstream DNSservers
upstream_dns_servers: upstream_dns_servers:
- 185.12.64.1 - 185.12.64.1

@ -0,0 +1,19 @@
---
# node exporter exposes data only into the private network
node_exporter_listen_address: "{{ stage_private_server_ip }}"
# TODO the blackbox exporter shouldn't be DEV tagged at all
blackbox_exporter_fqdn: "dev-blackbox-01.{{ domain }}"
blackbox_http_2xx_targets:
- 'https://{{ stage }}-keycloak-01.smardigo.digital/auth/'
- 'https://{{ stage }}-kube-awx.smardigo.digital'
#- 'https://{{ stage }}-management-01-connect.smardigo.digital/'
blackbox_http_2xx_additional_targets: []
prometheus_federation_enabled: true
kubernetes_prometheus_endpoint: "{{ stage }}-kube-prometheus.{{ domain }}"
prometheus_alert_diskspaceusage_warning: 85
prometheus_alert_pg_replication_lag: 120

@ -8,8 +8,11 @@ docker_enabled: true
docker_config_enabled: false docker_config_enabled: false
traefik_enabled: true traefik_enabled: true
filebeat_enabled: false filebeat_enabled: false
node_exporter_enabled: false node_exporter_enabled: true
shared_service_hosts: [] shared_service_hosts: []
# an ext server has no private network
node_exporter_listen_address: "0.0.0.0"
shared_service_harbor_hostname: "prodnso-harbor-01.smardigo.digital" shared_service_harbor_hostname: "prodnso-harbor-01.smardigo.digital"

@ -7,3 +7,7 @@ prometheus_tsdb_rentention_time: '90d'
# check firewall settings # check firewall settings
smardigo_connect_extra_servers: smardigo_connect_extra_servers:
- ext-bdev-mpmexec-02-connect.smardigo.digital - ext-bdev-mpmexec-02-connect.smardigo.digital
# check firewall settings
node_exporter_extra_servers:
- ext-bdev-mpmexec-02.smardigo.digital

@ -27,7 +27,7 @@
lineinfile: lineinfile:
path: /etc/default/prometheus-node-exporter path: /etc/default/prometheus-node-exporter
regex: "^ARGS=" regex: "^ARGS="
line: "ARGS=\"--web.listen-address='{{ stage_private_server_ip }}:{{ monitor_port_system }}'\"" line: "ARGS=\"--web.listen-address='{{ node_exporter_listen_address }}:{{ monitor_port_system }}'\""
notify: restart node-exporter notify: restart node-exporter
- name: "Ensure prometheus-node-exporter is running" - name: "Ensure prometheus-node-exporter is running"

@ -398,6 +398,31 @@ scrape_configs:
target_label: __address__ target_label: __address__
replacement: $1 replacement: $1
- job_name: 'node-exporter-extra'
scheme: http
metrics_path: '/metrics'
static_configs:
- targets: [
{% for server in node_exporter_extra_servers | default([]) %}
'{{ server }}:{{ monitor_port_system }}',
{% endfor %}
]
labels:
env: {{ stage }}
project: servers
relabel_configs:
- source_labels: [job]
target_label: job
replacement: 'node-exporter'
- source_labels: [__address__]
regex: .*!(.*)
target_label: instance
replacement: $1
- source_labels: [__address__]
regex: (.*)!.*
target_label: __address__
replacement: $1
- job_name: 'node-exporter-external-monitoring(digitalocean)' - job_name: 'node-exporter-external-monitoring(digitalocean)'
scheme: http scheme: http
metrics_path: '/metrics' metrics_path: '/metrics'

Loading…
Cancel
Save