Explorar el Código

Merge "Add bond member status monitoring."

pull/122/head
Ales Komarek hace 7 años
padre
commit
3dad1dba67
Se han modificado 3 ficheros con 35 adiciones y 0 borrados
  1. +7
    -0
      linux/files/collectd_bond_status.conf
  2. +9
    -0
      linux/meta/collectd.yml
  3. +19
    -0
      linux/meta/heka.yml

+ 7
- 0
linux/files/collectd_bond_status.conf Ver fichero

@@ -0,0 +1,7 @@
Import "bond_status"

<Module "bond_status">
{%- for interface in plugin.get('interfaces', []) %}
Bond "{{ interface }}"
{%- endfor %}
</Module>

+ 9
- 0
linux/meta/collectd.yml Ver fichero

@@ -51,3 +51,12 @@ local_plugin:
plugin: swap
template: linux/files/collectd_swap.conf
report_bytes: True
{%- if monitoring.bond_status.interfaces is defined and monitoring.bond_status.interfaces is list %}
linux_bond_status:
plugin: python
template: linux/files/collectd_bond_status.conf
interfaces:
{%- for interface in monitoring.bond_status.interfaces %}
- {{ interface }}
{%- endfor %}
{%- endif %}

+ 19
- 0
linux/meta/heka.yml Ver fichero

@@ -1,3 +1,4 @@
{%- from "linux/map.jinja" import monitoring with context %}
metric_collector:
trigger:
linux_system_cpu_critical:
@@ -136,6 +137,18 @@ metric_collector:
window: 60
periods: 0
function: max
{%- if monitoring.bond_status.interfaces is defined and monitoring.bond_status.interfaces is list %}
linux_bond_status_critical:
description: Bond members are down.
rules:
- function: last
metric: bond_status_links_down
periods: 0
relational_operator: '>'
threshold: 0
window: 120
severity: critical
{%- endif %}
alarm:
linux_system_cpu:
alerting: enabled
@@ -167,3 +180,9 @@ metric_collector:
alerting: enabled_with_notification
triggers:
- linux_system_hdd_errors_critical
{%- if monitoring.bond_status.interfaces is defined and monitoring.bond_status.interfaces is list %}
linux_bond_status:
alerting: enabled
triggers:
- linux_bond_status_critical
{%- endif %}

Cargando…
Cancelar
Guardar