Browse Source

Merge "Tune default thresholds for the nstat_time_squeeze based alerts"

pull/173/head
mcp-jenkins 6 years ago
parent
commit
af661e7ac1
2 changed files with 6 additions and 6 deletions
  1. +2
    -2
      linux/map.jinja
  2. +4
    -4
      linux/meta/prometheus.yml

+ 2
- 2
linux/map.jinja View File

'warn': 5, 'warn': 5,
}, },
'net_rx_action_per_cpu_threshold': { 'net_rx_action_per_cpu_threshold': {
'warning': '0',
'minor': '100'
'warning': '500',
'minor': '5000'
}, },
'packets_dropped_per_cpu_threshold': { 'packets_dropped_per_cpu_threshold': {
'minor': '0', 'minor': '0',

+ 4
- 4
linux/meta/prometheus.yml View File

{%- endraw %} {%- endraw %}
{%- set net_rx_action_warning_threshold = monitoring.net_rx_action_per_cpu_threshold.warning %} {%- set net_rx_action_warning_threshold = monitoring.net_rx_action_per_cpu_threshold.warning %}
if: >- if: >-
floor(increase(nstat_time_squeeze[24h])) > {{ net_rx_action_warning_threshold }}
floor(increase(nstat_time_squeeze[1d])) > {{ net_rx_action_warning_threshold }}
labels: labels:
severity: warning severity: warning
service: system service: system
annotations: annotations:
summary: "CPU terminated {{ net_rx_action_warning_threshold }}{%- raw %} net_rx_action loops" summary: "CPU terminated {{ net_rx_action_warning_threshold }}{%- raw %} net_rx_action loops"
description: "The {{ $labels.cpu }} CPU on the {{ $labels.host }} node terminated {{ $value }} net_rx_action loops during the last 24 hours."
description: "The {{ $labels.cpu }} CPU on the {{ $labels.host }} node terminated {{ $value }} net_rx_action loops during the last 24 hours. Modify the net.core.netdev_budget kernel parameter."
NetRxActionByCpuMinor: NetRxActionByCpuMinor:
{%- endraw %} {%- endraw %}
{%- set net_rx_action_minor_threshold = monitoring.net_rx_action_per_cpu_threshold.minor %} {%- set net_rx_action_minor_threshold = monitoring.net_rx_action_per_cpu_threshold.minor %}
if: >- if: >-
floor(increase(nstat_time_squeeze[24h])) > {{ net_rx_action_minor_threshold }}
floor(increase(nstat_time_squeeze[1d])) > {{ net_rx_action_minor_threshold }}
labels: labels:
severity: minor severity: minor
service: system service: system
annotations: annotations:
summary: "CPU terminated {{ net_rx_action_minor_threshold }}{%- raw %} net_rx_action loops" summary: "CPU terminated {{ net_rx_action_minor_threshold }}{%- raw %} net_rx_action loops"
description: "The {{ $labels.cpu }} CPU on the {{ $labels.host }} node terminated {{ $value }} net_rx_action loops during the last 24 hours."
description: "The {{ $labels.cpu }} CPU on the {{ $labels.host }} node terminated {{ $value }} net_rx_action loops during the last 24 hours. Modify the net.core.netdev_budget kernel parameter."
{%- endraw %} {%- endraw %}
{%- if monitoring.bond_status.interfaces is defined and monitoring.bond_status.interfaces %} {%- if monitoring.bond_status.interfaces is defined and monitoring.bond_status.interfaces %}
{%- raw %} {%- raw %}

Loading…
Cancel
Save