Skip to content

Commit

Permalink
Merge pull request #2346 from newrelic/release
Browse files Browse the repository at this point in the history
Release 20240328
  • Loading branch information
stevula authored Mar 28, 2024
2 parents 5a552cc + a88c92c commit b04c4d5
Show file tree
Hide file tree
Showing 31 changed files with 1,508 additions and 19 deletions.
32 changes: 32 additions & 0 deletions alert-policies/envoy/ClusterBindErrors.yml
Original file line number Diff line number Diff line change
@@ -0,0 +1,32 @@
# Name of the alert
name: Cluster bind errors

# Description and details
description: |+
This alert is triggered when at least one cluster bind errors is triggered for 5 minutes.
# Type of alert
type: STATIC

# NRQL query
nrql:

query: "SELECT latest(envoy_cluster_bind_errors) as 'Bind errors' from Metric"

# Function used to aggregate the NRQL query value(s) for comparison to the terms.threshold (Default: SINGLE_VALUE)
valueFunction: SINGLE_VALUE

# List of Critical and Warning thresholds for the condition
terms:
- priority: CRITICAL
# Operator used to compare against the threshold.
operator: ABOVE
# Value that triggers a violation
threshold: 1
# Time in seconds; 120 - 3600
thresholdDuration: 300
# How many data points must be in violation for the duration
thresholdOccurrences: ALL

# Duration after which a violation automatically closes
# Time in seconds; 300 - 2592000 (Default: 86400 [1 day])
violationTimeLimitSeconds: 86400
32 changes: 32 additions & 0 deletions alert-policies/envoy/ClusterUpdateFailed.yml
Original file line number Diff line number Diff line change
@@ -0,0 +1,32 @@
# Name of the alert
name: Cluster update failed

# Description and details
description: |+
This alert is triggered when at least one cluster update has failed for 5 minutes.
# Type of alert
type: STATIC

# NRQL query
nrql:

query: "SELECT latest(envoy_cluster_update_failure) as 'Cluster update failed' from Metric"

# Function used to aggregate the NRQL query value(s) for comparison to the terms.threshold (Default: SINGLE_VALUE)
valueFunction: SINGLE_VALUE

# List of Critical and Warning thresholds for the condition
terms:
- priority: CRITICAL
# Operator used to compare against the threshold.
operator: ABOVE
# Value that triggers a violation
threshold: 1
# Time in seconds; 120 - 3600
thresholdDuration: 300
# How many data points must be in violation for the duration
thresholdOccurrences: ALL

# Duration after which a violation automatically closes
# Time in seconds; 300 - 2592000 (Default: 86400 [1 day])
violationTimeLimitSeconds: 86400
41 changes: 41 additions & 0 deletions alert-policies/envoy/DownstreamTimedoutRequests.yml
Original file line number Diff line number Diff line change
@@ -0,0 +1,41 @@
# Name of the alert
name: Downstream timed out requests

# Description and details
description: |+
This alert is triggered when the number of downstream timed out requests exceeds 5 for 5 minutes.
# Type of alert
type: STATIC

# NRQL query
nrql:

query: "SELECT latest(envoy_http_downstream_rq_timeout) as 'Downstream timed out requests' from Metric"

# Function used to aggregate the NRQL query value(s) for comparison to the terms.threshold (Default: SINGLE_VALUE)
valueFunction: SINGLE_VALUE

# List of Critical and Warning thresholds for the condition
terms:
- priority: CRITICAL
# Operator used to compare against the threshold.
operator: ABOVE
# Value that triggers a violation
threshold: 5
# Time in seconds; 120 - 3600
thresholdDuration: 300
# How many data points must be in violation for the duration
thresholdOccurrences: ALL
- priority: WARNING
# Operator used to compare against the threshold.
operator: ABOVE
# Value that triggers a violation
threshold: 3
# Time in seconds; 120 - 3600, must be a multiple of 60 for Baseline conditions
thresholdDuration: 300
# How many data points must be in violation for the duration
thresholdOccurrences: ALL

# Duration after which a violation automatically closes
# Time in seconds; 300 - 2592000 (Default: 86400 [1 day])
violationTimeLimitSeconds: 86400
32 changes: 32 additions & 0 deletions alert-policies/envoy/DrainingListener.yml
Original file line number Diff line number Diff line change
@@ -0,0 +1,32 @@
# Name of the alert
name: Draining listener

# Description and details
description: |+
This alert is triggered when there is at least one draining listener for 5 minutes.
# Type of alert
type: STATIC

# NRQL query
nrql:

query: "SELECT latest(envoy_listener_manager_total_listeners_draining) as 'Draining listener' from Metric"

# Function used to aggregate the NRQL query value(s) for comparison to the terms.threshold (Default: SINGLE_VALUE)
valueFunction: SINGLE_VALUE

# List of Critical and Warning thresholds for the condition
terms:
- priority: CRITICAL
# Operator used to compare against the threshold.
operator: ABOVE
# Value that triggers a violation
threshold: 1
# Time in seconds; 120 - 3600
thresholdDuration: 300
# How many data points must be in violation for the duration
thresholdOccurrences: ALL

# Duration after which a violation automatically closes
# Time in seconds; 300 - 2592000 (Default: 86400 [1 day])
violationTimeLimitSeconds: 86400
Loading

0 comments on commit b04c4d5

Please sign in to comment.