9 Updating Alert Config Details
This section shares the content of the UDRAlertrules.yaml file.
Note:
The default namespace for UDR is OCUDR. You can change it as per deployment.language: sql
apiVersion: v1
data:
alertsudr: |
groups:
- name: OcudrAlerts
rules:
- alert: OcudrTrafficRateAboveMinorThreshold
annotations:
description: 'Ingress traffic Rate is above minor threshold i.e. 800
requests per second (current value is: {{ $value }})'
summary: 'Traffic Rate is above 80 Percent of Max requests per second(1000)'
expr: sum(rate(oc_ingressgateway_http_requests_total{app_kubernetes_io_name=
"ingressgateway",kubernetes_namespace="ocudr"}[20m])) >= 800 < 900
labels:
severity: Minor
- alert: OcudrTrafficRateAboveMajorThreshold
annotations:
description: 'Ingress traffic Rate is above major threshold i.e. 900 requests
per second (current value is: {{ $value }})'
summary: 'Traffic Rate is above 90 Percent of Max requests per second(1000)'
expr: sum(rate(oc_ingressgateway_http_requests_total{app_kubernetes_io_name=
"ingressgateway",kubernetes_namespace="ocudr"}[20m])) >= 900 < 950
labels:
severity: Major
- alert: OcudrTrafficRateAboveCriticalThreshold
annotations:
description: 'Ingress traffic Rate is above critical threshold i.e. 950 requests
per second (current value is: {{ $value }})'
summary: 'Traffic Rate is above 95 Percent of Max requests per second(1000)'
expr: sum(rate(oc_ingressgateway_http_requests_total{app_kubernetes_io_name=
"ingressgateway",kubernetes_namespace="ocudr"}[20m])) >= 950
labels:
severity: Critical
- alert: OcudrTransactionErrorRateAbove0.1Percent
annotations:
description: 'Transaction Error rate is above 0.1 Percent of Total Transactions
(current value is {{ $value }})'
summary: 'Transaction Error Rate detected above 0.1 Percent of Total
Transactions'
expr: (sum(rate(oc_ingressgateway_http_responses_total{Status!~"2.*",
app_kubernetes_io_name="ingressgateway",kubernetes_namespace="ocudr"}[20m]) or
(up * 0 ) ) )/sum(rate(oc_ingressgateway_http_responses_total
{app_kubernetes_io_name="ingressgateway",kubernetes_namespace="ocudr"}[20m]))
* 100 >= 0.1 < 1
labels:
severity: Warning
- alert: OcudrTransactionErrorRateAbove1Percent
annotations:
description: 'Transaction Error rate is above 1 Percent of Total Transactions
(current value is {{ $value }})'
summary: 'Transaction Error Rate detected above 1 Percent of Total Transactions'
expr: (sum(rate(oc_ingressgateway_http_responses_total{Status!~"2.*",
app_kubernetes_io_name="ingressgateway",kubernetes_namespace="ocudr"}[20m]) or
(up * 0 ) ) )/sum(rate(oc_ingressgateway_http_responses_total
{app_kubernetes_io_name="ingressgateway",kubernetes_namespace="ocudr"}[20m]))
* 100 >= 1 < 10
labels:
severity: Warning
- alert: OcudrTransactionErrorRateAbove10Percent
annotations:
description: 'Transaction Error rate is above 10 Percent of Total Transactions
(current value is {{ $value }})'
summary: 'Transaction Error Rate detected above 10 Percent of Total Transactions'
expr: (sum(rate(oc_ingressgateway_http_responses_total{Status!~"2.*",
app_kubernetes_io_name="ingressgateway",kubernetes_namespace="ocudr"}[20m])
or (up * 0 ) ) )/sum(rate(oc_ingressgateway_http_responses_total
{app_kubernetes_io_name="ingressgateway",kubernetes_namespace="ocudr"}[20m]))
* 100 >= 10 < 25
labels:
severity: Minor
- alert: OcudrTransactionErrorRateAbove25Percent
annotations:
description: 'Transaction Error Rate detected above 25 Percent of
Total Transactions (current value is {{ $value }})'
summary: 'Transaction Error Rate detected above 25 Percent of Total Transactions'
expr: (sum(rate(oc_ingressgateway_http_responses_total
{Status!~"2.*",app_kubernetes_io_name="ingressgateway",
kubernetes_namespace="ocudr"}[20m]) or (up * 0 ) ) )/sum
(rate(oc_ingressgateway_http_responses_total
{app_kubernetes_io_name="ingressgateway",kubernetes_namespace="ocudr"}[20m]))
* 100 >= 25 < 50
labels:
severity: Major
- alert: OcudrTransactionErrorRateAbove50Percent
annotations:
description: 'Transaction Error Rate detected above 50 Percent of
Total Transactions (current value is {{ $value }})'
summary: 'Transaction Error Rate detected above 50 Percent of Total Transactions'
expr: (sum(rate(oc_ingressgateway_http_responses_total{Status!~"2.*",
app_kubernetes_io_name="ingressgateway",kubernetes_namespace="ocudr"}[20m])
or (up * 0 ) ) )/sum(rate(oc_ingressgateway_http_responses_total
{app_kubernetes_io_name="ingressgateway",kubernetes_namespace="ocudr"}[20m]))
* 100 >= 50
labels:
severity: Critical
- alert: OcudrSubscriberNotFoundAbove1Percent
annotations:
description: 'Total number of response if subscriber not found is about 1% of
ingress traffic'
summary: 'Total number of response if subscriber not found is about 1% of
ingress traffic'
expr: (sum(rate(udr_subscriber_not_found_total[10m]))/
sum(rate(oc_ingressgateway_http_requests_total{kubernetes_namespace="ocudr"}
[10m])))*100 >= 1 < 10
labels:
severity: Warning
- alert: OcudrSubscriberNotFoundAbove10Percent
annotations:
description: 'Total number of response if subscriber not found is about 10% of
ingress traffic'
summary: 'Total number of response if subscriber not found is about 10% of
ingress traffic'
expr: (sum(rate(udr_subscriber_not_found_total[10m]))/sum(rate
(oc_ingressgateway_http_requests_total{kubernetes_namespace="ocudr"}[10m])))*100 >=
10 < 25
labels:
severity: Minor
- alert: OcudrSubscriberNotFoundAbove25Percent
annotations:
description: 'Total number of response if subscriber not found is about 25% of
ingress traffic'
summary: 'Total number of response if subscriber not found is about 25% of
ingress traffic'
expr: (sum(rate(udr_subscriber_not_found_total[10m]))/sum(rate
(oc_ingressgateway_http_requests_total{kubernetes_namespace="ocudr"}[10m])))*100 >=
25 < 50
labels:
severity: Major
- alert: OcudrSubscriberNotFoundAbove50Percent
annotations:
description: 'Total number of response if subscriber not found is about 50% of
ingress traffic'
summary: 'Total number of response if subscriber not found is about 50% of
ingress traffic'
expr: (sum(rate(udr_subscriber_not_found_total[10m]))/sum(rate
(oc_ingressgateway_http_requests_total{kubernetes_namespace="ocudr"}[10m])))*100 >= 50
labels:
severity: Critical