9 Updating Alert Config Details

This section shares the content of the UDRAlertrules.yaml file.

Note:

The default namespace for UDR is OCUDR. You can change it as per deployment.
language: sql

apiVersion: v1
data:
  alertsudr: |
    groups:
    - name: OcudrAlerts
      rules:
      - alert: OcudrTrafficRateAboveMinorThreshold
        annotations:
          description: 'Ingress traffic Rate is above minor threshold i.e. 800 
          requests per second (current value is: {{ $value }})'
          summary: 'Traffic Rate is above 80 Percent of Max requests per second(1000)'
        expr: sum(rate(oc_ingressgateway_http_requests_total{app_kubernetes_io_name=
        "ingressgateway",kubernetes_namespace="ocudr"}[20m])) >= 800 < 900
        labels:
          severity: Minor
      - alert: OcudrTrafficRateAboveMajorThreshold
        annotations:
          description: 'Ingress traffic Rate is above major threshold i.e. 900 requests
          per second (current value is: {{ $value }})'
          summary: 'Traffic Rate is above 90 Percent of Max requests per second(1000)'
        expr: sum(rate(oc_ingressgateway_http_requests_total{app_kubernetes_io_name=
        "ingressgateway",kubernetes_namespace="ocudr"}[20m])) >= 900 < 950
        labels:
          severity: Major
      - alert: OcudrTrafficRateAboveCriticalThreshold
        annotations:
          description: 'Ingress traffic Rate is above critical threshold i.e. 950 requests
          per second (current value is: {{ $value }})'
          summary: 'Traffic Rate is above 95 Percent of Max requests per second(1000)'
        expr: sum(rate(oc_ingressgateway_http_requests_total{app_kubernetes_io_name=
        "ingressgateway",kubernetes_namespace="ocudr"}[20m])) >= 950
        labels:
          severity: Critical
      - alert: OcudrTransactionErrorRateAbove0.1Percent
        annotations:
          description: 'Transaction Error rate is above 0.1 Percent of Total Transactions
         (current value is {{ $value }})'
          summary: 'Transaction Error Rate detected above 0.1 Percent of Total 
          Transactions'
        expr: (sum(rate(oc_ingressgateway_http_responses_total{Status!~"2.*",
        app_kubernetes_io_name="ingressgateway",kubernetes_namespace="ocudr"}[20m]) or 
        (up * 0 ) ) )/sum(rate(oc_ingressgateway_http_responses_total
        {app_kubernetes_io_name="ingressgateway",kubernetes_namespace="ocudr"}[20m]))
         * 100 >= 0.1 < 1
        labels:
          severity: Warning
      - alert: OcudrTransactionErrorRateAbove1Percent
        annotations:
          description: 'Transaction Error rate is above 1 Percent of Total Transactions
         (current value is {{ $value }})'
          summary: 'Transaction Error Rate detected above 1 Percent of Total Transactions'
        expr: (sum(rate(oc_ingressgateway_http_responses_total{Status!~"2.*",
        app_kubernetes_io_name="ingressgateway",kubernetes_namespace="ocudr"}[20m]) or 
        (up * 0 ) ) )/sum(rate(oc_ingressgateway_http_responses_total
        {app_kubernetes_io_name="ingressgateway",kubernetes_namespace="ocudr"}[20m]))
         * 100 >= 1 < 10
        labels:
          severity: Warning
      - alert: OcudrTransactionErrorRateAbove10Percent
        annotations:
          description: 'Transaction Error rate is above 10 Percent of Total Transactions 
        (current value is {{ $value }})'
          summary: 'Transaction Error Rate detected above 10 Percent of Total Transactions'
        expr: (sum(rate(oc_ingressgateway_http_responses_total{Status!~"2.*",
        app_kubernetes_io_name="ingressgateway",kubernetes_namespace="ocudr"}[20m]) 
        or (up * 0 ) ) )/sum(rate(oc_ingressgateway_http_responses_total
        {app_kubernetes_io_name="ingressgateway",kubernetes_namespace="ocudr"}[20m])) 
        * 100 >= 10 < 25
        labels:
          severity: Minor
      - alert: OcudrTransactionErrorRateAbove25Percent
        annotations:
          description: 'Transaction Error Rate detected above 25 Percent of 
           Total Transactions (current value is {{ $value }})'
          summary: 'Transaction Error Rate detected above 25 Percent of Total Transactions'
        expr: (sum(rate(oc_ingressgateway_http_responses_total
        {Status!~"2.*",app_kubernetes_io_name="ingressgateway",
        kubernetes_namespace="ocudr"}[20m]) or (up * 0 ) ) )/sum
        (rate(oc_ingressgateway_http_responses_total
        {app_kubernetes_io_name="ingressgateway",kubernetes_namespace="ocudr"}[20m]))
         * 100 >= 25 < 50
        labels:
          severity: Major
      - alert: OcudrTransactionErrorRateAbove50Percent
        annotations:
          description: 'Transaction Error Rate detected above 50 Percent of 
        Total Transactions (current value is {{ $value }})'
          summary: 'Transaction Error Rate detected above 50 Percent of Total Transactions'
        expr: (sum(rate(oc_ingressgateway_http_responses_total{Status!~"2.*",
        app_kubernetes_io_name="ingressgateway",kubernetes_namespace="ocudr"}[20m]) 
        or (up * 0 ) ) )/sum(rate(oc_ingressgateway_http_responses_total
        {app_kubernetes_io_name="ingressgateway",kubernetes_namespace="ocudr"}[20m]))
         * 100 >= 50
        labels:
          severity: Critical
      - alert: OcudrSubscriberNotFoundAbove1Percent
        annotations:
          description: 'Total number of response if subscriber not found is about 1% of 
        ingress traffic'
          summary: 'Total number of response if subscriber not found is about 1% of 
        ingress traffic'
        expr: (sum(rate(udr_subscriber_not_found_total[10m]))/
        sum(rate(oc_ingressgateway_http_requests_total{kubernetes_namespace="ocudr"}
        [10m])))*100 >= 1 < 10
        labels:
          severity: Warning
      - alert: OcudrSubscriberNotFoundAbove10Percent
        annotations:
          description: 'Total number of response if subscriber not found is about 10% of 
        ingress traffic'
          summary: 'Total number of response if subscriber not found is about 10% of 
        ingress traffic'
        expr: (sum(rate(udr_subscriber_not_found_total[10m]))/sum(rate
        (oc_ingressgateway_http_requests_total{kubernetes_namespace="ocudr"}[10m])))*100 >=
         10 < 25
        labels:
          severity: Minor
      - alert: OcudrSubscriberNotFoundAbove25Percent
        annotations:
          description: 'Total number of response if subscriber not found is about 25% of 
        ingress traffic'
          summary: 'Total number of response if subscriber not found is about 25% of 
        ingress traffic'
        expr: (sum(rate(udr_subscriber_not_found_total[10m]))/sum(rate
        (oc_ingressgateway_http_requests_total{kubernetes_namespace="ocudr"}[10m])))*100 >= 
        25 < 50
        labels:
          severity: Major
      - alert: OcudrSubscriberNotFoundAbove50Percent
        annotations:
          description: 'Total number of response if subscriber not found is about 50% of 
        ingress traffic'
          summary: 'Total number of response if subscriber not found is about 50% of 
        ingress traffic'
        expr: (sum(rate(udr_subscriber_not_found_total[10m]))/sum(rate
        (oc_ingressgateway_http_requests_total{kubernetes_namespace="ocudr"}[10m])))*100 >= 50
        labels:
          severity: Critical